Don't use vec_disp8 encoding with the .d32 suffix
[binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2016 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifndef REGISTER_WARNINGS
37 #define REGISTER_WARNINGS 1
38 #endif
39
40 #ifndef INFER_ADDR_PREFIX
41 #define INFER_ADDR_PREFIX 1
42 #endif
43
44 #ifndef DEFAULT_ARCH
45 #define DEFAULT_ARCH "i386"
46 #endif
47
48 #ifndef INLINE
49 #if __GNUC__ >= 2
50 #define INLINE __inline__
51 #else
52 #define INLINE
53 #endif
54 #endif
55
56 /* Prefixes will be emitted in the order defined below.
57 WAIT_PREFIX must be the first prefix since FWAIT is really is an
58 instruction, and so must come before any prefixes.
59 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
60 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
61 #define WAIT_PREFIX 0
62 #define SEG_PREFIX 1
63 #define ADDR_PREFIX 2
64 #define DATA_PREFIX 3
65 #define REP_PREFIX 4
66 #define HLE_PREFIX REP_PREFIX
67 #define BND_PREFIX REP_PREFIX
68 #define LOCK_PREFIX 5
69 #define REX_PREFIX 6 /* must come last. */
70 #define MAX_PREFIXES 7 /* max prefixes per opcode */
71
72 /* we define the syntax here (modulo base,index,scale syntax) */
73 #define REGISTER_PREFIX '%'
74 #define IMMEDIATE_PREFIX '$'
75 #define ABSOLUTE_PREFIX '*'
76
77 /* these are the instruction mnemonic suffixes in AT&T syntax or
78 memory operand size in Intel syntax. */
79 #define WORD_MNEM_SUFFIX 'w'
80 #define BYTE_MNEM_SUFFIX 'b'
81 #define SHORT_MNEM_SUFFIX 's'
82 #define LONG_MNEM_SUFFIX 'l'
83 #define QWORD_MNEM_SUFFIX 'q'
84 #define XMMWORD_MNEM_SUFFIX 'x'
85 #define YMMWORD_MNEM_SUFFIX 'y'
86 #define ZMMWORD_MNEM_SUFFIX 'z'
87 /* Intel Syntax. Use a non-ascii letter since since it never appears
88 in instructions. */
89 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
90
91 #define END_OF_INSN '\0'
92
93 /*
94 'templates' is for grouping together 'template' structures for opcodes
95 of the same name. This is only used for storing the insns in the grand
96 ole hash table of insns.
97 The templates themselves start at START and range up to (but not including)
98 END.
99 */
100 typedef struct
101 {
102 const insn_template *start;
103 const insn_template *end;
104 }
105 templates;
106
107 /* 386 operand encoding bytes: see 386 book for details of this. */
108 typedef struct
109 {
110 unsigned int regmem; /* codes register or memory operand */
111 unsigned int reg; /* codes register operand (or extended opcode) */
112 unsigned int mode; /* how to interpret regmem & reg */
113 }
114 modrm_byte;
115
116 /* x86-64 extension prefix. */
117 typedef int rex_byte;
118
119 /* 386 opcode byte to code indirect addressing. */
120 typedef struct
121 {
122 unsigned base;
123 unsigned index;
124 unsigned scale;
125 }
126 sib_byte;
127
128 /* x86 arch names, types and features */
129 typedef struct
130 {
131 const char *name; /* arch name */
132 unsigned int len; /* arch string length */
133 enum processor_type type; /* arch type */
134 i386_cpu_flags flags; /* cpu feature flags */
135 unsigned int skip; /* show_arch should skip this. */
136 unsigned int negated; /* turn off indicated flags. */
137 }
138 arch_entry;
139
140 static void update_code_flag (int, int);
141 static void set_code_flag (int);
142 static void set_16bit_gcc_code_flag (int);
143 static void set_intel_syntax (int);
144 static void set_intel_mnemonic (int);
145 static void set_allow_index_reg (int);
146 static void set_check (int);
147 static void set_cpu_arch (int);
148 #ifdef TE_PE
149 static void pe_directive_secrel (int);
150 #endif
151 static void signed_cons (int);
152 static char *output_invalid (int c);
153 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
154 const char *);
155 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
156 const char *);
157 static int i386_att_operand (char *);
158 static int i386_intel_operand (char *, int);
159 static int i386_intel_simplify (expressionS *);
160 static int i386_intel_parse_name (const char *, expressionS *);
161 static const reg_entry *parse_register (char *, char **);
162 static char *parse_insn (char *, char *);
163 static char *parse_operands (char *, const char *);
164 static void swap_operands (void);
165 static void swap_2_operands (int, int);
166 static void optimize_imm (void);
167 static void optimize_disp (void);
168 static const insn_template *match_template (void);
169 static int check_string (void);
170 static int process_suffix (void);
171 static int check_byte_reg (void);
172 static int check_long_reg (void);
173 static int check_qword_reg (void);
174 static int check_word_reg (void);
175 static int finalize_imm (void);
176 static int process_operands (void);
177 static const seg_entry *build_modrm_byte (void);
178 static void output_insn (void);
179 static void output_imm (fragS *, offsetT);
180 static void output_disp (fragS *, offsetT);
181 #ifndef I386COFF
182 static void s_bss (int);
183 #endif
184 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
185 static void handle_large_common (int small ATTRIBUTE_UNUSED);
186 #endif
187
188 static const char *default_arch = DEFAULT_ARCH;
189
190 /* This struct describes rounding control and SAE in the instruction. */
191 struct RC_Operation
192 {
193 enum rc_type
194 {
195 rne = 0,
196 rd,
197 ru,
198 rz,
199 saeonly
200 } type;
201 int operand;
202 };
203
204 static struct RC_Operation rc_op;
205
206 /* The struct describes masking, applied to OPERAND in the instruction.
207 MASK is a pointer to the corresponding mask register. ZEROING tells
208 whether merging or zeroing mask is used. */
209 struct Mask_Operation
210 {
211 const reg_entry *mask;
212 unsigned int zeroing;
213 /* The operand where this operation is associated. */
214 int operand;
215 };
216
217 static struct Mask_Operation mask_op;
218
219 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
220 broadcast factor. */
221 struct Broadcast_Operation
222 {
223 /* Type of broadcast: no broadcast, {1to8}, or {1to16}. */
224 int type;
225
226 /* Index of broadcasted operand. */
227 int operand;
228 };
229
230 static struct Broadcast_Operation broadcast_op;
231
232 /* VEX prefix. */
233 typedef struct
234 {
235 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
236 unsigned char bytes[4];
237 unsigned int length;
238 /* Destination or source register specifier. */
239 const reg_entry *register_specifier;
240 } vex_prefix;
241
242 /* 'md_assemble ()' gathers together information and puts it into a
243 i386_insn. */
244
245 union i386_op
246 {
247 expressionS *disps;
248 expressionS *imms;
249 const reg_entry *regs;
250 };
251
252 enum i386_error
253 {
254 operand_size_mismatch,
255 operand_type_mismatch,
256 register_type_mismatch,
257 number_of_operands_mismatch,
258 invalid_instruction_suffix,
259 bad_imm4,
260 old_gcc_only,
261 unsupported_with_intel_mnemonic,
262 unsupported_syntax,
263 unsupported,
264 invalid_vsib_address,
265 invalid_vector_register_set,
266 unsupported_vector_index_register,
267 unsupported_broadcast,
268 broadcast_not_on_src_operand,
269 broadcast_needed,
270 unsupported_masking,
271 mask_not_on_destination,
272 no_default_mask,
273 unsupported_rc_sae,
274 rc_sae_operand_not_last_imm,
275 invalid_register_operand,
276 try_vector_disp8
277 };
278
279 struct _i386_insn
280 {
281 /* TM holds the template for the insn were currently assembling. */
282 insn_template tm;
283
284 /* SUFFIX holds the instruction size suffix for byte, word, dword
285 or qword, if given. */
286 char suffix;
287
288 /* OPERANDS gives the number of given operands. */
289 unsigned int operands;
290
291 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
292 of given register, displacement, memory operands and immediate
293 operands. */
294 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
295
296 /* TYPES [i] is the type (see above #defines) which tells us how to
297 use OP[i] for the corresponding operand. */
298 i386_operand_type types[MAX_OPERANDS];
299
300 /* Displacement expression, immediate expression, or register for each
301 operand. */
302 union i386_op op[MAX_OPERANDS];
303
304 /* Flags for operands. */
305 unsigned int flags[MAX_OPERANDS];
306 #define Operand_PCrel 1
307
308 /* Relocation type for operand */
309 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
310
311 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
312 the base index byte below. */
313 const reg_entry *base_reg;
314 const reg_entry *index_reg;
315 unsigned int log2_scale_factor;
316
317 /* SEG gives the seg_entries of this insn. They are zero unless
318 explicit segment overrides are given. */
319 const seg_entry *seg[2];
320
321 /* PREFIX holds all the given prefix opcodes (usually null).
322 PREFIXES is the number of prefix opcodes. */
323 unsigned int prefixes;
324 unsigned char prefix[MAX_PREFIXES];
325
326 /* RM and SIB are the modrm byte and the sib byte where the
327 addressing modes of this insn are encoded. */
328 modrm_byte rm;
329 rex_byte rex;
330 rex_byte vrex;
331 sib_byte sib;
332 vex_prefix vex;
333
334 /* Masking attributes. */
335 struct Mask_Operation *mask;
336
337 /* Rounding control and SAE attributes. */
338 struct RC_Operation *rounding;
339
340 /* Broadcasting attributes. */
341 struct Broadcast_Operation *broadcast;
342
343 /* Compressed disp8*N attribute. */
344 unsigned int memshift;
345
346 /* Swap operand in encoding. */
347 unsigned int swap_operand;
348
349 /* Prefer 8bit or 32bit displacement in encoding. */
350 enum
351 {
352 disp_encoding_default = 0,
353 disp_encoding_8bit,
354 disp_encoding_32bit
355 } disp_encoding;
356
357 /* REP prefix. */
358 const char *rep_prefix;
359
360 /* HLE prefix. */
361 const char *hle_prefix;
362
363 /* Have BND prefix. */
364 const char *bnd_prefix;
365
366 /* Need VREX to support upper 16 registers. */
367 int need_vrex;
368
369 /* Error message. */
370 enum i386_error error;
371 };
372
373 typedef struct _i386_insn i386_insn;
374
375 /* Link RC type with corresponding string, that'll be looked for in
376 asm. */
377 struct RC_name
378 {
379 enum rc_type type;
380 const char *name;
381 unsigned int len;
382 };
383
384 static const struct RC_name RC_NamesTable[] =
385 {
386 { rne, STRING_COMMA_LEN ("rn-sae") },
387 { rd, STRING_COMMA_LEN ("rd-sae") },
388 { ru, STRING_COMMA_LEN ("ru-sae") },
389 { rz, STRING_COMMA_LEN ("rz-sae") },
390 { saeonly, STRING_COMMA_LEN ("sae") },
391 };
392
393 /* List of chars besides those in app.c:symbol_chars that can start an
394 operand. Used to prevent the scrubber eating vital white-space. */
395 const char extra_symbol_chars[] = "*%-([{"
396 #ifdef LEX_AT
397 "@"
398 #endif
399 #ifdef LEX_QM
400 "?"
401 #endif
402 ;
403
404 #if (defined (TE_I386AIX) \
405 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
406 && !defined (TE_GNU) \
407 && !defined (TE_LINUX) \
408 && !defined (TE_NACL) \
409 && !defined (TE_NETWARE) \
410 && !defined (TE_FreeBSD) \
411 && !defined (TE_DragonFly) \
412 && !defined (TE_NetBSD)))
413 /* This array holds the chars that always start a comment. If the
414 pre-processor is disabled, these aren't very useful. The option
415 --divide will remove '/' from this list. */
416 const char *i386_comment_chars = "#/";
417 #define SVR4_COMMENT_CHARS 1
418 #define PREFIX_SEPARATOR '\\'
419
420 #else
421 const char *i386_comment_chars = "#";
422 #define PREFIX_SEPARATOR '/'
423 #endif
424
425 /* This array holds the chars that only start a comment at the beginning of
426 a line. If the line seems to have the form '# 123 filename'
427 .line and .file directives will appear in the pre-processed output.
428 Note that input_file.c hand checks for '#' at the beginning of the
429 first line of the input file. This is because the compiler outputs
430 #NO_APP at the beginning of its output.
431 Also note that comments started like this one will always work if
432 '/' isn't otherwise defined. */
433 const char line_comment_chars[] = "#/";
434
435 const char line_separator_chars[] = ";";
436
437 /* Chars that can be used to separate mant from exp in floating point
438 nums. */
439 const char EXP_CHARS[] = "eE";
440
441 /* Chars that mean this number is a floating point constant
442 As in 0f12.456
443 or 0d1.2345e12. */
444 const char FLT_CHARS[] = "fFdDxX";
445
446 /* Tables for lexical analysis. */
447 static char mnemonic_chars[256];
448 static char register_chars[256];
449 static char operand_chars[256];
450 static char identifier_chars[256];
451 static char digit_chars[256];
452
453 /* Lexical macros. */
454 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
455 #define is_operand_char(x) (operand_chars[(unsigned char) x])
456 #define is_register_char(x) (register_chars[(unsigned char) x])
457 #define is_space_char(x) ((x) == ' ')
458 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
459 #define is_digit_char(x) (digit_chars[(unsigned char) x])
460
461 /* All non-digit non-letter characters that may occur in an operand. */
462 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
463
464 /* md_assemble() always leaves the strings it's passed unaltered. To
465 effect this we maintain a stack of saved characters that we've smashed
466 with '\0's (indicating end of strings for various sub-fields of the
467 assembler instruction). */
468 static char save_stack[32];
469 static char *save_stack_p;
470 #define END_STRING_AND_SAVE(s) \
471 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
472 #define RESTORE_END_STRING(s) \
473 do { *(s) = *--save_stack_p; } while (0)
474
475 /* The instruction we're assembling. */
476 static i386_insn i;
477
478 /* Possible templates for current insn. */
479 static const templates *current_templates;
480
481 /* Per instruction expressionS buffers: max displacements & immediates. */
482 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
483 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
484
485 /* Current operand we are working on. */
486 static int this_operand = -1;
487
488 /* We support four different modes. FLAG_CODE variable is used to distinguish
489 these. */
490
491 enum flag_code {
492 CODE_32BIT,
493 CODE_16BIT,
494 CODE_64BIT };
495
496 static enum flag_code flag_code;
497 static unsigned int object_64bit;
498 static unsigned int disallow_64bit_reloc;
499 static int use_rela_relocations = 0;
500
501 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
502 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
503 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
504
505 /* The ELF ABI to use. */
506 enum x86_elf_abi
507 {
508 I386_ABI,
509 X86_64_ABI,
510 X86_64_X32_ABI
511 };
512
513 static enum x86_elf_abi x86_elf_abi = I386_ABI;
514 #endif
515
516 #if defined (TE_PE) || defined (TE_PEP)
517 /* Use big object file format. */
518 static int use_big_obj = 0;
519 #endif
520
521 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
522 /* 1 if generating code for a shared library. */
523 static int shared = 0;
524 #endif
525
526 /* 1 for intel syntax,
527 0 if att syntax. */
528 static int intel_syntax = 0;
529
530 /* 1 for intel mnemonic,
531 0 if att mnemonic. */
532 static int intel_mnemonic = !SYSV386_COMPAT;
533
534 /* 1 if support old (<= 2.8.1) versions of gcc. */
535 static int old_gcc = OLDGCC_COMPAT;
536
537 /* 1 if pseudo registers are permitted. */
538 static int allow_pseudo_reg = 0;
539
540 /* 1 if register prefix % not required. */
541 static int allow_naked_reg = 0;
542
543 /* 1 if the assembler should add BND prefix for all control-tranferring
544 instructions supporting it, even if this prefix wasn't specified
545 explicitly. */
546 static int add_bnd_prefix = 0;
547
548 /* 1 if pseudo index register, eiz/riz, is allowed . */
549 static int allow_index_reg = 0;
550
551 /* 1 if the assembler should ignore LOCK prefix, even if it was
552 specified explicitly. */
553 static int omit_lock_prefix = 0;
554
555 /* 1 if the assembler should encode lfence, mfence, and sfence as
556 "lock addl $0, (%{re}sp)". */
557 static int avoid_fence = 0;
558
559 /* 1 if the assembler should generate relax relocations. */
560
561 static int generate_relax_relocations
562 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
563
564 static enum check_kind
565 {
566 check_none = 0,
567 check_warning,
568 check_error
569 }
570 sse_check, operand_check = check_warning;
571
572 /* Register prefix used for error message. */
573 static const char *register_prefix = "%";
574
575 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
576 leave, push, and pop instructions so that gcc has the same stack
577 frame as in 32 bit mode. */
578 static char stackop_size = '\0';
579
580 /* Non-zero to optimize code alignment. */
581 int optimize_align_code = 1;
582
583 /* Non-zero to quieten some warnings. */
584 static int quiet_warnings = 0;
585
586 /* CPU name. */
587 static const char *cpu_arch_name = NULL;
588 static char *cpu_sub_arch_name = NULL;
589
590 /* CPU feature flags. */
591 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
592
593 /* If we have selected a cpu we are generating instructions for. */
594 static int cpu_arch_tune_set = 0;
595
596 /* Cpu we are generating instructions for. */
597 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
598
599 /* CPU feature flags of cpu we are generating instructions for. */
600 static i386_cpu_flags cpu_arch_tune_flags;
601
602 /* CPU instruction set architecture used. */
603 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
604
605 /* CPU feature flags of instruction set architecture used. */
606 i386_cpu_flags cpu_arch_isa_flags;
607
608 /* If set, conditional jumps are not automatically promoted to handle
609 larger than a byte offset. */
610 static unsigned int no_cond_jump_promotion = 0;
611
612 /* Encode SSE instructions with VEX prefix. */
613 static unsigned int sse2avx;
614
615 /* Encode scalar AVX instructions with specific vector length. */
616 static enum
617 {
618 vex128 = 0,
619 vex256
620 } avxscalar;
621
622 /* Encode scalar EVEX LIG instructions with specific vector length. */
623 static enum
624 {
625 evexl128 = 0,
626 evexl256,
627 evexl512
628 } evexlig;
629
630 /* Encode EVEX WIG instructions with specific evex.w. */
631 static enum
632 {
633 evexw0 = 0,
634 evexw1
635 } evexwig;
636
637 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
638 static enum rc_type evexrcig = rne;
639
640 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
641 static symbolS *GOT_symbol;
642
643 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
644 unsigned int x86_dwarf2_return_column;
645
646 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
647 int x86_cie_data_alignment;
648
649 /* Interface to relax_segment.
650 There are 3 major relax states for 386 jump insns because the
651 different types of jumps add different sizes to frags when we're
652 figuring out what sort of jump to choose to reach a given label. */
653
654 /* Types. */
655 #define UNCOND_JUMP 0
656 #define COND_JUMP 1
657 #define COND_JUMP86 2
658
659 /* Sizes. */
660 #define CODE16 1
661 #define SMALL 0
662 #define SMALL16 (SMALL | CODE16)
663 #define BIG 2
664 #define BIG16 (BIG | CODE16)
665
666 #ifndef INLINE
667 #ifdef __GNUC__
668 #define INLINE __inline__
669 #else
670 #define INLINE
671 #endif
672 #endif
673
674 #define ENCODE_RELAX_STATE(type, size) \
675 ((relax_substateT) (((type) << 2) | (size)))
676 #define TYPE_FROM_RELAX_STATE(s) \
677 ((s) >> 2)
678 #define DISP_SIZE_FROM_RELAX_STATE(s) \
679 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
680
681 /* This table is used by relax_frag to promote short jumps to long
682 ones where necessary. SMALL (short) jumps may be promoted to BIG
683 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
684 don't allow a short jump in a 32 bit code segment to be promoted to
685 a 16 bit offset jump because it's slower (requires data size
686 prefix), and doesn't work, unless the destination is in the bottom
687 64k of the code segment (The top 16 bits of eip are zeroed). */
688
689 const relax_typeS md_relax_table[] =
690 {
691 /* The fields are:
692 1) most positive reach of this state,
693 2) most negative reach of this state,
694 3) how many bytes this mode will have in the variable part of the frag
695 4) which index into the table to try if we can't fit into this one. */
696
697 /* UNCOND_JUMP states. */
698 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
699 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
700 /* dword jmp adds 4 bytes to frag:
701 0 extra opcode bytes, 4 displacement bytes. */
702 {0, 0, 4, 0},
703 /* word jmp adds 2 byte2 to frag:
704 0 extra opcode bytes, 2 displacement bytes. */
705 {0, 0, 2, 0},
706
707 /* COND_JUMP states. */
708 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
709 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
710 /* dword conditionals adds 5 bytes to frag:
711 1 extra opcode byte, 4 displacement bytes. */
712 {0, 0, 5, 0},
713 /* word conditionals add 3 bytes to frag:
714 1 extra opcode byte, 2 displacement bytes. */
715 {0, 0, 3, 0},
716
717 /* COND_JUMP86 states. */
718 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
719 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
720 /* dword conditionals adds 5 bytes to frag:
721 1 extra opcode byte, 4 displacement bytes. */
722 {0, 0, 5, 0},
723 /* word conditionals add 4 bytes to frag:
724 1 displacement byte and a 3 byte long branch insn. */
725 {0, 0, 4, 0}
726 };
727
728 static const arch_entry cpu_arch[] =
729 {
730 /* Do not replace the first two entries - i386_target_format()
731 relies on them being there in this order. */
732 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
733 CPU_GENERIC32_FLAGS, 0, 0 },
734 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
735 CPU_GENERIC64_FLAGS, 0, 0 },
736 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
737 CPU_NONE_FLAGS, 0, 0 },
738 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
739 CPU_I186_FLAGS, 0, 0 },
740 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
741 CPU_I286_FLAGS, 0, 0 },
742 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
743 CPU_I386_FLAGS, 0, 0 },
744 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
745 CPU_I486_FLAGS, 0, 0 },
746 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
747 CPU_I586_FLAGS, 0, 0 },
748 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
749 CPU_I686_FLAGS, 0, 0 },
750 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
751 CPU_I586_FLAGS, 0, 0 },
752 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
753 CPU_PENTIUMPRO_FLAGS, 0, 0 },
754 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
755 CPU_P2_FLAGS, 0, 0 },
756 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
757 CPU_P3_FLAGS, 0, 0 },
758 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
759 CPU_P4_FLAGS, 0, 0 },
760 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
761 CPU_CORE_FLAGS, 0, 0 },
762 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
763 CPU_NOCONA_FLAGS, 0, 0 },
764 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
765 CPU_CORE_FLAGS, 1, 0 },
766 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
767 CPU_CORE_FLAGS, 0, 0 },
768 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
769 CPU_CORE2_FLAGS, 1, 0 },
770 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
771 CPU_CORE2_FLAGS, 0, 0 },
772 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
773 CPU_COREI7_FLAGS, 0, 0 },
774 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
775 CPU_L1OM_FLAGS, 0, 0 },
776 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
777 CPU_K1OM_FLAGS, 0, 0 },
778 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
779 CPU_IAMCU_FLAGS, 0, 0 },
780 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
781 CPU_K6_FLAGS, 0, 0 },
782 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
783 CPU_K6_2_FLAGS, 0, 0 },
784 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
785 CPU_ATHLON_FLAGS, 0, 0 },
786 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
787 CPU_K8_FLAGS, 1, 0 },
788 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
789 CPU_K8_FLAGS, 0, 0 },
790 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
791 CPU_K8_FLAGS, 0, 0 },
792 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
793 CPU_AMDFAM10_FLAGS, 0, 0 },
794 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
795 CPU_BDVER1_FLAGS, 0, 0 },
796 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
797 CPU_BDVER2_FLAGS, 0, 0 },
798 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
799 CPU_BDVER3_FLAGS, 0, 0 },
800 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
801 CPU_BDVER4_FLAGS, 0, 0 },
802 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
803 CPU_ZNVER1_FLAGS, 0, 0 },
804 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
805 CPU_BTVER1_FLAGS, 0, 0 },
806 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
807 CPU_BTVER2_FLAGS, 0, 0 },
808 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
809 CPU_8087_FLAGS, 0, 0 },
810 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
811 CPU_287_FLAGS, 0, 0 },
812 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
813 CPU_387_FLAGS, 0, 0 },
814 { STRING_COMMA_LEN (".no87"), PROCESSOR_UNKNOWN,
815 CPU_ANY87_FLAGS, 0, 1 },
816 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
817 CPU_MMX_FLAGS, 0, 0 },
818 { STRING_COMMA_LEN (".nommx"), PROCESSOR_UNKNOWN,
819 CPU_3DNOWA_FLAGS, 0, 1 },
820 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
821 CPU_SSE_FLAGS, 0, 0 },
822 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
823 CPU_SSE2_FLAGS, 0, 0 },
824 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
825 CPU_SSE3_FLAGS, 0, 0 },
826 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
827 CPU_SSSE3_FLAGS, 0, 0 },
828 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
829 CPU_SSE4_1_FLAGS, 0, 0 },
830 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
831 CPU_SSE4_2_FLAGS, 0, 0 },
832 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
833 CPU_SSE4_2_FLAGS, 0, 0 },
834 { STRING_COMMA_LEN (".nosse"), PROCESSOR_UNKNOWN,
835 CPU_ANY_SSE_FLAGS, 0, 1 },
836 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
837 CPU_AVX_FLAGS, 0, 0 },
838 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
839 CPU_AVX2_FLAGS, 0, 0 },
840 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
841 CPU_AVX512F_FLAGS, 0, 0 },
842 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
843 CPU_AVX512CD_FLAGS, 0, 0 },
844 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
845 CPU_AVX512ER_FLAGS, 0, 0 },
846 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
847 CPU_AVX512PF_FLAGS, 0, 0 },
848 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
849 CPU_AVX512DQ_FLAGS, 0, 0 },
850 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
851 CPU_AVX512BW_FLAGS, 0, 0 },
852 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
853 CPU_AVX512VL_FLAGS, 0, 0 },
854 { STRING_COMMA_LEN (".noavx"), PROCESSOR_UNKNOWN,
855 CPU_ANY_AVX_FLAGS, 0, 1 },
856 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
857 CPU_VMX_FLAGS, 0, 0 },
858 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
859 CPU_VMFUNC_FLAGS, 0, 0 },
860 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
861 CPU_SMX_FLAGS, 0, 0 },
862 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
863 CPU_XSAVE_FLAGS, 0, 0 },
864 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
865 CPU_XSAVEOPT_FLAGS, 0, 0 },
866 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
867 CPU_XSAVEC_FLAGS, 0, 0 },
868 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
869 CPU_XSAVES_FLAGS, 0, 0 },
870 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
871 CPU_AES_FLAGS, 0, 0 },
872 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
873 CPU_PCLMUL_FLAGS, 0, 0 },
874 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
875 CPU_PCLMUL_FLAGS, 1, 0 },
876 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
877 CPU_FSGSBASE_FLAGS, 0, 0 },
878 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
879 CPU_RDRND_FLAGS, 0, 0 },
880 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
881 CPU_F16C_FLAGS, 0, 0 },
882 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
883 CPU_BMI2_FLAGS, 0, 0 },
884 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
885 CPU_FMA_FLAGS, 0, 0 },
886 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
887 CPU_FMA4_FLAGS, 0, 0 },
888 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
889 CPU_XOP_FLAGS, 0, 0 },
890 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
891 CPU_LWP_FLAGS, 0, 0 },
892 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
893 CPU_MOVBE_FLAGS, 0, 0 },
894 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
895 CPU_CX16_FLAGS, 0, 0 },
896 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
897 CPU_EPT_FLAGS, 0, 0 },
898 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
899 CPU_LZCNT_FLAGS, 0, 0 },
900 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
901 CPU_HLE_FLAGS, 0, 0 },
902 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
903 CPU_RTM_FLAGS, 0, 0 },
904 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
905 CPU_INVPCID_FLAGS, 0, 0 },
906 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
907 CPU_CLFLUSH_FLAGS, 0, 0 },
908 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
909 CPU_NOP_FLAGS, 0, 0 },
910 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
911 CPU_SYSCALL_FLAGS, 0, 0 },
912 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
913 CPU_RDTSCP_FLAGS, 0, 0 },
914 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
915 CPU_3DNOW_FLAGS, 0, 0 },
916 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
917 CPU_3DNOWA_FLAGS, 0, 0 },
918 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
919 CPU_PADLOCK_FLAGS, 0, 0 },
920 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
921 CPU_SVME_FLAGS, 1, 0 },
922 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
923 CPU_SVME_FLAGS, 0, 0 },
924 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
925 CPU_SSE4A_FLAGS, 0, 0 },
926 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
927 CPU_ABM_FLAGS, 0, 0 },
928 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
929 CPU_BMI_FLAGS, 0, 0 },
930 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
931 CPU_TBM_FLAGS, 0, 0 },
932 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
933 CPU_ADX_FLAGS, 0, 0 },
934 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
935 CPU_RDSEED_FLAGS, 0, 0 },
936 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
937 CPU_PRFCHW_FLAGS, 0, 0 },
938 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
939 CPU_SMAP_FLAGS, 0, 0 },
940 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
941 CPU_MPX_FLAGS, 0, 0 },
942 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
943 CPU_SHA_FLAGS, 0, 0 },
944 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
945 CPU_CLFLUSHOPT_FLAGS, 0, 0 },
946 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
947 CPU_PREFETCHWT1_FLAGS, 0, 0 },
948 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
949 CPU_SE1_FLAGS, 0, 0 },
950 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
951 CPU_CLWB_FLAGS, 0, 0 },
952 { STRING_COMMA_LEN (".pcommit"), PROCESSOR_UNKNOWN,
953 CPU_PCOMMIT_FLAGS, 0, 0 },
954 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
955 CPU_AVX512IFMA_FLAGS, 0, 0 },
956 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
957 CPU_AVX512VBMI_FLAGS, 0, 0 },
958 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
959 CPU_CLZERO_FLAGS, 0, 0 },
960 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
961 CPU_MWAITX_FLAGS, 0, 0 },
962 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
963 CPU_OSPKE_FLAGS, 0, 0 },
964 };
965
966 #ifdef I386COFF
967 /* Like s_lcomm_internal in gas/read.c but the alignment string
968 is allowed to be optional. */
969
970 static symbolS *
971 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
972 {
973 addressT align = 0;
974
975 SKIP_WHITESPACE ();
976
977 if (needs_align
978 && *input_line_pointer == ',')
979 {
980 align = parse_align (needs_align - 1);
981
982 if (align == (addressT) -1)
983 return NULL;
984 }
985 else
986 {
987 if (size >= 8)
988 align = 3;
989 else if (size >= 4)
990 align = 2;
991 else if (size >= 2)
992 align = 1;
993 else
994 align = 0;
995 }
996
997 bss_alloc (symbolP, size, align);
998 return symbolP;
999 }
1000
1001 static void
1002 pe_lcomm (int needs_align)
1003 {
1004 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1005 }
1006 #endif
1007
1008 const pseudo_typeS md_pseudo_table[] =
1009 {
1010 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1011 {"align", s_align_bytes, 0},
1012 #else
1013 {"align", s_align_ptwo, 0},
1014 #endif
1015 {"arch", set_cpu_arch, 0},
1016 #ifndef I386COFF
1017 {"bss", s_bss, 0},
1018 #else
1019 {"lcomm", pe_lcomm, 1},
1020 #endif
1021 {"ffloat", float_cons, 'f'},
1022 {"dfloat", float_cons, 'd'},
1023 {"tfloat", float_cons, 'x'},
1024 {"value", cons, 2},
1025 {"slong", signed_cons, 4},
1026 {"noopt", s_ignore, 0},
1027 {"optim", s_ignore, 0},
1028 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1029 {"code16", set_code_flag, CODE_16BIT},
1030 {"code32", set_code_flag, CODE_32BIT},
1031 {"code64", set_code_flag, CODE_64BIT},
1032 {"intel_syntax", set_intel_syntax, 1},
1033 {"att_syntax", set_intel_syntax, 0},
1034 {"intel_mnemonic", set_intel_mnemonic, 1},
1035 {"att_mnemonic", set_intel_mnemonic, 0},
1036 {"allow_index_reg", set_allow_index_reg, 1},
1037 {"disallow_index_reg", set_allow_index_reg, 0},
1038 {"sse_check", set_check, 0},
1039 {"operand_check", set_check, 1},
1040 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1041 {"largecomm", handle_large_common, 0},
1042 #else
1043 {"file", (void (*) (int)) dwarf2_directive_file, 0},
1044 {"loc", dwarf2_directive_loc, 0},
1045 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1046 #endif
1047 #ifdef TE_PE
1048 {"secrel32", pe_directive_secrel, 0},
1049 #endif
1050 {0, 0, 0}
1051 };
1052
1053 /* For interface with expression (). */
1054 extern char *input_line_pointer;
1055
1056 /* Hash table for instruction mnemonic lookup. */
1057 static struct hash_control *op_hash;
1058
1059 /* Hash table for register lookup. */
1060 static struct hash_control *reg_hash;
1061 \f
1062 void
1063 i386_align_code (fragS *fragP, int count)
1064 {
1065 /* Various efficient no-op patterns for aligning code labels.
1066 Note: Don't try to assemble the instructions in the comments.
1067 0L and 0w are not legal. */
1068 static const unsigned char f32_1[] =
1069 {0x90}; /* nop */
1070 static const unsigned char f32_2[] =
1071 {0x66,0x90}; /* xchg %ax,%ax */
1072 static const unsigned char f32_3[] =
1073 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1074 static const unsigned char f32_4[] =
1075 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1076 static const unsigned char f32_5[] =
1077 {0x90, /* nop */
1078 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1079 static const unsigned char f32_6[] =
1080 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1081 static const unsigned char f32_7[] =
1082 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1083 static const unsigned char f32_8[] =
1084 {0x90, /* nop */
1085 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1086 static const unsigned char f32_9[] =
1087 {0x89,0xf6, /* movl %esi,%esi */
1088 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1089 static const unsigned char f32_10[] =
1090 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
1091 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1092 static const unsigned char f32_11[] =
1093 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
1094 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1095 static const unsigned char f32_12[] =
1096 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
1097 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
1098 static const unsigned char f32_13[] =
1099 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
1100 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1101 static const unsigned char f32_14[] =
1102 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
1103 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
1104 static const unsigned char f16_3[] =
1105 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
1106 static const unsigned char f16_4[] =
1107 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
1108 static const unsigned char f16_5[] =
1109 {0x90, /* nop */
1110 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
1111 static const unsigned char f16_6[] =
1112 {0x89,0xf6, /* mov %si,%si */
1113 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1114 static const unsigned char f16_7[] =
1115 {0x8d,0x74,0x00, /* lea 0(%si),%si */
1116 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1117 static const unsigned char f16_8[] =
1118 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
1119 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
1120 static const unsigned char jump_31[] =
1121 {0xeb,0x1d,0x90,0x90,0x90,0x90,0x90, /* jmp .+31; lotsa nops */
1122 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1123 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1124 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
1125 static const unsigned char *const f32_patt[] = {
1126 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
1127 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14
1128 };
1129 static const unsigned char *const f16_patt[] = {
1130 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8
1131 };
1132 /* nopl (%[re]ax) */
1133 static const unsigned char alt_3[] =
1134 {0x0f,0x1f,0x00};
1135 /* nopl 0(%[re]ax) */
1136 static const unsigned char alt_4[] =
1137 {0x0f,0x1f,0x40,0x00};
1138 /* nopl 0(%[re]ax,%[re]ax,1) */
1139 static const unsigned char alt_5[] =
1140 {0x0f,0x1f,0x44,0x00,0x00};
1141 /* nopw 0(%[re]ax,%[re]ax,1) */
1142 static const unsigned char alt_6[] =
1143 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1144 /* nopl 0L(%[re]ax) */
1145 static const unsigned char alt_7[] =
1146 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1147 /* nopl 0L(%[re]ax,%[re]ax,1) */
1148 static const unsigned char alt_8[] =
1149 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1150 /* nopw 0L(%[re]ax,%[re]ax,1) */
1151 static const unsigned char alt_9[] =
1152 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1153 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1154 static const unsigned char alt_10[] =
1155 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1156 static const unsigned char *const alt_patt[] = {
1157 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1158 alt_9, alt_10
1159 };
1160
1161 /* Only align for at least a positive non-zero boundary. */
1162 if (count <= 0 || count > MAX_MEM_FOR_RS_ALIGN_CODE)
1163 return;
1164
1165 /* We need to decide which NOP sequence to use for 32bit and
1166 64bit. When -mtune= is used:
1167
1168 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1169 PROCESSOR_GENERIC32, f32_patt will be used.
1170 2. For the rest, alt_patt will be used.
1171
1172 When -mtune= isn't used, alt_patt will be used if
1173 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1174 be used.
1175
1176 When -march= or .arch is used, we can't use anything beyond
1177 cpu_arch_isa_flags. */
1178
1179 if (flag_code == CODE_16BIT)
1180 {
1181 if (count > 8)
1182 {
1183 memcpy (fragP->fr_literal + fragP->fr_fix,
1184 jump_31, count);
1185 /* Adjust jump offset. */
1186 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1187 }
1188 else
1189 memcpy (fragP->fr_literal + fragP->fr_fix,
1190 f16_patt[count - 1], count);
1191 }
1192 else
1193 {
1194 const unsigned char *const *patt = NULL;
1195
1196 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1197 {
1198 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1199 switch (cpu_arch_tune)
1200 {
1201 case PROCESSOR_UNKNOWN:
1202 /* We use cpu_arch_isa_flags to check if we SHOULD
1203 optimize with nops. */
1204 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1205 patt = alt_patt;
1206 else
1207 patt = f32_patt;
1208 break;
1209 case PROCESSOR_PENTIUM4:
1210 case PROCESSOR_NOCONA:
1211 case PROCESSOR_CORE:
1212 case PROCESSOR_CORE2:
1213 case PROCESSOR_COREI7:
1214 case PROCESSOR_L1OM:
1215 case PROCESSOR_K1OM:
1216 case PROCESSOR_GENERIC64:
1217 case PROCESSOR_K6:
1218 case PROCESSOR_ATHLON:
1219 case PROCESSOR_K8:
1220 case PROCESSOR_AMDFAM10:
1221 case PROCESSOR_BD:
1222 case PROCESSOR_ZNVER:
1223 case PROCESSOR_BT:
1224 patt = alt_patt;
1225 break;
1226 case PROCESSOR_I386:
1227 case PROCESSOR_I486:
1228 case PROCESSOR_PENTIUM:
1229 case PROCESSOR_PENTIUMPRO:
1230 case PROCESSOR_IAMCU:
1231 case PROCESSOR_GENERIC32:
1232 patt = f32_patt;
1233 break;
1234 }
1235 }
1236 else
1237 {
1238 switch (fragP->tc_frag_data.tune)
1239 {
1240 case PROCESSOR_UNKNOWN:
1241 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1242 PROCESSOR_UNKNOWN. */
1243 abort ();
1244 break;
1245
1246 case PROCESSOR_I386:
1247 case PROCESSOR_I486:
1248 case PROCESSOR_PENTIUM:
1249 case PROCESSOR_IAMCU:
1250 case PROCESSOR_K6:
1251 case PROCESSOR_ATHLON:
1252 case PROCESSOR_K8:
1253 case PROCESSOR_AMDFAM10:
1254 case PROCESSOR_BD:
1255 case PROCESSOR_ZNVER:
1256 case PROCESSOR_BT:
1257 case PROCESSOR_GENERIC32:
1258 /* We use cpu_arch_isa_flags to check if we CAN optimize
1259 with nops. */
1260 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1261 patt = alt_patt;
1262 else
1263 patt = f32_patt;
1264 break;
1265 case PROCESSOR_PENTIUMPRO:
1266 case PROCESSOR_PENTIUM4:
1267 case PROCESSOR_NOCONA:
1268 case PROCESSOR_CORE:
1269 case PROCESSOR_CORE2:
1270 case PROCESSOR_COREI7:
1271 case PROCESSOR_L1OM:
1272 case PROCESSOR_K1OM:
1273 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1274 patt = alt_patt;
1275 else
1276 patt = f32_patt;
1277 break;
1278 case PROCESSOR_GENERIC64:
1279 patt = alt_patt;
1280 break;
1281 }
1282 }
1283
1284 if (patt == f32_patt)
1285 {
1286 /* If the padding is less than 15 bytes, we use the normal
1287 ones. Otherwise, we use a jump instruction and adjust
1288 its offset. */
1289 int limit;
1290
1291 /* For 64bit, the limit is 3 bytes. */
1292 if (flag_code == CODE_64BIT
1293 && fragP->tc_frag_data.isa_flags.bitfield.cpulm)
1294 limit = 3;
1295 else
1296 limit = 15;
1297 if (count < limit)
1298 memcpy (fragP->fr_literal + fragP->fr_fix,
1299 patt[count - 1], count);
1300 else
1301 {
1302 memcpy (fragP->fr_literal + fragP->fr_fix,
1303 jump_31, count);
1304 /* Adjust jump offset. */
1305 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1306 }
1307 }
1308 else
1309 {
1310 /* Maximum length of an instruction is 10 byte. If the
1311 padding is greater than 10 bytes and we don't use jump,
1312 we have to break it into smaller pieces. */
1313 int padding = count;
1314 while (padding > 10)
1315 {
1316 padding -= 10;
1317 memcpy (fragP->fr_literal + fragP->fr_fix + padding,
1318 patt [9], 10);
1319 }
1320
1321 if (padding)
1322 memcpy (fragP->fr_literal + fragP->fr_fix,
1323 patt [padding - 1], padding);
1324 }
1325 }
1326 fragP->fr_var = count;
1327 }
1328
1329 static INLINE int
1330 operand_type_all_zero (const union i386_operand_type *x)
1331 {
1332 switch (ARRAY_SIZE(x->array))
1333 {
1334 case 3:
1335 if (x->array[2])
1336 return 0;
1337 case 2:
1338 if (x->array[1])
1339 return 0;
1340 case 1:
1341 return !x->array[0];
1342 default:
1343 abort ();
1344 }
1345 }
1346
1347 static INLINE void
1348 operand_type_set (union i386_operand_type *x, unsigned int v)
1349 {
1350 switch (ARRAY_SIZE(x->array))
1351 {
1352 case 3:
1353 x->array[2] = v;
1354 case 2:
1355 x->array[1] = v;
1356 case 1:
1357 x->array[0] = v;
1358 break;
1359 default:
1360 abort ();
1361 }
1362 }
1363
1364 static INLINE int
1365 operand_type_equal (const union i386_operand_type *x,
1366 const union i386_operand_type *y)
1367 {
1368 switch (ARRAY_SIZE(x->array))
1369 {
1370 case 3:
1371 if (x->array[2] != y->array[2])
1372 return 0;
1373 case 2:
1374 if (x->array[1] != y->array[1])
1375 return 0;
1376 case 1:
1377 return x->array[0] == y->array[0];
1378 break;
1379 default:
1380 abort ();
1381 }
1382 }
1383
1384 static INLINE int
1385 cpu_flags_all_zero (const union i386_cpu_flags *x)
1386 {
1387 switch (ARRAY_SIZE(x->array))
1388 {
1389 case 3:
1390 if (x->array[2])
1391 return 0;
1392 case 2:
1393 if (x->array[1])
1394 return 0;
1395 case 1:
1396 return !x->array[0];
1397 default:
1398 abort ();
1399 }
1400 }
1401
1402 static INLINE int
1403 cpu_flags_equal (const union i386_cpu_flags *x,
1404 const union i386_cpu_flags *y)
1405 {
1406 switch (ARRAY_SIZE(x->array))
1407 {
1408 case 3:
1409 if (x->array[2] != y->array[2])
1410 return 0;
1411 case 2:
1412 if (x->array[1] != y->array[1])
1413 return 0;
1414 case 1:
1415 return x->array[0] == y->array[0];
1416 break;
1417 default:
1418 abort ();
1419 }
1420 }
1421
1422 static INLINE int
1423 cpu_flags_check_cpu64 (i386_cpu_flags f)
1424 {
1425 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1426 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1427 }
1428
1429 static INLINE i386_cpu_flags
1430 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1431 {
1432 switch (ARRAY_SIZE (x.array))
1433 {
1434 case 3:
1435 x.array [2] &= y.array [2];
1436 case 2:
1437 x.array [1] &= y.array [1];
1438 case 1:
1439 x.array [0] &= y.array [0];
1440 break;
1441 default:
1442 abort ();
1443 }
1444 return x;
1445 }
1446
1447 static INLINE i386_cpu_flags
1448 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1449 {
1450 switch (ARRAY_SIZE (x.array))
1451 {
1452 case 3:
1453 x.array [2] |= y.array [2];
1454 case 2:
1455 x.array [1] |= y.array [1];
1456 case 1:
1457 x.array [0] |= y.array [0];
1458 break;
1459 default:
1460 abort ();
1461 }
1462 return x;
1463 }
1464
1465 static INLINE i386_cpu_flags
1466 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1467 {
1468 switch (ARRAY_SIZE (x.array))
1469 {
1470 case 3:
1471 x.array [2] &= ~y.array [2];
1472 case 2:
1473 x.array [1] &= ~y.array [1];
1474 case 1:
1475 x.array [0] &= ~y.array [0];
1476 break;
1477 default:
1478 abort ();
1479 }
1480 return x;
1481 }
1482
1483 static int
1484 valid_iamcu_cpu_flags (const i386_cpu_flags *flags)
1485 {
1486 if (cpu_arch_isa == PROCESSOR_IAMCU)
1487 {
1488 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_COMPAT_FLAGS;
1489 i386_cpu_flags compat_flags;
1490 compat_flags = cpu_flags_and_not (*flags, iamcu_flags);
1491 return cpu_flags_all_zero (&compat_flags);
1492 }
1493 else
1494 return 1;
1495 }
1496
1497 #define CPU_FLAGS_ARCH_MATCH 0x1
1498 #define CPU_FLAGS_64BIT_MATCH 0x2
1499 #define CPU_FLAGS_AES_MATCH 0x4
1500 #define CPU_FLAGS_PCLMUL_MATCH 0x8
1501 #define CPU_FLAGS_AVX_MATCH 0x10
1502
1503 #define CPU_FLAGS_32BIT_MATCH \
1504 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_AES_MATCH \
1505 | CPU_FLAGS_PCLMUL_MATCH | CPU_FLAGS_AVX_MATCH)
1506 #define CPU_FLAGS_PERFECT_MATCH \
1507 (CPU_FLAGS_32BIT_MATCH | CPU_FLAGS_64BIT_MATCH)
1508
1509 /* Return CPU flags match bits. */
1510
1511 static int
1512 cpu_flags_match (const insn_template *t)
1513 {
1514 i386_cpu_flags x = t->cpu_flags;
1515 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1516
1517 x.bitfield.cpu64 = 0;
1518 x.bitfield.cpuno64 = 0;
1519
1520 if (cpu_flags_all_zero (&x))
1521 {
1522 /* This instruction is available on all archs. */
1523 match |= CPU_FLAGS_32BIT_MATCH;
1524 }
1525 else
1526 {
1527 /* This instruction is available only on some archs. */
1528 i386_cpu_flags cpu = cpu_arch_flags;
1529
1530 cpu.bitfield.cpu64 = 0;
1531 cpu.bitfield.cpuno64 = 0;
1532 cpu = cpu_flags_and (x, cpu);
1533 if (!cpu_flags_all_zero (&cpu))
1534 {
1535 if (x.bitfield.cpuavx)
1536 {
1537 /* We only need to check AES/PCLMUL/SSE2AVX with AVX. */
1538 if (cpu.bitfield.cpuavx)
1539 {
1540 /* Check SSE2AVX. */
1541 if (!t->opcode_modifier.sse2avx|| sse2avx)
1542 {
1543 match |= (CPU_FLAGS_ARCH_MATCH
1544 | CPU_FLAGS_AVX_MATCH);
1545 /* Check AES. */
1546 if (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1547 match |= CPU_FLAGS_AES_MATCH;
1548 /* Check PCLMUL. */
1549 if (!x.bitfield.cpupclmul
1550 || cpu.bitfield.cpupclmul)
1551 match |= CPU_FLAGS_PCLMUL_MATCH;
1552 }
1553 }
1554 else
1555 match |= CPU_FLAGS_ARCH_MATCH;
1556 }
1557 else
1558 match |= CPU_FLAGS_32BIT_MATCH;
1559 }
1560 }
1561 return match;
1562 }
1563
1564 static INLINE i386_operand_type
1565 operand_type_and (i386_operand_type x, i386_operand_type y)
1566 {
1567 switch (ARRAY_SIZE (x.array))
1568 {
1569 case 3:
1570 x.array [2] &= y.array [2];
1571 case 2:
1572 x.array [1] &= y.array [1];
1573 case 1:
1574 x.array [0] &= y.array [0];
1575 break;
1576 default:
1577 abort ();
1578 }
1579 return x;
1580 }
1581
1582 static INLINE i386_operand_type
1583 operand_type_or (i386_operand_type x, i386_operand_type y)
1584 {
1585 switch (ARRAY_SIZE (x.array))
1586 {
1587 case 3:
1588 x.array [2] |= y.array [2];
1589 case 2:
1590 x.array [1] |= y.array [1];
1591 case 1:
1592 x.array [0] |= y.array [0];
1593 break;
1594 default:
1595 abort ();
1596 }
1597 return x;
1598 }
1599
1600 static INLINE i386_operand_type
1601 operand_type_xor (i386_operand_type x, i386_operand_type y)
1602 {
1603 switch (ARRAY_SIZE (x.array))
1604 {
1605 case 3:
1606 x.array [2] ^= y.array [2];
1607 case 2:
1608 x.array [1] ^= y.array [1];
1609 case 1:
1610 x.array [0] ^= y.array [0];
1611 break;
1612 default:
1613 abort ();
1614 }
1615 return x;
1616 }
1617
1618 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1619 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1620 static const i386_operand_type control = OPERAND_TYPE_CONTROL;
1621 static const i386_operand_type inoutportreg
1622 = OPERAND_TYPE_INOUTPORTREG;
1623 static const i386_operand_type reg16_inoutportreg
1624 = OPERAND_TYPE_REG16_INOUTPORTREG;
1625 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1626 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1627 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1628 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1629 static const i386_operand_type anydisp
1630 = OPERAND_TYPE_ANYDISP;
1631 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1632 static const i386_operand_type regymm = OPERAND_TYPE_REGYMM;
1633 static const i386_operand_type regzmm = OPERAND_TYPE_REGZMM;
1634 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1635 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1636 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1637 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1638 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1639 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1640 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1641 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1642 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1643 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1644 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1645
1646 enum operand_type
1647 {
1648 reg,
1649 imm,
1650 disp,
1651 anymem
1652 };
1653
1654 static INLINE int
1655 operand_type_check (i386_operand_type t, enum operand_type c)
1656 {
1657 switch (c)
1658 {
1659 case reg:
1660 return (t.bitfield.reg8
1661 || t.bitfield.reg16
1662 || t.bitfield.reg32
1663 || t.bitfield.reg64);
1664
1665 case imm:
1666 return (t.bitfield.imm8
1667 || t.bitfield.imm8s
1668 || t.bitfield.imm16
1669 || t.bitfield.imm32
1670 || t.bitfield.imm32s
1671 || t.bitfield.imm64);
1672
1673 case disp:
1674 return (t.bitfield.disp8
1675 || t.bitfield.disp16
1676 || t.bitfield.disp32
1677 || t.bitfield.disp32s
1678 || t.bitfield.disp64);
1679
1680 case anymem:
1681 return (t.bitfield.disp8
1682 || t.bitfield.disp16
1683 || t.bitfield.disp32
1684 || t.bitfield.disp32s
1685 || t.bitfield.disp64
1686 || t.bitfield.baseindex);
1687
1688 default:
1689 abort ();
1690 }
1691
1692 return 0;
1693 }
1694
1695 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit on
1696 operand J for instruction template T. */
1697
1698 static INLINE int
1699 match_reg_size (const insn_template *t, unsigned int j)
1700 {
1701 return !((i.types[j].bitfield.byte
1702 && !t->operand_types[j].bitfield.byte)
1703 || (i.types[j].bitfield.word
1704 && !t->operand_types[j].bitfield.word)
1705 || (i.types[j].bitfield.dword
1706 && !t->operand_types[j].bitfield.dword)
1707 || (i.types[j].bitfield.qword
1708 && !t->operand_types[j].bitfield.qword));
1709 }
1710
1711 /* Return 1 if there is no conflict in any size on operand J for
1712 instruction template T. */
1713
1714 static INLINE int
1715 match_mem_size (const insn_template *t, unsigned int j)
1716 {
1717 return (match_reg_size (t, j)
1718 && !((i.types[j].bitfield.unspecified
1719 && !i.broadcast
1720 && !t->operand_types[j].bitfield.unspecified)
1721 || (i.types[j].bitfield.fword
1722 && !t->operand_types[j].bitfield.fword)
1723 || (i.types[j].bitfield.tbyte
1724 && !t->operand_types[j].bitfield.tbyte)
1725 || (i.types[j].bitfield.xmmword
1726 && !t->operand_types[j].bitfield.xmmword)
1727 || (i.types[j].bitfield.ymmword
1728 && !t->operand_types[j].bitfield.ymmword)
1729 || (i.types[j].bitfield.zmmword
1730 && !t->operand_types[j].bitfield.zmmword)));
1731 }
1732
1733 /* Return 1 if there is no size conflict on any operands for
1734 instruction template T. */
1735
1736 static INLINE int
1737 operand_size_match (const insn_template *t)
1738 {
1739 unsigned int j;
1740 int match = 1;
1741
1742 /* Don't check jump instructions. */
1743 if (t->opcode_modifier.jump
1744 || t->opcode_modifier.jumpbyte
1745 || t->opcode_modifier.jumpdword
1746 || t->opcode_modifier.jumpintersegment)
1747 return match;
1748
1749 /* Check memory and accumulator operand size. */
1750 for (j = 0; j < i.operands; j++)
1751 {
1752 if (t->operand_types[j].bitfield.anysize)
1753 continue;
1754
1755 if (t->operand_types[j].bitfield.acc && !match_reg_size (t, j))
1756 {
1757 match = 0;
1758 break;
1759 }
1760
1761 if (i.types[j].bitfield.mem && !match_mem_size (t, j))
1762 {
1763 match = 0;
1764 break;
1765 }
1766 }
1767
1768 if (match)
1769 return match;
1770 else if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
1771 {
1772 mismatch:
1773 i.error = operand_size_mismatch;
1774 return 0;
1775 }
1776
1777 /* Check reverse. */
1778 gas_assert (i.operands == 2);
1779
1780 match = 1;
1781 for (j = 0; j < 2; j++)
1782 {
1783 if (t->operand_types[j].bitfield.acc
1784 && !match_reg_size (t, j ? 0 : 1))
1785 goto mismatch;
1786
1787 if (i.types[j].bitfield.mem
1788 && !match_mem_size (t, j ? 0 : 1))
1789 goto mismatch;
1790 }
1791
1792 return match;
1793 }
1794
1795 static INLINE int
1796 operand_type_match (i386_operand_type overlap,
1797 i386_operand_type given)
1798 {
1799 i386_operand_type temp = overlap;
1800
1801 temp.bitfield.jumpabsolute = 0;
1802 temp.bitfield.unspecified = 0;
1803 temp.bitfield.byte = 0;
1804 temp.bitfield.word = 0;
1805 temp.bitfield.dword = 0;
1806 temp.bitfield.fword = 0;
1807 temp.bitfield.qword = 0;
1808 temp.bitfield.tbyte = 0;
1809 temp.bitfield.xmmword = 0;
1810 temp.bitfield.ymmword = 0;
1811 temp.bitfield.zmmword = 0;
1812 if (operand_type_all_zero (&temp))
1813 goto mismatch;
1814
1815 if (given.bitfield.baseindex == overlap.bitfield.baseindex
1816 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
1817 return 1;
1818
1819 mismatch:
1820 i.error = operand_type_mismatch;
1821 return 0;
1822 }
1823
1824 /* If given types g0 and g1 are registers they must be of the same type
1825 unless the expected operand type register overlap is null.
1826 Note that Acc in a template matches every size of reg. */
1827
1828 static INLINE int
1829 operand_type_register_match (i386_operand_type m0,
1830 i386_operand_type g0,
1831 i386_operand_type t0,
1832 i386_operand_type m1,
1833 i386_operand_type g1,
1834 i386_operand_type t1)
1835 {
1836 if (!operand_type_check (g0, reg))
1837 return 1;
1838
1839 if (!operand_type_check (g1, reg))
1840 return 1;
1841
1842 if (g0.bitfield.reg8 == g1.bitfield.reg8
1843 && g0.bitfield.reg16 == g1.bitfield.reg16
1844 && g0.bitfield.reg32 == g1.bitfield.reg32
1845 && g0.bitfield.reg64 == g1.bitfield.reg64)
1846 return 1;
1847
1848 if (m0.bitfield.acc)
1849 {
1850 t0.bitfield.reg8 = 1;
1851 t0.bitfield.reg16 = 1;
1852 t0.bitfield.reg32 = 1;
1853 t0.bitfield.reg64 = 1;
1854 }
1855
1856 if (m1.bitfield.acc)
1857 {
1858 t1.bitfield.reg8 = 1;
1859 t1.bitfield.reg16 = 1;
1860 t1.bitfield.reg32 = 1;
1861 t1.bitfield.reg64 = 1;
1862 }
1863
1864 if (!(t0.bitfield.reg8 & t1.bitfield.reg8)
1865 && !(t0.bitfield.reg16 & t1.bitfield.reg16)
1866 && !(t0.bitfield.reg32 & t1.bitfield.reg32)
1867 && !(t0.bitfield.reg64 & t1.bitfield.reg64))
1868 return 1;
1869
1870 i.error = register_type_mismatch;
1871
1872 return 0;
1873 }
1874
1875 static INLINE unsigned int
1876 register_number (const reg_entry *r)
1877 {
1878 unsigned int nr = r->reg_num;
1879
1880 if (r->reg_flags & RegRex)
1881 nr += 8;
1882
1883 if (r->reg_flags & RegVRex)
1884 nr += 16;
1885
1886 return nr;
1887 }
1888
1889 static INLINE unsigned int
1890 mode_from_disp_size (i386_operand_type t)
1891 {
1892 if (t.bitfield.disp8 || t.bitfield.vec_disp8)
1893 return 1;
1894 else if (t.bitfield.disp16
1895 || t.bitfield.disp32
1896 || t.bitfield.disp32s)
1897 return 2;
1898 else
1899 return 0;
1900 }
1901
1902 static INLINE int
1903 fits_in_signed_byte (addressT num)
1904 {
1905 return num + 0x80 <= 0xff;
1906 }
1907
1908 static INLINE int
1909 fits_in_unsigned_byte (addressT num)
1910 {
1911 return num <= 0xff;
1912 }
1913
1914 static INLINE int
1915 fits_in_unsigned_word (addressT num)
1916 {
1917 return num <= 0xffff;
1918 }
1919
1920 static INLINE int
1921 fits_in_signed_word (addressT num)
1922 {
1923 return num + 0x8000 <= 0xffff;
1924 }
1925
1926 static INLINE int
1927 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
1928 {
1929 #ifndef BFD64
1930 return 1;
1931 #else
1932 return num + 0x80000000 <= 0xffffffff;
1933 #endif
1934 } /* fits_in_signed_long() */
1935
1936 static INLINE int
1937 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
1938 {
1939 #ifndef BFD64
1940 return 1;
1941 #else
1942 return num <= 0xffffffff;
1943 #endif
1944 } /* fits_in_unsigned_long() */
1945
1946 static INLINE int
1947 fits_in_vec_disp8 (offsetT num)
1948 {
1949 int shift = i.memshift;
1950 unsigned int mask;
1951
1952 if (shift == -1)
1953 abort ();
1954
1955 mask = (1 << shift) - 1;
1956
1957 /* Return 0 if NUM isn't properly aligned. */
1958 if ((num & mask))
1959 return 0;
1960
1961 /* Check if NUM will fit in 8bit after shift. */
1962 return fits_in_signed_byte (num >> shift);
1963 }
1964
1965 static INLINE int
1966 fits_in_imm4 (offsetT num)
1967 {
1968 return (num & 0xf) == num;
1969 }
1970
1971 static i386_operand_type
1972 smallest_imm_type (offsetT num)
1973 {
1974 i386_operand_type t;
1975
1976 operand_type_set (&t, 0);
1977 t.bitfield.imm64 = 1;
1978
1979 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
1980 {
1981 /* This code is disabled on the 486 because all the Imm1 forms
1982 in the opcode table are slower on the i486. They're the
1983 versions with the implicitly specified single-position
1984 displacement, which has another syntax if you really want to
1985 use that form. */
1986 t.bitfield.imm1 = 1;
1987 t.bitfield.imm8 = 1;
1988 t.bitfield.imm8s = 1;
1989 t.bitfield.imm16 = 1;
1990 t.bitfield.imm32 = 1;
1991 t.bitfield.imm32s = 1;
1992 }
1993 else if (fits_in_signed_byte (num))
1994 {
1995 t.bitfield.imm8 = 1;
1996 t.bitfield.imm8s = 1;
1997 t.bitfield.imm16 = 1;
1998 t.bitfield.imm32 = 1;
1999 t.bitfield.imm32s = 1;
2000 }
2001 else if (fits_in_unsigned_byte (num))
2002 {
2003 t.bitfield.imm8 = 1;
2004 t.bitfield.imm16 = 1;
2005 t.bitfield.imm32 = 1;
2006 t.bitfield.imm32s = 1;
2007 }
2008 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2009 {
2010 t.bitfield.imm16 = 1;
2011 t.bitfield.imm32 = 1;
2012 t.bitfield.imm32s = 1;
2013 }
2014 else if (fits_in_signed_long (num))
2015 {
2016 t.bitfield.imm32 = 1;
2017 t.bitfield.imm32s = 1;
2018 }
2019 else if (fits_in_unsigned_long (num))
2020 t.bitfield.imm32 = 1;
2021
2022 return t;
2023 }
2024
2025 static offsetT
2026 offset_in_range (offsetT val, int size)
2027 {
2028 addressT mask;
2029
2030 switch (size)
2031 {
2032 case 1: mask = ((addressT) 1 << 8) - 1; break;
2033 case 2: mask = ((addressT) 1 << 16) - 1; break;
2034 case 4: mask = ((addressT) 2 << 31) - 1; break;
2035 #ifdef BFD64
2036 case 8: mask = ((addressT) 2 << 63) - 1; break;
2037 #endif
2038 default: abort ();
2039 }
2040
2041 #ifdef BFD64
2042 /* If BFD64, sign extend val for 32bit address mode. */
2043 if (flag_code != CODE_64BIT
2044 || i.prefix[ADDR_PREFIX])
2045 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2046 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2047 #endif
2048
2049 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2050 {
2051 char buf1[40], buf2[40];
2052
2053 sprint_value (buf1, val);
2054 sprint_value (buf2, val & mask);
2055 as_warn (_("%s shortened to %s"), buf1, buf2);
2056 }
2057 return val & mask;
2058 }
2059
2060 enum PREFIX_GROUP
2061 {
2062 PREFIX_EXIST = 0,
2063 PREFIX_LOCK,
2064 PREFIX_REP,
2065 PREFIX_OTHER
2066 };
2067
2068 /* Returns
2069 a. PREFIX_EXIST if attempting to add a prefix where one from the
2070 same class already exists.
2071 b. PREFIX_LOCK if lock prefix is added.
2072 c. PREFIX_REP if rep/repne prefix is added.
2073 d. PREFIX_OTHER if other prefix is added.
2074 */
2075
2076 static enum PREFIX_GROUP
2077 add_prefix (unsigned int prefix)
2078 {
2079 enum PREFIX_GROUP ret = PREFIX_OTHER;
2080 unsigned int q;
2081
2082 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2083 && flag_code == CODE_64BIT)
2084 {
2085 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2086 || ((i.prefix[REX_PREFIX] & (REX_R | REX_X | REX_B))
2087 && (prefix & (REX_R | REX_X | REX_B))))
2088 ret = PREFIX_EXIST;
2089 q = REX_PREFIX;
2090 }
2091 else
2092 {
2093 switch (prefix)
2094 {
2095 default:
2096 abort ();
2097
2098 case CS_PREFIX_OPCODE:
2099 case DS_PREFIX_OPCODE:
2100 case ES_PREFIX_OPCODE:
2101 case FS_PREFIX_OPCODE:
2102 case GS_PREFIX_OPCODE:
2103 case SS_PREFIX_OPCODE:
2104 q = SEG_PREFIX;
2105 break;
2106
2107 case REPNE_PREFIX_OPCODE:
2108 case REPE_PREFIX_OPCODE:
2109 q = REP_PREFIX;
2110 ret = PREFIX_REP;
2111 break;
2112
2113 case LOCK_PREFIX_OPCODE:
2114 q = LOCK_PREFIX;
2115 ret = PREFIX_LOCK;
2116 break;
2117
2118 case FWAIT_OPCODE:
2119 q = WAIT_PREFIX;
2120 break;
2121
2122 case ADDR_PREFIX_OPCODE:
2123 q = ADDR_PREFIX;
2124 break;
2125
2126 case DATA_PREFIX_OPCODE:
2127 q = DATA_PREFIX;
2128 break;
2129 }
2130 if (i.prefix[q] != 0)
2131 ret = PREFIX_EXIST;
2132 }
2133
2134 if (ret)
2135 {
2136 if (!i.prefix[q])
2137 ++i.prefixes;
2138 i.prefix[q] |= prefix;
2139 }
2140 else
2141 as_bad (_("same type of prefix used twice"));
2142
2143 return ret;
2144 }
2145
2146 static void
2147 update_code_flag (int value, int check)
2148 {
2149 PRINTF_LIKE ((*as_error));
2150
2151 flag_code = (enum flag_code) value;
2152 if (flag_code == CODE_64BIT)
2153 {
2154 cpu_arch_flags.bitfield.cpu64 = 1;
2155 cpu_arch_flags.bitfield.cpuno64 = 0;
2156 }
2157 else
2158 {
2159 cpu_arch_flags.bitfield.cpu64 = 0;
2160 cpu_arch_flags.bitfield.cpuno64 = 1;
2161 }
2162 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2163 {
2164 if (check)
2165 as_error = as_fatal;
2166 else
2167 as_error = as_bad;
2168 (*as_error) (_("64bit mode not supported on `%s'."),
2169 cpu_arch_name ? cpu_arch_name : default_arch);
2170 }
2171 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2172 {
2173 if (check)
2174 as_error = as_fatal;
2175 else
2176 as_error = as_bad;
2177 (*as_error) (_("32bit mode not supported on `%s'."),
2178 cpu_arch_name ? cpu_arch_name : default_arch);
2179 }
2180 stackop_size = '\0';
2181 }
2182
2183 static void
2184 set_code_flag (int value)
2185 {
2186 update_code_flag (value, 0);
2187 }
2188
2189 static void
2190 set_16bit_gcc_code_flag (int new_code_flag)
2191 {
2192 flag_code = (enum flag_code) new_code_flag;
2193 if (flag_code != CODE_16BIT)
2194 abort ();
2195 cpu_arch_flags.bitfield.cpu64 = 0;
2196 cpu_arch_flags.bitfield.cpuno64 = 1;
2197 stackop_size = LONG_MNEM_SUFFIX;
2198 }
2199
2200 static void
2201 set_intel_syntax (int syntax_flag)
2202 {
2203 /* Find out if register prefixing is specified. */
2204 int ask_naked_reg = 0;
2205
2206 SKIP_WHITESPACE ();
2207 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2208 {
2209 char *string;
2210 int e = get_symbol_name (&string);
2211
2212 if (strcmp (string, "prefix") == 0)
2213 ask_naked_reg = 1;
2214 else if (strcmp (string, "noprefix") == 0)
2215 ask_naked_reg = -1;
2216 else
2217 as_bad (_("bad argument to syntax directive."));
2218 (void) restore_line_pointer (e);
2219 }
2220 demand_empty_rest_of_line ();
2221
2222 intel_syntax = syntax_flag;
2223
2224 if (ask_naked_reg == 0)
2225 allow_naked_reg = (intel_syntax
2226 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2227 else
2228 allow_naked_reg = (ask_naked_reg < 0);
2229
2230 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2231
2232 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2233 identifier_chars['$'] = intel_syntax ? '$' : 0;
2234 register_prefix = allow_naked_reg ? "" : "%";
2235 }
2236
2237 static void
2238 set_intel_mnemonic (int mnemonic_flag)
2239 {
2240 intel_mnemonic = mnemonic_flag;
2241 }
2242
2243 static void
2244 set_allow_index_reg (int flag)
2245 {
2246 allow_index_reg = flag;
2247 }
2248
2249 static void
2250 set_check (int what)
2251 {
2252 enum check_kind *kind;
2253 const char *str;
2254
2255 if (what)
2256 {
2257 kind = &operand_check;
2258 str = "operand";
2259 }
2260 else
2261 {
2262 kind = &sse_check;
2263 str = "sse";
2264 }
2265
2266 SKIP_WHITESPACE ();
2267
2268 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2269 {
2270 char *string;
2271 int e = get_symbol_name (&string);
2272
2273 if (strcmp (string, "none") == 0)
2274 *kind = check_none;
2275 else if (strcmp (string, "warning") == 0)
2276 *kind = check_warning;
2277 else if (strcmp (string, "error") == 0)
2278 *kind = check_error;
2279 else
2280 as_bad (_("bad argument to %s_check directive."), str);
2281 (void) restore_line_pointer (e);
2282 }
2283 else
2284 as_bad (_("missing argument for %s_check directive"), str);
2285
2286 demand_empty_rest_of_line ();
2287 }
2288
2289 static void
2290 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2291 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2292 {
2293 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2294 static const char *arch;
2295
2296 /* Intel LIOM is only supported on ELF. */
2297 if (!IS_ELF)
2298 return;
2299
2300 if (!arch)
2301 {
2302 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2303 use default_arch. */
2304 arch = cpu_arch_name;
2305 if (!arch)
2306 arch = default_arch;
2307 }
2308
2309 /* If we are targeting Intel MCU, we must enable it. */
2310 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2311 || new_flag.bitfield.cpuiamcu)
2312 return;
2313
2314 /* If we are targeting Intel L1OM, we must enable it. */
2315 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2316 || new_flag.bitfield.cpul1om)
2317 return;
2318
2319 /* If we are targeting Intel K1OM, we must enable it. */
2320 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2321 || new_flag.bitfield.cpuk1om)
2322 return;
2323
2324 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2325 #endif
2326 }
2327
2328 static void
2329 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2330 {
2331 SKIP_WHITESPACE ();
2332
2333 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2334 {
2335 char *string;
2336 int e = get_symbol_name (&string);
2337 unsigned int j;
2338 i386_cpu_flags flags;
2339
2340 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2341 {
2342 if (strcmp (string, cpu_arch[j].name) == 0)
2343 {
2344 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2345
2346 if (*string != '.')
2347 {
2348 cpu_arch_name = cpu_arch[j].name;
2349 cpu_sub_arch_name = NULL;
2350 cpu_arch_flags = cpu_arch[j].flags;
2351 if (flag_code == CODE_64BIT)
2352 {
2353 cpu_arch_flags.bitfield.cpu64 = 1;
2354 cpu_arch_flags.bitfield.cpuno64 = 0;
2355 }
2356 else
2357 {
2358 cpu_arch_flags.bitfield.cpu64 = 0;
2359 cpu_arch_flags.bitfield.cpuno64 = 1;
2360 }
2361 cpu_arch_isa = cpu_arch[j].type;
2362 cpu_arch_isa_flags = cpu_arch[j].flags;
2363 if (!cpu_arch_tune_set)
2364 {
2365 cpu_arch_tune = cpu_arch_isa;
2366 cpu_arch_tune_flags = cpu_arch_isa_flags;
2367 }
2368 break;
2369 }
2370
2371 if (!cpu_arch[j].negated)
2372 flags = cpu_flags_or (cpu_arch_flags,
2373 cpu_arch[j].flags);
2374 else
2375 flags = cpu_flags_and_not (cpu_arch_flags,
2376 cpu_arch[j].flags);
2377
2378 if (!valid_iamcu_cpu_flags (&flags))
2379 as_fatal (_("`%s' isn't valid for Intel MCU"),
2380 cpu_arch[j].name);
2381 else if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2382 {
2383 if (cpu_sub_arch_name)
2384 {
2385 char *name = cpu_sub_arch_name;
2386 cpu_sub_arch_name = concat (name,
2387 cpu_arch[j].name,
2388 (const char *) NULL);
2389 free (name);
2390 }
2391 else
2392 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2393 cpu_arch_flags = flags;
2394 cpu_arch_isa_flags = flags;
2395 }
2396 (void) restore_line_pointer (e);
2397 demand_empty_rest_of_line ();
2398 return;
2399 }
2400 }
2401 if (j >= ARRAY_SIZE (cpu_arch))
2402 as_bad (_("no such architecture: `%s'"), string);
2403
2404 *input_line_pointer = e;
2405 }
2406 else
2407 as_bad (_("missing cpu architecture"));
2408
2409 no_cond_jump_promotion = 0;
2410 if (*input_line_pointer == ','
2411 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2412 {
2413 char *string;
2414 char e;
2415
2416 ++input_line_pointer;
2417 e = get_symbol_name (&string);
2418
2419 if (strcmp (string, "nojumps") == 0)
2420 no_cond_jump_promotion = 1;
2421 else if (strcmp (string, "jumps") == 0)
2422 ;
2423 else
2424 as_bad (_("no such architecture modifier: `%s'"), string);
2425
2426 (void) restore_line_pointer (e);
2427 }
2428
2429 demand_empty_rest_of_line ();
2430 }
2431
2432 enum bfd_architecture
2433 i386_arch (void)
2434 {
2435 if (cpu_arch_isa == PROCESSOR_L1OM)
2436 {
2437 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2438 || flag_code != CODE_64BIT)
2439 as_fatal (_("Intel L1OM is 64bit ELF only"));
2440 return bfd_arch_l1om;
2441 }
2442 else if (cpu_arch_isa == PROCESSOR_K1OM)
2443 {
2444 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2445 || flag_code != CODE_64BIT)
2446 as_fatal (_("Intel K1OM is 64bit ELF only"));
2447 return bfd_arch_k1om;
2448 }
2449 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2450 {
2451 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2452 || flag_code == CODE_64BIT)
2453 as_fatal (_("Intel MCU is 32bit ELF only"));
2454 return bfd_arch_iamcu;
2455 }
2456 else
2457 return bfd_arch_i386;
2458 }
2459
2460 unsigned long
2461 i386_mach (void)
2462 {
2463 if (!strncmp (default_arch, "x86_64", 6))
2464 {
2465 if (cpu_arch_isa == PROCESSOR_L1OM)
2466 {
2467 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2468 || default_arch[6] != '\0')
2469 as_fatal (_("Intel L1OM is 64bit ELF only"));
2470 return bfd_mach_l1om;
2471 }
2472 else if (cpu_arch_isa == PROCESSOR_K1OM)
2473 {
2474 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2475 || default_arch[6] != '\0')
2476 as_fatal (_("Intel K1OM is 64bit ELF only"));
2477 return bfd_mach_k1om;
2478 }
2479 else if (default_arch[6] == '\0')
2480 return bfd_mach_x86_64;
2481 else
2482 return bfd_mach_x64_32;
2483 }
2484 else if (!strcmp (default_arch, "i386")
2485 || !strcmp (default_arch, "iamcu"))
2486 {
2487 if (cpu_arch_isa == PROCESSOR_IAMCU)
2488 {
2489 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2490 as_fatal (_("Intel MCU is 32bit ELF only"));
2491 return bfd_mach_i386_iamcu;
2492 }
2493 else
2494 return bfd_mach_i386_i386;
2495 }
2496 else
2497 as_fatal (_("unknown architecture"));
2498 }
2499 \f
2500 void
2501 md_begin (void)
2502 {
2503 const char *hash_err;
2504
2505 /* Initialize op_hash hash table. */
2506 op_hash = hash_new ();
2507
2508 {
2509 const insn_template *optab;
2510 templates *core_optab;
2511
2512 /* Setup for loop. */
2513 optab = i386_optab;
2514 core_optab = (templates *) xmalloc (sizeof (templates));
2515 core_optab->start = optab;
2516
2517 while (1)
2518 {
2519 ++optab;
2520 if (optab->name == NULL
2521 || strcmp (optab->name, (optab - 1)->name) != 0)
2522 {
2523 /* different name --> ship out current template list;
2524 add to hash table; & begin anew. */
2525 core_optab->end = optab;
2526 hash_err = hash_insert (op_hash,
2527 (optab - 1)->name,
2528 (void *) core_optab);
2529 if (hash_err)
2530 {
2531 as_fatal (_("can't hash %s: %s"),
2532 (optab - 1)->name,
2533 hash_err);
2534 }
2535 if (optab->name == NULL)
2536 break;
2537 core_optab = (templates *) xmalloc (sizeof (templates));
2538 core_optab->start = optab;
2539 }
2540 }
2541 }
2542
2543 /* Initialize reg_hash hash table. */
2544 reg_hash = hash_new ();
2545 {
2546 const reg_entry *regtab;
2547 unsigned int regtab_size = i386_regtab_size;
2548
2549 for (regtab = i386_regtab; regtab_size--; regtab++)
2550 {
2551 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2552 if (hash_err)
2553 as_fatal (_("can't hash %s: %s"),
2554 regtab->reg_name,
2555 hash_err);
2556 }
2557 }
2558
2559 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2560 {
2561 int c;
2562 char *p;
2563
2564 for (c = 0; c < 256; c++)
2565 {
2566 if (ISDIGIT (c))
2567 {
2568 digit_chars[c] = c;
2569 mnemonic_chars[c] = c;
2570 register_chars[c] = c;
2571 operand_chars[c] = c;
2572 }
2573 else if (ISLOWER (c))
2574 {
2575 mnemonic_chars[c] = c;
2576 register_chars[c] = c;
2577 operand_chars[c] = c;
2578 }
2579 else if (ISUPPER (c))
2580 {
2581 mnemonic_chars[c] = TOLOWER (c);
2582 register_chars[c] = mnemonic_chars[c];
2583 operand_chars[c] = c;
2584 }
2585 else if (c == '{' || c == '}')
2586 operand_chars[c] = c;
2587
2588 if (ISALPHA (c) || ISDIGIT (c))
2589 identifier_chars[c] = c;
2590 else if (c >= 128)
2591 {
2592 identifier_chars[c] = c;
2593 operand_chars[c] = c;
2594 }
2595 }
2596
2597 #ifdef LEX_AT
2598 identifier_chars['@'] = '@';
2599 #endif
2600 #ifdef LEX_QM
2601 identifier_chars['?'] = '?';
2602 operand_chars['?'] = '?';
2603 #endif
2604 digit_chars['-'] = '-';
2605 mnemonic_chars['_'] = '_';
2606 mnemonic_chars['-'] = '-';
2607 mnemonic_chars['.'] = '.';
2608 identifier_chars['_'] = '_';
2609 identifier_chars['.'] = '.';
2610
2611 for (p = operand_special_chars; *p != '\0'; p++)
2612 operand_chars[(unsigned char) *p] = *p;
2613 }
2614
2615 if (flag_code == CODE_64BIT)
2616 {
2617 #if defined (OBJ_COFF) && defined (TE_PE)
2618 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2619 ? 32 : 16);
2620 #else
2621 x86_dwarf2_return_column = 16;
2622 #endif
2623 x86_cie_data_alignment = -8;
2624 }
2625 else
2626 {
2627 x86_dwarf2_return_column = 8;
2628 x86_cie_data_alignment = -4;
2629 }
2630 }
2631
2632 void
2633 i386_print_statistics (FILE *file)
2634 {
2635 hash_print_statistics (file, "i386 opcode", op_hash);
2636 hash_print_statistics (file, "i386 register", reg_hash);
2637 }
2638 \f
2639 #ifdef DEBUG386
2640
2641 /* Debugging routines for md_assemble. */
2642 static void pte (insn_template *);
2643 static void pt (i386_operand_type);
2644 static void pe (expressionS *);
2645 static void ps (symbolS *);
2646
2647 static void
2648 pi (char *line, i386_insn *x)
2649 {
2650 unsigned int j;
2651
2652 fprintf (stdout, "%s: template ", line);
2653 pte (&x->tm);
2654 fprintf (stdout, " address: base %s index %s scale %x\n",
2655 x->base_reg ? x->base_reg->reg_name : "none",
2656 x->index_reg ? x->index_reg->reg_name : "none",
2657 x->log2_scale_factor);
2658 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
2659 x->rm.mode, x->rm.reg, x->rm.regmem);
2660 fprintf (stdout, " sib: base %x index %x scale %x\n",
2661 x->sib.base, x->sib.index, x->sib.scale);
2662 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
2663 (x->rex & REX_W) != 0,
2664 (x->rex & REX_R) != 0,
2665 (x->rex & REX_X) != 0,
2666 (x->rex & REX_B) != 0);
2667 for (j = 0; j < x->operands; j++)
2668 {
2669 fprintf (stdout, " #%d: ", j + 1);
2670 pt (x->types[j]);
2671 fprintf (stdout, "\n");
2672 if (x->types[j].bitfield.reg8
2673 || x->types[j].bitfield.reg16
2674 || x->types[j].bitfield.reg32
2675 || x->types[j].bitfield.reg64
2676 || x->types[j].bitfield.regmmx
2677 || x->types[j].bitfield.regxmm
2678 || x->types[j].bitfield.regymm
2679 || x->types[j].bitfield.regzmm
2680 || x->types[j].bitfield.sreg2
2681 || x->types[j].bitfield.sreg3
2682 || x->types[j].bitfield.control
2683 || x->types[j].bitfield.debug
2684 || x->types[j].bitfield.test)
2685 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2686 if (operand_type_check (x->types[j], imm))
2687 pe (x->op[j].imms);
2688 if (operand_type_check (x->types[j], disp))
2689 pe (x->op[j].disps);
2690 }
2691 }
2692
2693 static void
2694 pte (insn_template *t)
2695 {
2696 unsigned int j;
2697 fprintf (stdout, " %d operands ", t->operands);
2698 fprintf (stdout, "opcode %x ", t->base_opcode);
2699 if (t->extension_opcode != None)
2700 fprintf (stdout, "ext %x ", t->extension_opcode);
2701 if (t->opcode_modifier.d)
2702 fprintf (stdout, "D");
2703 if (t->opcode_modifier.w)
2704 fprintf (stdout, "W");
2705 fprintf (stdout, "\n");
2706 for (j = 0; j < t->operands; j++)
2707 {
2708 fprintf (stdout, " #%d type ", j + 1);
2709 pt (t->operand_types[j]);
2710 fprintf (stdout, "\n");
2711 }
2712 }
2713
2714 static void
2715 pe (expressionS *e)
2716 {
2717 fprintf (stdout, " operation %d\n", e->X_op);
2718 fprintf (stdout, " add_number %ld (%lx)\n",
2719 (long) e->X_add_number, (long) e->X_add_number);
2720 if (e->X_add_symbol)
2721 {
2722 fprintf (stdout, " add_symbol ");
2723 ps (e->X_add_symbol);
2724 fprintf (stdout, "\n");
2725 }
2726 if (e->X_op_symbol)
2727 {
2728 fprintf (stdout, " op_symbol ");
2729 ps (e->X_op_symbol);
2730 fprintf (stdout, "\n");
2731 }
2732 }
2733
2734 static void
2735 ps (symbolS *s)
2736 {
2737 fprintf (stdout, "%s type %s%s",
2738 S_GET_NAME (s),
2739 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
2740 segment_name (S_GET_SEGMENT (s)));
2741 }
2742
2743 static struct type_name
2744 {
2745 i386_operand_type mask;
2746 const char *name;
2747 }
2748 const type_names[] =
2749 {
2750 { OPERAND_TYPE_REG8, "r8" },
2751 { OPERAND_TYPE_REG16, "r16" },
2752 { OPERAND_TYPE_REG32, "r32" },
2753 { OPERAND_TYPE_REG64, "r64" },
2754 { OPERAND_TYPE_IMM8, "i8" },
2755 { OPERAND_TYPE_IMM8, "i8s" },
2756 { OPERAND_TYPE_IMM16, "i16" },
2757 { OPERAND_TYPE_IMM32, "i32" },
2758 { OPERAND_TYPE_IMM32S, "i32s" },
2759 { OPERAND_TYPE_IMM64, "i64" },
2760 { OPERAND_TYPE_IMM1, "i1" },
2761 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
2762 { OPERAND_TYPE_DISP8, "d8" },
2763 { OPERAND_TYPE_DISP16, "d16" },
2764 { OPERAND_TYPE_DISP32, "d32" },
2765 { OPERAND_TYPE_DISP32S, "d32s" },
2766 { OPERAND_TYPE_DISP64, "d64" },
2767 { OPERAND_TYPE_VEC_DISP8, "Vector d8" },
2768 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
2769 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
2770 { OPERAND_TYPE_CONTROL, "control reg" },
2771 { OPERAND_TYPE_TEST, "test reg" },
2772 { OPERAND_TYPE_DEBUG, "debug reg" },
2773 { OPERAND_TYPE_FLOATREG, "FReg" },
2774 { OPERAND_TYPE_FLOATACC, "FAcc" },
2775 { OPERAND_TYPE_SREG2, "SReg2" },
2776 { OPERAND_TYPE_SREG3, "SReg3" },
2777 { OPERAND_TYPE_ACC, "Acc" },
2778 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
2779 { OPERAND_TYPE_REGMMX, "rMMX" },
2780 { OPERAND_TYPE_REGXMM, "rXMM" },
2781 { OPERAND_TYPE_REGYMM, "rYMM" },
2782 { OPERAND_TYPE_REGZMM, "rZMM" },
2783 { OPERAND_TYPE_REGMASK, "Mask reg" },
2784 { OPERAND_TYPE_ESSEG, "es" },
2785 };
2786
2787 static void
2788 pt (i386_operand_type t)
2789 {
2790 unsigned int j;
2791 i386_operand_type a;
2792
2793 for (j = 0; j < ARRAY_SIZE (type_names); j++)
2794 {
2795 a = operand_type_and (t, type_names[j].mask);
2796 if (!operand_type_all_zero (&a))
2797 fprintf (stdout, "%s, ", type_names[j].name);
2798 }
2799 fflush (stdout);
2800 }
2801
2802 #endif /* DEBUG386 */
2803 \f
2804 static bfd_reloc_code_real_type
2805 reloc (unsigned int size,
2806 int pcrel,
2807 int sign,
2808 bfd_reloc_code_real_type other)
2809 {
2810 if (other != NO_RELOC)
2811 {
2812 reloc_howto_type *rel;
2813
2814 if (size == 8)
2815 switch (other)
2816 {
2817 case BFD_RELOC_X86_64_GOT32:
2818 return BFD_RELOC_X86_64_GOT64;
2819 break;
2820 case BFD_RELOC_X86_64_GOTPLT64:
2821 return BFD_RELOC_X86_64_GOTPLT64;
2822 break;
2823 case BFD_RELOC_X86_64_PLTOFF64:
2824 return BFD_RELOC_X86_64_PLTOFF64;
2825 break;
2826 case BFD_RELOC_X86_64_GOTPC32:
2827 other = BFD_RELOC_X86_64_GOTPC64;
2828 break;
2829 case BFD_RELOC_X86_64_GOTPCREL:
2830 other = BFD_RELOC_X86_64_GOTPCREL64;
2831 break;
2832 case BFD_RELOC_X86_64_TPOFF32:
2833 other = BFD_RELOC_X86_64_TPOFF64;
2834 break;
2835 case BFD_RELOC_X86_64_DTPOFF32:
2836 other = BFD_RELOC_X86_64_DTPOFF64;
2837 break;
2838 default:
2839 break;
2840 }
2841
2842 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2843 if (other == BFD_RELOC_SIZE32)
2844 {
2845 if (size == 8)
2846 other = BFD_RELOC_SIZE64;
2847 if (pcrel)
2848 {
2849 as_bad (_("there are no pc-relative size relocations"));
2850 return NO_RELOC;
2851 }
2852 }
2853 #endif
2854
2855 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
2856 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
2857 sign = -1;
2858
2859 rel = bfd_reloc_type_lookup (stdoutput, other);
2860 if (!rel)
2861 as_bad (_("unknown relocation (%u)"), other);
2862 else if (size != bfd_get_reloc_size (rel))
2863 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
2864 bfd_get_reloc_size (rel),
2865 size);
2866 else if (pcrel && !rel->pc_relative)
2867 as_bad (_("non-pc-relative relocation for pc-relative field"));
2868 else if ((rel->complain_on_overflow == complain_overflow_signed
2869 && !sign)
2870 || (rel->complain_on_overflow == complain_overflow_unsigned
2871 && sign > 0))
2872 as_bad (_("relocated field and relocation type differ in signedness"));
2873 else
2874 return other;
2875 return NO_RELOC;
2876 }
2877
2878 if (pcrel)
2879 {
2880 if (!sign)
2881 as_bad (_("there are no unsigned pc-relative relocations"));
2882 switch (size)
2883 {
2884 case 1: return BFD_RELOC_8_PCREL;
2885 case 2: return BFD_RELOC_16_PCREL;
2886 case 4: return BFD_RELOC_32_PCREL;
2887 case 8: return BFD_RELOC_64_PCREL;
2888 }
2889 as_bad (_("cannot do %u byte pc-relative relocation"), size);
2890 }
2891 else
2892 {
2893 if (sign > 0)
2894 switch (size)
2895 {
2896 case 4: return BFD_RELOC_X86_64_32S;
2897 }
2898 else
2899 switch (size)
2900 {
2901 case 1: return BFD_RELOC_8;
2902 case 2: return BFD_RELOC_16;
2903 case 4: return BFD_RELOC_32;
2904 case 8: return BFD_RELOC_64;
2905 }
2906 as_bad (_("cannot do %s %u byte relocation"),
2907 sign > 0 ? "signed" : "unsigned", size);
2908 }
2909
2910 return NO_RELOC;
2911 }
2912
2913 /* Here we decide which fixups can be adjusted to make them relative to
2914 the beginning of the section instead of the symbol. Basically we need
2915 to make sure that the dynamic relocations are done correctly, so in
2916 some cases we force the original symbol to be used. */
2917
2918 int
2919 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
2920 {
2921 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2922 if (!IS_ELF)
2923 return 1;
2924
2925 /* Don't adjust pc-relative references to merge sections in 64-bit
2926 mode. */
2927 if (use_rela_relocations
2928 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
2929 && fixP->fx_pcrel)
2930 return 0;
2931
2932 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
2933 and changed later by validate_fix. */
2934 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
2935 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
2936 return 0;
2937
2938 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
2939 for size relocations. */
2940 if (fixP->fx_r_type == BFD_RELOC_SIZE32
2941 || fixP->fx_r_type == BFD_RELOC_SIZE64
2942 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
2943 || fixP->fx_r_type == BFD_RELOC_386_PLT32
2944 || fixP->fx_r_type == BFD_RELOC_386_GOT32
2945 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
2946 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
2947 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
2948 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
2949 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
2950 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
2951 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
2952 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
2953 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
2954 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
2955 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
2956 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
2957 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
2958 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
2959 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
2960 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
2961 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
2962 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
2963 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
2964 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
2965 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
2966 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
2967 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
2968 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
2969 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
2970 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
2971 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
2972 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
2973 return 0;
2974 #endif
2975 return 1;
2976 }
2977
2978 static int
2979 intel_float_operand (const char *mnemonic)
2980 {
2981 /* Note that the value returned is meaningful only for opcodes with (memory)
2982 operands, hence the code here is free to improperly handle opcodes that
2983 have no operands (for better performance and smaller code). */
2984
2985 if (mnemonic[0] != 'f')
2986 return 0; /* non-math */
2987
2988 switch (mnemonic[1])
2989 {
2990 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
2991 the fs segment override prefix not currently handled because no
2992 call path can make opcodes without operands get here */
2993 case 'i':
2994 return 2 /* integer op */;
2995 case 'l':
2996 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
2997 return 3; /* fldcw/fldenv */
2998 break;
2999 case 'n':
3000 if (mnemonic[2] != 'o' /* fnop */)
3001 return 3; /* non-waiting control op */
3002 break;
3003 case 'r':
3004 if (mnemonic[2] == 's')
3005 return 3; /* frstor/frstpm */
3006 break;
3007 case 's':
3008 if (mnemonic[2] == 'a')
3009 return 3; /* fsave */
3010 if (mnemonic[2] == 't')
3011 {
3012 switch (mnemonic[3])
3013 {
3014 case 'c': /* fstcw */
3015 case 'd': /* fstdw */
3016 case 'e': /* fstenv */
3017 case 's': /* fsts[gw] */
3018 return 3;
3019 }
3020 }
3021 break;
3022 case 'x':
3023 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3024 return 0; /* fxsave/fxrstor are not really math ops */
3025 break;
3026 }
3027
3028 return 1;
3029 }
3030
3031 /* Build the VEX prefix. */
3032
3033 static void
3034 build_vex_prefix (const insn_template *t)
3035 {
3036 unsigned int register_specifier;
3037 unsigned int implied_prefix;
3038 unsigned int vector_length;
3039
3040 /* Check register specifier. */
3041 if (i.vex.register_specifier)
3042 {
3043 register_specifier =
3044 ~register_number (i.vex.register_specifier) & 0xf;
3045 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3046 }
3047 else
3048 register_specifier = 0xf;
3049
3050 /* Use 2-byte VEX prefix by swappping destination and source
3051 operand. */
3052 if (!i.swap_operand
3053 && i.operands == i.reg_operands
3054 && i.tm.opcode_modifier.vexopcode == VEX0F
3055 && i.tm.opcode_modifier.s
3056 && i.rex == REX_B)
3057 {
3058 unsigned int xchg = i.operands - 1;
3059 union i386_op temp_op;
3060 i386_operand_type temp_type;
3061
3062 temp_type = i.types[xchg];
3063 i.types[xchg] = i.types[0];
3064 i.types[0] = temp_type;
3065 temp_op = i.op[xchg];
3066 i.op[xchg] = i.op[0];
3067 i.op[0] = temp_op;
3068
3069 gas_assert (i.rm.mode == 3);
3070
3071 i.rex = REX_R;
3072 xchg = i.rm.regmem;
3073 i.rm.regmem = i.rm.reg;
3074 i.rm.reg = xchg;
3075
3076 /* Use the next insn. */
3077 i.tm = t[1];
3078 }
3079
3080 if (i.tm.opcode_modifier.vex == VEXScalar)
3081 vector_length = avxscalar;
3082 else
3083 vector_length = i.tm.opcode_modifier.vex == VEX256 ? 1 : 0;
3084
3085 switch ((i.tm.base_opcode >> 8) & 0xff)
3086 {
3087 case 0:
3088 implied_prefix = 0;
3089 break;
3090 case DATA_PREFIX_OPCODE:
3091 implied_prefix = 1;
3092 break;
3093 case REPE_PREFIX_OPCODE:
3094 implied_prefix = 2;
3095 break;
3096 case REPNE_PREFIX_OPCODE:
3097 implied_prefix = 3;
3098 break;
3099 default:
3100 abort ();
3101 }
3102
3103 /* Use 2-byte VEX prefix if possible. */
3104 if (i.tm.opcode_modifier.vexopcode == VEX0F
3105 && i.tm.opcode_modifier.vexw != VEXW1
3106 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3107 {
3108 /* 2-byte VEX prefix. */
3109 unsigned int r;
3110
3111 i.vex.length = 2;
3112 i.vex.bytes[0] = 0xc5;
3113
3114 /* Check the REX.R bit. */
3115 r = (i.rex & REX_R) ? 0 : 1;
3116 i.vex.bytes[1] = (r << 7
3117 | register_specifier << 3
3118 | vector_length << 2
3119 | implied_prefix);
3120 }
3121 else
3122 {
3123 /* 3-byte VEX prefix. */
3124 unsigned int m, w;
3125
3126 i.vex.length = 3;
3127
3128 switch (i.tm.opcode_modifier.vexopcode)
3129 {
3130 case VEX0F:
3131 m = 0x1;
3132 i.vex.bytes[0] = 0xc4;
3133 break;
3134 case VEX0F38:
3135 m = 0x2;
3136 i.vex.bytes[0] = 0xc4;
3137 break;
3138 case VEX0F3A:
3139 m = 0x3;
3140 i.vex.bytes[0] = 0xc4;
3141 break;
3142 case XOP08:
3143 m = 0x8;
3144 i.vex.bytes[0] = 0x8f;
3145 break;
3146 case XOP09:
3147 m = 0x9;
3148 i.vex.bytes[0] = 0x8f;
3149 break;
3150 case XOP0A:
3151 m = 0xa;
3152 i.vex.bytes[0] = 0x8f;
3153 break;
3154 default:
3155 abort ();
3156 }
3157
3158 /* The high 3 bits of the second VEX byte are 1's compliment
3159 of RXB bits from REX. */
3160 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3161
3162 /* Check the REX.W bit. */
3163 w = (i.rex & REX_W) ? 1 : 0;
3164 if (i.tm.opcode_modifier.vexw == VEXW1)
3165 w = 1;
3166
3167 i.vex.bytes[2] = (w << 7
3168 | register_specifier << 3
3169 | vector_length << 2
3170 | implied_prefix);
3171 }
3172 }
3173
3174 /* Build the EVEX prefix. */
3175
3176 static void
3177 build_evex_prefix (void)
3178 {
3179 unsigned int register_specifier;
3180 unsigned int implied_prefix;
3181 unsigned int m, w;
3182 rex_byte vrex_used = 0;
3183
3184 /* Check register specifier. */
3185 if (i.vex.register_specifier)
3186 {
3187 gas_assert ((i.vrex & REX_X) == 0);
3188
3189 register_specifier = i.vex.register_specifier->reg_num;
3190 if ((i.vex.register_specifier->reg_flags & RegRex))
3191 register_specifier += 8;
3192 /* The upper 16 registers are encoded in the fourth byte of the
3193 EVEX prefix. */
3194 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3195 i.vex.bytes[3] = 0x8;
3196 register_specifier = ~register_specifier & 0xf;
3197 }
3198 else
3199 {
3200 register_specifier = 0xf;
3201
3202 /* Encode upper 16 vector index register in the fourth byte of
3203 the EVEX prefix. */
3204 if (!(i.vrex & REX_X))
3205 i.vex.bytes[3] = 0x8;
3206 else
3207 vrex_used |= REX_X;
3208 }
3209
3210 switch ((i.tm.base_opcode >> 8) & 0xff)
3211 {
3212 case 0:
3213 implied_prefix = 0;
3214 break;
3215 case DATA_PREFIX_OPCODE:
3216 implied_prefix = 1;
3217 break;
3218 case REPE_PREFIX_OPCODE:
3219 implied_prefix = 2;
3220 break;
3221 case REPNE_PREFIX_OPCODE:
3222 implied_prefix = 3;
3223 break;
3224 default:
3225 abort ();
3226 }
3227
3228 /* 4 byte EVEX prefix. */
3229 i.vex.length = 4;
3230 i.vex.bytes[0] = 0x62;
3231
3232 /* mmmm bits. */
3233 switch (i.tm.opcode_modifier.vexopcode)
3234 {
3235 case VEX0F:
3236 m = 1;
3237 break;
3238 case VEX0F38:
3239 m = 2;
3240 break;
3241 case VEX0F3A:
3242 m = 3;
3243 break;
3244 default:
3245 abort ();
3246 break;
3247 }
3248
3249 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3250 bits from REX. */
3251 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3252
3253 /* The fifth bit of the second EVEX byte is 1's compliment of the
3254 REX_R bit in VREX. */
3255 if (!(i.vrex & REX_R))
3256 i.vex.bytes[1] |= 0x10;
3257 else
3258 vrex_used |= REX_R;
3259
3260 if ((i.reg_operands + i.imm_operands) == i.operands)
3261 {
3262 /* When all operands are registers, the REX_X bit in REX is not
3263 used. We reuse it to encode the upper 16 registers, which is
3264 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3265 as 1's compliment. */
3266 if ((i.vrex & REX_B))
3267 {
3268 vrex_used |= REX_B;
3269 i.vex.bytes[1] &= ~0x40;
3270 }
3271 }
3272
3273 /* EVEX instructions shouldn't need the REX prefix. */
3274 i.vrex &= ~vrex_used;
3275 gas_assert (i.vrex == 0);
3276
3277 /* Check the REX.W bit. */
3278 w = (i.rex & REX_W) ? 1 : 0;
3279 if (i.tm.opcode_modifier.vexw)
3280 {
3281 if (i.tm.opcode_modifier.vexw == VEXW1)
3282 w = 1;
3283 }
3284 /* If w is not set it means we are dealing with WIG instruction. */
3285 else if (!w)
3286 {
3287 if (evexwig == evexw1)
3288 w = 1;
3289 }
3290
3291 /* Encode the U bit. */
3292 implied_prefix |= 0x4;
3293
3294 /* The third byte of the EVEX prefix. */
3295 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3296
3297 /* The fourth byte of the EVEX prefix. */
3298 /* The zeroing-masking bit. */
3299 if (i.mask && i.mask->zeroing)
3300 i.vex.bytes[3] |= 0x80;
3301
3302 /* Don't always set the broadcast bit if there is no RC. */
3303 if (!i.rounding)
3304 {
3305 /* Encode the vector length. */
3306 unsigned int vec_length;
3307
3308 switch (i.tm.opcode_modifier.evex)
3309 {
3310 case EVEXLIG: /* LL' is ignored */
3311 vec_length = evexlig << 5;
3312 break;
3313 case EVEX128:
3314 vec_length = 0 << 5;
3315 break;
3316 case EVEX256:
3317 vec_length = 1 << 5;
3318 break;
3319 case EVEX512:
3320 vec_length = 2 << 5;
3321 break;
3322 default:
3323 abort ();
3324 break;
3325 }
3326 i.vex.bytes[3] |= vec_length;
3327 /* Encode the broadcast bit. */
3328 if (i.broadcast)
3329 i.vex.bytes[3] |= 0x10;
3330 }
3331 else
3332 {
3333 if (i.rounding->type != saeonly)
3334 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3335 else
3336 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3337 }
3338
3339 if (i.mask && i.mask->mask)
3340 i.vex.bytes[3] |= i.mask->mask->reg_num;
3341 }
3342
3343 static void
3344 process_immext (void)
3345 {
3346 expressionS *exp;
3347
3348 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3349 && i.operands > 0)
3350 {
3351 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3352 with an opcode suffix which is coded in the same place as an
3353 8-bit immediate field would be.
3354 Here we check those operands and remove them afterwards. */
3355 unsigned int x;
3356
3357 for (x = 0; x < i.operands; x++)
3358 if (register_number (i.op[x].regs) != x)
3359 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3360 register_prefix, i.op[x].regs->reg_name, x + 1,
3361 i.tm.name);
3362
3363 i.operands = 0;
3364 }
3365
3366 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3367 {
3368 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3369 suffix which is coded in the same place as an 8-bit immediate
3370 field would be.
3371 Here we check those operands and remove them afterwards. */
3372 unsigned int x;
3373
3374 if (i.operands != 3)
3375 abort();
3376
3377 for (x = 0; x < 2; x++)
3378 if (register_number (i.op[x].regs) != x)
3379 goto bad_register_operand;
3380
3381 /* Check for third operand for mwaitx/monitorx insn. */
3382 if (register_number (i.op[x].regs)
3383 != (x + (i.tm.extension_opcode == 0xfb)))
3384 {
3385 bad_register_operand:
3386 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3387 register_prefix, i.op[x].regs->reg_name, x+1,
3388 i.tm.name);
3389 }
3390
3391 i.operands = 0;
3392 }
3393
3394 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3395 which is coded in the same place as an 8-bit immediate field
3396 would be. Here we fake an 8-bit immediate operand from the
3397 opcode suffix stored in tm.extension_opcode.
3398
3399 AVX instructions also use this encoding, for some of
3400 3 argument instructions. */
3401
3402 gas_assert (i.imm_operands <= 1
3403 && (i.operands <= 2
3404 || ((i.tm.opcode_modifier.vex
3405 || i.tm.opcode_modifier.evex)
3406 && i.operands <= 4)));
3407
3408 exp = &im_expressions[i.imm_operands++];
3409 i.op[i.operands].imms = exp;
3410 i.types[i.operands] = imm8;
3411 i.operands++;
3412 exp->X_op = O_constant;
3413 exp->X_add_number = i.tm.extension_opcode;
3414 i.tm.extension_opcode = None;
3415 }
3416
3417
3418 static int
3419 check_hle (void)
3420 {
3421 switch (i.tm.opcode_modifier.hleprefixok)
3422 {
3423 default:
3424 abort ();
3425 case HLEPrefixNone:
3426 as_bad (_("invalid instruction `%s' after `%s'"),
3427 i.tm.name, i.hle_prefix);
3428 return 0;
3429 case HLEPrefixLock:
3430 if (i.prefix[LOCK_PREFIX])
3431 return 1;
3432 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3433 return 0;
3434 case HLEPrefixAny:
3435 return 1;
3436 case HLEPrefixRelease:
3437 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3438 {
3439 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3440 i.tm.name);
3441 return 0;
3442 }
3443 if (i.mem_operands == 0
3444 || !operand_type_check (i.types[i.operands - 1], anymem))
3445 {
3446 as_bad (_("memory destination needed for instruction `%s'"
3447 " after `xrelease'"), i.tm.name);
3448 return 0;
3449 }
3450 return 1;
3451 }
3452 }
3453
3454 /* This is the guts of the machine-dependent assembler. LINE points to a
3455 machine dependent instruction. This function is supposed to emit
3456 the frags/bytes it assembles to. */
3457
3458 void
3459 md_assemble (char *line)
3460 {
3461 unsigned int j;
3462 char mnemonic[MAX_MNEM_SIZE];
3463 const insn_template *t;
3464
3465 /* Initialize globals. */
3466 memset (&i, '\0', sizeof (i));
3467 for (j = 0; j < MAX_OPERANDS; j++)
3468 i.reloc[j] = NO_RELOC;
3469 memset (disp_expressions, '\0', sizeof (disp_expressions));
3470 memset (im_expressions, '\0', sizeof (im_expressions));
3471 save_stack_p = save_stack;
3472
3473 /* First parse an instruction mnemonic & call i386_operand for the operands.
3474 We assume that the scrubber has arranged it so that line[0] is the valid
3475 start of a (possibly prefixed) mnemonic. */
3476
3477 line = parse_insn (line, mnemonic);
3478 if (line == NULL)
3479 return;
3480
3481 line = parse_operands (line, mnemonic);
3482 this_operand = -1;
3483 if (line == NULL)
3484 return;
3485
3486 /* Now we've parsed the mnemonic into a set of templates, and have the
3487 operands at hand. */
3488
3489 /* All intel opcodes have reversed operands except for "bound" and
3490 "enter". We also don't reverse intersegment "jmp" and "call"
3491 instructions with 2 immediate operands so that the immediate segment
3492 precedes the offset, as it does when in AT&T mode. */
3493 if (intel_syntax
3494 && i.operands > 1
3495 && (strcmp (mnemonic, "bound") != 0)
3496 && (strcmp (mnemonic, "invlpga") != 0)
3497 && !(operand_type_check (i.types[0], imm)
3498 && operand_type_check (i.types[1], imm)))
3499 swap_operands ();
3500
3501 /* The order of the immediates should be reversed
3502 for 2 immediates extrq and insertq instructions */
3503 if (i.imm_operands == 2
3504 && (strcmp (mnemonic, "extrq") == 0
3505 || strcmp (mnemonic, "insertq") == 0))
3506 swap_2_operands (0, 1);
3507
3508 if (i.imm_operands)
3509 optimize_imm ();
3510
3511 /* Don't optimize displacement for movabs since it only takes 64bit
3512 displacement. */
3513 if (i.disp_operands
3514 && i.disp_encoding != disp_encoding_32bit
3515 && (flag_code != CODE_64BIT
3516 || strcmp (mnemonic, "movabs") != 0))
3517 optimize_disp ();
3518
3519 /* Next, we find a template that matches the given insn,
3520 making sure the overlap of the given operands types is consistent
3521 with the template operand types. */
3522
3523 if (!(t = match_template ()))
3524 return;
3525
3526 if (sse_check != check_none
3527 && !i.tm.opcode_modifier.noavx
3528 && (i.tm.cpu_flags.bitfield.cpusse
3529 || i.tm.cpu_flags.bitfield.cpusse2
3530 || i.tm.cpu_flags.bitfield.cpusse3
3531 || i.tm.cpu_flags.bitfield.cpussse3
3532 || i.tm.cpu_flags.bitfield.cpusse4_1
3533 || i.tm.cpu_flags.bitfield.cpusse4_2))
3534 {
3535 (sse_check == check_warning
3536 ? as_warn
3537 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
3538 }
3539
3540 /* Zap movzx and movsx suffix. The suffix has been set from
3541 "word ptr" or "byte ptr" on the source operand in Intel syntax
3542 or extracted from mnemonic in AT&T syntax. But we'll use
3543 the destination register to choose the suffix for encoding. */
3544 if ((i.tm.base_opcode & ~9) == 0x0fb6)
3545 {
3546 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
3547 there is no suffix, the default will be byte extension. */
3548 if (i.reg_operands != 2
3549 && !i.suffix
3550 && intel_syntax)
3551 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
3552
3553 i.suffix = 0;
3554 }
3555
3556 if (i.tm.opcode_modifier.fwait)
3557 if (!add_prefix (FWAIT_OPCODE))
3558 return;
3559
3560 /* Check if REP prefix is OK. */
3561 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
3562 {
3563 as_bad (_("invalid instruction `%s' after `%s'"),
3564 i.tm.name, i.rep_prefix);
3565 return;
3566 }
3567
3568 /* Check for lock without a lockable instruction. Destination operand
3569 must be memory unless it is xchg (0x86). */
3570 if (i.prefix[LOCK_PREFIX]
3571 && (!i.tm.opcode_modifier.islockable
3572 || i.mem_operands == 0
3573 || (i.tm.base_opcode != 0x86
3574 && !operand_type_check (i.types[i.operands - 1], anymem))))
3575 {
3576 as_bad (_("expecting lockable instruction after `lock'"));
3577 return;
3578 }
3579
3580 /* Check if HLE prefix is OK. */
3581 if (i.hle_prefix && !check_hle ())
3582 return;
3583
3584 /* Check BND prefix. */
3585 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
3586 as_bad (_("expecting valid branch instruction after `bnd'"));
3587
3588 if (i.tm.cpu_flags.bitfield.cpumpx
3589 && flag_code == CODE_64BIT
3590 && i.prefix[ADDR_PREFIX])
3591 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
3592
3593 /* Insert BND prefix. */
3594 if (add_bnd_prefix
3595 && i.tm.opcode_modifier.bndprefixok
3596 && !i.prefix[BND_PREFIX])
3597 add_prefix (BND_PREFIX_OPCODE);
3598
3599 /* Check string instruction segment overrides. */
3600 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
3601 {
3602 if (!check_string ())
3603 return;
3604 i.disp_operands = 0;
3605 }
3606
3607 if (!process_suffix ())
3608 return;
3609
3610 /* Update operand types. */
3611 for (j = 0; j < i.operands; j++)
3612 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3613
3614 /* Make still unresolved immediate matches conform to size of immediate
3615 given in i.suffix. */
3616 if (!finalize_imm ())
3617 return;
3618
3619 if (i.types[0].bitfield.imm1)
3620 i.imm_operands = 0; /* kludge for shift insns. */
3621
3622 /* We only need to check those implicit registers for instructions
3623 with 3 operands or less. */
3624 if (i.operands <= 3)
3625 for (j = 0; j < i.operands; j++)
3626 if (i.types[j].bitfield.inoutportreg
3627 || i.types[j].bitfield.shiftcount
3628 || i.types[j].bitfield.acc
3629 || i.types[j].bitfield.floatacc)
3630 i.reg_operands--;
3631
3632 /* ImmExt should be processed after SSE2AVX. */
3633 if (!i.tm.opcode_modifier.sse2avx
3634 && i.tm.opcode_modifier.immext)
3635 process_immext ();
3636
3637 /* For insns with operands there are more diddles to do to the opcode. */
3638 if (i.operands)
3639 {
3640 if (!process_operands ())
3641 return;
3642 }
3643 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
3644 {
3645 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
3646 as_warn (_("translating to `%sp'"), i.tm.name);
3647 }
3648
3649 if (i.tm.opcode_modifier.vex || i.tm.opcode_modifier.evex)
3650 {
3651 if (flag_code == CODE_16BIT)
3652 {
3653 as_bad (_("instruction `%s' isn't supported in 16-bit mode."),
3654 i.tm.name);
3655 return;
3656 }
3657
3658 if (i.tm.opcode_modifier.vex)
3659 build_vex_prefix (t);
3660 else
3661 build_evex_prefix ();
3662 }
3663
3664 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
3665 instructions may define INT_OPCODE as well, so avoid this corner
3666 case for those instructions that use MODRM. */
3667 if (i.tm.base_opcode == INT_OPCODE
3668 && !i.tm.opcode_modifier.modrm
3669 && i.op[0].imms->X_add_number == 3)
3670 {
3671 i.tm.base_opcode = INT3_OPCODE;
3672 i.imm_operands = 0;
3673 }
3674
3675 if ((i.tm.opcode_modifier.jump
3676 || i.tm.opcode_modifier.jumpbyte
3677 || i.tm.opcode_modifier.jumpdword)
3678 && i.op[0].disps->X_op == O_constant)
3679 {
3680 /* Convert "jmp constant" (and "call constant") to a jump (call) to
3681 the absolute address given by the constant. Since ix86 jumps and
3682 calls are pc relative, we need to generate a reloc. */
3683 i.op[0].disps->X_add_symbol = &abs_symbol;
3684 i.op[0].disps->X_op = O_symbol;
3685 }
3686
3687 if (i.tm.opcode_modifier.rex64)
3688 i.rex |= REX_W;
3689
3690 /* For 8 bit registers we need an empty rex prefix. Also if the
3691 instruction already has a prefix, we need to convert old
3692 registers to new ones. */
3693
3694 if ((i.types[0].bitfield.reg8
3695 && (i.op[0].regs->reg_flags & RegRex64) != 0)
3696 || (i.types[1].bitfield.reg8
3697 && (i.op[1].regs->reg_flags & RegRex64) != 0)
3698 || ((i.types[0].bitfield.reg8
3699 || i.types[1].bitfield.reg8)
3700 && i.rex != 0))
3701 {
3702 int x;
3703
3704 i.rex |= REX_OPCODE;
3705 for (x = 0; x < 2; x++)
3706 {
3707 /* Look for 8 bit operand that uses old registers. */
3708 if (i.types[x].bitfield.reg8
3709 && (i.op[x].regs->reg_flags & RegRex64) == 0)
3710 {
3711 /* In case it is "hi" register, give up. */
3712 if (i.op[x].regs->reg_num > 3)
3713 as_bad (_("can't encode register '%s%s' in an "
3714 "instruction requiring REX prefix."),
3715 register_prefix, i.op[x].regs->reg_name);
3716
3717 /* Otherwise it is equivalent to the extended register.
3718 Since the encoding doesn't change this is merely
3719 cosmetic cleanup for debug output. */
3720
3721 i.op[x].regs = i.op[x].regs + 8;
3722 }
3723 }
3724 }
3725
3726 if (i.rex != 0)
3727 add_prefix (REX_OPCODE | i.rex);
3728
3729 /* We are ready to output the insn. */
3730 output_insn ();
3731 }
3732
3733 static char *
3734 parse_insn (char *line, char *mnemonic)
3735 {
3736 char *l = line;
3737 char *token_start = l;
3738 char *mnem_p;
3739 int supported;
3740 const insn_template *t;
3741 char *dot_p = NULL;
3742
3743 while (1)
3744 {
3745 mnem_p = mnemonic;
3746 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
3747 {
3748 if (*mnem_p == '.')
3749 dot_p = mnem_p;
3750 mnem_p++;
3751 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
3752 {
3753 as_bad (_("no such instruction: `%s'"), token_start);
3754 return NULL;
3755 }
3756 l++;
3757 }
3758 if (!is_space_char (*l)
3759 && *l != END_OF_INSN
3760 && (intel_syntax
3761 || (*l != PREFIX_SEPARATOR
3762 && *l != ',')))
3763 {
3764 as_bad (_("invalid character %s in mnemonic"),
3765 output_invalid (*l));
3766 return NULL;
3767 }
3768 if (token_start == l)
3769 {
3770 if (!intel_syntax && *l == PREFIX_SEPARATOR)
3771 as_bad (_("expecting prefix; got nothing"));
3772 else
3773 as_bad (_("expecting mnemonic; got nothing"));
3774 return NULL;
3775 }
3776
3777 /* Look up instruction (or prefix) via hash table. */
3778 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3779
3780 if (*l != END_OF_INSN
3781 && (!is_space_char (*l) || l[1] != END_OF_INSN)
3782 && current_templates
3783 && current_templates->start->opcode_modifier.isprefix)
3784 {
3785 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
3786 {
3787 as_bad ((flag_code != CODE_64BIT
3788 ? _("`%s' is only supported in 64-bit mode")
3789 : _("`%s' is not supported in 64-bit mode")),
3790 current_templates->start->name);
3791 return NULL;
3792 }
3793 /* If we are in 16-bit mode, do not allow addr16 or data16.
3794 Similarly, in 32-bit mode, do not allow addr32 or data32. */
3795 if ((current_templates->start->opcode_modifier.size16
3796 || current_templates->start->opcode_modifier.size32)
3797 && flag_code != CODE_64BIT
3798 && (current_templates->start->opcode_modifier.size32
3799 ^ (flag_code == CODE_16BIT)))
3800 {
3801 as_bad (_("redundant %s prefix"),
3802 current_templates->start->name);
3803 return NULL;
3804 }
3805 /* Add prefix, checking for repeated prefixes. */
3806 switch (add_prefix (current_templates->start->base_opcode))
3807 {
3808 case PREFIX_EXIST:
3809 return NULL;
3810 case PREFIX_REP:
3811 if (current_templates->start->cpu_flags.bitfield.cpuhle)
3812 i.hle_prefix = current_templates->start->name;
3813 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
3814 i.bnd_prefix = current_templates->start->name;
3815 else
3816 i.rep_prefix = current_templates->start->name;
3817 break;
3818 default:
3819 break;
3820 }
3821 /* Skip past PREFIX_SEPARATOR and reset token_start. */
3822 token_start = ++l;
3823 }
3824 else
3825 break;
3826 }
3827
3828 if (!current_templates)
3829 {
3830 /* Check if we should swap operand or force 32bit displacement in
3831 encoding. */
3832 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
3833 i.swap_operand = 1;
3834 else if (mnem_p - 3 == dot_p
3835 && dot_p[1] == 'd'
3836 && dot_p[2] == '8')
3837 i.disp_encoding = disp_encoding_8bit;
3838 else if (mnem_p - 4 == dot_p
3839 && dot_p[1] == 'd'
3840 && dot_p[2] == '3'
3841 && dot_p[3] == '2')
3842 i.disp_encoding = disp_encoding_32bit;
3843 else
3844 goto check_suffix;
3845 mnem_p = dot_p;
3846 *dot_p = '\0';
3847 current_templates = (const templates *) hash_find (op_hash, mnemonic);
3848 }
3849
3850 if (!current_templates)
3851 {
3852 check_suffix:
3853 /* See if we can get a match by trimming off a suffix. */
3854 switch (mnem_p[-1])
3855 {
3856 case WORD_MNEM_SUFFIX:
3857 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
3858 i.suffix = SHORT_MNEM_SUFFIX;
3859 else
3860 case BYTE_MNEM_SUFFIX:
3861 case QWORD_MNEM_SUFFIX:
3862 i.suffix = mnem_p[-1];
3863 mnem_p[-1] = '\0';
3864 current_templates = (const templates *) hash_find (op_hash,
3865 mnemonic);
3866 break;
3867 case SHORT_MNEM_SUFFIX:
3868 case LONG_MNEM_SUFFIX:
3869 if (!intel_syntax)
3870 {
3871 i.suffix = mnem_p[-1];
3872 mnem_p[-1] = '\0';
3873 current_templates = (const templates *) hash_find (op_hash,
3874 mnemonic);
3875 }
3876 break;
3877
3878 /* Intel Syntax. */
3879 case 'd':
3880 if (intel_syntax)
3881 {
3882 if (intel_float_operand (mnemonic) == 1)
3883 i.suffix = SHORT_MNEM_SUFFIX;
3884 else
3885 i.suffix = LONG_MNEM_SUFFIX;
3886 mnem_p[-1] = '\0';
3887 current_templates = (const templates *) hash_find (op_hash,
3888 mnemonic);
3889 }
3890 break;
3891 }
3892 if (!current_templates)
3893 {
3894 as_bad (_("no such instruction: `%s'"), token_start);
3895 return NULL;
3896 }
3897 }
3898
3899 if (current_templates->start->opcode_modifier.jump
3900 || current_templates->start->opcode_modifier.jumpbyte)
3901 {
3902 /* Check for a branch hint. We allow ",pt" and ",pn" for
3903 predict taken and predict not taken respectively.
3904 I'm not sure that branch hints actually do anything on loop
3905 and jcxz insns (JumpByte) for current Pentium4 chips. They
3906 may work in the future and it doesn't hurt to accept them
3907 now. */
3908 if (l[0] == ',' && l[1] == 'p')
3909 {
3910 if (l[2] == 't')
3911 {
3912 if (!add_prefix (DS_PREFIX_OPCODE))
3913 return NULL;
3914 l += 3;
3915 }
3916 else if (l[2] == 'n')
3917 {
3918 if (!add_prefix (CS_PREFIX_OPCODE))
3919 return NULL;
3920 l += 3;
3921 }
3922 }
3923 }
3924 /* Any other comma loses. */
3925 if (*l == ',')
3926 {
3927 as_bad (_("invalid character %s in mnemonic"),
3928 output_invalid (*l));
3929 return NULL;
3930 }
3931
3932 /* Check if instruction is supported on specified architecture. */
3933 supported = 0;
3934 for (t = current_templates->start; t < current_templates->end; ++t)
3935 {
3936 supported |= cpu_flags_match (t);
3937 if (supported == CPU_FLAGS_PERFECT_MATCH)
3938 goto skip;
3939 }
3940
3941 if (!(supported & CPU_FLAGS_64BIT_MATCH))
3942 {
3943 as_bad (flag_code == CODE_64BIT
3944 ? _("`%s' is not supported in 64-bit mode")
3945 : _("`%s' is only supported in 64-bit mode"),
3946 current_templates->start->name);
3947 return NULL;
3948 }
3949 if (supported != CPU_FLAGS_PERFECT_MATCH)
3950 {
3951 as_bad (_("`%s' is not supported on `%s%s'"),
3952 current_templates->start->name,
3953 cpu_arch_name ? cpu_arch_name : default_arch,
3954 cpu_sub_arch_name ? cpu_sub_arch_name : "");
3955 return NULL;
3956 }
3957
3958 skip:
3959 if (!cpu_arch_flags.bitfield.cpui386
3960 && (flag_code != CODE_16BIT))
3961 {
3962 as_warn (_("use .code16 to ensure correct addressing mode"));
3963 }
3964
3965 return l;
3966 }
3967
3968 static char *
3969 parse_operands (char *l, const char *mnemonic)
3970 {
3971 char *token_start;
3972
3973 /* 1 if operand is pending after ','. */
3974 unsigned int expecting_operand = 0;
3975
3976 /* Non-zero if operand parens not balanced. */
3977 unsigned int paren_not_balanced;
3978
3979 while (*l != END_OF_INSN)
3980 {
3981 /* Skip optional white space before operand. */
3982 if (is_space_char (*l))
3983 ++l;
3984 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
3985 {
3986 as_bad (_("invalid character %s before operand %d"),
3987 output_invalid (*l),
3988 i.operands + 1);
3989 return NULL;
3990 }
3991 token_start = l; /* After white space. */
3992 paren_not_balanced = 0;
3993 while (paren_not_balanced || *l != ',')
3994 {
3995 if (*l == END_OF_INSN)
3996 {
3997 if (paren_not_balanced)
3998 {
3999 if (!intel_syntax)
4000 as_bad (_("unbalanced parenthesis in operand %d."),
4001 i.operands + 1);
4002 else
4003 as_bad (_("unbalanced brackets in operand %d."),
4004 i.operands + 1);
4005 return NULL;
4006 }
4007 else
4008 break; /* we are done */
4009 }
4010 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4011 {
4012 as_bad (_("invalid character %s in operand %d"),
4013 output_invalid (*l),
4014 i.operands + 1);
4015 return NULL;
4016 }
4017 if (!intel_syntax)
4018 {
4019 if (*l == '(')
4020 ++paren_not_balanced;
4021 if (*l == ')')
4022 --paren_not_balanced;
4023 }
4024 else
4025 {
4026 if (*l == '[')
4027 ++paren_not_balanced;
4028 if (*l == ']')
4029 --paren_not_balanced;
4030 }
4031 l++;
4032 }
4033 if (l != token_start)
4034 { /* Yes, we've read in another operand. */
4035 unsigned int operand_ok;
4036 this_operand = i.operands++;
4037 i.types[this_operand].bitfield.unspecified = 1;
4038 if (i.operands > MAX_OPERANDS)
4039 {
4040 as_bad (_("spurious operands; (%d operands/instruction max)"),
4041 MAX_OPERANDS);
4042 return NULL;
4043 }
4044 /* Now parse operand adding info to 'i' as we go along. */
4045 END_STRING_AND_SAVE (l);
4046
4047 if (intel_syntax)
4048 operand_ok =
4049 i386_intel_operand (token_start,
4050 intel_float_operand (mnemonic));
4051 else
4052 operand_ok = i386_att_operand (token_start);
4053
4054 RESTORE_END_STRING (l);
4055 if (!operand_ok)
4056 return NULL;
4057 }
4058 else
4059 {
4060 if (expecting_operand)
4061 {
4062 expecting_operand_after_comma:
4063 as_bad (_("expecting operand after ','; got nothing"));
4064 return NULL;
4065 }
4066 if (*l == ',')
4067 {
4068 as_bad (_("expecting operand before ','; got nothing"));
4069 return NULL;
4070 }
4071 }
4072
4073 /* Now *l must be either ',' or END_OF_INSN. */
4074 if (*l == ',')
4075 {
4076 if (*++l == END_OF_INSN)
4077 {
4078 /* Just skip it, if it's \n complain. */
4079 goto expecting_operand_after_comma;
4080 }
4081 expecting_operand = 1;
4082 }
4083 }
4084 return l;
4085 }
4086
4087 static void
4088 swap_2_operands (int xchg1, int xchg2)
4089 {
4090 union i386_op temp_op;
4091 i386_operand_type temp_type;
4092 enum bfd_reloc_code_real temp_reloc;
4093
4094 temp_type = i.types[xchg2];
4095 i.types[xchg2] = i.types[xchg1];
4096 i.types[xchg1] = temp_type;
4097 temp_op = i.op[xchg2];
4098 i.op[xchg2] = i.op[xchg1];
4099 i.op[xchg1] = temp_op;
4100 temp_reloc = i.reloc[xchg2];
4101 i.reloc[xchg2] = i.reloc[xchg1];
4102 i.reloc[xchg1] = temp_reloc;
4103
4104 if (i.mask)
4105 {
4106 if (i.mask->operand == xchg1)
4107 i.mask->operand = xchg2;
4108 else if (i.mask->operand == xchg2)
4109 i.mask->operand = xchg1;
4110 }
4111 if (i.broadcast)
4112 {
4113 if (i.broadcast->operand == xchg1)
4114 i.broadcast->operand = xchg2;
4115 else if (i.broadcast->operand == xchg2)
4116 i.broadcast->operand = xchg1;
4117 }
4118 if (i.rounding)
4119 {
4120 if (i.rounding->operand == xchg1)
4121 i.rounding->operand = xchg2;
4122 else if (i.rounding->operand == xchg2)
4123 i.rounding->operand = xchg1;
4124 }
4125 }
4126
4127 static void
4128 swap_operands (void)
4129 {
4130 switch (i.operands)
4131 {
4132 case 5:
4133 case 4:
4134 swap_2_operands (1, i.operands - 2);
4135 case 3:
4136 case 2:
4137 swap_2_operands (0, i.operands - 1);
4138 break;
4139 default:
4140 abort ();
4141 }
4142
4143 if (i.mem_operands == 2)
4144 {
4145 const seg_entry *temp_seg;
4146 temp_seg = i.seg[0];
4147 i.seg[0] = i.seg[1];
4148 i.seg[1] = temp_seg;
4149 }
4150 }
4151
4152 /* Try to ensure constant immediates are represented in the smallest
4153 opcode possible. */
4154 static void
4155 optimize_imm (void)
4156 {
4157 char guess_suffix = 0;
4158 int op;
4159
4160 if (i.suffix)
4161 guess_suffix = i.suffix;
4162 else if (i.reg_operands)
4163 {
4164 /* Figure out a suffix from the last register operand specified.
4165 We can't do this properly yet, ie. excluding InOutPortReg,
4166 but the following works for instructions with immediates.
4167 In any case, we can't set i.suffix yet. */
4168 for (op = i.operands; --op >= 0;)
4169 if (i.types[op].bitfield.reg8)
4170 {
4171 guess_suffix = BYTE_MNEM_SUFFIX;
4172 break;
4173 }
4174 else if (i.types[op].bitfield.reg16)
4175 {
4176 guess_suffix = WORD_MNEM_SUFFIX;
4177 break;
4178 }
4179 else if (i.types[op].bitfield.reg32)
4180 {
4181 guess_suffix = LONG_MNEM_SUFFIX;
4182 break;
4183 }
4184 else if (i.types[op].bitfield.reg64)
4185 {
4186 guess_suffix = QWORD_MNEM_SUFFIX;
4187 break;
4188 }
4189 }
4190 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4191 guess_suffix = WORD_MNEM_SUFFIX;
4192
4193 for (op = i.operands; --op >= 0;)
4194 if (operand_type_check (i.types[op], imm))
4195 {
4196 switch (i.op[op].imms->X_op)
4197 {
4198 case O_constant:
4199 /* If a suffix is given, this operand may be shortened. */
4200 switch (guess_suffix)
4201 {
4202 case LONG_MNEM_SUFFIX:
4203 i.types[op].bitfield.imm32 = 1;
4204 i.types[op].bitfield.imm64 = 1;
4205 break;
4206 case WORD_MNEM_SUFFIX:
4207 i.types[op].bitfield.imm16 = 1;
4208 i.types[op].bitfield.imm32 = 1;
4209 i.types[op].bitfield.imm32s = 1;
4210 i.types[op].bitfield.imm64 = 1;
4211 break;
4212 case BYTE_MNEM_SUFFIX:
4213 i.types[op].bitfield.imm8 = 1;
4214 i.types[op].bitfield.imm8s = 1;
4215 i.types[op].bitfield.imm16 = 1;
4216 i.types[op].bitfield.imm32 = 1;
4217 i.types[op].bitfield.imm32s = 1;
4218 i.types[op].bitfield.imm64 = 1;
4219 break;
4220 }
4221
4222 /* If this operand is at most 16 bits, convert it
4223 to a signed 16 bit number before trying to see
4224 whether it will fit in an even smaller size.
4225 This allows a 16-bit operand such as $0xffe0 to
4226 be recognised as within Imm8S range. */
4227 if ((i.types[op].bitfield.imm16)
4228 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4229 {
4230 i.op[op].imms->X_add_number =
4231 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4232 }
4233 #ifdef BFD64
4234 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
4235 if ((i.types[op].bitfield.imm32)
4236 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4237 == 0))
4238 {
4239 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4240 ^ ((offsetT) 1 << 31))
4241 - ((offsetT) 1 << 31));
4242 }
4243 #endif
4244 i.types[op]
4245 = operand_type_or (i.types[op],
4246 smallest_imm_type (i.op[op].imms->X_add_number));
4247
4248 /* We must avoid matching of Imm32 templates when 64bit
4249 only immediate is available. */
4250 if (guess_suffix == QWORD_MNEM_SUFFIX)
4251 i.types[op].bitfield.imm32 = 0;
4252 break;
4253
4254 case O_absent:
4255 case O_register:
4256 abort ();
4257
4258 /* Symbols and expressions. */
4259 default:
4260 /* Convert symbolic operand to proper sizes for matching, but don't
4261 prevent matching a set of insns that only supports sizes other
4262 than those matching the insn suffix. */
4263 {
4264 i386_operand_type mask, allowed;
4265 const insn_template *t;
4266
4267 operand_type_set (&mask, 0);
4268 operand_type_set (&allowed, 0);
4269
4270 for (t = current_templates->start;
4271 t < current_templates->end;
4272 ++t)
4273 allowed = operand_type_or (allowed,
4274 t->operand_types[op]);
4275 switch (guess_suffix)
4276 {
4277 case QWORD_MNEM_SUFFIX:
4278 mask.bitfield.imm64 = 1;
4279 mask.bitfield.imm32s = 1;
4280 break;
4281 case LONG_MNEM_SUFFIX:
4282 mask.bitfield.imm32 = 1;
4283 break;
4284 case WORD_MNEM_SUFFIX:
4285 mask.bitfield.imm16 = 1;
4286 break;
4287 case BYTE_MNEM_SUFFIX:
4288 mask.bitfield.imm8 = 1;
4289 break;
4290 default:
4291 break;
4292 }
4293 allowed = operand_type_and (mask, allowed);
4294 if (!operand_type_all_zero (&allowed))
4295 i.types[op] = operand_type_and (i.types[op], mask);
4296 }
4297 break;
4298 }
4299 }
4300 }
4301
4302 /* Try to use the smallest displacement type too. */
4303 static void
4304 optimize_disp (void)
4305 {
4306 int op;
4307
4308 for (op = i.operands; --op >= 0;)
4309 if (operand_type_check (i.types[op], disp))
4310 {
4311 if (i.op[op].disps->X_op == O_constant)
4312 {
4313 offsetT op_disp = i.op[op].disps->X_add_number;
4314
4315 if (i.types[op].bitfield.disp16
4316 && (op_disp & ~(offsetT) 0xffff) == 0)
4317 {
4318 /* If this operand is at most 16 bits, convert
4319 to a signed 16 bit number and don't use 64bit
4320 displacement. */
4321 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
4322 i.types[op].bitfield.disp64 = 0;
4323 }
4324 #ifdef BFD64
4325 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
4326 if (i.types[op].bitfield.disp32
4327 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
4328 {
4329 /* If this operand is at most 32 bits, convert
4330 to a signed 32 bit number and don't use 64bit
4331 displacement. */
4332 op_disp &= (((offsetT) 2 << 31) - 1);
4333 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
4334 i.types[op].bitfield.disp64 = 0;
4335 }
4336 #endif
4337 if (!op_disp && i.types[op].bitfield.baseindex)
4338 {
4339 i.types[op].bitfield.disp8 = 0;
4340 i.types[op].bitfield.disp16 = 0;
4341 i.types[op].bitfield.disp32 = 0;
4342 i.types[op].bitfield.disp32s = 0;
4343 i.types[op].bitfield.disp64 = 0;
4344 i.op[op].disps = 0;
4345 i.disp_operands--;
4346 }
4347 else if (flag_code == CODE_64BIT)
4348 {
4349 if (fits_in_signed_long (op_disp))
4350 {
4351 i.types[op].bitfield.disp64 = 0;
4352 i.types[op].bitfield.disp32s = 1;
4353 }
4354 if (i.prefix[ADDR_PREFIX]
4355 && fits_in_unsigned_long (op_disp))
4356 i.types[op].bitfield.disp32 = 1;
4357 }
4358 if ((i.types[op].bitfield.disp32
4359 || i.types[op].bitfield.disp32s
4360 || i.types[op].bitfield.disp16)
4361 && fits_in_signed_byte (op_disp))
4362 i.types[op].bitfield.disp8 = 1;
4363 }
4364 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
4365 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
4366 {
4367 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
4368 i.op[op].disps, 0, i.reloc[op]);
4369 i.types[op].bitfield.disp8 = 0;
4370 i.types[op].bitfield.disp16 = 0;
4371 i.types[op].bitfield.disp32 = 0;
4372 i.types[op].bitfield.disp32s = 0;
4373 i.types[op].bitfield.disp64 = 0;
4374 }
4375 else
4376 /* We only support 64bit displacement on constants. */
4377 i.types[op].bitfield.disp64 = 0;
4378 }
4379 }
4380
4381 /* Check if operands are valid for the instruction. */
4382
4383 static int
4384 check_VecOperands (const insn_template *t)
4385 {
4386 unsigned int op;
4387
4388 /* Without VSIB byte, we can't have a vector register for index. */
4389 if (!t->opcode_modifier.vecsib
4390 && i.index_reg
4391 && (i.index_reg->reg_type.bitfield.regxmm
4392 || i.index_reg->reg_type.bitfield.regymm
4393 || i.index_reg->reg_type.bitfield.regzmm))
4394 {
4395 i.error = unsupported_vector_index_register;
4396 return 1;
4397 }
4398
4399 /* Check if default mask is allowed. */
4400 if (t->opcode_modifier.nodefmask
4401 && (!i.mask || i.mask->mask->reg_num == 0))
4402 {
4403 i.error = no_default_mask;
4404 return 1;
4405 }
4406
4407 /* For VSIB byte, we need a vector register for index, and all vector
4408 registers must be distinct. */
4409 if (t->opcode_modifier.vecsib)
4410 {
4411 if (!i.index_reg
4412 || !((t->opcode_modifier.vecsib == VecSIB128
4413 && i.index_reg->reg_type.bitfield.regxmm)
4414 || (t->opcode_modifier.vecsib == VecSIB256
4415 && i.index_reg->reg_type.bitfield.regymm)
4416 || (t->opcode_modifier.vecsib == VecSIB512
4417 && i.index_reg->reg_type.bitfield.regzmm)))
4418 {
4419 i.error = invalid_vsib_address;
4420 return 1;
4421 }
4422
4423 gas_assert (i.reg_operands == 2 || i.mask);
4424 if (i.reg_operands == 2 && !i.mask)
4425 {
4426 gas_assert (i.types[0].bitfield.regxmm
4427 || i.types[0].bitfield.regymm);
4428 gas_assert (i.types[2].bitfield.regxmm
4429 || i.types[2].bitfield.regymm);
4430 if (operand_check == check_none)
4431 return 0;
4432 if (register_number (i.op[0].regs)
4433 != register_number (i.index_reg)
4434 && register_number (i.op[2].regs)
4435 != register_number (i.index_reg)
4436 && register_number (i.op[0].regs)
4437 != register_number (i.op[2].regs))
4438 return 0;
4439 if (operand_check == check_error)
4440 {
4441 i.error = invalid_vector_register_set;
4442 return 1;
4443 }
4444 as_warn (_("mask, index, and destination registers should be distinct"));
4445 }
4446 else if (i.reg_operands == 1 && i.mask)
4447 {
4448 if ((i.types[1].bitfield.regymm
4449 || i.types[1].bitfield.regzmm)
4450 && (register_number (i.op[1].regs)
4451 == register_number (i.index_reg)))
4452 {
4453 if (operand_check == check_error)
4454 {
4455 i.error = invalid_vector_register_set;
4456 return 1;
4457 }
4458 if (operand_check != check_none)
4459 as_warn (_("index and destination registers should be distinct"));
4460 }
4461 }
4462 }
4463
4464 /* Check if broadcast is supported by the instruction and is applied
4465 to the memory operand. */
4466 if (i.broadcast)
4467 {
4468 int broadcasted_opnd_size;
4469
4470 /* Check if specified broadcast is supported in this instruction,
4471 and it's applied to memory operand of DWORD or QWORD type,
4472 depending on VecESize. */
4473 if (i.broadcast->type != t->opcode_modifier.broadcast
4474 || !i.types[i.broadcast->operand].bitfield.mem
4475 || (t->opcode_modifier.vecesize == 0
4476 && !i.types[i.broadcast->operand].bitfield.dword
4477 && !i.types[i.broadcast->operand].bitfield.unspecified)
4478 || (t->opcode_modifier.vecesize == 1
4479 && !i.types[i.broadcast->operand].bitfield.qword
4480 && !i.types[i.broadcast->operand].bitfield.unspecified))
4481 goto bad_broadcast;
4482
4483 broadcasted_opnd_size = t->opcode_modifier.vecesize ? 64 : 32;
4484 if (i.broadcast->type == BROADCAST_1TO16)
4485 broadcasted_opnd_size <<= 4; /* Broadcast 1to16. */
4486 else if (i.broadcast->type == BROADCAST_1TO8)
4487 broadcasted_opnd_size <<= 3; /* Broadcast 1to8. */
4488 else if (i.broadcast->type == BROADCAST_1TO4)
4489 broadcasted_opnd_size <<= 2; /* Broadcast 1to4. */
4490 else if (i.broadcast->type == BROADCAST_1TO2)
4491 broadcasted_opnd_size <<= 1; /* Broadcast 1to2. */
4492 else
4493 goto bad_broadcast;
4494
4495 if ((broadcasted_opnd_size == 256
4496 && !t->operand_types[i.broadcast->operand].bitfield.ymmword)
4497 || (broadcasted_opnd_size == 512
4498 && !t->operand_types[i.broadcast->operand].bitfield.zmmword))
4499 {
4500 bad_broadcast:
4501 i.error = unsupported_broadcast;
4502 return 1;
4503 }
4504 }
4505 /* If broadcast is supported in this instruction, we need to check if
4506 operand of one-element size isn't specified without broadcast. */
4507 else if (t->opcode_modifier.broadcast && i.mem_operands)
4508 {
4509 /* Find memory operand. */
4510 for (op = 0; op < i.operands; op++)
4511 if (operand_type_check (i.types[op], anymem))
4512 break;
4513 gas_assert (op < i.operands);
4514 /* Check size of the memory operand. */
4515 if ((t->opcode_modifier.vecesize == 0
4516 && i.types[op].bitfield.dword)
4517 || (t->opcode_modifier.vecesize == 1
4518 && i.types[op].bitfield.qword))
4519 {
4520 i.error = broadcast_needed;
4521 return 1;
4522 }
4523 }
4524
4525 /* Check if requested masking is supported. */
4526 if (i.mask
4527 && (!t->opcode_modifier.masking
4528 || (i.mask->zeroing
4529 && t->opcode_modifier.masking == MERGING_MASKING)))
4530 {
4531 i.error = unsupported_masking;
4532 return 1;
4533 }
4534
4535 /* Check if masking is applied to dest operand. */
4536 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
4537 {
4538 i.error = mask_not_on_destination;
4539 return 1;
4540 }
4541
4542 /* Check RC/SAE. */
4543 if (i.rounding)
4544 {
4545 if ((i.rounding->type != saeonly
4546 && !t->opcode_modifier.staticrounding)
4547 || (i.rounding->type == saeonly
4548 && (t->opcode_modifier.staticrounding
4549 || !t->opcode_modifier.sae)))
4550 {
4551 i.error = unsupported_rc_sae;
4552 return 1;
4553 }
4554 /* If the instruction has several immediate operands and one of
4555 them is rounding, the rounding operand should be the last
4556 immediate operand. */
4557 if (i.imm_operands > 1
4558 && i.rounding->operand != (int) (i.imm_operands - 1))
4559 {
4560 i.error = rc_sae_operand_not_last_imm;
4561 return 1;
4562 }
4563 }
4564
4565 /* Check vector Disp8 operand. */
4566 if (t->opcode_modifier.disp8memshift)
4567 {
4568 if (i.broadcast)
4569 i.memshift = t->opcode_modifier.vecesize ? 3 : 2;
4570 else
4571 i.memshift = t->opcode_modifier.disp8memshift;
4572
4573 for (op = 0; op < i.operands; op++)
4574 if (operand_type_check (i.types[op], disp)
4575 && i.op[op].disps->X_op == O_constant)
4576 {
4577 offsetT value = i.op[op].disps->X_add_number;
4578 int vec_disp8_ok
4579 = (i.disp_encoding != disp_encoding_32bit
4580 && fits_in_vec_disp8 (value));
4581 if (t->operand_types [op].bitfield.vec_disp8)
4582 {
4583 if (vec_disp8_ok)
4584 i.types[op].bitfield.vec_disp8 = 1;
4585 else
4586 {
4587 /* Vector insn can only have Vec_Disp8/Disp32 in
4588 32/64bit modes, and Vec_Disp8/Disp16 in 16bit
4589 mode. */
4590 i.types[op].bitfield.disp8 = 0;
4591 if (flag_code != CODE_16BIT)
4592 i.types[op].bitfield.disp16 = 0;
4593 }
4594 }
4595 else if (flag_code != CODE_16BIT)
4596 {
4597 /* One form of this instruction supports vector Disp8.
4598 Try vector Disp8 if we need to use Disp32. */
4599 if (vec_disp8_ok && !fits_in_signed_byte (value))
4600 {
4601 i.error = try_vector_disp8;
4602 return 1;
4603 }
4604 }
4605 }
4606 }
4607 else
4608 i.memshift = -1;
4609
4610 return 0;
4611 }
4612
4613 /* Check if operands are valid for the instruction. Update VEX
4614 operand types. */
4615
4616 static int
4617 VEX_check_operands (const insn_template *t)
4618 {
4619 /* VREX is only valid with EVEX prefix. */
4620 if (i.need_vrex && !t->opcode_modifier.evex)
4621 {
4622 i.error = invalid_register_operand;
4623 return 1;
4624 }
4625
4626 if (!t->opcode_modifier.vex)
4627 return 0;
4628
4629 /* Only check VEX_Imm4, which must be the first operand. */
4630 if (t->operand_types[0].bitfield.vec_imm4)
4631 {
4632 if (i.op[0].imms->X_op != O_constant
4633 || !fits_in_imm4 (i.op[0].imms->X_add_number))
4634 {
4635 i.error = bad_imm4;
4636 return 1;
4637 }
4638
4639 /* Turn off Imm8 so that update_imm won't complain. */
4640 i.types[0] = vec_imm4;
4641 }
4642
4643 return 0;
4644 }
4645
4646 static const insn_template *
4647 match_template (void)
4648 {
4649 /* Points to template once we've found it. */
4650 const insn_template *t;
4651 i386_operand_type overlap0, overlap1, overlap2, overlap3;
4652 i386_operand_type overlap4;
4653 unsigned int found_reverse_match;
4654 i386_opcode_modifier suffix_check;
4655 i386_operand_type operand_types [MAX_OPERANDS];
4656 int addr_prefix_disp;
4657 unsigned int j;
4658 unsigned int found_cpu_match;
4659 unsigned int check_register;
4660 enum i386_error specific_error = 0;
4661
4662 #if MAX_OPERANDS != 5
4663 # error "MAX_OPERANDS must be 5."
4664 #endif
4665
4666 found_reverse_match = 0;
4667 addr_prefix_disp = -1;
4668
4669 memset (&suffix_check, 0, sizeof (suffix_check));
4670 if (i.suffix == BYTE_MNEM_SUFFIX)
4671 suffix_check.no_bsuf = 1;
4672 else if (i.suffix == WORD_MNEM_SUFFIX)
4673 suffix_check.no_wsuf = 1;
4674 else if (i.suffix == SHORT_MNEM_SUFFIX)
4675 suffix_check.no_ssuf = 1;
4676 else if (i.suffix == LONG_MNEM_SUFFIX)
4677 suffix_check.no_lsuf = 1;
4678 else if (i.suffix == QWORD_MNEM_SUFFIX)
4679 suffix_check.no_qsuf = 1;
4680 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
4681 suffix_check.no_ldsuf = 1;
4682
4683 /* Must have right number of operands. */
4684 i.error = number_of_operands_mismatch;
4685
4686 for (t = current_templates->start; t < current_templates->end; t++)
4687 {
4688 addr_prefix_disp = -1;
4689
4690 if (i.operands != t->operands)
4691 continue;
4692
4693 /* Check processor support. */
4694 i.error = unsupported;
4695 found_cpu_match = (cpu_flags_match (t)
4696 == CPU_FLAGS_PERFECT_MATCH);
4697 if (!found_cpu_match)
4698 continue;
4699
4700 /* Check old gcc support. */
4701 i.error = old_gcc_only;
4702 if (!old_gcc && t->opcode_modifier.oldgcc)
4703 continue;
4704
4705 /* Check AT&T mnemonic. */
4706 i.error = unsupported_with_intel_mnemonic;
4707 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
4708 continue;
4709
4710 /* Check AT&T/Intel syntax. */
4711 i.error = unsupported_syntax;
4712 if ((intel_syntax && t->opcode_modifier.attsyntax)
4713 || (!intel_syntax && t->opcode_modifier.intelsyntax))
4714 continue;
4715
4716 /* Check the suffix, except for some instructions in intel mode. */
4717 i.error = invalid_instruction_suffix;
4718 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
4719 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
4720 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
4721 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
4722 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
4723 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
4724 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
4725 continue;
4726
4727 if (!operand_size_match (t))
4728 continue;
4729
4730 for (j = 0; j < MAX_OPERANDS; j++)
4731 operand_types[j] = t->operand_types[j];
4732
4733 /* In general, don't allow 64-bit operands in 32-bit mode. */
4734 if (i.suffix == QWORD_MNEM_SUFFIX
4735 && flag_code != CODE_64BIT
4736 && (intel_syntax
4737 ? (!t->opcode_modifier.ignoresize
4738 && !intel_float_operand (t->name))
4739 : intel_float_operand (t->name) != 2)
4740 && ((!operand_types[0].bitfield.regmmx
4741 && !operand_types[0].bitfield.regxmm
4742 && !operand_types[0].bitfield.regymm
4743 && !operand_types[0].bitfield.regzmm)
4744 || (!operand_types[t->operands > 1].bitfield.regmmx
4745 && operand_types[t->operands > 1].bitfield.regxmm
4746 && operand_types[t->operands > 1].bitfield.regymm
4747 && operand_types[t->operands > 1].bitfield.regzmm))
4748 && (t->base_opcode != 0x0fc7
4749 || t->extension_opcode != 1 /* cmpxchg8b */))
4750 continue;
4751
4752 /* In general, don't allow 32-bit operands on pre-386. */
4753 else if (i.suffix == LONG_MNEM_SUFFIX
4754 && !cpu_arch_flags.bitfield.cpui386
4755 && (intel_syntax
4756 ? (!t->opcode_modifier.ignoresize
4757 && !intel_float_operand (t->name))
4758 : intel_float_operand (t->name) != 2)
4759 && ((!operand_types[0].bitfield.regmmx
4760 && !operand_types[0].bitfield.regxmm)
4761 || (!operand_types[t->operands > 1].bitfield.regmmx
4762 && operand_types[t->operands > 1].bitfield.regxmm)))
4763 continue;
4764
4765 /* Do not verify operands when there are none. */
4766 else
4767 {
4768 if (!t->operands)
4769 /* We've found a match; break out of loop. */
4770 break;
4771 }
4772
4773 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
4774 into Disp32/Disp16/Disp32 operand. */
4775 if (i.prefix[ADDR_PREFIX] != 0)
4776 {
4777 /* There should be only one Disp operand. */
4778 switch (flag_code)
4779 {
4780 case CODE_16BIT:
4781 for (j = 0; j < MAX_OPERANDS; j++)
4782 {
4783 if (operand_types[j].bitfield.disp16)
4784 {
4785 addr_prefix_disp = j;
4786 operand_types[j].bitfield.disp32 = 1;
4787 operand_types[j].bitfield.disp16 = 0;
4788 break;
4789 }
4790 }
4791 break;
4792 case CODE_32BIT:
4793 for (j = 0; j < MAX_OPERANDS; j++)
4794 {
4795 if (operand_types[j].bitfield.disp32)
4796 {
4797 addr_prefix_disp = j;
4798 operand_types[j].bitfield.disp32 = 0;
4799 operand_types[j].bitfield.disp16 = 1;
4800 break;
4801 }
4802 }
4803 break;
4804 case CODE_64BIT:
4805 for (j = 0; j < MAX_OPERANDS; j++)
4806 {
4807 if (operand_types[j].bitfield.disp64)
4808 {
4809 addr_prefix_disp = j;
4810 operand_types[j].bitfield.disp64 = 0;
4811 operand_types[j].bitfield.disp32 = 1;
4812 break;
4813 }
4814 }
4815 break;
4816 }
4817 }
4818
4819 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
4820 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
4821 continue;
4822
4823 /* We check register size if needed. */
4824 check_register = t->opcode_modifier.checkregsize;
4825 overlap0 = operand_type_and (i.types[0], operand_types[0]);
4826 switch (t->operands)
4827 {
4828 case 1:
4829 if (!operand_type_match (overlap0, i.types[0]))
4830 continue;
4831 break;
4832 case 2:
4833 /* xchg %eax, %eax is a special case. It is an aliase for nop
4834 only in 32bit mode and we can use opcode 0x90. In 64bit
4835 mode, we can't use 0x90 for xchg %eax, %eax since it should
4836 zero-extend %eax to %rax. */
4837 if (flag_code == CODE_64BIT
4838 && t->base_opcode == 0x90
4839 && operand_type_equal (&i.types [0], &acc32)
4840 && operand_type_equal (&i.types [1], &acc32))
4841 continue;
4842 if (i.swap_operand)
4843 {
4844 /* If we swap operand in encoding, we either match
4845 the next one or reverse direction of operands. */
4846 if (t->opcode_modifier.s)
4847 continue;
4848 else if (t->opcode_modifier.d)
4849 goto check_reverse;
4850 }
4851
4852 case 3:
4853 /* If we swap operand in encoding, we match the next one. */
4854 if (i.swap_operand && t->opcode_modifier.s)
4855 continue;
4856 case 4:
4857 case 5:
4858 overlap1 = operand_type_and (i.types[1], operand_types[1]);
4859 if (!operand_type_match (overlap0, i.types[0])
4860 || !operand_type_match (overlap1, i.types[1])
4861 || (check_register
4862 && !operand_type_register_match (overlap0, i.types[0],
4863 operand_types[0],
4864 overlap1, i.types[1],
4865 operand_types[1])))
4866 {
4867 /* Check if other direction is valid ... */
4868 if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
4869 continue;
4870
4871 check_reverse:
4872 /* Try reversing direction of operands. */
4873 overlap0 = operand_type_and (i.types[0], operand_types[1]);
4874 overlap1 = operand_type_and (i.types[1], operand_types[0]);
4875 if (!operand_type_match (overlap0, i.types[0])
4876 || !operand_type_match (overlap1, i.types[1])
4877 || (check_register
4878 && !operand_type_register_match (overlap0,
4879 i.types[0],
4880 operand_types[1],
4881 overlap1,
4882 i.types[1],
4883 operand_types[0])))
4884 {
4885 /* Does not match either direction. */
4886 continue;
4887 }
4888 /* found_reverse_match holds which of D or FloatDR
4889 we've found. */
4890 if (t->opcode_modifier.d)
4891 found_reverse_match = Opcode_D;
4892 else if (t->opcode_modifier.floatd)
4893 found_reverse_match = Opcode_FloatD;
4894 else
4895 found_reverse_match = 0;
4896 if (t->opcode_modifier.floatr)
4897 found_reverse_match |= Opcode_FloatR;
4898 }
4899 else
4900 {
4901 /* Found a forward 2 operand match here. */
4902 switch (t->operands)
4903 {
4904 case 5:
4905 overlap4 = operand_type_and (i.types[4],
4906 operand_types[4]);
4907 case 4:
4908 overlap3 = operand_type_and (i.types[3],
4909 operand_types[3]);
4910 case 3:
4911 overlap2 = operand_type_and (i.types[2],
4912 operand_types[2]);
4913 break;
4914 }
4915
4916 switch (t->operands)
4917 {
4918 case 5:
4919 if (!operand_type_match (overlap4, i.types[4])
4920 || !operand_type_register_match (overlap3,
4921 i.types[3],
4922 operand_types[3],
4923 overlap4,
4924 i.types[4],
4925 operand_types[4]))
4926 continue;
4927 case 4:
4928 if (!operand_type_match (overlap3, i.types[3])
4929 || (check_register
4930 && !operand_type_register_match (overlap2,
4931 i.types[2],
4932 operand_types[2],
4933 overlap3,
4934 i.types[3],
4935 operand_types[3])))
4936 continue;
4937 case 3:
4938 /* Here we make use of the fact that there are no
4939 reverse match 3 operand instructions, and all 3
4940 operand instructions only need to be checked for
4941 register consistency between operands 2 and 3. */
4942 if (!operand_type_match (overlap2, i.types[2])
4943 || (check_register
4944 && !operand_type_register_match (overlap1,
4945 i.types[1],
4946 operand_types[1],
4947 overlap2,
4948 i.types[2],
4949 operand_types[2])))
4950 continue;
4951 break;
4952 }
4953 }
4954 /* Found either forward/reverse 2, 3 or 4 operand match here:
4955 slip through to break. */
4956 }
4957 if (!found_cpu_match)
4958 {
4959 found_reverse_match = 0;
4960 continue;
4961 }
4962
4963 /* Check if vector and VEX operands are valid. */
4964 if (check_VecOperands (t) || VEX_check_operands (t))
4965 {
4966 specific_error = i.error;
4967 continue;
4968 }
4969
4970 /* We've found a match; break out of loop. */
4971 break;
4972 }
4973
4974 if (t == current_templates->end)
4975 {
4976 /* We found no match. */
4977 const char *err_msg;
4978 switch (specific_error ? specific_error : i.error)
4979 {
4980 default:
4981 abort ();
4982 case operand_size_mismatch:
4983 err_msg = _("operand size mismatch");
4984 break;
4985 case operand_type_mismatch:
4986 err_msg = _("operand type mismatch");
4987 break;
4988 case register_type_mismatch:
4989 err_msg = _("register type mismatch");
4990 break;
4991 case number_of_operands_mismatch:
4992 err_msg = _("number of operands mismatch");
4993 break;
4994 case invalid_instruction_suffix:
4995 err_msg = _("invalid instruction suffix");
4996 break;
4997 case bad_imm4:
4998 err_msg = _("constant doesn't fit in 4 bits");
4999 break;
5000 case old_gcc_only:
5001 err_msg = _("only supported with old gcc");
5002 break;
5003 case unsupported_with_intel_mnemonic:
5004 err_msg = _("unsupported with Intel mnemonic");
5005 break;
5006 case unsupported_syntax:
5007 err_msg = _("unsupported syntax");
5008 break;
5009 case unsupported:
5010 as_bad (_("unsupported instruction `%s'"),
5011 current_templates->start->name);
5012 return NULL;
5013 case invalid_vsib_address:
5014 err_msg = _("invalid VSIB address");
5015 break;
5016 case invalid_vector_register_set:
5017 err_msg = _("mask, index, and destination registers must be distinct");
5018 break;
5019 case unsupported_vector_index_register:
5020 err_msg = _("unsupported vector index register");
5021 break;
5022 case unsupported_broadcast:
5023 err_msg = _("unsupported broadcast");
5024 break;
5025 case broadcast_not_on_src_operand:
5026 err_msg = _("broadcast not on source memory operand");
5027 break;
5028 case broadcast_needed:
5029 err_msg = _("broadcast is needed for operand of such type");
5030 break;
5031 case unsupported_masking:
5032 err_msg = _("unsupported masking");
5033 break;
5034 case mask_not_on_destination:
5035 err_msg = _("mask not on destination operand");
5036 break;
5037 case no_default_mask:
5038 err_msg = _("default mask isn't allowed");
5039 break;
5040 case unsupported_rc_sae:
5041 err_msg = _("unsupported static rounding/sae");
5042 break;
5043 case rc_sae_operand_not_last_imm:
5044 if (intel_syntax)
5045 err_msg = _("RC/SAE operand must precede immediate operands");
5046 else
5047 err_msg = _("RC/SAE operand must follow immediate operands");
5048 break;
5049 case invalid_register_operand:
5050 err_msg = _("invalid register operand");
5051 break;
5052 }
5053 as_bad (_("%s for `%s'"), err_msg,
5054 current_templates->start->name);
5055 return NULL;
5056 }
5057
5058 if (!quiet_warnings)
5059 {
5060 if (!intel_syntax
5061 && (i.types[0].bitfield.jumpabsolute
5062 != operand_types[0].bitfield.jumpabsolute))
5063 {
5064 as_warn (_("indirect %s without `*'"), t->name);
5065 }
5066
5067 if (t->opcode_modifier.isprefix
5068 && t->opcode_modifier.ignoresize)
5069 {
5070 /* Warn them that a data or address size prefix doesn't
5071 affect assembly of the next line of code. */
5072 as_warn (_("stand-alone `%s' prefix"), t->name);
5073 }
5074 }
5075
5076 /* Copy the template we found. */
5077 i.tm = *t;
5078
5079 if (addr_prefix_disp != -1)
5080 i.tm.operand_types[addr_prefix_disp]
5081 = operand_types[addr_prefix_disp];
5082
5083 if (found_reverse_match)
5084 {
5085 /* If we found a reverse match we must alter the opcode
5086 direction bit. found_reverse_match holds bits to change
5087 (different for int & float insns). */
5088
5089 i.tm.base_opcode ^= found_reverse_match;
5090
5091 i.tm.operand_types[0] = operand_types[1];
5092 i.tm.operand_types[1] = operand_types[0];
5093 }
5094
5095 return t;
5096 }
5097
5098 static int
5099 check_string (void)
5100 {
5101 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5102 if (i.tm.operand_types[mem_op].bitfield.esseg)
5103 {
5104 if (i.seg[0] != NULL && i.seg[0] != &es)
5105 {
5106 as_bad (_("`%s' operand %d must use `%ses' segment"),
5107 i.tm.name,
5108 mem_op + 1,
5109 register_prefix);
5110 return 0;
5111 }
5112 /* There's only ever one segment override allowed per instruction.
5113 This instruction possibly has a legal segment override on the
5114 second operand, so copy the segment to where non-string
5115 instructions store it, allowing common code. */
5116 i.seg[0] = i.seg[1];
5117 }
5118 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5119 {
5120 if (i.seg[1] != NULL && i.seg[1] != &es)
5121 {
5122 as_bad (_("`%s' operand %d must use `%ses' segment"),
5123 i.tm.name,
5124 mem_op + 2,
5125 register_prefix);
5126 return 0;
5127 }
5128 }
5129 return 1;
5130 }
5131
5132 static int
5133 process_suffix (void)
5134 {
5135 /* If matched instruction specifies an explicit instruction mnemonic
5136 suffix, use it. */
5137 if (i.tm.opcode_modifier.size16)
5138 i.suffix = WORD_MNEM_SUFFIX;
5139 else if (i.tm.opcode_modifier.size32)
5140 i.suffix = LONG_MNEM_SUFFIX;
5141 else if (i.tm.opcode_modifier.size64)
5142 i.suffix = QWORD_MNEM_SUFFIX;
5143 else if (i.reg_operands)
5144 {
5145 /* If there's no instruction mnemonic suffix we try to invent one
5146 based on register operands. */
5147 if (!i.suffix)
5148 {
5149 /* We take i.suffix from the last register operand specified,
5150 Destination register type is more significant than source
5151 register type. crc32 in SSE4.2 prefers source register
5152 type. */
5153 if (i.tm.base_opcode == 0xf20f38f1)
5154 {
5155 if (i.types[0].bitfield.reg16)
5156 i.suffix = WORD_MNEM_SUFFIX;
5157 else if (i.types[0].bitfield.reg32)
5158 i.suffix = LONG_MNEM_SUFFIX;
5159 else if (i.types[0].bitfield.reg64)
5160 i.suffix = QWORD_MNEM_SUFFIX;
5161 }
5162 else if (i.tm.base_opcode == 0xf20f38f0)
5163 {
5164 if (i.types[0].bitfield.reg8)
5165 i.suffix = BYTE_MNEM_SUFFIX;
5166 }
5167
5168 if (!i.suffix)
5169 {
5170 int op;
5171
5172 if (i.tm.base_opcode == 0xf20f38f1
5173 || i.tm.base_opcode == 0xf20f38f0)
5174 {
5175 /* We have to know the operand size for crc32. */
5176 as_bad (_("ambiguous memory operand size for `%s`"),
5177 i.tm.name);
5178 return 0;
5179 }
5180
5181 for (op = i.operands; --op >= 0;)
5182 if (!i.tm.operand_types[op].bitfield.inoutportreg)
5183 {
5184 if (i.types[op].bitfield.reg8)
5185 {
5186 i.suffix = BYTE_MNEM_SUFFIX;
5187 break;
5188 }
5189 else if (i.types[op].bitfield.reg16)
5190 {
5191 i.suffix = WORD_MNEM_SUFFIX;
5192 break;
5193 }
5194 else if (i.types[op].bitfield.reg32)
5195 {
5196 i.suffix = LONG_MNEM_SUFFIX;
5197 break;
5198 }
5199 else if (i.types[op].bitfield.reg64)
5200 {
5201 i.suffix = QWORD_MNEM_SUFFIX;
5202 break;
5203 }
5204 }
5205 }
5206 }
5207 else if (i.suffix == BYTE_MNEM_SUFFIX)
5208 {
5209 if (intel_syntax
5210 && i.tm.opcode_modifier.ignoresize
5211 && i.tm.opcode_modifier.no_bsuf)
5212 i.suffix = 0;
5213 else if (!check_byte_reg ())
5214 return 0;
5215 }
5216 else if (i.suffix == LONG_MNEM_SUFFIX)
5217 {
5218 if (intel_syntax
5219 && i.tm.opcode_modifier.ignoresize
5220 && i.tm.opcode_modifier.no_lsuf)
5221 i.suffix = 0;
5222 else if (!check_long_reg ())
5223 return 0;
5224 }
5225 else if (i.suffix == QWORD_MNEM_SUFFIX)
5226 {
5227 if (intel_syntax
5228 && i.tm.opcode_modifier.ignoresize
5229 && i.tm.opcode_modifier.no_qsuf)
5230 i.suffix = 0;
5231 else if (!check_qword_reg ())
5232 return 0;
5233 }
5234 else if (i.suffix == WORD_MNEM_SUFFIX)
5235 {
5236 if (intel_syntax
5237 && i.tm.opcode_modifier.ignoresize
5238 && i.tm.opcode_modifier.no_wsuf)
5239 i.suffix = 0;
5240 else if (!check_word_reg ())
5241 return 0;
5242 }
5243 else if (i.suffix == XMMWORD_MNEM_SUFFIX
5244 || i.suffix == YMMWORD_MNEM_SUFFIX
5245 || i.suffix == ZMMWORD_MNEM_SUFFIX)
5246 {
5247 /* Skip if the instruction has x/y/z suffix. match_template
5248 should check if it is a valid suffix. */
5249 }
5250 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
5251 /* Do nothing if the instruction is going to ignore the prefix. */
5252 ;
5253 else
5254 abort ();
5255 }
5256 else if (i.tm.opcode_modifier.defaultsize
5257 && !i.suffix
5258 /* exclude fldenv/frstor/fsave/fstenv */
5259 && i.tm.opcode_modifier.no_ssuf)
5260 {
5261 i.suffix = stackop_size;
5262 }
5263 else if (intel_syntax
5264 && !i.suffix
5265 && (i.tm.operand_types[0].bitfield.jumpabsolute
5266 || i.tm.opcode_modifier.jumpbyte
5267 || i.tm.opcode_modifier.jumpintersegment
5268 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
5269 && i.tm.extension_opcode <= 3)))
5270 {
5271 switch (flag_code)
5272 {
5273 case CODE_64BIT:
5274 if (!i.tm.opcode_modifier.no_qsuf)
5275 {
5276 i.suffix = QWORD_MNEM_SUFFIX;
5277 break;
5278 }
5279 case CODE_32BIT:
5280 if (!i.tm.opcode_modifier.no_lsuf)
5281 i.suffix = LONG_MNEM_SUFFIX;
5282 break;
5283 case CODE_16BIT:
5284 if (!i.tm.opcode_modifier.no_wsuf)
5285 i.suffix = WORD_MNEM_SUFFIX;
5286 break;
5287 }
5288 }
5289
5290 if (!i.suffix)
5291 {
5292 if (!intel_syntax)
5293 {
5294 if (i.tm.opcode_modifier.w)
5295 {
5296 as_bad (_("no instruction mnemonic suffix given and "
5297 "no register operands; can't size instruction"));
5298 return 0;
5299 }
5300 }
5301 else
5302 {
5303 unsigned int suffixes;
5304
5305 suffixes = !i.tm.opcode_modifier.no_bsuf;
5306 if (!i.tm.opcode_modifier.no_wsuf)
5307 suffixes |= 1 << 1;
5308 if (!i.tm.opcode_modifier.no_lsuf)
5309 suffixes |= 1 << 2;
5310 if (!i.tm.opcode_modifier.no_ldsuf)
5311 suffixes |= 1 << 3;
5312 if (!i.tm.opcode_modifier.no_ssuf)
5313 suffixes |= 1 << 4;
5314 if (!i.tm.opcode_modifier.no_qsuf)
5315 suffixes |= 1 << 5;
5316
5317 /* There are more than suffix matches. */
5318 if (i.tm.opcode_modifier.w
5319 || ((suffixes & (suffixes - 1))
5320 && !i.tm.opcode_modifier.defaultsize
5321 && !i.tm.opcode_modifier.ignoresize))
5322 {
5323 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
5324 return 0;
5325 }
5326 }
5327 }
5328
5329 /* Change the opcode based on the operand size given by i.suffix;
5330 We don't need to change things for byte insns. */
5331
5332 if (i.suffix
5333 && i.suffix != BYTE_MNEM_SUFFIX
5334 && i.suffix != XMMWORD_MNEM_SUFFIX
5335 && i.suffix != YMMWORD_MNEM_SUFFIX
5336 && i.suffix != ZMMWORD_MNEM_SUFFIX)
5337 {
5338 /* It's not a byte, select word/dword operation. */
5339 if (i.tm.opcode_modifier.w)
5340 {
5341 if (i.tm.opcode_modifier.shortform)
5342 i.tm.base_opcode |= 8;
5343 else
5344 i.tm.base_opcode |= 1;
5345 }
5346
5347 /* Now select between word & dword operations via the operand
5348 size prefix, except for instructions that will ignore this
5349 prefix anyway. */
5350 if (i.tm.opcode_modifier.addrprefixop0)
5351 {
5352 /* The address size override prefix changes the size of the
5353 first operand. */
5354 if ((flag_code == CODE_32BIT
5355 && i.op->regs[0].reg_type.bitfield.reg16)
5356 || (flag_code != CODE_32BIT
5357 && i.op->regs[0].reg_type.bitfield.reg32))
5358 if (!add_prefix (ADDR_PREFIX_OPCODE))
5359 return 0;
5360 }
5361 else if (i.suffix != QWORD_MNEM_SUFFIX
5362 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
5363 && !i.tm.opcode_modifier.ignoresize
5364 && !i.tm.opcode_modifier.floatmf
5365 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
5366 || (flag_code == CODE_64BIT
5367 && i.tm.opcode_modifier.jumpbyte)))
5368 {
5369 unsigned int prefix = DATA_PREFIX_OPCODE;
5370
5371 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
5372 prefix = ADDR_PREFIX_OPCODE;
5373
5374 if (!add_prefix (prefix))
5375 return 0;
5376 }
5377
5378 /* Set mode64 for an operand. */
5379 if (i.suffix == QWORD_MNEM_SUFFIX
5380 && flag_code == CODE_64BIT
5381 && !i.tm.opcode_modifier.norex64)
5382 {
5383 /* Special case for xchg %rax,%rax. It is NOP and doesn't
5384 need rex64. cmpxchg8b is also a special case. */
5385 if (! (i.operands == 2
5386 && i.tm.base_opcode == 0x90
5387 && i.tm.extension_opcode == None
5388 && operand_type_equal (&i.types [0], &acc64)
5389 && operand_type_equal (&i.types [1], &acc64))
5390 && ! (i.operands == 1
5391 && i.tm.base_opcode == 0xfc7
5392 && i.tm.extension_opcode == 1
5393 && !operand_type_check (i.types [0], reg)
5394 && operand_type_check (i.types [0], anymem)))
5395 i.rex |= REX_W;
5396 }
5397
5398 /* Size floating point instruction. */
5399 if (i.suffix == LONG_MNEM_SUFFIX)
5400 if (i.tm.opcode_modifier.floatmf)
5401 i.tm.base_opcode ^= 4;
5402 }
5403
5404 return 1;
5405 }
5406
5407 static int
5408 check_byte_reg (void)
5409 {
5410 int op;
5411
5412 for (op = i.operands; --op >= 0;)
5413 {
5414 /* If this is an eight bit register, it's OK. If it's the 16 or
5415 32 bit version of an eight bit register, we will just use the
5416 low portion, and that's OK too. */
5417 if (i.types[op].bitfield.reg8)
5418 continue;
5419
5420 /* I/O port address operands are OK too. */
5421 if (i.tm.operand_types[op].bitfield.inoutportreg)
5422 continue;
5423
5424 /* crc32 doesn't generate this warning. */
5425 if (i.tm.base_opcode == 0xf20f38f0)
5426 continue;
5427
5428 if ((i.types[op].bitfield.reg16
5429 || i.types[op].bitfield.reg32
5430 || i.types[op].bitfield.reg64)
5431 && i.op[op].regs->reg_num < 4
5432 /* Prohibit these changes in 64bit mode, since the lowering
5433 would be more complicated. */
5434 && flag_code != CODE_64BIT)
5435 {
5436 #if REGISTER_WARNINGS
5437 if (!quiet_warnings)
5438 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5439 register_prefix,
5440 (i.op[op].regs + (i.types[op].bitfield.reg16
5441 ? REGNAM_AL - REGNAM_AX
5442 : REGNAM_AL - REGNAM_EAX))->reg_name,
5443 register_prefix,
5444 i.op[op].regs->reg_name,
5445 i.suffix);
5446 #endif
5447 continue;
5448 }
5449 /* Any other register is bad. */
5450 if (i.types[op].bitfield.reg16
5451 || i.types[op].bitfield.reg32
5452 || i.types[op].bitfield.reg64
5453 || i.types[op].bitfield.regmmx
5454 || i.types[op].bitfield.regxmm
5455 || i.types[op].bitfield.regymm
5456 || i.types[op].bitfield.regzmm
5457 || i.types[op].bitfield.sreg2
5458 || i.types[op].bitfield.sreg3
5459 || i.types[op].bitfield.control
5460 || i.types[op].bitfield.debug
5461 || i.types[op].bitfield.test
5462 || i.types[op].bitfield.floatreg
5463 || i.types[op].bitfield.floatacc)
5464 {
5465 as_bad (_("`%s%s' not allowed with `%s%c'"),
5466 register_prefix,
5467 i.op[op].regs->reg_name,
5468 i.tm.name,
5469 i.suffix);
5470 return 0;
5471 }
5472 }
5473 return 1;
5474 }
5475
5476 static int
5477 check_long_reg (void)
5478 {
5479 int op;
5480
5481 for (op = i.operands; --op >= 0;)
5482 /* Reject eight bit registers, except where the template requires
5483 them. (eg. movzb) */
5484 if (i.types[op].bitfield.reg8
5485 && (i.tm.operand_types[op].bitfield.reg16
5486 || i.tm.operand_types[op].bitfield.reg32
5487 || i.tm.operand_types[op].bitfield.acc))
5488 {
5489 as_bad (_("`%s%s' not allowed with `%s%c'"),
5490 register_prefix,
5491 i.op[op].regs->reg_name,
5492 i.tm.name,
5493 i.suffix);
5494 return 0;
5495 }
5496 /* Warn if the e prefix on a general reg is missing. */
5497 else if ((!quiet_warnings || flag_code == CODE_64BIT)
5498 && i.types[op].bitfield.reg16
5499 && (i.tm.operand_types[op].bitfield.reg32
5500 || i.tm.operand_types[op].bitfield.acc))
5501 {
5502 /* Prohibit these changes in the 64bit mode, since the
5503 lowering is more complicated. */
5504 if (flag_code == CODE_64BIT)
5505 {
5506 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5507 register_prefix, i.op[op].regs->reg_name,
5508 i.suffix);
5509 return 0;
5510 }
5511 #if REGISTER_WARNINGS
5512 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5513 register_prefix,
5514 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
5515 register_prefix, i.op[op].regs->reg_name, i.suffix);
5516 #endif
5517 }
5518 /* Warn if the r prefix on a general reg is present. */
5519 else if (i.types[op].bitfield.reg64
5520 && (i.tm.operand_types[op].bitfield.reg32
5521 || i.tm.operand_types[op].bitfield.acc))
5522 {
5523 if (intel_syntax
5524 && i.tm.opcode_modifier.toqword
5525 && !i.types[0].bitfield.regxmm)
5526 {
5527 /* Convert to QWORD. We want REX byte. */
5528 i.suffix = QWORD_MNEM_SUFFIX;
5529 }
5530 else
5531 {
5532 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5533 register_prefix, i.op[op].regs->reg_name,
5534 i.suffix);
5535 return 0;
5536 }
5537 }
5538 return 1;
5539 }
5540
5541 static int
5542 check_qword_reg (void)
5543 {
5544 int op;
5545
5546 for (op = i.operands; --op >= 0; )
5547 /* Reject eight bit registers, except where the template requires
5548 them. (eg. movzb) */
5549 if (i.types[op].bitfield.reg8
5550 && (i.tm.operand_types[op].bitfield.reg16
5551 || i.tm.operand_types[op].bitfield.reg32
5552 || i.tm.operand_types[op].bitfield.acc))
5553 {
5554 as_bad (_("`%s%s' not allowed with `%s%c'"),
5555 register_prefix,
5556 i.op[op].regs->reg_name,
5557 i.tm.name,
5558 i.suffix);
5559 return 0;
5560 }
5561 /* Warn if the r prefix on a general reg is missing. */
5562 else if ((i.types[op].bitfield.reg16
5563 || i.types[op].bitfield.reg32)
5564 && (i.tm.operand_types[op].bitfield.reg32
5565 || i.tm.operand_types[op].bitfield.acc))
5566 {
5567 /* Prohibit these changes in the 64bit mode, since the
5568 lowering is more complicated. */
5569 if (intel_syntax
5570 && i.tm.opcode_modifier.todword
5571 && !i.types[0].bitfield.regxmm)
5572 {
5573 /* Convert to DWORD. We don't want REX byte. */
5574 i.suffix = LONG_MNEM_SUFFIX;
5575 }
5576 else
5577 {
5578 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5579 register_prefix, i.op[op].regs->reg_name,
5580 i.suffix);
5581 return 0;
5582 }
5583 }
5584 return 1;
5585 }
5586
5587 static int
5588 check_word_reg (void)
5589 {
5590 int op;
5591 for (op = i.operands; --op >= 0;)
5592 /* Reject eight bit registers, except where the template requires
5593 them. (eg. movzb) */
5594 if (i.types[op].bitfield.reg8
5595 && (i.tm.operand_types[op].bitfield.reg16
5596 || i.tm.operand_types[op].bitfield.reg32
5597 || i.tm.operand_types[op].bitfield.acc))
5598 {
5599 as_bad (_("`%s%s' not allowed with `%s%c'"),
5600 register_prefix,
5601 i.op[op].regs->reg_name,
5602 i.tm.name,
5603 i.suffix);
5604 return 0;
5605 }
5606 /* Warn if the e or r prefix on a general reg is present. */
5607 else if ((!quiet_warnings || flag_code == CODE_64BIT)
5608 && (i.types[op].bitfield.reg32
5609 || i.types[op].bitfield.reg64)
5610 && (i.tm.operand_types[op].bitfield.reg16
5611 || i.tm.operand_types[op].bitfield.acc))
5612 {
5613 /* Prohibit these changes in the 64bit mode, since the
5614 lowering is more complicated. */
5615 if (flag_code == CODE_64BIT)
5616 {
5617 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5618 register_prefix, i.op[op].regs->reg_name,
5619 i.suffix);
5620 return 0;
5621 }
5622 #if REGISTER_WARNINGS
5623 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5624 register_prefix,
5625 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
5626 register_prefix, i.op[op].regs->reg_name, i.suffix);
5627 #endif
5628 }
5629 return 1;
5630 }
5631
5632 static int
5633 update_imm (unsigned int j)
5634 {
5635 i386_operand_type overlap = i.types[j];
5636 if ((overlap.bitfield.imm8
5637 || overlap.bitfield.imm8s
5638 || overlap.bitfield.imm16
5639 || overlap.bitfield.imm32
5640 || overlap.bitfield.imm32s
5641 || overlap.bitfield.imm64)
5642 && !operand_type_equal (&overlap, &imm8)
5643 && !operand_type_equal (&overlap, &imm8s)
5644 && !operand_type_equal (&overlap, &imm16)
5645 && !operand_type_equal (&overlap, &imm32)
5646 && !operand_type_equal (&overlap, &imm32s)
5647 && !operand_type_equal (&overlap, &imm64))
5648 {
5649 if (i.suffix)
5650 {
5651 i386_operand_type temp;
5652
5653 operand_type_set (&temp, 0);
5654 if (i.suffix == BYTE_MNEM_SUFFIX)
5655 {
5656 temp.bitfield.imm8 = overlap.bitfield.imm8;
5657 temp.bitfield.imm8s = overlap.bitfield.imm8s;
5658 }
5659 else if (i.suffix == WORD_MNEM_SUFFIX)
5660 temp.bitfield.imm16 = overlap.bitfield.imm16;
5661 else if (i.suffix == QWORD_MNEM_SUFFIX)
5662 {
5663 temp.bitfield.imm64 = overlap.bitfield.imm64;
5664 temp.bitfield.imm32s = overlap.bitfield.imm32s;
5665 }
5666 else
5667 temp.bitfield.imm32 = overlap.bitfield.imm32;
5668 overlap = temp;
5669 }
5670 else if (operand_type_equal (&overlap, &imm16_32_32s)
5671 || operand_type_equal (&overlap, &imm16_32)
5672 || operand_type_equal (&overlap, &imm16_32s))
5673 {
5674 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5675 overlap = imm16;
5676 else
5677 overlap = imm32s;
5678 }
5679 if (!operand_type_equal (&overlap, &imm8)
5680 && !operand_type_equal (&overlap, &imm8s)
5681 && !operand_type_equal (&overlap, &imm16)
5682 && !operand_type_equal (&overlap, &imm32)
5683 && !operand_type_equal (&overlap, &imm32s)
5684 && !operand_type_equal (&overlap, &imm64))
5685 {
5686 as_bad (_("no instruction mnemonic suffix given; "
5687 "can't determine immediate size"));
5688 return 0;
5689 }
5690 }
5691 i.types[j] = overlap;
5692
5693 return 1;
5694 }
5695
5696 static int
5697 finalize_imm (void)
5698 {
5699 unsigned int j, n;
5700
5701 /* Update the first 2 immediate operands. */
5702 n = i.operands > 2 ? 2 : i.operands;
5703 if (n)
5704 {
5705 for (j = 0; j < n; j++)
5706 if (update_imm (j) == 0)
5707 return 0;
5708
5709 /* The 3rd operand can't be immediate operand. */
5710 gas_assert (operand_type_check (i.types[2], imm) == 0);
5711 }
5712
5713 return 1;
5714 }
5715
5716 static int
5717 bad_implicit_operand (int xmm)
5718 {
5719 const char *ireg = xmm ? "xmm0" : "ymm0";
5720
5721 if (intel_syntax)
5722 as_bad (_("the last operand of `%s' must be `%s%s'"),
5723 i.tm.name, register_prefix, ireg);
5724 else
5725 as_bad (_("the first operand of `%s' must be `%s%s'"),
5726 i.tm.name, register_prefix, ireg);
5727 return 0;
5728 }
5729
5730 static int
5731 process_operands (void)
5732 {
5733 /* Default segment register this instruction will use for memory
5734 accesses. 0 means unknown. This is only for optimizing out
5735 unnecessary segment overrides. */
5736 const seg_entry *default_seg = 0;
5737
5738 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
5739 {
5740 unsigned int dupl = i.operands;
5741 unsigned int dest = dupl - 1;
5742 unsigned int j;
5743
5744 /* The destination must be an xmm register. */
5745 gas_assert (i.reg_operands
5746 && MAX_OPERANDS > dupl
5747 && operand_type_equal (&i.types[dest], &regxmm));
5748
5749 if (i.tm.opcode_modifier.firstxmm0)
5750 {
5751 /* The first operand is implicit and must be xmm0. */
5752 gas_assert (operand_type_equal (&i.types[0], &regxmm));
5753 if (register_number (i.op[0].regs) != 0)
5754 return bad_implicit_operand (1);
5755
5756 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
5757 {
5758 /* Keep xmm0 for instructions with VEX prefix and 3
5759 sources. */
5760 goto duplicate;
5761 }
5762 else
5763 {
5764 /* We remove the first xmm0 and keep the number of
5765 operands unchanged, which in fact duplicates the
5766 destination. */
5767 for (j = 1; j < i.operands; j++)
5768 {
5769 i.op[j - 1] = i.op[j];
5770 i.types[j - 1] = i.types[j];
5771 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
5772 }
5773 }
5774 }
5775 else if (i.tm.opcode_modifier.implicit1stxmm0)
5776 {
5777 gas_assert ((MAX_OPERANDS - 1) > dupl
5778 && (i.tm.opcode_modifier.vexsources
5779 == VEX3SOURCES));
5780
5781 /* Add the implicit xmm0 for instructions with VEX prefix
5782 and 3 sources. */
5783 for (j = i.operands; j > 0; j--)
5784 {
5785 i.op[j] = i.op[j - 1];
5786 i.types[j] = i.types[j - 1];
5787 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
5788 }
5789 i.op[0].regs
5790 = (const reg_entry *) hash_find (reg_hash, "xmm0");
5791 i.types[0] = regxmm;
5792 i.tm.operand_types[0] = regxmm;
5793
5794 i.operands += 2;
5795 i.reg_operands += 2;
5796 i.tm.operands += 2;
5797
5798 dupl++;
5799 dest++;
5800 i.op[dupl] = i.op[dest];
5801 i.types[dupl] = i.types[dest];
5802 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5803 }
5804 else
5805 {
5806 duplicate:
5807 i.operands++;
5808 i.reg_operands++;
5809 i.tm.operands++;
5810
5811 i.op[dupl] = i.op[dest];
5812 i.types[dupl] = i.types[dest];
5813 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5814 }
5815
5816 if (i.tm.opcode_modifier.immext)
5817 process_immext ();
5818 }
5819 else if (i.tm.opcode_modifier.firstxmm0)
5820 {
5821 unsigned int j;
5822
5823 /* The first operand is implicit and must be xmm0/ymm0/zmm0. */
5824 gas_assert (i.reg_operands
5825 && (operand_type_equal (&i.types[0], &regxmm)
5826 || operand_type_equal (&i.types[0], &regymm)
5827 || operand_type_equal (&i.types[0], &regzmm)));
5828 if (register_number (i.op[0].regs) != 0)
5829 return bad_implicit_operand (i.types[0].bitfield.regxmm);
5830
5831 for (j = 1; j < i.operands; j++)
5832 {
5833 i.op[j - 1] = i.op[j];
5834 i.types[j - 1] = i.types[j];
5835
5836 /* We need to adjust fields in i.tm since they are used by
5837 build_modrm_byte. */
5838 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
5839 }
5840
5841 i.operands--;
5842 i.reg_operands--;
5843 i.tm.operands--;
5844 }
5845 else if (i.tm.opcode_modifier.regkludge)
5846 {
5847 /* The imul $imm, %reg instruction is converted into
5848 imul $imm, %reg, %reg, and the clr %reg instruction
5849 is converted into xor %reg, %reg. */
5850
5851 unsigned int first_reg_op;
5852
5853 if (operand_type_check (i.types[0], reg))
5854 first_reg_op = 0;
5855 else
5856 first_reg_op = 1;
5857 /* Pretend we saw the extra register operand. */
5858 gas_assert (i.reg_operands == 1
5859 && i.op[first_reg_op + 1].regs == 0);
5860 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
5861 i.types[first_reg_op + 1] = i.types[first_reg_op];
5862 i.operands++;
5863 i.reg_operands++;
5864 }
5865
5866 if (i.tm.opcode_modifier.shortform)
5867 {
5868 if (i.types[0].bitfield.sreg2
5869 || i.types[0].bitfield.sreg3)
5870 {
5871 if (i.tm.base_opcode == POP_SEG_SHORT
5872 && i.op[0].regs->reg_num == 1)
5873 {
5874 as_bad (_("you can't `pop %scs'"), register_prefix);
5875 return 0;
5876 }
5877 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
5878 if ((i.op[0].regs->reg_flags & RegRex) != 0)
5879 i.rex |= REX_B;
5880 }
5881 else
5882 {
5883 /* The register or float register operand is in operand
5884 0 or 1. */
5885 unsigned int op;
5886
5887 if (i.types[0].bitfield.floatreg
5888 || operand_type_check (i.types[0], reg))
5889 op = 0;
5890 else
5891 op = 1;
5892 /* Register goes in low 3 bits of opcode. */
5893 i.tm.base_opcode |= i.op[op].regs->reg_num;
5894 if ((i.op[op].regs->reg_flags & RegRex) != 0)
5895 i.rex |= REX_B;
5896 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
5897 {
5898 /* Warn about some common errors, but press on regardless.
5899 The first case can be generated by gcc (<= 2.8.1). */
5900 if (i.operands == 2)
5901 {
5902 /* Reversed arguments on faddp, fsubp, etc. */
5903 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
5904 register_prefix, i.op[!intel_syntax].regs->reg_name,
5905 register_prefix, i.op[intel_syntax].regs->reg_name);
5906 }
5907 else
5908 {
5909 /* Extraneous `l' suffix on fp insn. */
5910 as_warn (_("translating to `%s %s%s'"), i.tm.name,
5911 register_prefix, i.op[0].regs->reg_name);
5912 }
5913 }
5914 }
5915 }
5916 else if (i.tm.opcode_modifier.modrm)
5917 {
5918 /* The opcode is completed (modulo i.tm.extension_opcode which
5919 must be put into the modrm byte). Now, we make the modrm and
5920 index base bytes based on all the info we've collected. */
5921
5922 default_seg = build_modrm_byte ();
5923 }
5924 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
5925 {
5926 default_seg = &ds;
5927 }
5928 else if (i.tm.opcode_modifier.isstring)
5929 {
5930 /* For the string instructions that allow a segment override
5931 on one of their operands, the default segment is ds. */
5932 default_seg = &ds;
5933 }
5934
5935 if (i.tm.base_opcode == 0x8d /* lea */
5936 && i.seg[0]
5937 && !quiet_warnings)
5938 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
5939
5940 /* If a segment was explicitly specified, and the specified segment
5941 is not the default, use an opcode prefix to select it. If we
5942 never figured out what the default segment is, then default_seg
5943 will be zero at this point, and the specified segment prefix will
5944 always be used. */
5945 if ((i.seg[0]) && (i.seg[0] != default_seg))
5946 {
5947 if (!add_prefix (i.seg[0]->seg_prefix))
5948 return 0;
5949 }
5950 return 1;
5951 }
5952
5953 static const seg_entry *
5954 build_modrm_byte (void)
5955 {
5956 const seg_entry *default_seg = 0;
5957 unsigned int source, dest;
5958 int vex_3_sources;
5959
5960 /* The first operand of instructions with VEX prefix and 3 sources
5961 must be VEX_Imm4. */
5962 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
5963 if (vex_3_sources)
5964 {
5965 unsigned int nds, reg_slot;
5966 expressionS *exp;
5967
5968 if (i.tm.opcode_modifier.veximmext
5969 && i.tm.opcode_modifier.immext)
5970 {
5971 dest = i.operands - 2;
5972 gas_assert (dest == 3);
5973 }
5974 else
5975 dest = i.operands - 1;
5976 nds = dest - 1;
5977
5978 /* There are 2 kinds of instructions:
5979 1. 5 operands: 4 register operands or 3 register operands
5980 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
5981 VexW0 or VexW1. The destination must be either XMM, YMM or
5982 ZMM register.
5983 2. 4 operands: 4 register operands or 3 register operands
5984 plus 1 memory operand, VexXDS, and VexImmExt */
5985 gas_assert ((i.reg_operands == 4
5986 || (i.reg_operands == 3 && i.mem_operands == 1))
5987 && i.tm.opcode_modifier.vexvvvv == VEXXDS
5988 && (i.tm.opcode_modifier.veximmext
5989 || (i.imm_operands == 1
5990 && i.types[0].bitfield.vec_imm4
5991 && (i.tm.opcode_modifier.vexw == VEXW0
5992 || i.tm.opcode_modifier.vexw == VEXW1)
5993 && (operand_type_equal (&i.tm.operand_types[dest], &regxmm)
5994 || operand_type_equal (&i.tm.operand_types[dest], &regymm)
5995 || operand_type_equal (&i.tm.operand_types[dest], &regzmm)))));
5996
5997 if (i.imm_operands == 0)
5998 {
5999 /* When there is no immediate operand, generate an 8bit
6000 immediate operand to encode the first operand. */
6001 exp = &im_expressions[i.imm_operands++];
6002 i.op[i.operands].imms = exp;
6003 i.types[i.operands] = imm8;
6004 i.operands++;
6005 /* If VexW1 is set, the first operand is the source and
6006 the second operand is encoded in the immediate operand. */
6007 if (i.tm.opcode_modifier.vexw == VEXW1)
6008 {
6009 source = 0;
6010 reg_slot = 1;
6011 }
6012 else
6013 {
6014 source = 1;
6015 reg_slot = 0;
6016 }
6017
6018 /* FMA swaps REG and NDS. */
6019 if (i.tm.cpu_flags.bitfield.cpufma)
6020 {
6021 unsigned int tmp;
6022 tmp = reg_slot;
6023 reg_slot = nds;
6024 nds = tmp;
6025 }
6026
6027 gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6028 &regxmm)
6029 || operand_type_equal (&i.tm.operand_types[reg_slot],
6030 &regymm)
6031 || operand_type_equal (&i.tm.operand_types[reg_slot],
6032 &regzmm));
6033 exp->X_op = O_constant;
6034 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
6035 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6036 }
6037 else
6038 {
6039 unsigned int imm_slot;
6040
6041 if (i.tm.opcode_modifier.vexw == VEXW0)
6042 {
6043 /* If VexW0 is set, the third operand is the source and
6044 the second operand is encoded in the immediate
6045 operand. */
6046 source = 2;
6047 reg_slot = 1;
6048 }
6049 else
6050 {
6051 /* VexW1 is set, the second operand is the source and
6052 the third operand is encoded in the immediate
6053 operand. */
6054 source = 1;
6055 reg_slot = 2;
6056 }
6057
6058 if (i.tm.opcode_modifier.immext)
6059 {
6060 /* When ImmExt is set, the immdiate byte is the last
6061 operand. */
6062 imm_slot = i.operands - 1;
6063 source--;
6064 reg_slot--;
6065 }
6066 else
6067 {
6068 imm_slot = 0;
6069
6070 /* Turn on Imm8 so that output_imm will generate it. */
6071 i.types[imm_slot].bitfield.imm8 = 1;
6072 }
6073
6074 gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6075 &regxmm)
6076 || operand_type_equal (&i.tm.operand_types[reg_slot],
6077 &regymm)
6078 || operand_type_equal (&i.tm.operand_types[reg_slot],
6079 &regzmm));
6080 i.op[imm_slot].imms->X_add_number
6081 |= register_number (i.op[reg_slot].regs) << 4;
6082 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6083 }
6084
6085 gas_assert (operand_type_equal (&i.tm.operand_types[nds], &regxmm)
6086 || operand_type_equal (&i.tm.operand_types[nds],
6087 &regymm)
6088 || operand_type_equal (&i.tm.operand_types[nds],
6089 &regzmm));
6090 i.vex.register_specifier = i.op[nds].regs;
6091 }
6092 else
6093 source = dest = 0;
6094
6095 /* i.reg_operands MUST be the number of real register operands;
6096 implicit registers do not count. If there are 3 register
6097 operands, it must be a instruction with VexNDS. For a
6098 instruction with VexNDD, the destination register is encoded
6099 in VEX prefix. If there are 4 register operands, it must be
6100 a instruction with VEX prefix and 3 sources. */
6101 if (i.mem_operands == 0
6102 && ((i.reg_operands == 2
6103 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6104 || (i.reg_operands == 3
6105 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6106 || (i.reg_operands == 4 && vex_3_sources)))
6107 {
6108 switch (i.operands)
6109 {
6110 case 2:
6111 source = 0;
6112 break;
6113 case 3:
6114 /* When there are 3 operands, one of them may be immediate,
6115 which may be the first or the last operand. Otherwise,
6116 the first operand must be shift count register (cl) or it
6117 is an instruction with VexNDS. */
6118 gas_assert (i.imm_operands == 1
6119 || (i.imm_operands == 0
6120 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6121 || i.types[0].bitfield.shiftcount)));
6122 if (operand_type_check (i.types[0], imm)
6123 || i.types[0].bitfield.shiftcount)
6124 source = 1;
6125 else
6126 source = 0;
6127 break;
6128 case 4:
6129 /* When there are 4 operands, the first two must be 8bit
6130 immediate operands. The source operand will be the 3rd
6131 one.
6132
6133 For instructions with VexNDS, if the first operand
6134 an imm8, the source operand is the 2nd one. If the last
6135 operand is imm8, the source operand is the first one. */
6136 gas_assert ((i.imm_operands == 2
6137 && i.types[0].bitfield.imm8
6138 && i.types[1].bitfield.imm8)
6139 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6140 && i.imm_operands == 1
6141 && (i.types[0].bitfield.imm8
6142 || i.types[i.operands - 1].bitfield.imm8
6143 || i.rounding)));
6144 if (i.imm_operands == 2)
6145 source = 2;
6146 else
6147 {
6148 if (i.types[0].bitfield.imm8)
6149 source = 1;
6150 else
6151 source = 0;
6152 }
6153 break;
6154 case 5:
6155 if (i.tm.opcode_modifier.evex)
6156 {
6157 /* For EVEX instructions, when there are 5 operands, the
6158 first one must be immediate operand. If the second one
6159 is immediate operand, the source operand is the 3th
6160 one. If the last one is immediate operand, the source
6161 operand is the 2nd one. */
6162 gas_assert (i.imm_operands == 2
6163 && i.tm.opcode_modifier.sae
6164 && operand_type_check (i.types[0], imm));
6165 if (operand_type_check (i.types[1], imm))
6166 source = 2;
6167 else if (operand_type_check (i.types[4], imm))
6168 source = 1;
6169 else
6170 abort ();
6171 }
6172 break;
6173 default:
6174 abort ();
6175 }
6176
6177 if (!vex_3_sources)
6178 {
6179 dest = source + 1;
6180
6181 /* RC/SAE operand could be between DEST and SRC. That happens
6182 when one operand is GPR and the other one is XMM/YMM/ZMM
6183 register. */
6184 if (i.rounding && i.rounding->operand == (int) dest)
6185 dest++;
6186
6187 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6188 {
6189 /* For instructions with VexNDS, the register-only source
6190 operand must be 32/64bit integer, XMM, YMM or ZMM
6191 register. It is encoded in VEX prefix. We need to
6192 clear RegMem bit before calling operand_type_equal. */
6193
6194 i386_operand_type op;
6195 unsigned int vvvv;
6196
6197 /* Check register-only source operand when two source
6198 operands are swapped. */
6199 if (!i.tm.operand_types[source].bitfield.baseindex
6200 && i.tm.operand_types[dest].bitfield.baseindex)
6201 {
6202 vvvv = source;
6203 source = dest;
6204 }
6205 else
6206 vvvv = dest;
6207
6208 op = i.tm.operand_types[vvvv];
6209 op.bitfield.regmem = 0;
6210 if ((dest + 1) >= i.operands
6211 || (!op.bitfield.reg32
6212 && op.bitfield.reg64
6213 && !operand_type_equal (&op, &regxmm)
6214 && !operand_type_equal (&op, &regymm)
6215 && !operand_type_equal (&op, &regzmm)
6216 && !operand_type_equal (&op, &regmask)))
6217 abort ();
6218 i.vex.register_specifier = i.op[vvvv].regs;
6219 dest++;
6220 }
6221 }
6222
6223 i.rm.mode = 3;
6224 /* One of the register operands will be encoded in the i.tm.reg
6225 field, the other in the combined i.tm.mode and i.tm.regmem
6226 fields. If no form of this instruction supports a memory
6227 destination operand, then we assume the source operand may
6228 sometimes be a memory operand and so we need to store the
6229 destination in the i.rm.reg field. */
6230 if (!i.tm.operand_types[dest].bitfield.regmem
6231 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
6232 {
6233 i.rm.reg = i.op[dest].regs->reg_num;
6234 i.rm.regmem = i.op[source].regs->reg_num;
6235 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6236 i.rex |= REX_R;
6237 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6238 i.vrex |= REX_R;
6239 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6240 i.rex |= REX_B;
6241 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6242 i.vrex |= REX_B;
6243 }
6244 else
6245 {
6246 i.rm.reg = i.op[source].regs->reg_num;
6247 i.rm.regmem = i.op[dest].regs->reg_num;
6248 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6249 i.rex |= REX_B;
6250 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6251 i.vrex |= REX_B;
6252 if ((i.op[source].regs->reg_flags & RegRex) != 0)
6253 i.rex |= REX_R;
6254 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6255 i.vrex |= REX_R;
6256 }
6257 if (flag_code != CODE_64BIT && (i.rex & (REX_R | REX_B)))
6258 {
6259 if (!i.types[0].bitfield.control
6260 && !i.types[1].bitfield.control)
6261 abort ();
6262 i.rex &= ~(REX_R | REX_B);
6263 add_prefix (LOCK_PREFIX_OPCODE);
6264 }
6265 }
6266 else
6267 { /* If it's not 2 reg operands... */
6268 unsigned int mem;
6269
6270 if (i.mem_operands)
6271 {
6272 unsigned int fake_zero_displacement = 0;
6273 unsigned int op;
6274
6275 for (op = 0; op < i.operands; op++)
6276 if (operand_type_check (i.types[op], anymem))
6277 break;
6278 gas_assert (op < i.operands);
6279
6280 if (i.tm.opcode_modifier.vecsib)
6281 {
6282 if (i.index_reg->reg_num == RegEiz
6283 || i.index_reg->reg_num == RegRiz)
6284 abort ();
6285
6286 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6287 if (!i.base_reg)
6288 {
6289 i.sib.base = NO_BASE_REGISTER;
6290 i.sib.scale = i.log2_scale_factor;
6291 /* No Vec_Disp8 if there is no base. */
6292 i.types[op].bitfield.vec_disp8 = 0;
6293 i.types[op].bitfield.disp8 = 0;
6294 i.types[op].bitfield.disp16 = 0;
6295 i.types[op].bitfield.disp64 = 0;
6296 if (flag_code != CODE_64BIT)
6297 {
6298 /* Must be 32 bit */
6299 i.types[op].bitfield.disp32 = 1;
6300 i.types[op].bitfield.disp32s = 0;
6301 }
6302 else
6303 {
6304 i.types[op].bitfield.disp32 = 0;
6305 i.types[op].bitfield.disp32s = 1;
6306 }
6307 }
6308 i.sib.index = i.index_reg->reg_num;
6309 if ((i.index_reg->reg_flags & RegRex) != 0)
6310 i.rex |= REX_X;
6311 if ((i.index_reg->reg_flags & RegVRex) != 0)
6312 i.vrex |= REX_X;
6313 }
6314
6315 default_seg = &ds;
6316
6317 if (i.base_reg == 0)
6318 {
6319 i.rm.mode = 0;
6320 if (!i.disp_operands)
6321 {
6322 fake_zero_displacement = 1;
6323 /* Instructions with VSIB byte need 32bit displacement
6324 if there is no base register. */
6325 if (i.tm.opcode_modifier.vecsib)
6326 i.types[op].bitfield.disp32 = 1;
6327 }
6328 if (i.index_reg == 0)
6329 {
6330 gas_assert (!i.tm.opcode_modifier.vecsib);
6331 /* Operand is just <disp> */
6332 if (flag_code == CODE_64BIT)
6333 {
6334 /* 64bit mode overwrites the 32bit absolute
6335 addressing by RIP relative addressing and
6336 absolute addressing is encoded by one of the
6337 redundant SIB forms. */
6338 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6339 i.sib.base = NO_BASE_REGISTER;
6340 i.sib.index = NO_INDEX_REGISTER;
6341 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0)
6342 ? disp32s : disp32);
6343 }
6344 else if ((flag_code == CODE_16BIT)
6345 ^ (i.prefix[ADDR_PREFIX] != 0))
6346 {
6347 i.rm.regmem = NO_BASE_REGISTER_16;
6348 i.types[op] = disp16;
6349 }
6350 else
6351 {
6352 i.rm.regmem = NO_BASE_REGISTER;
6353 i.types[op] = disp32;
6354 }
6355 }
6356 else if (!i.tm.opcode_modifier.vecsib)
6357 {
6358 /* !i.base_reg && i.index_reg */
6359 if (i.index_reg->reg_num == RegEiz
6360 || i.index_reg->reg_num == RegRiz)
6361 i.sib.index = NO_INDEX_REGISTER;
6362 else
6363 i.sib.index = i.index_reg->reg_num;
6364 i.sib.base = NO_BASE_REGISTER;
6365 i.sib.scale = i.log2_scale_factor;
6366 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6367 /* No Vec_Disp8 if there is no base. */
6368 i.types[op].bitfield.vec_disp8 = 0;
6369 i.types[op].bitfield.disp8 = 0;
6370 i.types[op].bitfield.disp16 = 0;
6371 i.types[op].bitfield.disp64 = 0;
6372 if (flag_code != CODE_64BIT)
6373 {
6374 /* Must be 32 bit */
6375 i.types[op].bitfield.disp32 = 1;
6376 i.types[op].bitfield.disp32s = 0;
6377 }
6378 else
6379 {
6380 i.types[op].bitfield.disp32 = 0;
6381 i.types[op].bitfield.disp32s = 1;
6382 }
6383 if ((i.index_reg->reg_flags & RegRex) != 0)
6384 i.rex |= REX_X;
6385 }
6386 }
6387 /* RIP addressing for 64bit mode. */
6388 else if (i.base_reg->reg_num == RegRip ||
6389 i.base_reg->reg_num == RegEip)
6390 {
6391 gas_assert (!i.tm.opcode_modifier.vecsib);
6392 i.rm.regmem = NO_BASE_REGISTER;
6393 i.types[op].bitfield.disp8 = 0;
6394 i.types[op].bitfield.disp16 = 0;
6395 i.types[op].bitfield.disp32 = 0;
6396 i.types[op].bitfield.disp32s = 1;
6397 i.types[op].bitfield.disp64 = 0;
6398 i.types[op].bitfield.vec_disp8 = 0;
6399 i.flags[op] |= Operand_PCrel;
6400 if (! i.disp_operands)
6401 fake_zero_displacement = 1;
6402 }
6403 else if (i.base_reg->reg_type.bitfield.reg16)
6404 {
6405 gas_assert (!i.tm.opcode_modifier.vecsib);
6406 switch (i.base_reg->reg_num)
6407 {
6408 case 3: /* (%bx) */
6409 if (i.index_reg == 0)
6410 i.rm.regmem = 7;
6411 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
6412 i.rm.regmem = i.index_reg->reg_num - 6;
6413 break;
6414 case 5: /* (%bp) */
6415 default_seg = &ss;
6416 if (i.index_reg == 0)
6417 {
6418 i.rm.regmem = 6;
6419 if (operand_type_check (i.types[op], disp) == 0)
6420 {
6421 /* fake (%bp) into 0(%bp) */
6422 if (i.tm.operand_types[op].bitfield.vec_disp8)
6423 i.types[op].bitfield.vec_disp8 = 1;
6424 else
6425 i.types[op].bitfield.disp8 = 1;
6426 fake_zero_displacement = 1;
6427 }
6428 }
6429 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
6430 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
6431 break;
6432 default: /* (%si) -> 4 or (%di) -> 5 */
6433 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
6434 }
6435 i.rm.mode = mode_from_disp_size (i.types[op]);
6436 }
6437 else /* i.base_reg and 32/64 bit mode */
6438 {
6439 if (flag_code == CODE_64BIT
6440 && operand_type_check (i.types[op], disp))
6441 {
6442 i386_operand_type temp;
6443 operand_type_set (&temp, 0);
6444 temp.bitfield.disp8 = i.types[op].bitfield.disp8;
6445 temp.bitfield.vec_disp8
6446 = i.types[op].bitfield.vec_disp8;
6447 i.types[op] = temp;
6448 if (i.prefix[ADDR_PREFIX] == 0)
6449 i.types[op].bitfield.disp32s = 1;
6450 else
6451 i.types[op].bitfield.disp32 = 1;
6452 }
6453
6454 if (!i.tm.opcode_modifier.vecsib)
6455 i.rm.regmem = i.base_reg->reg_num;
6456 if ((i.base_reg->reg_flags & RegRex) != 0)
6457 i.rex |= REX_B;
6458 i.sib.base = i.base_reg->reg_num;
6459 /* x86-64 ignores REX prefix bit here to avoid decoder
6460 complications. */
6461 if (!(i.base_reg->reg_flags & RegRex)
6462 && (i.base_reg->reg_num == EBP_REG_NUM
6463 || i.base_reg->reg_num == ESP_REG_NUM))
6464 default_seg = &ss;
6465 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
6466 {
6467 fake_zero_displacement = 1;
6468 if (i.tm.operand_types [op].bitfield.vec_disp8)
6469 i.types[op].bitfield.vec_disp8 = 1;
6470 else
6471 i.types[op].bitfield.disp8 = 1;
6472 }
6473 i.sib.scale = i.log2_scale_factor;
6474 if (i.index_reg == 0)
6475 {
6476 gas_assert (!i.tm.opcode_modifier.vecsib);
6477 /* <disp>(%esp) becomes two byte modrm with no index
6478 register. We've already stored the code for esp
6479 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
6480 Any base register besides %esp will not use the
6481 extra modrm byte. */
6482 i.sib.index = NO_INDEX_REGISTER;
6483 }
6484 else if (!i.tm.opcode_modifier.vecsib)
6485 {
6486 if (i.index_reg->reg_num == RegEiz
6487 || i.index_reg->reg_num == RegRiz)
6488 i.sib.index = NO_INDEX_REGISTER;
6489 else
6490 i.sib.index = i.index_reg->reg_num;
6491 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6492 if ((i.index_reg->reg_flags & RegRex) != 0)
6493 i.rex |= REX_X;
6494 }
6495
6496 if (i.disp_operands
6497 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6498 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
6499 i.rm.mode = 0;
6500 else
6501 {
6502 if (!fake_zero_displacement
6503 && !i.disp_operands
6504 && i.disp_encoding)
6505 {
6506 fake_zero_displacement = 1;
6507 if (i.disp_encoding == disp_encoding_8bit)
6508 i.types[op].bitfield.disp8 = 1;
6509 else
6510 i.types[op].bitfield.disp32 = 1;
6511 }
6512 i.rm.mode = mode_from_disp_size (i.types[op]);
6513 }
6514 }
6515
6516 if (fake_zero_displacement)
6517 {
6518 /* Fakes a zero displacement assuming that i.types[op]
6519 holds the correct displacement size. */
6520 expressionS *exp;
6521
6522 gas_assert (i.op[op].disps == 0);
6523 exp = &disp_expressions[i.disp_operands++];
6524 i.op[op].disps = exp;
6525 exp->X_op = O_constant;
6526 exp->X_add_number = 0;
6527 exp->X_add_symbol = (symbolS *) 0;
6528 exp->X_op_symbol = (symbolS *) 0;
6529 }
6530
6531 mem = op;
6532 }
6533 else
6534 mem = ~0;
6535
6536 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
6537 {
6538 if (operand_type_check (i.types[0], imm))
6539 i.vex.register_specifier = NULL;
6540 else
6541 {
6542 /* VEX.vvvv encodes one of the sources when the first
6543 operand is not an immediate. */
6544 if (i.tm.opcode_modifier.vexw == VEXW0)
6545 i.vex.register_specifier = i.op[0].regs;
6546 else
6547 i.vex.register_specifier = i.op[1].regs;
6548 }
6549
6550 /* Destination is a XMM register encoded in the ModRM.reg
6551 and VEX.R bit. */
6552 i.rm.reg = i.op[2].regs->reg_num;
6553 if ((i.op[2].regs->reg_flags & RegRex) != 0)
6554 i.rex |= REX_R;
6555
6556 /* ModRM.rm and VEX.B encodes the other source. */
6557 if (!i.mem_operands)
6558 {
6559 i.rm.mode = 3;
6560
6561 if (i.tm.opcode_modifier.vexw == VEXW0)
6562 i.rm.regmem = i.op[1].regs->reg_num;
6563 else
6564 i.rm.regmem = i.op[0].regs->reg_num;
6565
6566 if ((i.op[1].regs->reg_flags & RegRex) != 0)
6567 i.rex |= REX_B;
6568 }
6569 }
6570 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
6571 {
6572 i.vex.register_specifier = i.op[2].regs;
6573 if (!i.mem_operands)
6574 {
6575 i.rm.mode = 3;
6576 i.rm.regmem = i.op[1].regs->reg_num;
6577 if ((i.op[1].regs->reg_flags & RegRex) != 0)
6578 i.rex |= REX_B;
6579 }
6580 }
6581 /* Fill in i.rm.reg or i.rm.regmem field with register operand
6582 (if any) based on i.tm.extension_opcode. Again, we must be
6583 careful to make sure that segment/control/debug/test/MMX
6584 registers are coded into the i.rm.reg field. */
6585 else if (i.reg_operands)
6586 {
6587 unsigned int op;
6588 unsigned int vex_reg = ~0;
6589
6590 for (op = 0; op < i.operands; op++)
6591 if (i.types[op].bitfield.reg8
6592 || i.types[op].bitfield.reg16
6593 || i.types[op].bitfield.reg32
6594 || i.types[op].bitfield.reg64
6595 || i.types[op].bitfield.regmmx
6596 || i.types[op].bitfield.regxmm
6597 || i.types[op].bitfield.regymm
6598 || i.types[op].bitfield.regbnd
6599 || i.types[op].bitfield.regzmm
6600 || i.types[op].bitfield.regmask
6601 || i.types[op].bitfield.sreg2
6602 || i.types[op].bitfield.sreg3
6603 || i.types[op].bitfield.control
6604 || i.types[op].bitfield.debug
6605 || i.types[op].bitfield.test)
6606 break;
6607
6608 if (vex_3_sources)
6609 op = dest;
6610 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6611 {
6612 /* For instructions with VexNDS, the register-only
6613 source operand is encoded in VEX prefix. */
6614 gas_assert (mem != (unsigned int) ~0);
6615
6616 if (op > mem)
6617 {
6618 vex_reg = op++;
6619 gas_assert (op < i.operands);
6620 }
6621 else
6622 {
6623 /* Check register-only source operand when two source
6624 operands are swapped. */
6625 if (!i.tm.operand_types[op].bitfield.baseindex
6626 && i.tm.operand_types[op + 1].bitfield.baseindex)
6627 {
6628 vex_reg = op;
6629 op += 2;
6630 gas_assert (mem == (vex_reg + 1)
6631 && op < i.operands);
6632 }
6633 else
6634 {
6635 vex_reg = op + 1;
6636 gas_assert (vex_reg < i.operands);
6637 }
6638 }
6639 }
6640 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
6641 {
6642 /* For instructions with VexNDD, the register destination
6643 is encoded in VEX prefix. */
6644 if (i.mem_operands == 0)
6645 {
6646 /* There is no memory operand. */
6647 gas_assert ((op + 2) == i.operands);
6648 vex_reg = op + 1;
6649 }
6650 else
6651 {
6652 /* There are only 2 operands. */
6653 gas_assert (op < 2 && i.operands == 2);
6654 vex_reg = 1;
6655 }
6656 }
6657 else
6658 gas_assert (op < i.operands);
6659
6660 if (vex_reg != (unsigned int) ~0)
6661 {
6662 i386_operand_type *type = &i.tm.operand_types[vex_reg];
6663
6664 if (type->bitfield.reg32 != 1
6665 && type->bitfield.reg64 != 1
6666 && !operand_type_equal (type, &regxmm)
6667 && !operand_type_equal (type, &regymm)
6668 && !operand_type_equal (type, &regzmm)
6669 && !operand_type_equal (type, &regmask))
6670 abort ();
6671
6672 i.vex.register_specifier = i.op[vex_reg].regs;
6673 }
6674
6675 /* Don't set OP operand twice. */
6676 if (vex_reg != op)
6677 {
6678 /* If there is an extension opcode to put here, the
6679 register number must be put into the regmem field. */
6680 if (i.tm.extension_opcode != None)
6681 {
6682 i.rm.regmem = i.op[op].regs->reg_num;
6683 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6684 i.rex |= REX_B;
6685 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6686 i.vrex |= REX_B;
6687 }
6688 else
6689 {
6690 i.rm.reg = i.op[op].regs->reg_num;
6691 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6692 i.rex |= REX_R;
6693 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6694 i.vrex |= REX_R;
6695 }
6696 }
6697
6698 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
6699 must set it to 3 to indicate this is a register operand
6700 in the regmem field. */
6701 if (!i.mem_operands)
6702 i.rm.mode = 3;
6703 }
6704
6705 /* Fill in i.rm.reg field with extension opcode (if any). */
6706 if (i.tm.extension_opcode != None)
6707 i.rm.reg = i.tm.extension_opcode;
6708 }
6709 return default_seg;
6710 }
6711
6712 static void
6713 output_branch (void)
6714 {
6715 char *p;
6716 int size;
6717 int code16;
6718 int prefix;
6719 relax_substateT subtype;
6720 symbolS *sym;
6721 offsetT off;
6722
6723 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
6724 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
6725
6726 prefix = 0;
6727 if (i.prefix[DATA_PREFIX] != 0)
6728 {
6729 prefix = 1;
6730 i.prefixes -= 1;
6731 code16 ^= CODE16;
6732 }
6733 /* Pentium4 branch hints. */
6734 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6735 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6736 {
6737 prefix++;
6738 i.prefixes--;
6739 }
6740 if (i.prefix[REX_PREFIX] != 0)
6741 {
6742 prefix++;
6743 i.prefixes--;
6744 }
6745
6746 /* BND prefixed jump. */
6747 if (i.prefix[BND_PREFIX] != 0)
6748 {
6749 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6750 i.prefixes -= 1;
6751 }
6752
6753 if (i.prefixes != 0 && !intel_syntax)
6754 as_warn (_("skipping prefixes on this instruction"));
6755
6756 /* It's always a symbol; End frag & setup for relax.
6757 Make sure there is enough room in this frag for the largest
6758 instruction we may generate in md_convert_frag. This is 2
6759 bytes for the opcode and room for the prefix and largest
6760 displacement. */
6761 frag_grow (prefix + 2 + 4);
6762 /* Prefix and 1 opcode byte go in fr_fix. */
6763 p = frag_more (prefix + 1);
6764 if (i.prefix[DATA_PREFIX] != 0)
6765 *p++ = DATA_PREFIX_OPCODE;
6766 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
6767 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
6768 *p++ = i.prefix[SEG_PREFIX];
6769 if (i.prefix[REX_PREFIX] != 0)
6770 *p++ = i.prefix[REX_PREFIX];
6771 *p = i.tm.base_opcode;
6772
6773 if ((unsigned char) *p == JUMP_PC_RELATIVE)
6774 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
6775 else if (cpu_arch_flags.bitfield.cpui386)
6776 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
6777 else
6778 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
6779 subtype |= code16;
6780
6781 sym = i.op[0].disps->X_add_symbol;
6782 off = i.op[0].disps->X_add_number;
6783
6784 if (i.op[0].disps->X_op != O_constant
6785 && i.op[0].disps->X_op != O_symbol)
6786 {
6787 /* Handle complex expressions. */
6788 sym = make_expr_symbol (i.op[0].disps);
6789 off = 0;
6790 }
6791
6792 /* 1 possible extra opcode + 4 byte displacement go in var part.
6793 Pass reloc in fr_var. */
6794 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
6795 }
6796
6797 static void
6798 output_jump (void)
6799 {
6800 char *p;
6801 int size;
6802 fixS *fixP;
6803
6804 if (i.tm.opcode_modifier.jumpbyte)
6805 {
6806 /* This is a loop or jecxz type instruction. */
6807 size = 1;
6808 if (i.prefix[ADDR_PREFIX] != 0)
6809 {
6810 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
6811 i.prefixes -= 1;
6812 }
6813 /* Pentium4 branch hints. */
6814 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6815 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6816 {
6817 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
6818 i.prefixes--;
6819 }
6820 }
6821 else
6822 {
6823 int code16;
6824
6825 code16 = 0;
6826 if (flag_code == CODE_16BIT)
6827 code16 = CODE16;
6828
6829 if (i.prefix[DATA_PREFIX] != 0)
6830 {
6831 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
6832 i.prefixes -= 1;
6833 code16 ^= CODE16;
6834 }
6835
6836 size = 4;
6837 if (code16)
6838 size = 2;
6839 }
6840
6841 if (i.prefix[REX_PREFIX] != 0)
6842 {
6843 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
6844 i.prefixes -= 1;
6845 }
6846
6847 /* BND prefixed jump. */
6848 if (i.prefix[BND_PREFIX] != 0)
6849 {
6850 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6851 i.prefixes -= 1;
6852 }
6853
6854 if (i.prefixes != 0 && !intel_syntax)
6855 as_warn (_("skipping prefixes on this instruction"));
6856
6857 p = frag_more (i.tm.opcode_length + size);
6858 switch (i.tm.opcode_length)
6859 {
6860 case 2:
6861 *p++ = i.tm.base_opcode >> 8;
6862 case 1:
6863 *p++ = i.tm.base_opcode;
6864 break;
6865 default:
6866 abort ();
6867 }
6868
6869 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6870 i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
6871
6872 /* All jumps handled here are signed, but don't use a signed limit
6873 check for 32 and 16 bit jumps as we want to allow wrap around at
6874 4G and 64k respectively. */
6875 if (size == 1)
6876 fixP->fx_signed = 1;
6877 }
6878
6879 static void
6880 output_interseg_jump (void)
6881 {
6882 char *p;
6883 int size;
6884 int prefix;
6885 int code16;
6886
6887 code16 = 0;
6888 if (flag_code == CODE_16BIT)
6889 code16 = CODE16;
6890
6891 prefix = 0;
6892 if (i.prefix[DATA_PREFIX] != 0)
6893 {
6894 prefix = 1;
6895 i.prefixes -= 1;
6896 code16 ^= CODE16;
6897 }
6898 if (i.prefix[REX_PREFIX] != 0)
6899 {
6900 prefix++;
6901 i.prefixes -= 1;
6902 }
6903
6904 size = 4;
6905 if (code16)
6906 size = 2;
6907
6908 if (i.prefixes != 0 && !intel_syntax)
6909 as_warn (_("skipping prefixes on this instruction"));
6910
6911 /* 1 opcode; 2 segment; offset */
6912 p = frag_more (prefix + 1 + 2 + size);
6913
6914 if (i.prefix[DATA_PREFIX] != 0)
6915 *p++ = DATA_PREFIX_OPCODE;
6916
6917 if (i.prefix[REX_PREFIX] != 0)
6918 *p++ = i.prefix[REX_PREFIX];
6919
6920 *p++ = i.tm.base_opcode;
6921 if (i.op[1].imms->X_op == O_constant)
6922 {
6923 offsetT n = i.op[1].imms->X_add_number;
6924
6925 if (size == 2
6926 && !fits_in_unsigned_word (n)
6927 && !fits_in_signed_word (n))
6928 {
6929 as_bad (_("16-bit jump out of range"));
6930 return;
6931 }
6932 md_number_to_chars (p, n, size);
6933 }
6934 else
6935 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6936 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
6937 if (i.op[0].imms->X_op != O_constant)
6938 as_bad (_("can't handle non absolute segment in `%s'"),
6939 i.tm.name);
6940 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
6941 }
6942
6943 static void
6944 output_insn (void)
6945 {
6946 fragS *insn_start_frag;
6947 offsetT insn_start_off;
6948
6949 /* Tie dwarf2 debug info to the address at the start of the insn.
6950 We can't do this after the insn has been output as the current
6951 frag may have been closed off. eg. by frag_var. */
6952 dwarf2_emit_insn (0);
6953
6954 insn_start_frag = frag_now;
6955 insn_start_off = frag_now_fix ();
6956
6957 /* Output jumps. */
6958 if (i.tm.opcode_modifier.jump)
6959 output_branch ();
6960 else if (i.tm.opcode_modifier.jumpbyte
6961 || i.tm.opcode_modifier.jumpdword)
6962 output_jump ();
6963 else if (i.tm.opcode_modifier.jumpintersegment)
6964 output_interseg_jump ();
6965 else
6966 {
6967 /* Output normal instructions here. */
6968 char *p;
6969 unsigned char *q;
6970 unsigned int j;
6971 unsigned int prefix;
6972
6973 if (avoid_fence
6974 && i.tm.base_opcode == 0xfae
6975 && i.operands == 1
6976 && i.imm_operands == 1
6977 && (i.op[0].imms->X_add_number == 0xe8
6978 || i.op[0].imms->X_add_number == 0xf0
6979 || i.op[0].imms->X_add_number == 0xf8))
6980 {
6981 /* Encode lfence, mfence, and sfence as
6982 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
6983 offsetT val = 0x240483f0ULL;
6984 p = frag_more (5);
6985 md_number_to_chars (p, val, 5);
6986 return;
6987 }
6988
6989 /* Some processors fail on LOCK prefix. This options makes
6990 assembler ignore LOCK prefix and serves as a workaround. */
6991 if (omit_lock_prefix)
6992 {
6993 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
6994 return;
6995 i.prefix[LOCK_PREFIX] = 0;
6996 }
6997
6998 /* Since the VEX/EVEX prefix contains the implicit prefix, we
6999 don't need the explicit prefix. */
7000 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
7001 {
7002 switch (i.tm.opcode_length)
7003 {
7004 case 3:
7005 if (i.tm.base_opcode & 0xff000000)
7006 {
7007 prefix = (i.tm.base_opcode >> 24) & 0xff;
7008 goto check_prefix;
7009 }
7010 break;
7011 case 2:
7012 if ((i.tm.base_opcode & 0xff0000) != 0)
7013 {
7014 prefix = (i.tm.base_opcode >> 16) & 0xff;
7015 if (i.tm.cpu_flags.bitfield.cpupadlock)
7016 {
7017 check_prefix:
7018 if (prefix != REPE_PREFIX_OPCODE
7019 || (i.prefix[REP_PREFIX]
7020 != REPE_PREFIX_OPCODE))
7021 add_prefix (prefix);
7022 }
7023 else
7024 add_prefix (prefix);
7025 }
7026 break;
7027 case 1:
7028 break;
7029 default:
7030 abort ();
7031 }
7032
7033 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7034 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
7035 R_X86_64_GOTTPOFF relocation so that linker can safely
7036 perform IE->LE optimization. */
7037 if (x86_elf_abi == X86_64_X32_ABI
7038 && i.operands == 2
7039 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
7040 && i.prefix[REX_PREFIX] == 0)
7041 add_prefix (REX_OPCODE);
7042 #endif
7043
7044 /* The prefix bytes. */
7045 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
7046 if (*q)
7047 FRAG_APPEND_1_CHAR (*q);
7048 }
7049 else
7050 {
7051 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
7052 if (*q)
7053 switch (j)
7054 {
7055 case REX_PREFIX:
7056 /* REX byte is encoded in VEX prefix. */
7057 break;
7058 case SEG_PREFIX:
7059 case ADDR_PREFIX:
7060 FRAG_APPEND_1_CHAR (*q);
7061 break;
7062 default:
7063 /* There should be no other prefixes for instructions
7064 with VEX prefix. */
7065 abort ();
7066 }
7067
7068 /* For EVEX instructions i.vrex should become 0 after
7069 build_evex_prefix. For VEX instructions upper 16 registers
7070 aren't available, so VREX should be 0. */
7071 if (i.vrex)
7072 abort ();
7073 /* Now the VEX prefix. */
7074 p = frag_more (i.vex.length);
7075 for (j = 0; j < i.vex.length; j++)
7076 p[j] = i.vex.bytes[j];
7077 }
7078
7079 /* Now the opcode; be careful about word order here! */
7080 if (i.tm.opcode_length == 1)
7081 {
7082 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
7083 }
7084 else
7085 {
7086 switch (i.tm.opcode_length)
7087 {
7088 case 4:
7089 p = frag_more (4);
7090 *p++ = (i.tm.base_opcode >> 24) & 0xff;
7091 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7092 break;
7093 case 3:
7094 p = frag_more (3);
7095 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7096 break;
7097 case 2:
7098 p = frag_more (2);
7099 break;
7100 default:
7101 abort ();
7102 break;
7103 }
7104
7105 /* Put out high byte first: can't use md_number_to_chars! */
7106 *p++ = (i.tm.base_opcode >> 8) & 0xff;
7107 *p = i.tm.base_opcode & 0xff;
7108 }
7109
7110 /* Now the modrm byte and sib byte (if present). */
7111 if (i.tm.opcode_modifier.modrm)
7112 {
7113 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7114 | i.rm.reg << 3
7115 | i.rm.mode << 6));
7116 /* If i.rm.regmem == ESP (4)
7117 && i.rm.mode != (Register mode)
7118 && not 16 bit
7119 ==> need second modrm byte. */
7120 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7121 && i.rm.mode != 3
7122 && !(i.base_reg && i.base_reg->reg_type.bitfield.reg16))
7123 FRAG_APPEND_1_CHAR ((i.sib.base << 0
7124 | i.sib.index << 3
7125 | i.sib.scale << 6));
7126 }
7127
7128 if (i.disp_operands)
7129 output_disp (insn_start_frag, insn_start_off);
7130
7131 if (i.imm_operands)
7132 output_imm (insn_start_frag, insn_start_off);
7133 }
7134
7135 #ifdef DEBUG386
7136 if (flag_debug)
7137 {
7138 pi ("" /*line*/, &i);
7139 }
7140 #endif /* DEBUG386 */
7141 }
7142
7143 /* Return the size of the displacement operand N. */
7144
7145 static int
7146 disp_size (unsigned int n)
7147 {
7148 int size = 4;
7149
7150 /* Vec_Disp8 has to be 8bit. */
7151 if (i.types[n].bitfield.vec_disp8)
7152 size = 1;
7153 else if (i.types[n].bitfield.disp64)
7154 size = 8;
7155 else if (i.types[n].bitfield.disp8)
7156 size = 1;
7157 else if (i.types[n].bitfield.disp16)
7158 size = 2;
7159 return size;
7160 }
7161
7162 /* Return the size of the immediate operand N. */
7163
7164 static int
7165 imm_size (unsigned int n)
7166 {
7167 int size = 4;
7168 if (i.types[n].bitfield.imm64)
7169 size = 8;
7170 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
7171 size = 1;
7172 else if (i.types[n].bitfield.imm16)
7173 size = 2;
7174 return size;
7175 }
7176
7177 static void
7178 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
7179 {
7180 char *p;
7181 unsigned int n;
7182
7183 for (n = 0; n < i.operands; n++)
7184 {
7185 if (i.types[n].bitfield.vec_disp8
7186 || operand_type_check (i.types[n], disp))
7187 {
7188 if (i.op[n].disps->X_op == O_constant)
7189 {
7190 int size = disp_size (n);
7191 offsetT val = i.op[n].disps->X_add_number;
7192
7193 if (i.types[n].bitfield.vec_disp8)
7194 val >>= i.memshift;
7195 val = offset_in_range (val, size);
7196 p = frag_more (size);
7197 md_number_to_chars (p, val, size);
7198 }
7199 else
7200 {
7201 enum bfd_reloc_code_real reloc_type;
7202 int size = disp_size (n);
7203 int sign = i.types[n].bitfield.disp32s;
7204 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
7205 fixS *fixP;
7206
7207 /* We can't have 8 bit displacement here. */
7208 gas_assert (!i.types[n].bitfield.disp8);
7209
7210 /* The PC relative address is computed relative
7211 to the instruction boundary, so in case immediate
7212 fields follows, we need to adjust the value. */
7213 if (pcrel && i.imm_operands)
7214 {
7215 unsigned int n1;
7216 int sz = 0;
7217
7218 for (n1 = 0; n1 < i.operands; n1++)
7219 if (operand_type_check (i.types[n1], imm))
7220 {
7221 /* Only one immediate is allowed for PC
7222 relative address. */
7223 gas_assert (sz == 0);
7224 sz = imm_size (n1);
7225 i.op[n].disps->X_add_number -= sz;
7226 }
7227 /* We should find the immediate. */
7228 gas_assert (sz != 0);
7229 }
7230
7231 p = frag_more (size);
7232 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
7233 if (GOT_symbol
7234 && GOT_symbol == i.op[n].disps->X_add_symbol
7235 && (((reloc_type == BFD_RELOC_32
7236 || reloc_type == BFD_RELOC_X86_64_32S
7237 || (reloc_type == BFD_RELOC_64
7238 && object_64bit))
7239 && (i.op[n].disps->X_op == O_symbol
7240 || (i.op[n].disps->X_op == O_add
7241 && ((symbol_get_value_expression
7242 (i.op[n].disps->X_op_symbol)->X_op)
7243 == O_subtract))))
7244 || reloc_type == BFD_RELOC_32_PCREL))
7245 {
7246 offsetT add;
7247
7248 if (insn_start_frag == frag_now)
7249 add = (p - frag_now->fr_literal) - insn_start_off;
7250 else
7251 {
7252 fragS *fr;
7253
7254 add = insn_start_frag->fr_fix - insn_start_off;
7255 for (fr = insn_start_frag->fr_next;
7256 fr && fr != frag_now; fr = fr->fr_next)
7257 add += fr->fr_fix;
7258 add += p - frag_now->fr_literal;
7259 }
7260
7261 if (!object_64bit)
7262 {
7263 reloc_type = BFD_RELOC_386_GOTPC;
7264 i.op[n].imms->X_add_number += add;
7265 }
7266 else if (reloc_type == BFD_RELOC_64)
7267 reloc_type = BFD_RELOC_X86_64_GOTPC64;
7268 else
7269 /* Don't do the adjustment for x86-64, as there
7270 the pcrel addressing is relative to the _next_
7271 insn, and that is taken care of in other code. */
7272 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7273 }
7274 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
7275 size, i.op[n].disps, pcrel,
7276 reloc_type);
7277 /* Check for "call/jmp *mem", "mov mem, %reg",
7278 "test %reg, mem" and "binop mem, %reg" where binop
7279 is one of adc, add, and, cmp, or, sbb, sub, xor
7280 instructions. Always generate R_386_GOT32X for
7281 "sym*GOT" operand in 32-bit mode. */
7282 if ((generate_relax_relocations
7283 || (!object_64bit
7284 && i.rm.mode == 0
7285 && i.rm.regmem == 5))
7286 && (i.rm.mode == 2
7287 || (i.rm.mode == 0 && i.rm.regmem == 5))
7288 && ((i.operands == 1
7289 && i.tm.base_opcode == 0xff
7290 && (i.rm.reg == 2 || i.rm.reg == 4))
7291 || (i.operands == 2
7292 && (i.tm.base_opcode == 0x8b
7293 || i.tm.base_opcode == 0x85
7294 || (i.tm.base_opcode & 0xc7) == 0x03))))
7295 {
7296 if (object_64bit)
7297 {
7298 fixP->fx_tcbit = i.rex != 0;
7299 if (i.base_reg
7300 && (i.base_reg->reg_num == RegRip
7301 || i.base_reg->reg_num == RegEip))
7302 fixP->fx_tcbit2 = 1;
7303 }
7304 else
7305 fixP->fx_tcbit2 = 1;
7306 }
7307 }
7308 }
7309 }
7310 }
7311
7312 static void
7313 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
7314 {
7315 char *p;
7316 unsigned int n;
7317
7318 for (n = 0; n < i.operands; n++)
7319 {
7320 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
7321 if (i.rounding && (int) n == i.rounding->operand)
7322 continue;
7323
7324 if (operand_type_check (i.types[n], imm))
7325 {
7326 if (i.op[n].imms->X_op == O_constant)
7327 {
7328 int size = imm_size (n);
7329 offsetT val;
7330
7331 val = offset_in_range (i.op[n].imms->X_add_number,
7332 size);
7333 p = frag_more (size);
7334 md_number_to_chars (p, val, size);
7335 }
7336 else
7337 {
7338 /* Not absolute_section.
7339 Need a 32-bit fixup (don't support 8bit
7340 non-absolute imms). Try to support other
7341 sizes ... */
7342 enum bfd_reloc_code_real reloc_type;
7343 int size = imm_size (n);
7344 int sign;
7345
7346 if (i.types[n].bitfield.imm32s
7347 && (i.suffix == QWORD_MNEM_SUFFIX
7348 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
7349 sign = 1;
7350 else
7351 sign = 0;
7352
7353 p = frag_more (size);
7354 reloc_type = reloc (size, 0, sign, i.reloc[n]);
7355
7356 /* This is tough to explain. We end up with this one if we
7357 * have operands that look like
7358 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
7359 * obtain the absolute address of the GOT, and it is strongly
7360 * preferable from a performance point of view to avoid using
7361 * a runtime relocation for this. The actual sequence of
7362 * instructions often look something like:
7363 *
7364 * call .L66
7365 * .L66:
7366 * popl %ebx
7367 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
7368 *
7369 * The call and pop essentially return the absolute address
7370 * of the label .L66 and store it in %ebx. The linker itself
7371 * will ultimately change the first operand of the addl so
7372 * that %ebx points to the GOT, but to keep things simple, the
7373 * .o file must have this operand set so that it generates not
7374 * the absolute address of .L66, but the absolute address of
7375 * itself. This allows the linker itself simply treat a GOTPC
7376 * relocation as asking for a pcrel offset to the GOT to be
7377 * added in, and the addend of the relocation is stored in the
7378 * operand field for the instruction itself.
7379 *
7380 * Our job here is to fix the operand so that it would add
7381 * the correct offset so that %ebx would point to itself. The
7382 * thing that is tricky is that .-.L66 will point to the
7383 * beginning of the instruction, so we need to further modify
7384 * the operand so that it will point to itself. There are
7385 * other cases where you have something like:
7386 *
7387 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
7388 *
7389 * and here no correction would be required. Internally in
7390 * the assembler we treat operands of this form as not being
7391 * pcrel since the '.' is explicitly mentioned, and I wonder
7392 * whether it would simplify matters to do it this way. Who
7393 * knows. In earlier versions of the PIC patches, the
7394 * pcrel_adjust field was used to store the correction, but
7395 * since the expression is not pcrel, I felt it would be
7396 * confusing to do it this way. */
7397
7398 if ((reloc_type == BFD_RELOC_32
7399 || reloc_type == BFD_RELOC_X86_64_32S
7400 || reloc_type == BFD_RELOC_64)
7401 && GOT_symbol
7402 && GOT_symbol == i.op[n].imms->X_add_symbol
7403 && (i.op[n].imms->X_op == O_symbol
7404 || (i.op[n].imms->X_op == O_add
7405 && ((symbol_get_value_expression
7406 (i.op[n].imms->X_op_symbol)->X_op)
7407 == O_subtract))))
7408 {
7409 offsetT add;
7410
7411 if (insn_start_frag == frag_now)
7412 add = (p - frag_now->fr_literal) - insn_start_off;
7413 else
7414 {
7415 fragS *fr;
7416
7417 add = insn_start_frag->fr_fix - insn_start_off;
7418 for (fr = insn_start_frag->fr_next;
7419 fr && fr != frag_now; fr = fr->fr_next)
7420 add += fr->fr_fix;
7421 add += p - frag_now->fr_literal;
7422 }
7423
7424 if (!object_64bit)
7425 reloc_type = BFD_RELOC_386_GOTPC;
7426 else if (size == 4)
7427 reloc_type = BFD_RELOC_X86_64_GOTPC32;
7428 else if (size == 8)
7429 reloc_type = BFD_RELOC_X86_64_GOTPC64;
7430 i.op[n].imms->X_add_number += add;
7431 }
7432 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7433 i.op[n].imms, 0, reloc_type);
7434 }
7435 }
7436 }
7437 }
7438 \f
7439 /* x86_cons_fix_new is called via the expression parsing code when a
7440 reloc is needed. We use this hook to get the correct .got reloc. */
7441 static int cons_sign = -1;
7442
7443 void
7444 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
7445 expressionS *exp, bfd_reloc_code_real_type r)
7446 {
7447 r = reloc (len, 0, cons_sign, r);
7448
7449 #ifdef TE_PE
7450 if (exp->X_op == O_secrel)
7451 {
7452 exp->X_op = O_symbol;
7453 r = BFD_RELOC_32_SECREL;
7454 }
7455 #endif
7456
7457 fix_new_exp (frag, off, len, exp, 0, r);
7458 }
7459
7460 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
7461 purpose of the `.dc.a' internal pseudo-op. */
7462
7463 int
7464 x86_address_bytes (void)
7465 {
7466 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
7467 return 4;
7468 return stdoutput->arch_info->bits_per_address / 8;
7469 }
7470
7471 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
7472 || defined (LEX_AT)
7473 # define lex_got(reloc, adjust, types) NULL
7474 #else
7475 /* Parse operands of the form
7476 <symbol>@GOTOFF+<nnn>
7477 and similar .plt or .got references.
7478
7479 If we find one, set up the correct relocation in RELOC and copy the
7480 input string, minus the `@GOTOFF' into a malloc'd buffer for
7481 parsing by the calling routine. Return this buffer, and if ADJUST
7482 is non-null set it to the length of the string we removed from the
7483 input line. Otherwise return NULL. */
7484 static char *
7485 lex_got (enum bfd_reloc_code_real *rel,
7486 int *adjust,
7487 i386_operand_type *types)
7488 {
7489 /* Some of the relocations depend on the size of what field is to
7490 be relocated. But in our callers i386_immediate and i386_displacement
7491 we don't yet know the operand size (this will be set by insn
7492 matching). Hence we record the word32 relocation here,
7493 and adjust the reloc according to the real size in reloc(). */
7494 static const struct {
7495 const char *str;
7496 int len;
7497 const enum bfd_reloc_code_real rel[2];
7498 const i386_operand_type types64;
7499 } gotrel[] = {
7500 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7501 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
7502 BFD_RELOC_SIZE32 },
7503 OPERAND_TYPE_IMM32_64 },
7504 #endif
7505 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
7506 BFD_RELOC_X86_64_PLTOFF64 },
7507 OPERAND_TYPE_IMM64 },
7508 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
7509 BFD_RELOC_X86_64_PLT32 },
7510 OPERAND_TYPE_IMM32_32S_DISP32 },
7511 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
7512 BFD_RELOC_X86_64_GOTPLT64 },
7513 OPERAND_TYPE_IMM64_DISP64 },
7514 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
7515 BFD_RELOC_X86_64_GOTOFF64 },
7516 OPERAND_TYPE_IMM64_DISP64 },
7517 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
7518 BFD_RELOC_X86_64_GOTPCREL },
7519 OPERAND_TYPE_IMM32_32S_DISP32 },
7520 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
7521 BFD_RELOC_X86_64_TLSGD },
7522 OPERAND_TYPE_IMM32_32S_DISP32 },
7523 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
7524 _dummy_first_bfd_reloc_code_real },
7525 OPERAND_TYPE_NONE },
7526 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
7527 BFD_RELOC_X86_64_TLSLD },
7528 OPERAND_TYPE_IMM32_32S_DISP32 },
7529 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
7530 BFD_RELOC_X86_64_GOTTPOFF },
7531 OPERAND_TYPE_IMM32_32S_DISP32 },
7532 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
7533 BFD_RELOC_X86_64_TPOFF32 },
7534 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7535 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
7536 _dummy_first_bfd_reloc_code_real },
7537 OPERAND_TYPE_NONE },
7538 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
7539 BFD_RELOC_X86_64_DTPOFF32 },
7540 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7541 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
7542 _dummy_first_bfd_reloc_code_real },
7543 OPERAND_TYPE_NONE },
7544 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
7545 _dummy_first_bfd_reloc_code_real },
7546 OPERAND_TYPE_NONE },
7547 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
7548 BFD_RELOC_X86_64_GOT32 },
7549 OPERAND_TYPE_IMM32_32S_64_DISP32 },
7550 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
7551 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
7552 OPERAND_TYPE_IMM32_32S_DISP32 },
7553 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
7554 BFD_RELOC_X86_64_TLSDESC_CALL },
7555 OPERAND_TYPE_IMM32_32S_DISP32 },
7556 };
7557 char *cp;
7558 unsigned int j;
7559
7560 #if defined (OBJ_MAYBE_ELF)
7561 if (!IS_ELF)
7562 return NULL;
7563 #endif
7564
7565 for (cp = input_line_pointer; *cp != '@'; cp++)
7566 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7567 return NULL;
7568
7569 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7570 {
7571 int len = gotrel[j].len;
7572 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7573 {
7574 if (gotrel[j].rel[object_64bit] != 0)
7575 {
7576 int first, second;
7577 char *tmpbuf, *past_reloc;
7578
7579 *rel = gotrel[j].rel[object_64bit];
7580
7581 if (types)
7582 {
7583 if (flag_code != CODE_64BIT)
7584 {
7585 types->bitfield.imm32 = 1;
7586 types->bitfield.disp32 = 1;
7587 }
7588 else
7589 *types = gotrel[j].types64;
7590 }
7591
7592 if (j != 0 && GOT_symbol == NULL)
7593 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
7594
7595 /* The length of the first part of our input line. */
7596 first = cp - input_line_pointer;
7597
7598 /* The second part goes from after the reloc token until
7599 (and including) an end_of_line char or comma. */
7600 past_reloc = cp + 1 + len;
7601 cp = past_reloc;
7602 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7603 ++cp;
7604 second = cp + 1 - past_reloc;
7605
7606 /* Allocate and copy string. The trailing NUL shouldn't
7607 be necessary, but be safe. */
7608 tmpbuf = (char *) xmalloc (first + second + 2);
7609 memcpy (tmpbuf, input_line_pointer, first);
7610 if (second != 0 && *past_reloc != ' ')
7611 /* Replace the relocation token with ' ', so that
7612 errors like foo@GOTOFF1 will be detected. */
7613 tmpbuf[first++] = ' ';
7614 else
7615 /* Increment length by 1 if the relocation token is
7616 removed. */
7617 len++;
7618 if (adjust)
7619 *adjust = len;
7620 memcpy (tmpbuf + first, past_reloc, second);
7621 tmpbuf[first + second] = '\0';
7622 return tmpbuf;
7623 }
7624
7625 as_bad (_("@%s reloc is not supported with %d-bit output format"),
7626 gotrel[j].str, 1 << (5 + object_64bit));
7627 return NULL;
7628 }
7629 }
7630
7631 /* Might be a symbol version string. Don't as_bad here. */
7632 return NULL;
7633 }
7634 #endif
7635
7636 #ifdef TE_PE
7637 #ifdef lex_got
7638 #undef lex_got
7639 #endif
7640 /* Parse operands of the form
7641 <symbol>@SECREL32+<nnn>
7642
7643 If we find one, set up the correct relocation in RELOC and copy the
7644 input string, minus the `@SECREL32' into a malloc'd buffer for
7645 parsing by the calling routine. Return this buffer, and if ADJUST
7646 is non-null set it to the length of the string we removed from the
7647 input line. Otherwise return NULL.
7648
7649 This function is copied from the ELF version above adjusted for PE targets. */
7650
7651 static char *
7652 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
7653 int *adjust ATTRIBUTE_UNUSED,
7654 i386_operand_type *types)
7655 {
7656 static const struct
7657 {
7658 const char *str;
7659 int len;
7660 const enum bfd_reloc_code_real rel[2];
7661 const i386_operand_type types64;
7662 }
7663 gotrel[] =
7664 {
7665 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
7666 BFD_RELOC_32_SECREL },
7667 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7668 };
7669
7670 char *cp;
7671 unsigned j;
7672
7673 for (cp = input_line_pointer; *cp != '@'; cp++)
7674 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7675 return NULL;
7676
7677 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7678 {
7679 int len = gotrel[j].len;
7680
7681 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7682 {
7683 if (gotrel[j].rel[object_64bit] != 0)
7684 {
7685 int first, second;
7686 char *tmpbuf, *past_reloc;
7687
7688 *rel = gotrel[j].rel[object_64bit];
7689 if (adjust)
7690 *adjust = len;
7691
7692 if (types)
7693 {
7694 if (flag_code != CODE_64BIT)
7695 {
7696 types->bitfield.imm32 = 1;
7697 types->bitfield.disp32 = 1;
7698 }
7699 else
7700 *types = gotrel[j].types64;
7701 }
7702
7703 /* The length of the first part of our input line. */
7704 first = cp - input_line_pointer;
7705
7706 /* The second part goes from after the reloc token until
7707 (and including) an end_of_line char or comma. */
7708 past_reloc = cp + 1 + len;
7709 cp = past_reloc;
7710 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7711 ++cp;
7712 second = cp + 1 - past_reloc;
7713
7714 /* Allocate and copy string. The trailing NUL shouldn't
7715 be necessary, but be safe. */
7716 tmpbuf = (char *) xmalloc (first + second + 2);
7717 memcpy (tmpbuf, input_line_pointer, first);
7718 if (second != 0 && *past_reloc != ' ')
7719 /* Replace the relocation token with ' ', so that
7720 errors like foo@SECLREL321 will be detected. */
7721 tmpbuf[first++] = ' ';
7722 memcpy (tmpbuf + first, past_reloc, second);
7723 tmpbuf[first + second] = '\0';
7724 return tmpbuf;
7725 }
7726
7727 as_bad (_("@%s reloc is not supported with %d-bit output format"),
7728 gotrel[j].str, 1 << (5 + object_64bit));
7729 return NULL;
7730 }
7731 }
7732
7733 /* Might be a symbol version string. Don't as_bad here. */
7734 return NULL;
7735 }
7736
7737 #endif /* TE_PE */
7738
7739 bfd_reloc_code_real_type
7740 x86_cons (expressionS *exp, int size)
7741 {
7742 bfd_reloc_code_real_type got_reloc = NO_RELOC;
7743
7744 intel_syntax = -intel_syntax;
7745
7746 exp->X_md = 0;
7747 if (size == 4 || (object_64bit && size == 8))
7748 {
7749 /* Handle @GOTOFF and the like in an expression. */
7750 char *save;
7751 char *gotfree_input_line;
7752 int adjust = 0;
7753
7754 save = input_line_pointer;
7755 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
7756 if (gotfree_input_line)
7757 input_line_pointer = gotfree_input_line;
7758
7759 expression (exp);
7760
7761 if (gotfree_input_line)
7762 {
7763 /* expression () has merrily parsed up to the end of line,
7764 or a comma - in the wrong buffer. Transfer how far
7765 input_line_pointer has moved to the right buffer. */
7766 input_line_pointer = (save
7767 + (input_line_pointer - gotfree_input_line)
7768 + adjust);
7769 free (gotfree_input_line);
7770 if (exp->X_op == O_constant
7771 || exp->X_op == O_absent
7772 || exp->X_op == O_illegal
7773 || exp->X_op == O_register
7774 || exp->X_op == O_big)
7775 {
7776 char c = *input_line_pointer;
7777 *input_line_pointer = 0;
7778 as_bad (_("missing or invalid expression `%s'"), save);
7779 *input_line_pointer = c;
7780 }
7781 }
7782 }
7783 else
7784 expression (exp);
7785
7786 intel_syntax = -intel_syntax;
7787
7788 if (intel_syntax)
7789 i386_intel_simplify (exp);
7790
7791 return got_reloc;
7792 }
7793
7794 static void
7795 signed_cons (int size)
7796 {
7797 if (flag_code == CODE_64BIT)
7798 cons_sign = 1;
7799 cons (size);
7800 cons_sign = -1;
7801 }
7802
7803 #ifdef TE_PE
7804 static void
7805 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
7806 {
7807 expressionS exp;
7808
7809 do
7810 {
7811 expression (&exp);
7812 if (exp.X_op == O_symbol)
7813 exp.X_op = O_secrel;
7814
7815 emit_expr (&exp, 4);
7816 }
7817 while (*input_line_pointer++ == ',');
7818
7819 input_line_pointer--;
7820 demand_empty_rest_of_line ();
7821 }
7822 #endif
7823
7824 /* Handle Vector operations. */
7825
7826 static char *
7827 check_VecOperations (char *op_string, char *op_end)
7828 {
7829 const reg_entry *mask;
7830 const char *saved;
7831 char *end_op;
7832
7833 while (*op_string
7834 && (op_end == NULL || op_string < op_end))
7835 {
7836 saved = op_string;
7837 if (*op_string == '{')
7838 {
7839 op_string++;
7840
7841 /* Check broadcasts. */
7842 if (strncmp (op_string, "1to", 3) == 0)
7843 {
7844 int bcst_type;
7845
7846 if (i.broadcast)
7847 goto duplicated_vec_op;
7848
7849 op_string += 3;
7850 if (*op_string == '8')
7851 bcst_type = BROADCAST_1TO8;
7852 else if (*op_string == '4')
7853 bcst_type = BROADCAST_1TO4;
7854 else if (*op_string == '2')
7855 bcst_type = BROADCAST_1TO2;
7856 else if (*op_string == '1'
7857 && *(op_string+1) == '6')
7858 {
7859 bcst_type = BROADCAST_1TO16;
7860 op_string++;
7861 }
7862 else
7863 {
7864 as_bad (_("Unsupported broadcast: `%s'"), saved);
7865 return NULL;
7866 }
7867 op_string++;
7868
7869 broadcast_op.type = bcst_type;
7870 broadcast_op.operand = this_operand;
7871 i.broadcast = &broadcast_op;
7872 }
7873 /* Check masking operation. */
7874 else if ((mask = parse_register (op_string, &end_op)) != NULL)
7875 {
7876 /* k0 can't be used for write mask. */
7877 if (mask->reg_num == 0)
7878 {
7879 as_bad (_("`%s' can't be used for write mask"),
7880 op_string);
7881 return NULL;
7882 }
7883
7884 if (!i.mask)
7885 {
7886 mask_op.mask = mask;
7887 mask_op.zeroing = 0;
7888 mask_op.operand = this_operand;
7889 i.mask = &mask_op;
7890 }
7891 else
7892 {
7893 if (i.mask->mask)
7894 goto duplicated_vec_op;
7895
7896 i.mask->mask = mask;
7897
7898 /* Only "{z}" is allowed here. No need to check
7899 zeroing mask explicitly. */
7900 if (i.mask->operand != this_operand)
7901 {
7902 as_bad (_("invalid write mask `%s'"), saved);
7903 return NULL;
7904 }
7905 }
7906
7907 op_string = end_op;
7908 }
7909 /* Check zeroing-flag for masking operation. */
7910 else if (*op_string == 'z')
7911 {
7912 if (!i.mask)
7913 {
7914 mask_op.mask = NULL;
7915 mask_op.zeroing = 1;
7916 mask_op.operand = this_operand;
7917 i.mask = &mask_op;
7918 }
7919 else
7920 {
7921 if (i.mask->zeroing)
7922 {
7923 duplicated_vec_op:
7924 as_bad (_("duplicated `%s'"), saved);
7925 return NULL;
7926 }
7927
7928 i.mask->zeroing = 1;
7929
7930 /* Only "{%k}" is allowed here. No need to check mask
7931 register explicitly. */
7932 if (i.mask->operand != this_operand)
7933 {
7934 as_bad (_("invalid zeroing-masking `%s'"),
7935 saved);
7936 return NULL;
7937 }
7938 }
7939
7940 op_string++;
7941 }
7942 else
7943 goto unknown_vec_op;
7944
7945 if (*op_string != '}')
7946 {
7947 as_bad (_("missing `}' in `%s'"), saved);
7948 return NULL;
7949 }
7950 op_string++;
7951 continue;
7952 }
7953 unknown_vec_op:
7954 /* We don't know this one. */
7955 as_bad (_("unknown vector operation: `%s'"), saved);
7956 return NULL;
7957 }
7958
7959 return op_string;
7960 }
7961
7962 static int
7963 i386_immediate (char *imm_start)
7964 {
7965 char *save_input_line_pointer;
7966 char *gotfree_input_line;
7967 segT exp_seg = 0;
7968 expressionS *exp;
7969 i386_operand_type types;
7970
7971 operand_type_set (&types, ~0);
7972
7973 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
7974 {
7975 as_bad (_("at most %d immediate operands are allowed"),
7976 MAX_IMMEDIATE_OPERANDS);
7977 return 0;
7978 }
7979
7980 exp = &im_expressions[i.imm_operands++];
7981 i.op[this_operand].imms = exp;
7982
7983 if (is_space_char (*imm_start))
7984 ++imm_start;
7985
7986 save_input_line_pointer = input_line_pointer;
7987 input_line_pointer = imm_start;
7988
7989 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
7990 if (gotfree_input_line)
7991 input_line_pointer = gotfree_input_line;
7992
7993 exp_seg = expression (exp);
7994
7995 SKIP_WHITESPACE ();
7996
7997 /* Handle vector operations. */
7998 if (*input_line_pointer == '{')
7999 {
8000 input_line_pointer = check_VecOperations (input_line_pointer,
8001 NULL);
8002 if (input_line_pointer == NULL)
8003 return 0;
8004 }
8005
8006 if (*input_line_pointer)
8007 as_bad (_("junk `%s' after expression"), input_line_pointer);
8008
8009 input_line_pointer = save_input_line_pointer;
8010 if (gotfree_input_line)
8011 {
8012 free (gotfree_input_line);
8013
8014 if (exp->X_op == O_constant || exp->X_op == O_register)
8015 exp->X_op = O_illegal;
8016 }
8017
8018 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
8019 }
8020
8021 static int
8022 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8023 i386_operand_type types, const char *imm_start)
8024 {
8025 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
8026 {
8027 if (imm_start)
8028 as_bad (_("missing or invalid immediate expression `%s'"),
8029 imm_start);
8030 return 0;
8031 }
8032 else if (exp->X_op == O_constant)
8033 {
8034 /* Size it properly later. */
8035 i.types[this_operand].bitfield.imm64 = 1;
8036 /* If not 64bit, sign extend val. */
8037 if (flag_code != CODE_64BIT
8038 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
8039 exp->X_add_number
8040 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
8041 }
8042 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8043 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
8044 && exp_seg != absolute_section
8045 && exp_seg != text_section
8046 && exp_seg != data_section
8047 && exp_seg != bss_section
8048 && exp_seg != undefined_section
8049 && !bfd_is_com_section (exp_seg))
8050 {
8051 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8052 return 0;
8053 }
8054 #endif
8055 else if (!intel_syntax && exp_seg == reg_section)
8056 {
8057 if (imm_start)
8058 as_bad (_("illegal immediate register operand %s"), imm_start);
8059 return 0;
8060 }
8061 else
8062 {
8063 /* This is an address. The size of the address will be
8064 determined later, depending on destination register,
8065 suffix, or the default for the section. */
8066 i.types[this_operand].bitfield.imm8 = 1;
8067 i.types[this_operand].bitfield.imm16 = 1;
8068 i.types[this_operand].bitfield.imm32 = 1;
8069 i.types[this_operand].bitfield.imm32s = 1;
8070 i.types[this_operand].bitfield.imm64 = 1;
8071 i.types[this_operand] = operand_type_and (i.types[this_operand],
8072 types);
8073 }
8074
8075 return 1;
8076 }
8077
8078 static char *
8079 i386_scale (char *scale)
8080 {
8081 offsetT val;
8082 char *save = input_line_pointer;
8083
8084 input_line_pointer = scale;
8085 val = get_absolute_expression ();
8086
8087 switch (val)
8088 {
8089 case 1:
8090 i.log2_scale_factor = 0;
8091 break;
8092 case 2:
8093 i.log2_scale_factor = 1;
8094 break;
8095 case 4:
8096 i.log2_scale_factor = 2;
8097 break;
8098 case 8:
8099 i.log2_scale_factor = 3;
8100 break;
8101 default:
8102 {
8103 char sep = *input_line_pointer;
8104
8105 *input_line_pointer = '\0';
8106 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
8107 scale);
8108 *input_line_pointer = sep;
8109 input_line_pointer = save;
8110 return NULL;
8111 }
8112 }
8113 if (i.log2_scale_factor != 0 && i.index_reg == 0)
8114 {
8115 as_warn (_("scale factor of %d without an index register"),
8116 1 << i.log2_scale_factor);
8117 i.log2_scale_factor = 0;
8118 }
8119 scale = input_line_pointer;
8120 input_line_pointer = save;
8121 return scale;
8122 }
8123
8124 static int
8125 i386_displacement (char *disp_start, char *disp_end)
8126 {
8127 expressionS *exp;
8128 segT exp_seg = 0;
8129 char *save_input_line_pointer;
8130 char *gotfree_input_line;
8131 int override;
8132 i386_operand_type bigdisp, types = anydisp;
8133 int ret;
8134
8135 if (i.disp_operands == MAX_MEMORY_OPERANDS)
8136 {
8137 as_bad (_("at most %d displacement operands are allowed"),
8138 MAX_MEMORY_OPERANDS);
8139 return 0;
8140 }
8141
8142 operand_type_set (&bigdisp, 0);
8143 if ((i.types[this_operand].bitfield.jumpabsolute)
8144 || (!current_templates->start->opcode_modifier.jump
8145 && !current_templates->start->opcode_modifier.jumpdword))
8146 {
8147 bigdisp.bitfield.disp32 = 1;
8148 override = (i.prefix[ADDR_PREFIX] != 0);
8149 if (flag_code == CODE_64BIT)
8150 {
8151 if (!override)
8152 {
8153 bigdisp.bitfield.disp32s = 1;
8154 bigdisp.bitfield.disp64 = 1;
8155 }
8156 }
8157 else if ((flag_code == CODE_16BIT) ^ override)
8158 {
8159 bigdisp.bitfield.disp32 = 0;
8160 bigdisp.bitfield.disp16 = 1;
8161 }
8162 }
8163 else
8164 {
8165 /* For PC-relative branches, the width of the displacement
8166 is dependent upon data size, not address size. */
8167 override = (i.prefix[DATA_PREFIX] != 0);
8168 if (flag_code == CODE_64BIT)
8169 {
8170 if (override || i.suffix == WORD_MNEM_SUFFIX)
8171 bigdisp.bitfield.disp16 = 1;
8172 else
8173 {
8174 bigdisp.bitfield.disp32 = 1;
8175 bigdisp.bitfield.disp32s = 1;
8176 }
8177 }
8178 else
8179 {
8180 if (!override)
8181 override = (i.suffix == (flag_code != CODE_16BIT
8182 ? WORD_MNEM_SUFFIX
8183 : LONG_MNEM_SUFFIX));
8184 bigdisp.bitfield.disp32 = 1;
8185 if ((flag_code == CODE_16BIT) ^ override)
8186 {
8187 bigdisp.bitfield.disp32 = 0;
8188 bigdisp.bitfield.disp16 = 1;
8189 }
8190 }
8191 }
8192 i.types[this_operand] = operand_type_or (i.types[this_operand],
8193 bigdisp);
8194
8195 exp = &disp_expressions[i.disp_operands];
8196 i.op[this_operand].disps = exp;
8197 i.disp_operands++;
8198 save_input_line_pointer = input_line_pointer;
8199 input_line_pointer = disp_start;
8200 END_STRING_AND_SAVE (disp_end);
8201
8202 #ifndef GCC_ASM_O_HACK
8203 #define GCC_ASM_O_HACK 0
8204 #endif
8205 #if GCC_ASM_O_HACK
8206 END_STRING_AND_SAVE (disp_end + 1);
8207 if (i.types[this_operand].bitfield.baseIndex
8208 && displacement_string_end[-1] == '+')
8209 {
8210 /* This hack is to avoid a warning when using the "o"
8211 constraint within gcc asm statements.
8212 For instance:
8213
8214 #define _set_tssldt_desc(n,addr,limit,type) \
8215 __asm__ __volatile__ ( \
8216 "movw %w2,%0\n\t" \
8217 "movw %w1,2+%0\n\t" \
8218 "rorl $16,%1\n\t" \
8219 "movb %b1,4+%0\n\t" \
8220 "movb %4,5+%0\n\t" \
8221 "movb $0,6+%0\n\t" \
8222 "movb %h1,7+%0\n\t" \
8223 "rorl $16,%1" \
8224 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
8225
8226 This works great except that the output assembler ends
8227 up looking a bit weird if it turns out that there is
8228 no offset. You end up producing code that looks like:
8229
8230 #APP
8231 movw $235,(%eax)
8232 movw %dx,2+(%eax)
8233 rorl $16,%edx
8234 movb %dl,4+(%eax)
8235 movb $137,5+(%eax)
8236 movb $0,6+(%eax)
8237 movb %dh,7+(%eax)
8238 rorl $16,%edx
8239 #NO_APP
8240
8241 So here we provide the missing zero. */
8242
8243 *displacement_string_end = '0';
8244 }
8245 #endif
8246 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
8247 if (gotfree_input_line)
8248 input_line_pointer = gotfree_input_line;
8249
8250 exp_seg = expression (exp);
8251
8252 SKIP_WHITESPACE ();
8253 if (*input_line_pointer)
8254 as_bad (_("junk `%s' after expression"), input_line_pointer);
8255 #if GCC_ASM_O_HACK
8256 RESTORE_END_STRING (disp_end + 1);
8257 #endif
8258 input_line_pointer = save_input_line_pointer;
8259 if (gotfree_input_line)
8260 {
8261 free (gotfree_input_line);
8262
8263 if (exp->X_op == O_constant || exp->X_op == O_register)
8264 exp->X_op = O_illegal;
8265 }
8266
8267 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
8268
8269 RESTORE_END_STRING (disp_end);
8270
8271 return ret;
8272 }
8273
8274 static int
8275 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8276 i386_operand_type types, const char *disp_start)
8277 {
8278 i386_operand_type bigdisp;
8279 int ret = 1;
8280
8281 /* We do this to make sure that the section symbol is in
8282 the symbol table. We will ultimately change the relocation
8283 to be relative to the beginning of the section. */
8284 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
8285 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
8286 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8287 {
8288 if (exp->X_op != O_symbol)
8289 goto inv_disp;
8290
8291 if (S_IS_LOCAL (exp->X_add_symbol)
8292 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
8293 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
8294 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
8295 exp->X_op = O_subtract;
8296 exp->X_op_symbol = GOT_symbol;
8297 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
8298 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
8299 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8300 i.reloc[this_operand] = BFD_RELOC_64;
8301 else
8302 i.reloc[this_operand] = BFD_RELOC_32;
8303 }
8304
8305 else if (exp->X_op == O_absent
8306 || exp->X_op == O_illegal
8307 || exp->X_op == O_big)
8308 {
8309 inv_disp:
8310 as_bad (_("missing or invalid displacement expression `%s'"),
8311 disp_start);
8312 ret = 0;
8313 }
8314
8315 else if (flag_code == CODE_64BIT
8316 && !i.prefix[ADDR_PREFIX]
8317 && exp->X_op == O_constant)
8318 {
8319 /* Since displacement is signed extended to 64bit, don't allow
8320 disp32 and turn off disp32s if they are out of range. */
8321 i.types[this_operand].bitfield.disp32 = 0;
8322 if (!fits_in_signed_long (exp->X_add_number))
8323 {
8324 i.types[this_operand].bitfield.disp32s = 0;
8325 if (i.types[this_operand].bitfield.baseindex)
8326 {
8327 as_bad (_("0x%lx out range of signed 32bit displacement"),
8328 (long) exp->X_add_number);
8329 ret = 0;
8330 }
8331 }
8332 }
8333
8334 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8335 else if (exp->X_op != O_constant
8336 && OUTPUT_FLAVOR == bfd_target_aout_flavour
8337 && exp_seg != absolute_section
8338 && exp_seg != text_section
8339 && exp_seg != data_section
8340 && exp_seg != bss_section
8341 && exp_seg != undefined_section
8342 && !bfd_is_com_section (exp_seg))
8343 {
8344 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8345 ret = 0;
8346 }
8347 #endif
8348
8349 /* Check if this is a displacement only operand. */
8350 bigdisp = i.types[this_operand];
8351 bigdisp.bitfield.disp8 = 0;
8352 bigdisp.bitfield.disp16 = 0;
8353 bigdisp.bitfield.disp32 = 0;
8354 bigdisp.bitfield.disp32s = 0;
8355 bigdisp.bitfield.disp64 = 0;
8356 if (operand_type_all_zero (&bigdisp))
8357 i.types[this_operand] = operand_type_and (i.types[this_operand],
8358 types);
8359
8360 return ret;
8361 }
8362
8363 /* Make sure the memory operand we've been dealt is valid.
8364 Return 1 on success, 0 on a failure. */
8365
8366 static int
8367 i386_index_check (const char *operand_string)
8368 {
8369 const char *kind = "base/index";
8370 enum flag_code addr_mode;
8371
8372 if (i.prefix[ADDR_PREFIX])
8373 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
8374 else
8375 {
8376 addr_mode = flag_code;
8377
8378 #if INFER_ADDR_PREFIX
8379 if (i.mem_operands == 0)
8380 {
8381 /* Infer address prefix from the first memory operand. */
8382 const reg_entry *addr_reg = i.base_reg;
8383
8384 if (addr_reg == NULL)
8385 addr_reg = i.index_reg;
8386
8387 if (addr_reg)
8388 {
8389 if (addr_reg->reg_num == RegEip
8390 || addr_reg->reg_num == RegEiz
8391 || addr_reg->reg_type.bitfield.reg32)
8392 addr_mode = CODE_32BIT;
8393 else if (flag_code != CODE_64BIT
8394 && addr_reg->reg_type.bitfield.reg16)
8395 addr_mode = CODE_16BIT;
8396
8397 if (addr_mode != flag_code)
8398 {
8399 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
8400 i.prefixes += 1;
8401 /* Change the size of any displacement too. At most one
8402 of Disp16 or Disp32 is set.
8403 FIXME. There doesn't seem to be any real need for
8404 separate Disp16 and Disp32 flags. The same goes for
8405 Imm16 and Imm32. Removing them would probably clean
8406 up the code quite a lot. */
8407 if (flag_code != CODE_64BIT
8408 && (i.types[this_operand].bitfield.disp16
8409 || i.types[this_operand].bitfield.disp32))
8410 i.types[this_operand]
8411 = operand_type_xor (i.types[this_operand], disp16_32);
8412 }
8413 }
8414 }
8415 #endif
8416 }
8417
8418 if (current_templates->start->opcode_modifier.isstring
8419 && !current_templates->start->opcode_modifier.immext
8420 && (current_templates->end[-1].opcode_modifier.isstring
8421 || i.mem_operands))
8422 {
8423 /* Memory operands of string insns are special in that they only allow
8424 a single register (rDI, rSI, or rBX) as their memory address. */
8425 const reg_entry *expected_reg;
8426 static const char *di_si[][2] =
8427 {
8428 { "esi", "edi" },
8429 { "si", "di" },
8430 { "rsi", "rdi" }
8431 };
8432 static const char *bx[] = { "ebx", "bx", "rbx" };
8433
8434 kind = "string address";
8435
8436 if (current_templates->start->opcode_modifier.w)
8437 {
8438 i386_operand_type type = current_templates->end[-1].operand_types[0];
8439
8440 if (!type.bitfield.baseindex
8441 || ((!i.mem_operands != !intel_syntax)
8442 && current_templates->end[-1].operand_types[1]
8443 .bitfield.baseindex))
8444 type = current_templates->end[-1].operand_types[1];
8445 expected_reg = hash_find (reg_hash,
8446 di_si[addr_mode][type.bitfield.esseg]);
8447
8448 }
8449 else
8450 expected_reg = hash_find (reg_hash, bx[addr_mode]);
8451
8452 if (i.base_reg != expected_reg
8453 || i.index_reg
8454 || operand_type_check (i.types[this_operand], disp))
8455 {
8456 /* The second memory operand must have the same size as
8457 the first one. */
8458 if (i.mem_operands
8459 && i.base_reg
8460 && !((addr_mode == CODE_64BIT
8461 && i.base_reg->reg_type.bitfield.reg64)
8462 || (addr_mode == CODE_32BIT
8463 ? i.base_reg->reg_type.bitfield.reg32
8464 : i.base_reg->reg_type.bitfield.reg16)))
8465 goto bad_address;
8466
8467 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
8468 operand_string,
8469 intel_syntax ? '[' : '(',
8470 register_prefix,
8471 expected_reg->reg_name,
8472 intel_syntax ? ']' : ')');
8473 return 1;
8474 }
8475 else
8476 return 1;
8477
8478 bad_address:
8479 as_bad (_("`%s' is not a valid %s expression"),
8480 operand_string, kind);
8481 return 0;
8482 }
8483 else
8484 {
8485 if (addr_mode != CODE_16BIT)
8486 {
8487 /* 32-bit/64-bit checks. */
8488 if ((i.base_reg
8489 && (addr_mode == CODE_64BIT
8490 ? !i.base_reg->reg_type.bitfield.reg64
8491 : !i.base_reg->reg_type.bitfield.reg32)
8492 && (i.index_reg
8493 || (i.base_reg->reg_num
8494 != (addr_mode == CODE_64BIT ? RegRip : RegEip))))
8495 || (i.index_reg
8496 && !i.index_reg->reg_type.bitfield.regxmm
8497 && !i.index_reg->reg_type.bitfield.regymm
8498 && !i.index_reg->reg_type.bitfield.regzmm
8499 && ((addr_mode == CODE_64BIT
8500 ? !(i.index_reg->reg_type.bitfield.reg64
8501 || i.index_reg->reg_num == RegRiz)
8502 : !(i.index_reg->reg_type.bitfield.reg32
8503 || i.index_reg->reg_num == RegEiz))
8504 || !i.index_reg->reg_type.bitfield.baseindex)))
8505 goto bad_address;
8506 }
8507 else
8508 {
8509 /* 16-bit checks. */
8510 if ((i.base_reg
8511 && (!i.base_reg->reg_type.bitfield.reg16
8512 || !i.base_reg->reg_type.bitfield.baseindex))
8513 || (i.index_reg
8514 && (!i.index_reg->reg_type.bitfield.reg16
8515 || !i.index_reg->reg_type.bitfield.baseindex
8516 || !(i.base_reg
8517 && i.base_reg->reg_num < 6
8518 && i.index_reg->reg_num >= 6
8519 && i.log2_scale_factor == 0))))
8520 goto bad_address;
8521 }
8522 }
8523 return 1;
8524 }
8525
8526 /* Handle vector immediates. */
8527
8528 static int
8529 RC_SAE_immediate (const char *imm_start)
8530 {
8531 unsigned int match_found, j;
8532 const char *pstr = imm_start;
8533 expressionS *exp;
8534
8535 if (*pstr != '{')
8536 return 0;
8537
8538 pstr++;
8539 match_found = 0;
8540 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
8541 {
8542 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
8543 {
8544 if (!i.rounding)
8545 {
8546 rc_op.type = RC_NamesTable[j].type;
8547 rc_op.operand = this_operand;
8548 i.rounding = &rc_op;
8549 }
8550 else
8551 {
8552 as_bad (_("duplicated `%s'"), imm_start);
8553 return 0;
8554 }
8555 pstr += RC_NamesTable[j].len;
8556 match_found = 1;
8557 break;
8558 }
8559 }
8560 if (!match_found)
8561 return 0;
8562
8563 if (*pstr++ != '}')
8564 {
8565 as_bad (_("Missing '}': '%s'"), imm_start);
8566 return 0;
8567 }
8568 /* RC/SAE immediate string should contain nothing more. */;
8569 if (*pstr != 0)
8570 {
8571 as_bad (_("Junk after '}': '%s'"), imm_start);
8572 return 0;
8573 }
8574
8575 exp = &im_expressions[i.imm_operands++];
8576 i.op[this_operand].imms = exp;
8577
8578 exp->X_op = O_constant;
8579 exp->X_add_number = 0;
8580 exp->X_add_symbol = (symbolS *) 0;
8581 exp->X_op_symbol = (symbolS *) 0;
8582
8583 i.types[this_operand].bitfield.imm8 = 1;
8584 return 1;
8585 }
8586
8587 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
8588 on error. */
8589
8590 static int
8591 i386_att_operand (char *operand_string)
8592 {
8593 const reg_entry *r;
8594 char *end_op;
8595 char *op_string = operand_string;
8596
8597 if (is_space_char (*op_string))
8598 ++op_string;
8599
8600 /* We check for an absolute prefix (differentiating,
8601 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
8602 if (*op_string == ABSOLUTE_PREFIX)
8603 {
8604 ++op_string;
8605 if (is_space_char (*op_string))
8606 ++op_string;
8607 i.types[this_operand].bitfield.jumpabsolute = 1;
8608 }
8609
8610 /* Check if operand is a register. */
8611 if ((r = parse_register (op_string, &end_op)) != NULL)
8612 {
8613 i386_operand_type temp;
8614
8615 /* Check for a segment override by searching for ':' after a
8616 segment register. */
8617 op_string = end_op;
8618 if (is_space_char (*op_string))
8619 ++op_string;
8620 if (*op_string == ':'
8621 && (r->reg_type.bitfield.sreg2
8622 || r->reg_type.bitfield.sreg3))
8623 {
8624 switch (r->reg_num)
8625 {
8626 case 0:
8627 i.seg[i.mem_operands] = &es;
8628 break;
8629 case 1:
8630 i.seg[i.mem_operands] = &cs;
8631 break;
8632 case 2:
8633 i.seg[i.mem_operands] = &ss;
8634 break;
8635 case 3:
8636 i.seg[i.mem_operands] = &ds;
8637 break;
8638 case 4:
8639 i.seg[i.mem_operands] = &fs;
8640 break;
8641 case 5:
8642 i.seg[i.mem_operands] = &gs;
8643 break;
8644 }
8645
8646 /* Skip the ':' and whitespace. */
8647 ++op_string;
8648 if (is_space_char (*op_string))
8649 ++op_string;
8650
8651 if (!is_digit_char (*op_string)
8652 && !is_identifier_char (*op_string)
8653 && *op_string != '('
8654 && *op_string != ABSOLUTE_PREFIX)
8655 {
8656 as_bad (_("bad memory operand `%s'"), op_string);
8657 return 0;
8658 }
8659 /* Handle case of %es:*foo. */
8660 if (*op_string == ABSOLUTE_PREFIX)
8661 {
8662 ++op_string;
8663 if (is_space_char (*op_string))
8664 ++op_string;
8665 i.types[this_operand].bitfield.jumpabsolute = 1;
8666 }
8667 goto do_memory_reference;
8668 }
8669
8670 /* Handle vector operations. */
8671 if (*op_string == '{')
8672 {
8673 op_string = check_VecOperations (op_string, NULL);
8674 if (op_string == NULL)
8675 return 0;
8676 }
8677
8678 if (*op_string)
8679 {
8680 as_bad (_("junk `%s' after register"), op_string);
8681 return 0;
8682 }
8683 temp = r->reg_type;
8684 temp.bitfield.baseindex = 0;
8685 i.types[this_operand] = operand_type_or (i.types[this_operand],
8686 temp);
8687 i.types[this_operand].bitfield.unspecified = 0;
8688 i.op[this_operand].regs = r;
8689 i.reg_operands++;
8690 }
8691 else if (*op_string == REGISTER_PREFIX)
8692 {
8693 as_bad (_("bad register name `%s'"), op_string);
8694 return 0;
8695 }
8696 else if (*op_string == IMMEDIATE_PREFIX)
8697 {
8698 ++op_string;
8699 if (i.types[this_operand].bitfield.jumpabsolute)
8700 {
8701 as_bad (_("immediate operand illegal with absolute jump"));
8702 return 0;
8703 }
8704 if (!i386_immediate (op_string))
8705 return 0;
8706 }
8707 else if (RC_SAE_immediate (operand_string))
8708 {
8709 /* If it is a RC or SAE immediate, do nothing. */
8710 ;
8711 }
8712 else if (is_digit_char (*op_string)
8713 || is_identifier_char (*op_string)
8714 || *op_string == '"'
8715 || *op_string == '(')
8716 {
8717 /* This is a memory reference of some sort. */
8718 char *base_string;
8719
8720 /* Start and end of displacement string expression (if found). */
8721 char *displacement_string_start;
8722 char *displacement_string_end;
8723 char *vop_start;
8724
8725 do_memory_reference:
8726 if ((i.mem_operands == 1
8727 && !current_templates->start->opcode_modifier.isstring)
8728 || i.mem_operands == 2)
8729 {
8730 as_bad (_("too many memory references for `%s'"),
8731 current_templates->start->name);
8732 return 0;
8733 }
8734
8735 /* Check for base index form. We detect the base index form by
8736 looking for an ')' at the end of the operand, searching
8737 for the '(' matching it, and finding a REGISTER_PREFIX or ','
8738 after the '('. */
8739 base_string = op_string + strlen (op_string);
8740
8741 /* Handle vector operations. */
8742 vop_start = strchr (op_string, '{');
8743 if (vop_start && vop_start < base_string)
8744 {
8745 if (check_VecOperations (vop_start, base_string) == NULL)
8746 return 0;
8747 base_string = vop_start;
8748 }
8749
8750 --base_string;
8751 if (is_space_char (*base_string))
8752 --base_string;
8753
8754 /* If we only have a displacement, set-up for it to be parsed later. */
8755 displacement_string_start = op_string;
8756 displacement_string_end = base_string + 1;
8757
8758 if (*base_string == ')')
8759 {
8760 char *temp_string;
8761 unsigned int parens_balanced = 1;
8762 /* We've already checked that the number of left & right ()'s are
8763 equal, so this loop will not be infinite. */
8764 do
8765 {
8766 base_string--;
8767 if (*base_string == ')')
8768 parens_balanced++;
8769 if (*base_string == '(')
8770 parens_balanced--;
8771 }
8772 while (parens_balanced);
8773
8774 temp_string = base_string;
8775
8776 /* Skip past '(' and whitespace. */
8777 ++base_string;
8778 if (is_space_char (*base_string))
8779 ++base_string;
8780
8781 if (*base_string == ','
8782 || ((i.base_reg = parse_register (base_string, &end_op))
8783 != NULL))
8784 {
8785 displacement_string_end = temp_string;
8786
8787 i.types[this_operand].bitfield.baseindex = 1;
8788
8789 if (i.base_reg)
8790 {
8791 base_string = end_op;
8792 if (is_space_char (*base_string))
8793 ++base_string;
8794 }
8795
8796 /* There may be an index reg or scale factor here. */
8797 if (*base_string == ',')
8798 {
8799 ++base_string;
8800 if (is_space_char (*base_string))
8801 ++base_string;
8802
8803 if ((i.index_reg = parse_register (base_string, &end_op))
8804 != NULL)
8805 {
8806 base_string = end_op;
8807 if (is_space_char (*base_string))
8808 ++base_string;
8809 if (*base_string == ',')
8810 {
8811 ++base_string;
8812 if (is_space_char (*base_string))
8813 ++base_string;
8814 }
8815 else if (*base_string != ')')
8816 {
8817 as_bad (_("expecting `,' or `)' "
8818 "after index register in `%s'"),
8819 operand_string);
8820 return 0;
8821 }
8822 }
8823 else if (*base_string == REGISTER_PREFIX)
8824 {
8825 end_op = strchr (base_string, ',');
8826 if (end_op)
8827 *end_op = '\0';
8828 as_bad (_("bad register name `%s'"), base_string);
8829 return 0;
8830 }
8831
8832 /* Check for scale factor. */
8833 if (*base_string != ')')
8834 {
8835 char *end_scale = i386_scale (base_string);
8836
8837 if (!end_scale)
8838 return 0;
8839
8840 base_string = end_scale;
8841 if (is_space_char (*base_string))
8842 ++base_string;
8843 if (*base_string != ')')
8844 {
8845 as_bad (_("expecting `)' "
8846 "after scale factor in `%s'"),
8847 operand_string);
8848 return 0;
8849 }
8850 }
8851 else if (!i.index_reg)
8852 {
8853 as_bad (_("expecting index register or scale factor "
8854 "after `,'; got '%c'"),
8855 *base_string);
8856 return 0;
8857 }
8858 }
8859 else if (*base_string != ')')
8860 {
8861 as_bad (_("expecting `,' or `)' "
8862 "after base register in `%s'"),
8863 operand_string);
8864 return 0;
8865 }
8866 }
8867 else if (*base_string == REGISTER_PREFIX)
8868 {
8869 end_op = strchr (base_string, ',');
8870 if (end_op)
8871 *end_op = '\0';
8872 as_bad (_("bad register name `%s'"), base_string);
8873 return 0;
8874 }
8875 }
8876
8877 /* If there's an expression beginning the operand, parse it,
8878 assuming displacement_string_start and
8879 displacement_string_end are meaningful. */
8880 if (displacement_string_start != displacement_string_end)
8881 {
8882 if (!i386_displacement (displacement_string_start,
8883 displacement_string_end))
8884 return 0;
8885 }
8886
8887 /* Special case for (%dx) while doing input/output op. */
8888 if (i.base_reg
8889 && operand_type_equal (&i.base_reg->reg_type,
8890 &reg16_inoutportreg)
8891 && i.index_reg == 0
8892 && i.log2_scale_factor == 0
8893 && i.seg[i.mem_operands] == 0
8894 && !operand_type_check (i.types[this_operand], disp))
8895 {
8896 i.types[this_operand] = inoutportreg;
8897 return 1;
8898 }
8899
8900 if (i386_index_check (operand_string) == 0)
8901 return 0;
8902 i.types[this_operand].bitfield.mem = 1;
8903 i.mem_operands++;
8904 }
8905 else
8906 {
8907 /* It's not a memory operand; argh! */
8908 as_bad (_("invalid char %s beginning operand %d `%s'"),
8909 output_invalid (*op_string),
8910 this_operand + 1,
8911 op_string);
8912 return 0;
8913 }
8914 return 1; /* Normal return. */
8915 }
8916 \f
8917 /* Calculate the maximum variable size (i.e., excluding fr_fix)
8918 that an rs_machine_dependent frag may reach. */
8919
8920 unsigned int
8921 i386_frag_max_var (fragS *frag)
8922 {
8923 /* The only relaxable frags are for jumps.
8924 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
8925 gas_assert (frag->fr_type == rs_machine_dependent);
8926 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
8927 }
8928
8929 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8930 static int
8931 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
8932 {
8933 /* STT_GNU_IFUNC symbol must go through PLT. */
8934 if ((symbol_get_bfdsym (fr_symbol)->flags
8935 & BSF_GNU_INDIRECT_FUNCTION) != 0)
8936 return 0;
8937
8938 if (!S_IS_EXTERNAL (fr_symbol))
8939 /* Symbol may be weak or local. */
8940 return !S_IS_WEAK (fr_symbol);
8941
8942 /* Global symbols with non-default visibility can't be preempted. */
8943 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
8944 return 1;
8945
8946 if (fr_var != NO_RELOC)
8947 switch ((enum bfd_reloc_code_real) fr_var)
8948 {
8949 case BFD_RELOC_386_PLT32:
8950 case BFD_RELOC_X86_64_PLT32:
8951 /* Symbol with PLT relocatin may be preempted. */
8952 return 0;
8953 default:
8954 abort ();
8955 }
8956
8957 /* Global symbols with default visibility in a shared library may be
8958 preempted by another definition. */
8959 return !shared;
8960 }
8961 #endif
8962
8963 /* md_estimate_size_before_relax()
8964
8965 Called just before relax() for rs_machine_dependent frags. The x86
8966 assembler uses these frags to handle variable size jump
8967 instructions.
8968
8969 Any symbol that is now undefined will not become defined.
8970 Return the correct fr_subtype in the frag.
8971 Return the initial "guess for variable size of frag" to caller.
8972 The guess is actually the growth beyond the fixed part. Whatever
8973 we do to grow the fixed or variable part contributes to our
8974 returned value. */
8975
8976 int
8977 md_estimate_size_before_relax (fragS *fragP, segT segment)
8978 {
8979 /* We've already got fragP->fr_subtype right; all we have to do is
8980 check for un-relaxable symbols. On an ELF system, we can't relax
8981 an externally visible symbol, because it may be overridden by a
8982 shared library. */
8983 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
8984 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8985 || (IS_ELF
8986 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
8987 fragP->fr_var))
8988 #endif
8989 #if defined (OBJ_COFF) && defined (TE_PE)
8990 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
8991 && S_IS_WEAK (fragP->fr_symbol))
8992 #endif
8993 )
8994 {
8995 /* Symbol is undefined in this segment, or we need to keep a
8996 reloc so that weak symbols can be overridden. */
8997 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
8998 enum bfd_reloc_code_real reloc_type;
8999 unsigned char *opcode;
9000 int old_fr_fix;
9001
9002 if (fragP->fr_var != NO_RELOC)
9003 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
9004 else if (size == 2)
9005 reloc_type = BFD_RELOC_16_PCREL;
9006 else
9007 reloc_type = BFD_RELOC_32_PCREL;
9008
9009 old_fr_fix = fragP->fr_fix;
9010 opcode = (unsigned char *) fragP->fr_opcode;
9011
9012 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
9013 {
9014 case UNCOND_JUMP:
9015 /* Make jmp (0xeb) a (d)word displacement jump. */
9016 opcode[0] = 0xe9;
9017 fragP->fr_fix += size;
9018 fix_new (fragP, old_fr_fix, size,
9019 fragP->fr_symbol,
9020 fragP->fr_offset, 1,
9021 reloc_type);
9022 break;
9023
9024 case COND_JUMP86:
9025 if (size == 2
9026 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
9027 {
9028 /* Negate the condition, and branch past an
9029 unconditional jump. */
9030 opcode[0] ^= 1;
9031 opcode[1] = 3;
9032 /* Insert an unconditional jump. */
9033 opcode[2] = 0xe9;
9034 /* We added two extra opcode bytes, and have a two byte
9035 offset. */
9036 fragP->fr_fix += 2 + 2;
9037 fix_new (fragP, old_fr_fix + 2, 2,
9038 fragP->fr_symbol,
9039 fragP->fr_offset, 1,
9040 reloc_type);
9041 break;
9042 }
9043 /* Fall through. */
9044
9045 case COND_JUMP:
9046 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
9047 {
9048 fixS *fixP;
9049
9050 fragP->fr_fix += 1;
9051 fixP = fix_new (fragP, old_fr_fix, 1,
9052 fragP->fr_symbol,
9053 fragP->fr_offset, 1,
9054 BFD_RELOC_8_PCREL);
9055 fixP->fx_signed = 1;
9056 break;
9057 }
9058
9059 /* This changes the byte-displacement jump 0x7N
9060 to the (d)word-displacement jump 0x0f,0x8N. */
9061 opcode[1] = opcode[0] + 0x10;
9062 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9063 /* We've added an opcode byte. */
9064 fragP->fr_fix += 1 + size;
9065 fix_new (fragP, old_fr_fix + 1, size,
9066 fragP->fr_symbol,
9067 fragP->fr_offset, 1,
9068 reloc_type);
9069 break;
9070
9071 default:
9072 BAD_CASE (fragP->fr_subtype);
9073 break;
9074 }
9075 frag_wane (fragP);
9076 return fragP->fr_fix - old_fr_fix;
9077 }
9078
9079 /* Guess size depending on current relax state. Initially the relax
9080 state will correspond to a short jump and we return 1, because
9081 the variable part of the frag (the branch offset) is one byte
9082 long. However, we can relax a section more than once and in that
9083 case we must either set fr_subtype back to the unrelaxed state,
9084 or return the value for the appropriate branch. */
9085 return md_relax_table[fragP->fr_subtype].rlx_length;
9086 }
9087
9088 /* Called after relax() is finished.
9089
9090 In: Address of frag.
9091 fr_type == rs_machine_dependent.
9092 fr_subtype is what the address relaxed to.
9093
9094 Out: Any fixSs and constants are set up.
9095 Caller will turn frag into a ".space 0". */
9096
9097 void
9098 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
9099 fragS *fragP)
9100 {
9101 unsigned char *opcode;
9102 unsigned char *where_to_put_displacement = NULL;
9103 offsetT target_address;
9104 offsetT opcode_address;
9105 unsigned int extension = 0;
9106 offsetT displacement_from_opcode_start;
9107
9108 opcode = (unsigned char *) fragP->fr_opcode;
9109
9110 /* Address we want to reach in file space. */
9111 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
9112
9113 /* Address opcode resides at in file space. */
9114 opcode_address = fragP->fr_address + fragP->fr_fix;
9115
9116 /* Displacement from opcode start to fill into instruction. */
9117 displacement_from_opcode_start = target_address - opcode_address;
9118
9119 if ((fragP->fr_subtype & BIG) == 0)
9120 {
9121 /* Don't have to change opcode. */
9122 extension = 1; /* 1 opcode + 1 displacement */
9123 where_to_put_displacement = &opcode[1];
9124 }
9125 else
9126 {
9127 if (no_cond_jump_promotion
9128 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
9129 as_warn_where (fragP->fr_file, fragP->fr_line,
9130 _("long jump required"));
9131
9132 switch (fragP->fr_subtype)
9133 {
9134 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
9135 extension = 4; /* 1 opcode + 4 displacement */
9136 opcode[0] = 0xe9;
9137 where_to_put_displacement = &opcode[1];
9138 break;
9139
9140 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
9141 extension = 2; /* 1 opcode + 2 displacement */
9142 opcode[0] = 0xe9;
9143 where_to_put_displacement = &opcode[1];
9144 break;
9145
9146 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
9147 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
9148 extension = 5; /* 2 opcode + 4 displacement */
9149 opcode[1] = opcode[0] + 0x10;
9150 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9151 where_to_put_displacement = &opcode[2];
9152 break;
9153
9154 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
9155 extension = 3; /* 2 opcode + 2 displacement */
9156 opcode[1] = opcode[0] + 0x10;
9157 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9158 where_to_put_displacement = &opcode[2];
9159 break;
9160
9161 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
9162 extension = 4;
9163 opcode[0] ^= 1;
9164 opcode[1] = 3;
9165 opcode[2] = 0xe9;
9166 where_to_put_displacement = &opcode[3];
9167 break;
9168
9169 default:
9170 BAD_CASE (fragP->fr_subtype);
9171 break;
9172 }
9173 }
9174
9175 /* If size if less then four we are sure that the operand fits,
9176 but if it's 4, then it could be that the displacement is larger
9177 then -/+ 2GB. */
9178 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
9179 && object_64bit
9180 && ((addressT) (displacement_from_opcode_start - extension
9181 + ((addressT) 1 << 31))
9182 > (((addressT) 2 << 31) - 1)))
9183 {
9184 as_bad_where (fragP->fr_file, fragP->fr_line,
9185 _("jump target out of range"));
9186 /* Make us emit 0. */
9187 displacement_from_opcode_start = extension;
9188 }
9189 /* Now put displacement after opcode. */
9190 md_number_to_chars ((char *) where_to_put_displacement,
9191 (valueT) (displacement_from_opcode_start - extension),
9192 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
9193 fragP->fr_fix += extension;
9194 }
9195 \f
9196 /* Apply a fixup (fixP) to segment data, once it has been determined
9197 by our caller that we have all the info we need to fix it up.
9198
9199 Parameter valP is the pointer to the value of the bits.
9200
9201 On the 386, immediates, displacements, and data pointers are all in
9202 the same (little-endian) format, so we don't need to care about which
9203 we are handling. */
9204
9205 void
9206 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
9207 {
9208 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
9209 valueT value = *valP;
9210
9211 #if !defined (TE_Mach)
9212 if (fixP->fx_pcrel)
9213 {
9214 switch (fixP->fx_r_type)
9215 {
9216 default:
9217 break;
9218
9219 case BFD_RELOC_64:
9220 fixP->fx_r_type = BFD_RELOC_64_PCREL;
9221 break;
9222 case BFD_RELOC_32:
9223 case BFD_RELOC_X86_64_32S:
9224 fixP->fx_r_type = BFD_RELOC_32_PCREL;
9225 break;
9226 case BFD_RELOC_16:
9227 fixP->fx_r_type = BFD_RELOC_16_PCREL;
9228 break;
9229 case BFD_RELOC_8:
9230 fixP->fx_r_type = BFD_RELOC_8_PCREL;
9231 break;
9232 }
9233 }
9234
9235 if (fixP->fx_addsy != NULL
9236 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
9237 || fixP->fx_r_type == BFD_RELOC_64_PCREL
9238 || fixP->fx_r_type == BFD_RELOC_16_PCREL
9239 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
9240 && !use_rela_relocations)
9241 {
9242 /* This is a hack. There should be a better way to handle this.
9243 This covers for the fact that bfd_install_relocation will
9244 subtract the current location (for partial_inplace, PC relative
9245 relocations); see more below. */
9246 #ifndef OBJ_AOUT
9247 if (IS_ELF
9248 #ifdef TE_PE
9249 || OUTPUT_FLAVOR == bfd_target_coff_flavour
9250 #endif
9251 )
9252 value += fixP->fx_where + fixP->fx_frag->fr_address;
9253 #endif
9254 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9255 if (IS_ELF)
9256 {
9257 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
9258
9259 if ((sym_seg == seg
9260 || (symbol_section_p (fixP->fx_addsy)
9261 && sym_seg != absolute_section))
9262 && !generic_force_reloc (fixP))
9263 {
9264 /* Yes, we add the values in twice. This is because
9265 bfd_install_relocation subtracts them out again. I think
9266 bfd_install_relocation is broken, but I don't dare change
9267 it. FIXME. */
9268 value += fixP->fx_where + fixP->fx_frag->fr_address;
9269 }
9270 }
9271 #endif
9272 #if defined (OBJ_COFF) && defined (TE_PE)
9273 /* For some reason, the PE format does not store a
9274 section address offset for a PC relative symbol. */
9275 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
9276 || S_IS_WEAK (fixP->fx_addsy))
9277 value += md_pcrel_from (fixP);
9278 #endif
9279 }
9280 #if defined (OBJ_COFF) && defined (TE_PE)
9281 if (fixP->fx_addsy != NULL
9282 && S_IS_WEAK (fixP->fx_addsy)
9283 /* PR 16858: Do not modify weak function references. */
9284 && ! fixP->fx_pcrel)
9285 {
9286 #if !defined (TE_PEP)
9287 /* For x86 PE weak function symbols are neither PC-relative
9288 nor do they set S_IS_FUNCTION. So the only reliable way
9289 to detect them is to check the flags of their containing
9290 section. */
9291 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
9292 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
9293 ;
9294 else
9295 #endif
9296 value -= S_GET_VALUE (fixP->fx_addsy);
9297 }
9298 #endif
9299
9300 /* Fix a few things - the dynamic linker expects certain values here,
9301 and we must not disappoint it. */
9302 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9303 if (IS_ELF && fixP->fx_addsy)
9304 switch (fixP->fx_r_type)
9305 {
9306 case BFD_RELOC_386_PLT32:
9307 case BFD_RELOC_X86_64_PLT32:
9308 /* Make the jump instruction point to the address of the operand. At
9309 runtime we merely add the offset to the actual PLT entry. */
9310 value = -4;
9311 break;
9312
9313 case BFD_RELOC_386_TLS_GD:
9314 case BFD_RELOC_386_TLS_LDM:
9315 case BFD_RELOC_386_TLS_IE_32:
9316 case BFD_RELOC_386_TLS_IE:
9317 case BFD_RELOC_386_TLS_GOTIE:
9318 case BFD_RELOC_386_TLS_GOTDESC:
9319 case BFD_RELOC_X86_64_TLSGD:
9320 case BFD_RELOC_X86_64_TLSLD:
9321 case BFD_RELOC_X86_64_GOTTPOFF:
9322 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9323 value = 0; /* Fully resolved at runtime. No addend. */
9324 /* Fallthrough */
9325 case BFD_RELOC_386_TLS_LE:
9326 case BFD_RELOC_386_TLS_LDO_32:
9327 case BFD_RELOC_386_TLS_LE_32:
9328 case BFD_RELOC_X86_64_DTPOFF32:
9329 case BFD_RELOC_X86_64_DTPOFF64:
9330 case BFD_RELOC_X86_64_TPOFF32:
9331 case BFD_RELOC_X86_64_TPOFF64:
9332 S_SET_THREAD_LOCAL (fixP->fx_addsy);
9333 break;
9334
9335 case BFD_RELOC_386_TLS_DESC_CALL:
9336 case BFD_RELOC_X86_64_TLSDESC_CALL:
9337 value = 0; /* Fully resolved at runtime. No addend. */
9338 S_SET_THREAD_LOCAL (fixP->fx_addsy);
9339 fixP->fx_done = 0;
9340 return;
9341
9342 case BFD_RELOC_386_GOT32:
9343 case BFD_RELOC_X86_64_GOT32:
9344 value = 0; /* Fully resolved at runtime. No addend. */
9345 break;
9346
9347 case BFD_RELOC_VTABLE_INHERIT:
9348 case BFD_RELOC_VTABLE_ENTRY:
9349 fixP->fx_done = 0;
9350 return;
9351
9352 default:
9353 break;
9354 }
9355 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
9356 *valP = value;
9357 #endif /* !defined (TE_Mach) */
9358
9359 /* Are we finished with this relocation now? */
9360 if (fixP->fx_addsy == NULL)
9361 fixP->fx_done = 1;
9362 #if defined (OBJ_COFF) && defined (TE_PE)
9363 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
9364 {
9365 fixP->fx_done = 0;
9366 /* Remember value for tc_gen_reloc. */
9367 fixP->fx_addnumber = value;
9368 /* Clear out the frag for now. */
9369 value = 0;
9370 }
9371 #endif
9372 else if (use_rela_relocations)
9373 {
9374 fixP->fx_no_overflow = 1;
9375 /* Remember value for tc_gen_reloc. */
9376 fixP->fx_addnumber = value;
9377 value = 0;
9378 }
9379
9380 md_number_to_chars (p, value, fixP->fx_size);
9381 }
9382 \f
9383 const char *
9384 md_atof (int type, char *litP, int *sizeP)
9385 {
9386 /* This outputs the LITTLENUMs in REVERSE order;
9387 in accord with the bigendian 386. */
9388 return ieee_md_atof (type, litP, sizeP, FALSE);
9389 }
9390 \f
9391 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
9392
9393 static char *
9394 output_invalid (int c)
9395 {
9396 if (ISPRINT (c))
9397 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9398 "'%c'", c);
9399 else
9400 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9401 "(0x%x)", (unsigned char) c);
9402 return output_invalid_buf;
9403 }
9404
9405 /* REG_STRING starts *before* REGISTER_PREFIX. */
9406
9407 static const reg_entry *
9408 parse_real_register (char *reg_string, char **end_op)
9409 {
9410 char *s = reg_string;
9411 char *p;
9412 char reg_name_given[MAX_REG_NAME_SIZE + 1];
9413 const reg_entry *r;
9414
9415 /* Skip possible REGISTER_PREFIX and possible whitespace. */
9416 if (*s == REGISTER_PREFIX)
9417 ++s;
9418
9419 if (is_space_char (*s))
9420 ++s;
9421
9422 p = reg_name_given;
9423 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
9424 {
9425 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
9426 return (const reg_entry *) NULL;
9427 s++;
9428 }
9429
9430 /* For naked regs, make sure that we are not dealing with an identifier.
9431 This prevents confusing an identifier like `eax_var' with register
9432 `eax'. */
9433 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
9434 return (const reg_entry *) NULL;
9435
9436 *end_op = s;
9437
9438 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
9439
9440 /* Handle floating point regs, allowing spaces in the (i) part. */
9441 if (r == i386_regtab /* %st is first entry of table */)
9442 {
9443 if (is_space_char (*s))
9444 ++s;
9445 if (*s == '(')
9446 {
9447 ++s;
9448 if (is_space_char (*s))
9449 ++s;
9450 if (*s >= '0' && *s <= '7')
9451 {
9452 int fpr = *s - '0';
9453 ++s;
9454 if (is_space_char (*s))
9455 ++s;
9456 if (*s == ')')
9457 {
9458 *end_op = s + 1;
9459 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
9460 know (r);
9461 return r + fpr;
9462 }
9463 }
9464 /* We have "%st(" then garbage. */
9465 return (const reg_entry *) NULL;
9466 }
9467 }
9468
9469 if (r == NULL || allow_pseudo_reg)
9470 return r;
9471
9472 if (operand_type_all_zero (&r->reg_type))
9473 return (const reg_entry *) NULL;
9474
9475 if ((r->reg_type.bitfield.reg32
9476 || r->reg_type.bitfield.sreg3
9477 || r->reg_type.bitfield.control
9478 || r->reg_type.bitfield.debug
9479 || r->reg_type.bitfield.test)
9480 && !cpu_arch_flags.bitfield.cpui386)
9481 return (const reg_entry *) NULL;
9482
9483 if (r->reg_type.bitfield.floatreg
9484 && !cpu_arch_flags.bitfield.cpu8087
9485 && !cpu_arch_flags.bitfield.cpu287
9486 && !cpu_arch_flags.bitfield.cpu387)
9487 return (const reg_entry *) NULL;
9488
9489 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
9490 return (const reg_entry *) NULL;
9491
9492 if (r->reg_type.bitfield.regxmm && !cpu_arch_flags.bitfield.cpusse)
9493 return (const reg_entry *) NULL;
9494
9495 if (r->reg_type.bitfield.regymm && !cpu_arch_flags.bitfield.cpuavx)
9496 return (const reg_entry *) NULL;
9497
9498 if ((r->reg_type.bitfield.regzmm || r->reg_type.bitfield.regmask)
9499 && !cpu_arch_flags.bitfield.cpuavx512f)
9500 return (const reg_entry *) NULL;
9501
9502 /* Don't allow fake index register unless allow_index_reg isn't 0. */
9503 if (!allow_index_reg
9504 && (r->reg_num == RegEiz || r->reg_num == RegRiz))
9505 return (const reg_entry *) NULL;
9506
9507 /* Upper 16 vector register is only available with VREX in 64bit
9508 mode. */
9509 if ((r->reg_flags & RegVRex))
9510 {
9511 if (!cpu_arch_flags.bitfield.cpuvrex
9512 || flag_code != CODE_64BIT)
9513 return (const reg_entry *) NULL;
9514
9515 i.need_vrex = 1;
9516 }
9517
9518 if (((r->reg_flags & (RegRex64 | RegRex))
9519 || r->reg_type.bitfield.reg64)
9520 && (!cpu_arch_flags.bitfield.cpulm
9521 || !operand_type_equal (&r->reg_type, &control))
9522 && flag_code != CODE_64BIT)
9523 return (const reg_entry *) NULL;
9524
9525 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
9526 return (const reg_entry *) NULL;
9527
9528 return r;
9529 }
9530
9531 /* REG_STRING starts *before* REGISTER_PREFIX. */
9532
9533 static const reg_entry *
9534 parse_register (char *reg_string, char **end_op)
9535 {
9536 const reg_entry *r;
9537
9538 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
9539 r = parse_real_register (reg_string, end_op);
9540 else
9541 r = NULL;
9542 if (!r)
9543 {
9544 char *save = input_line_pointer;
9545 char c;
9546 symbolS *symbolP;
9547
9548 input_line_pointer = reg_string;
9549 c = get_symbol_name (&reg_string);
9550 symbolP = symbol_find (reg_string);
9551 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
9552 {
9553 const expressionS *e = symbol_get_value_expression (symbolP);
9554
9555 know (e->X_op == O_register);
9556 know (e->X_add_number >= 0
9557 && (valueT) e->X_add_number < i386_regtab_size);
9558 r = i386_regtab + e->X_add_number;
9559 if ((r->reg_flags & RegVRex))
9560 i.need_vrex = 1;
9561 *end_op = input_line_pointer;
9562 }
9563 *input_line_pointer = c;
9564 input_line_pointer = save;
9565 }
9566 return r;
9567 }
9568
9569 int
9570 i386_parse_name (char *name, expressionS *e, char *nextcharP)
9571 {
9572 const reg_entry *r;
9573 char *end = input_line_pointer;
9574
9575 *end = *nextcharP;
9576 r = parse_register (name, &input_line_pointer);
9577 if (r && end <= input_line_pointer)
9578 {
9579 *nextcharP = *input_line_pointer;
9580 *input_line_pointer = 0;
9581 e->X_op = O_register;
9582 e->X_add_number = r - i386_regtab;
9583 return 1;
9584 }
9585 input_line_pointer = end;
9586 *end = 0;
9587 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
9588 }
9589
9590 void
9591 md_operand (expressionS *e)
9592 {
9593 char *end;
9594 const reg_entry *r;
9595
9596 switch (*input_line_pointer)
9597 {
9598 case REGISTER_PREFIX:
9599 r = parse_real_register (input_line_pointer, &end);
9600 if (r)
9601 {
9602 e->X_op = O_register;
9603 e->X_add_number = r - i386_regtab;
9604 input_line_pointer = end;
9605 }
9606 break;
9607
9608 case '[':
9609 gas_assert (intel_syntax);
9610 end = input_line_pointer++;
9611 expression (e);
9612 if (*input_line_pointer == ']')
9613 {
9614 ++input_line_pointer;
9615 e->X_op_symbol = make_expr_symbol (e);
9616 e->X_add_symbol = NULL;
9617 e->X_add_number = 0;
9618 e->X_op = O_index;
9619 }
9620 else
9621 {
9622 e->X_op = O_absent;
9623 input_line_pointer = end;
9624 }
9625 break;
9626 }
9627 }
9628
9629 \f
9630 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9631 const char *md_shortopts = "kVQ:sqn";
9632 #else
9633 const char *md_shortopts = "qn";
9634 #endif
9635
9636 #define OPTION_32 (OPTION_MD_BASE + 0)
9637 #define OPTION_64 (OPTION_MD_BASE + 1)
9638 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9639 #define OPTION_MARCH (OPTION_MD_BASE + 3)
9640 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
9641 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
9642 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
9643 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
9644 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
9645 #define OPTION_MOLD_GCC (OPTION_MD_BASE + 9)
9646 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
9647 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
9648 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
9649 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
9650 #define OPTION_X32 (OPTION_MD_BASE + 14)
9651 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
9652 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
9653 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
9654 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
9655 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
9656 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
9657 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
9658 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
9659 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
9660 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
9661 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 25)
9662
9663 struct option md_longopts[] =
9664 {
9665 {"32", no_argument, NULL, OPTION_32},
9666 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9667 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9668 {"64", no_argument, NULL, OPTION_64},
9669 #endif
9670 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9671 {"x32", no_argument, NULL, OPTION_X32},
9672 {"mshared", no_argument, NULL, OPTION_MSHARED},
9673 #endif
9674 {"divide", no_argument, NULL, OPTION_DIVIDE},
9675 {"march", required_argument, NULL, OPTION_MARCH},
9676 {"mtune", required_argument, NULL, OPTION_MTUNE},
9677 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
9678 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
9679 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
9680 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
9681 {"mold-gcc", no_argument, NULL, OPTION_MOLD_GCC},
9682 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
9683 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
9684 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
9685 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
9686 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
9687 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
9688 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
9689 # if defined (TE_PE) || defined (TE_PEP)
9690 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
9691 #endif
9692 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
9693 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
9694 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
9695 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
9696 {"mamd64", no_argument, NULL, OPTION_MAMD64},
9697 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
9698 {NULL, no_argument, NULL, 0}
9699 };
9700 size_t md_longopts_size = sizeof (md_longopts);
9701
9702 int
9703 md_parse_option (int c, const char *arg)
9704 {
9705 unsigned int j;
9706 char *arch, *next;
9707
9708 switch (c)
9709 {
9710 case 'n':
9711 optimize_align_code = 0;
9712 break;
9713
9714 case 'q':
9715 quiet_warnings = 1;
9716 break;
9717
9718 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9719 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
9720 should be emitted or not. FIXME: Not implemented. */
9721 case 'Q':
9722 break;
9723
9724 /* -V: SVR4 argument to print version ID. */
9725 case 'V':
9726 print_version_id ();
9727 break;
9728
9729 /* -k: Ignore for FreeBSD compatibility. */
9730 case 'k':
9731 break;
9732
9733 case 's':
9734 /* -s: On i386 Solaris, this tells the native assembler to use
9735 .stab instead of .stab.excl. We always use .stab anyhow. */
9736 break;
9737
9738 case OPTION_MSHARED:
9739 shared = 1;
9740 break;
9741 #endif
9742 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9743 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9744 case OPTION_64:
9745 {
9746 const char **list, **l;
9747
9748 list = bfd_target_list ();
9749 for (l = list; *l != NULL; l++)
9750 if (CONST_STRNEQ (*l, "elf64-x86-64")
9751 || strcmp (*l, "coff-x86-64") == 0
9752 || strcmp (*l, "pe-x86-64") == 0
9753 || strcmp (*l, "pei-x86-64") == 0
9754 || strcmp (*l, "mach-o-x86-64") == 0)
9755 {
9756 default_arch = "x86_64";
9757 break;
9758 }
9759 if (*l == NULL)
9760 as_fatal (_("no compiled in support for x86_64"));
9761 free (list);
9762 }
9763 break;
9764 #endif
9765
9766 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9767 case OPTION_X32:
9768 if (IS_ELF)
9769 {
9770 const char **list, **l;
9771
9772 list = bfd_target_list ();
9773 for (l = list; *l != NULL; l++)
9774 if (CONST_STRNEQ (*l, "elf32-x86-64"))
9775 {
9776 default_arch = "x86_64:32";
9777 break;
9778 }
9779 if (*l == NULL)
9780 as_fatal (_("no compiled in support for 32bit x86_64"));
9781 free (list);
9782 }
9783 else
9784 as_fatal (_("32bit x86_64 is only supported for ELF"));
9785 break;
9786 #endif
9787
9788 case OPTION_32:
9789 default_arch = "i386";
9790 break;
9791
9792 case OPTION_DIVIDE:
9793 #ifdef SVR4_COMMENT_CHARS
9794 {
9795 char *n, *t;
9796 const char *s;
9797
9798 n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
9799 t = n;
9800 for (s = i386_comment_chars; *s != '\0'; s++)
9801 if (*s != '/')
9802 *t++ = *s;
9803 *t = '\0';
9804 i386_comment_chars = n;
9805 }
9806 #endif
9807 break;
9808
9809 case OPTION_MARCH:
9810 arch = xstrdup (arg);
9811 do
9812 {
9813 if (*arch == '.')
9814 as_fatal (_("invalid -march= option: `%s'"), arg);
9815 next = strchr (arch, '+');
9816 if (next)
9817 *next++ = '\0';
9818 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9819 {
9820 if (strcmp (arch, cpu_arch [j].name) == 0)
9821 {
9822 /* Processor. */
9823 if (! cpu_arch[j].flags.bitfield.cpui386)
9824 continue;
9825
9826 cpu_arch_name = cpu_arch[j].name;
9827 cpu_sub_arch_name = NULL;
9828 cpu_arch_flags = cpu_arch[j].flags;
9829 cpu_arch_isa = cpu_arch[j].type;
9830 cpu_arch_isa_flags = cpu_arch[j].flags;
9831 if (!cpu_arch_tune_set)
9832 {
9833 cpu_arch_tune = cpu_arch_isa;
9834 cpu_arch_tune_flags = cpu_arch_isa_flags;
9835 }
9836 break;
9837 }
9838 else if (*cpu_arch [j].name == '.'
9839 && strcmp (arch, cpu_arch [j].name + 1) == 0)
9840 {
9841 /* ISA entension. */
9842 i386_cpu_flags flags;
9843
9844 if (!cpu_arch[j].negated)
9845 flags = cpu_flags_or (cpu_arch_flags,
9846 cpu_arch[j].flags);
9847 else
9848 flags = cpu_flags_and_not (cpu_arch_flags,
9849 cpu_arch[j].flags);
9850
9851 if (!valid_iamcu_cpu_flags (&flags))
9852 as_fatal (_("`%s' isn't valid for Intel MCU"), arch);
9853 else if (!cpu_flags_equal (&flags, &cpu_arch_flags))
9854 {
9855 if (cpu_sub_arch_name)
9856 {
9857 char *name = cpu_sub_arch_name;
9858 cpu_sub_arch_name = concat (name,
9859 cpu_arch[j].name,
9860 (const char *) NULL);
9861 free (name);
9862 }
9863 else
9864 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
9865 cpu_arch_flags = flags;
9866 cpu_arch_isa_flags = flags;
9867 }
9868 break;
9869 }
9870 }
9871
9872 if (j >= ARRAY_SIZE (cpu_arch))
9873 as_fatal (_("invalid -march= option: `%s'"), arg);
9874
9875 arch = next;
9876 }
9877 while (next != NULL );
9878 break;
9879
9880 case OPTION_MTUNE:
9881 if (*arg == '.')
9882 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9883 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9884 {
9885 if (strcmp (arg, cpu_arch [j].name) == 0)
9886 {
9887 cpu_arch_tune_set = 1;
9888 cpu_arch_tune = cpu_arch [j].type;
9889 cpu_arch_tune_flags = cpu_arch[j].flags;
9890 break;
9891 }
9892 }
9893 if (j >= ARRAY_SIZE (cpu_arch))
9894 as_fatal (_("invalid -mtune= option: `%s'"), arg);
9895 break;
9896
9897 case OPTION_MMNEMONIC:
9898 if (strcasecmp (arg, "att") == 0)
9899 intel_mnemonic = 0;
9900 else if (strcasecmp (arg, "intel") == 0)
9901 intel_mnemonic = 1;
9902 else
9903 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
9904 break;
9905
9906 case OPTION_MSYNTAX:
9907 if (strcasecmp (arg, "att") == 0)
9908 intel_syntax = 0;
9909 else if (strcasecmp (arg, "intel") == 0)
9910 intel_syntax = 1;
9911 else
9912 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
9913 break;
9914
9915 case OPTION_MINDEX_REG:
9916 allow_index_reg = 1;
9917 break;
9918
9919 case OPTION_MNAKED_REG:
9920 allow_naked_reg = 1;
9921 break;
9922
9923 case OPTION_MOLD_GCC:
9924 old_gcc = 1;
9925 break;
9926
9927 case OPTION_MSSE2AVX:
9928 sse2avx = 1;
9929 break;
9930
9931 case OPTION_MSSE_CHECK:
9932 if (strcasecmp (arg, "error") == 0)
9933 sse_check = check_error;
9934 else if (strcasecmp (arg, "warning") == 0)
9935 sse_check = check_warning;
9936 else if (strcasecmp (arg, "none") == 0)
9937 sse_check = check_none;
9938 else
9939 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
9940 break;
9941
9942 case OPTION_MOPERAND_CHECK:
9943 if (strcasecmp (arg, "error") == 0)
9944 operand_check = check_error;
9945 else if (strcasecmp (arg, "warning") == 0)
9946 operand_check = check_warning;
9947 else if (strcasecmp (arg, "none") == 0)
9948 operand_check = check_none;
9949 else
9950 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
9951 break;
9952
9953 case OPTION_MAVXSCALAR:
9954 if (strcasecmp (arg, "128") == 0)
9955 avxscalar = vex128;
9956 else if (strcasecmp (arg, "256") == 0)
9957 avxscalar = vex256;
9958 else
9959 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
9960 break;
9961
9962 case OPTION_MADD_BND_PREFIX:
9963 add_bnd_prefix = 1;
9964 break;
9965
9966 case OPTION_MEVEXLIG:
9967 if (strcmp (arg, "128") == 0)
9968 evexlig = evexl128;
9969 else if (strcmp (arg, "256") == 0)
9970 evexlig = evexl256;
9971 else if (strcmp (arg, "512") == 0)
9972 evexlig = evexl512;
9973 else
9974 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
9975 break;
9976
9977 case OPTION_MEVEXRCIG:
9978 if (strcmp (arg, "rne") == 0)
9979 evexrcig = rne;
9980 else if (strcmp (arg, "rd") == 0)
9981 evexrcig = rd;
9982 else if (strcmp (arg, "ru") == 0)
9983 evexrcig = ru;
9984 else if (strcmp (arg, "rz") == 0)
9985 evexrcig = rz;
9986 else
9987 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
9988 break;
9989
9990 case OPTION_MEVEXWIG:
9991 if (strcmp (arg, "0") == 0)
9992 evexwig = evexw0;
9993 else if (strcmp (arg, "1") == 0)
9994 evexwig = evexw1;
9995 else
9996 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
9997 break;
9998
9999 # if defined (TE_PE) || defined (TE_PEP)
10000 case OPTION_MBIG_OBJ:
10001 use_big_obj = 1;
10002 break;
10003 #endif
10004
10005 case OPTION_MOMIT_LOCK_PREFIX:
10006 if (strcasecmp (arg, "yes") == 0)
10007 omit_lock_prefix = 1;
10008 else if (strcasecmp (arg, "no") == 0)
10009 omit_lock_prefix = 0;
10010 else
10011 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
10012 break;
10013
10014 case OPTION_MFENCE_AS_LOCK_ADD:
10015 if (strcasecmp (arg, "yes") == 0)
10016 avoid_fence = 1;
10017 else if (strcasecmp (arg, "no") == 0)
10018 avoid_fence = 0;
10019 else
10020 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
10021 break;
10022
10023 case OPTION_MRELAX_RELOCATIONS:
10024 if (strcasecmp (arg, "yes") == 0)
10025 generate_relax_relocations = 1;
10026 else if (strcasecmp (arg, "no") == 0)
10027 generate_relax_relocations = 0;
10028 else
10029 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
10030 break;
10031
10032 case OPTION_MAMD64:
10033 cpu_arch_flags.bitfield.cpuamd64 = 1;
10034 cpu_arch_flags.bitfield.cpuintel64 = 0;
10035 cpu_arch_isa_flags.bitfield.cpuamd64 = 1;
10036 cpu_arch_isa_flags.bitfield.cpuintel64 = 0;
10037 break;
10038
10039 case OPTION_MINTEL64:
10040 cpu_arch_flags.bitfield.cpuamd64 = 0;
10041 cpu_arch_flags.bitfield.cpuintel64 = 1;
10042 cpu_arch_isa_flags.bitfield.cpuamd64 = 0;
10043 cpu_arch_isa_flags.bitfield.cpuintel64 = 1;
10044 break;
10045
10046 default:
10047 return 0;
10048 }
10049 return 1;
10050 }
10051
10052 #define MESSAGE_TEMPLATE \
10053 " "
10054
10055 static void
10056 show_arch (FILE *stream, int ext, int check)
10057 {
10058 static char message[] = MESSAGE_TEMPLATE;
10059 char *start = message + 27;
10060 char *p;
10061 int size = sizeof (MESSAGE_TEMPLATE);
10062 int left;
10063 const char *name;
10064 int len;
10065 unsigned int j;
10066
10067 p = start;
10068 left = size - (start - message);
10069 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10070 {
10071 /* Should it be skipped? */
10072 if (cpu_arch [j].skip)
10073 continue;
10074
10075 name = cpu_arch [j].name;
10076 len = cpu_arch [j].len;
10077 if (*name == '.')
10078 {
10079 /* It is an extension. Skip if we aren't asked to show it. */
10080 if (ext)
10081 {
10082 name++;
10083 len--;
10084 }
10085 else
10086 continue;
10087 }
10088 else if (ext)
10089 {
10090 /* It is an processor. Skip if we show only extension. */
10091 continue;
10092 }
10093 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
10094 {
10095 /* It is an impossible processor - skip. */
10096 continue;
10097 }
10098
10099 /* Reserve 2 spaces for ", " or ",\0" */
10100 left -= len + 2;
10101
10102 /* Check if there is any room. */
10103 if (left >= 0)
10104 {
10105 if (p != start)
10106 {
10107 *p++ = ',';
10108 *p++ = ' ';
10109 }
10110 p = mempcpy (p, name, len);
10111 }
10112 else
10113 {
10114 /* Output the current message now and start a new one. */
10115 *p++ = ',';
10116 *p = '\0';
10117 fprintf (stream, "%s\n", message);
10118 p = start;
10119 left = size - (start - message) - len - 2;
10120
10121 gas_assert (left >= 0);
10122
10123 p = mempcpy (p, name, len);
10124 }
10125 }
10126
10127 *p = '\0';
10128 fprintf (stream, "%s\n", message);
10129 }
10130
10131 void
10132 md_show_usage (FILE *stream)
10133 {
10134 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10135 fprintf (stream, _("\
10136 -Q ignored\n\
10137 -V print assembler version number\n\
10138 -k ignored\n"));
10139 #endif
10140 fprintf (stream, _("\
10141 -n Do not optimize code alignment\n\
10142 -q quieten some warnings\n"));
10143 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10144 fprintf (stream, _("\
10145 -s ignored\n"));
10146 #endif
10147 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10148 || defined (TE_PE) || defined (TE_PEP))
10149 fprintf (stream, _("\
10150 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
10151 #endif
10152 #ifdef SVR4_COMMENT_CHARS
10153 fprintf (stream, _("\
10154 --divide do not treat `/' as a comment character\n"));
10155 #else
10156 fprintf (stream, _("\
10157 --divide ignored\n"));
10158 #endif
10159 fprintf (stream, _("\
10160 -march=CPU[,+EXTENSION...]\n\
10161 generate code for CPU and EXTENSION, CPU is one of:\n"));
10162 show_arch (stream, 0, 1);
10163 fprintf (stream, _("\
10164 EXTENSION is combination of:\n"));
10165 show_arch (stream, 1, 0);
10166 fprintf (stream, _("\
10167 -mtune=CPU optimize for CPU, CPU is one of:\n"));
10168 show_arch (stream, 0, 0);
10169 fprintf (stream, _("\
10170 -msse2avx encode SSE instructions with VEX prefix\n"));
10171 fprintf (stream, _("\
10172 -msse-check=[none|error|warning]\n\
10173 check SSE instructions\n"));
10174 fprintf (stream, _("\
10175 -moperand-check=[none|error|warning]\n\
10176 check operand combinations for validity\n"));
10177 fprintf (stream, _("\
10178 -mavxscalar=[128|256] encode scalar AVX instructions with specific vector\n\
10179 length\n"));
10180 fprintf (stream, _("\
10181 -mevexlig=[128|256|512] encode scalar EVEX instructions with specific vector\n\
10182 length\n"));
10183 fprintf (stream, _("\
10184 -mevexwig=[0|1] encode EVEX instructions with specific EVEX.W value\n\
10185 for EVEX.W bit ignored instructions\n"));
10186 fprintf (stream, _("\
10187 -mevexrcig=[rne|rd|ru|rz]\n\
10188 encode EVEX instructions with specific EVEX.RC value\n\
10189 for SAE-only ignored instructions\n"));
10190 fprintf (stream, _("\
10191 -mmnemonic=[att|intel] use AT&T/Intel mnemonic\n"));
10192 fprintf (stream, _("\
10193 -msyntax=[att|intel] use AT&T/Intel syntax\n"));
10194 fprintf (stream, _("\
10195 -mindex-reg support pseudo index registers\n"));
10196 fprintf (stream, _("\
10197 -mnaked-reg don't require `%%' prefix for registers\n"));
10198 fprintf (stream, _("\
10199 -mold-gcc support old (<= 2.8.1) versions of gcc\n"));
10200 fprintf (stream, _("\
10201 -madd-bnd-prefix add BND prefix for all valid branches\n"));
10202 fprintf (stream, _("\
10203 -mshared disable branch optimization for shared code\n"));
10204 # if defined (TE_PE) || defined (TE_PEP)
10205 fprintf (stream, _("\
10206 -mbig-obj generate big object files\n"));
10207 #endif
10208 fprintf (stream, _("\
10209 -momit-lock-prefix=[no|yes]\n\
10210 strip all lock prefixes\n"));
10211 fprintf (stream, _("\
10212 -mfence-as-lock-add=[no|yes]\n\
10213 encode lfence, mfence and sfence as\n\
10214 lock addl $0x0, (%%{re}sp)\n"));
10215 fprintf (stream, _("\
10216 -mrelax-relocations=[no|yes]\n\
10217 generate relax relocations\n"));
10218 fprintf (stream, _("\
10219 -mamd64 accept only AMD64 ISA\n"));
10220 fprintf (stream, _("\
10221 -mintel64 accept only Intel64 ISA\n"));
10222 }
10223
10224 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
10225 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10226 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10227
10228 /* Pick the target format to use. */
10229
10230 const char *
10231 i386_target_format (void)
10232 {
10233 if (!strncmp (default_arch, "x86_64", 6))
10234 {
10235 update_code_flag (CODE_64BIT, 1);
10236 if (default_arch[6] == '\0')
10237 x86_elf_abi = X86_64_ABI;
10238 else
10239 x86_elf_abi = X86_64_X32_ABI;
10240 }
10241 else if (!strcmp (default_arch, "i386"))
10242 update_code_flag (CODE_32BIT, 1);
10243 else if (!strcmp (default_arch, "iamcu"))
10244 {
10245 update_code_flag (CODE_32BIT, 1);
10246 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
10247 {
10248 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
10249 cpu_arch_name = "iamcu";
10250 cpu_sub_arch_name = NULL;
10251 cpu_arch_flags = iamcu_flags;
10252 cpu_arch_isa = PROCESSOR_IAMCU;
10253 cpu_arch_isa_flags = iamcu_flags;
10254 if (!cpu_arch_tune_set)
10255 {
10256 cpu_arch_tune = cpu_arch_isa;
10257 cpu_arch_tune_flags = cpu_arch_isa_flags;
10258 }
10259 }
10260 else
10261 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
10262 cpu_arch_name);
10263 }
10264 else
10265 as_fatal (_("unknown architecture"));
10266
10267 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
10268 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10269 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
10270 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10271
10272 switch (OUTPUT_FLAVOR)
10273 {
10274 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
10275 case bfd_target_aout_flavour:
10276 return AOUT_TARGET_FORMAT;
10277 #endif
10278 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
10279 # if defined (TE_PE) || defined (TE_PEP)
10280 case bfd_target_coff_flavour:
10281 if (flag_code == CODE_64BIT)
10282 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
10283 else
10284 return "pe-i386";
10285 # elif defined (TE_GO32)
10286 case bfd_target_coff_flavour:
10287 return "coff-go32";
10288 # else
10289 case bfd_target_coff_flavour:
10290 return "coff-i386";
10291 # endif
10292 #endif
10293 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10294 case bfd_target_elf_flavour:
10295 {
10296 const char *format;
10297
10298 switch (x86_elf_abi)
10299 {
10300 default:
10301 format = ELF_TARGET_FORMAT;
10302 break;
10303 case X86_64_ABI:
10304 use_rela_relocations = 1;
10305 object_64bit = 1;
10306 format = ELF_TARGET_FORMAT64;
10307 break;
10308 case X86_64_X32_ABI:
10309 use_rela_relocations = 1;
10310 object_64bit = 1;
10311 disallow_64bit_reloc = 1;
10312 format = ELF_TARGET_FORMAT32;
10313 break;
10314 }
10315 if (cpu_arch_isa == PROCESSOR_L1OM)
10316 {
10317 if (x86_elf_abi != X86_64_ABI)
10318 as_fatal (_("Intel L1OM is 64bit only"));
10319 return ELF_TARGET_L1OM_FORMAT;
10320 }
10321 else if (cpu_arch_isa == PROCESSOR_K1OM)
10322 {
10323 if (x86_elf_abi != X86_64_ABI)
10324 as_fatal (_("Intel K1OM is 64bit only"));
10325 return ELF_TARGET_K1OM_FORMAT;
10326 }
10327 else if (cpu_arch_isa == PROCESSOR_IAMCU)
10328 {
10329 if (x86_elf_abi != I386_ABI)
10330 as_fatal (_("Intel MCU is 32bit only"));
10331 return ELF_TARGET_IAMCU_FORMAT;
10332 }
10333 else
10334 return format;
10335 }
10336 #endif
10337 #if defined (OBJ_MACH_O)
10338 case bfd_target_mach_o_flavour:
10339 if (flag_code == CODE_64BIT)
10340 {
10341 use_rela_relocations = 1;
10342 object_64bit = 1;
10343 return "mach-o-x86-64";
10344 }
10345 else
10346 return "mach-o-i386";
10347 #endif
10348 default:
10349 abort ();
10350 return NULL;
10351 }
10352 }
10353
10354 #endif /* OBJ_MAYBE_ more than one */
10355 \f
10356 symbolS *
10357 md_undefined_symbol (char *name)
10358 {
10359 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
10360 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
10361 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
10362 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
10363 {
10364 if (!GOT_symbol)
10365 {
10366 if (symbol_find (name))
10367 as_bad (_("GOT already in symbol table"));
10368 GOT_symbol = symbol_new (name, undefined_section,
10369 (valueT) 0, &zero_address_frag);
10370 };
10371 return GOT_symbol;
10372 }
10373 return 0;
10374 }
10375
10376 /* Round up a section size to the appropriate boundary. */
10377
10378 valueT
10379 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
10380 {
10381 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10382 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
10383 {
10384 /* For a.out, force the section size to be aligned. If we don't do
10385 this, BFD will align it for us, but it will not write out the
10386 final bytes of the section. This may be a bug in BFD, but it is
10387 easier to fix it here since that is how the other a.out targets
10388 work. */
10389 int align;
10390
10391 align = bfd_get_section_alignment (stdoutput, segment);
10392 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
10393 }
10394 #endif
10395
10396 return size;
10397 }
10398
10399 /* On the i386, PC-relative offsets are relative to the start of the
10400 next instruction. That is, the address of the offset, plus its
10401 size, since the offset is always the last part of the insn. */
10402
10403 long
10404 md_pcrel_from (fixS *fixP)
10405 {
10406 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
10407 }
10408
10409 #ifndef I386COFF
10410
10411 static void
10412 s_bss (int ignore ATTRIBUTE_UNUSED)
10413 {
10414 int temp;
10415
10416 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10417 if (IS_ELF)
10418 obj_elf_section_change_hook ();
10419 #endif
10420 temp = get_absolute_expression ();
10421 subseg_set (bss_section, (subsegT) temp);
10422 demand_empty_rest_of_line ();
10423 }
10424
10425 #endif
10426
10427 void
10428 i386_validate_fix (fixS *fixp)
10429 {
10430 if (fixp->fx_subsy)
10431 {
10432 if (fixp->fx_subsy == GOT_symbol)
10433 {
10434 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
10435 {
10436 if (!object_64bit)
10437 abort ();
10438 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10439 if (fixp->fx_tcbit2)
10440 fixp->fx_r_type = (fixp->fx_tcbit
10441 ? BFD_RELOC_X86_64_REX_GOTPCRELX
10442 : BFD_RELOC_X86_64_GOTPCRELX);
10443 else
10444 #endif
10445 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
10446 }
10447 else
10448 {
10449 if (!object_64bit)
10450 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
10451 else
10452 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
10453 }
10454 fixp->fx_subsy = 0;
10455 }
10456 }
10457 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10458 else if (!object_64bit)
10459 {
10460 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
10461 && fixp->fx_tcbit2)
10462 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
10463 }
10464 #endif
10465 }
10466
10467 arelent *
10468 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
10469 {
10470 arelent *rel;
10471 bfd_reloc_code_real_type code;
10472
10473 switch (fixp->fx_r_type)
10474 {
10475 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10476 case BFD_RELOC_SIZE32:
10477 case BFD_RELOC_SIZE64:
10478 if (S_IS_DEFINED (fixp->fx_addsy)
10479 && !S_IS_EXTERNAL (fixp->fx_addsy))
10480 {
10481 /* Resolve size relocation against local symbol to size of
10482 the symbol plus addend. */
10483 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
10484 if (fixp->fx_r_type == BFD_RELOC_SIZE32
10485 && !fits_in_unsigned_long (value))
10486 as_bad_where (fixp->fx_file, fixp->fx_line,
10487 _("symbol size computation overflow"));
10488 fixp->fx_addsy = NULL;
10489 fixp->fx_subsy = NULL;
10490 md_apply_fix (fixp, (valueT *) &value, NULL);
10491 return NULL;
10492 }
10493 #endif
10494
10495 case BFD_RELOC_X86_64_PLT32:
10496 case BFD_RELOC_X86_64_GOT32:
10497 case BFD_RELOC_X86_64_GOTPCREL:
10498 case BFD_RELOC_X86_64_GOTPCRELX:
10499 case BFD_RELOC_X86_64_REX_GOTPCRELX:
10500 case BFD_RELOC_386_PLT32:
10501 case BFD_RELOC_386_GOT32:
10502 case BFD_RELOC_386_GOT32X:
10503 case BFD_RELOC_386_GOTOFF:
10504 case BFD_RELOC_386_GOTPC:
10505 case BFD_RELOC_386_TLS_GD:
10506 case BFD_RELOC_386_TLS_LDM:
10507 case BFD_RELOC_386_TLS_LDO_32:
10508 case BFD_RELOC_386_TLS_IE_32:
10509 case BFD_RELOC_386_TLS_IE:
10510 case BFD_RELOC_386_TLS_GOTIE:
10511 case BFD_RELOC_386_TLS_LE_32:
10512 case BFD_RELOC_386_TLS_LE:
10513 case BFD_RELOC_386_TLS_GOTDESC:
10514 case BFD_RELOC_386_TLS_DESC_CALL:
10515 case BFD_RELOC_X86_64_TLSGD:
10516 case BFD_RELOC_X86_64_TLSLD:
10517 case BFD_RELOC_X86_64_DTPOFF32:
10518 case BFD_RELOC_X86_64_DTPOFF64:
10519 case BFD_RELOC_X86_64_GOTTPOFF:
10520 case BFD_RELOC_X86_64_TPOFF32:
10521 case BFD_RELOC_X86_64_TPOFF64:
10522 case BFD_RELOC_X86_64_GOTOFF64:
10523 case BFD_RELOC_X86_64_GOTPC32:
10524 case BFD_RELOC_X86_64_GOT64:
10525 case BFD_RELOC_X86_64_GOTPCREL64:
10526 case BFD_RELOC_X86_64_GOTPC64:
10527 case BFD_RELOC_X86_64_GOTPLT64:
10528 case BFD_RELOC_X86_64_PLTOFF64:
10529 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10530 case BFD_RELOC_X86_64_TLSDESC_CALL:
10531 case BFD_RELOC_RVA:
10532 case BFD_RELOC_VTABLE_ENTRY:
10533 case BFD_RELOC_VTABLE_INHERIT:
10534 #ifdef TE_PE
10535 case BFD_RELOC_32_SECREL:
10536 #endif
10537 code = fixp->fx_r_type;
10538 break;
10539 case BFD_RELOC_X86_64_32S:
10540 if (!fixp->fx_pcrel)
10541 {
10542 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
10543 code = fixp->fx_r_type;
10544 break;
10545 }
10546 default:
10547 if (fixp->fx_pcrel)
10548 {
10549 switch (fixp->fx_size)
10550 {
10551 default:
10552 as_bad_where (fixp->fx_file, fixp->fx_line,
10553 _("can not do %d byte pc-relative relocation"),
10554 fixp->fx_size);
10555 code = BFD_RELOC_32_PCREL;
10556 break;
10557 case 1: code = BFD_RELOC_8_PCREL; break;
10558 case 2: code = BFD_RELOC_16_PCREL; break;
10559 case 4: code = BFD_RELOC_32_PCREL; break;
10560 #ifdef BFD64
10561 case 8: code = BFD_RELOC_64_PCREL; break;
10562 #endif
10563 }
10564 }
10565 else
10566 {
10567 switch (fixp->fx_size)
10568 {
10569 default:
10570 as_bad_where (fixp->fx_file, fixp->fx_line,
10571 _("can not do %d byte relocation"),
10572 fixp->fx_size);
10573 code = BFD_RELOC_32;
10574 break;
10575 case 1: code = BFD_RELOC_8; break;
10576 case 2: code = BFD_RELOC_16; break;
10577 case 4: code = BFD_RELOC_32; break;
10578 #ifdef BFD64
10579 case 8: code = BFD_RELOC_64; break;
10580 #endif
10581 }
10582 }
10583 break;
10584 }
10585
10586 if ((code == BFD_RELOC_32
10587 || code == BFD_RELOC_32_PCREL
10588 || code == BFD_RELOC_X86_64_32S)
10589 && GOT_symbol
10590 && fixp->fx_addsy == GOT_symbol)
10591 {
10592 if (!object_64bit)
10593 code = BFD_RELOC_386_GOTPC;
10594 else
10595 code = BFD_RELOC_X86_64_GOTPC32;
10596 }
10597 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
10598 && GOT_symbol
10599 && fixp->fx_addsy == GOT_symbol)
10600 {
10601 code = BFD_RELOC_X86_64_GOTPC64;
10602 }
10603
10604 rel = (arelent *) xmalloc (sizeof (arelent));
10605 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
10606 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
10607
10608 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
10609
10610 if (!use_rela_relocations)
10611 {
10612 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
10613 vtable entry to be used in the relocation's section offset. */
10614 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
10615 rel->address = fixp->fx_offset;
10616 #if defined (OBJ_COFF) && defined (TE_PE)
10617 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
10618 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
10619 else
10620 #endif
10621 rel->addend = 0;
10622 }
10623 /* Use the rela in 64bit mode. */
10624 else
10625 {
10626 if (disallow_64bit_reloc)
10627 switch (code)
10628 {
10629 case BFD_RELOC_X86_64_DTPOFF64:
10630 case BFD_RELOC_X86_64_TPOFF64:
10631 case BFD_RELOC_64_PCREL:
10632 case BFD_RELOC_X86_64_GOTOFF64:
10633 case BFD_RELOC_X86_64_GOT64:
10634 case BFD_RELOC_X86_64_GOTPCREL64:
10635 case BFD_RELOC_X86_64_GOTPC64:
10636 case BFD_RELOC_X86_64_GOTPLT64:
10637 case BFD_RELOC_X86_64_PLTOFF64:
10638 as_bad_where (fixp->fx_file, fixp->fx_line,
10639 _("cannot represent relocation type %s in x32 mode"),
10640 bfd_get_reloc_code_name (code));
10641 break;
10642 default:
10643 break;
10644 }
10645
10646 if (!fixp->fx_pcrel)
10647 rel->addend = fixp->fx_offset;
10648 else
10649 switch (code)
10650 {
10651 case BFD_RELOC_X86_64_PLT32:
10652 case BFD_RELOC_X86_64_GOT32:
10653 case BFD_RELOC_X86_64_GOTPCREL:
10654 case BFD_RELOC_X86_64_GOTPCRELX:
10655 case BFD_RELOC_X86_64_REX_GOTPCRELX:
10656 case BFD_RELOC_X86_64_TLSGD:
10657 case BFD_RELOC_X86_64_TLSLD:
10658 case BFD_RELOC_X86_64_GOTTPOFF:
10659 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10660 case BFD_RELOC_X86_64_TLSDESC_CALL:
10661 rel->addend = fixp->fx_offset - fixp->fx_size;
10662 break;
10663 default:
10664 rel->addend = (section->vma
10665 - fixp->fx_size
10666 + fixp->fx_addnumber
10667 + md_pcrel_from (fixp));
10668 break;
10669 }
10670 }
10671
10672 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
10673 if (rel->howto == NULL)
10674 {
10675 as_bad_where (fixp->fx_file, fixp->fx_line,
10676 _("cannot represent relocation type %s"),
10677 bfd_get_reloc_code_name (code));
10678 /* Set howto to a garbage value so that we can keep going. */
10679 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
10680 gas_assert (rel->howto != NULL);
10681 }
10682
10683 return rel;
10684 }
10685
10686 #include "tc-i386-intel.c"
10687
10688 void
10689 tc_x86_parse_to_dw2regnum (expressionS *exp)
10690 {
10691 int saved_naked_reg;
10692 char saved_register_dot;
10693
10694 saved_naked_reg = allow_naked_reg;
10695 allow_naked_reg = 1;
10696 saved_register_dot = register_chars['.'];
10697 register_chars['.'] = '.';
10698 allow_pseudo_reg = 1;
10699 expression_and_evaluate (exp);
10700 allow_pseudo_reg = 0;
10701 register_chars['.'] = saved_register_dot;
10702 allow_naked_reg = saved_naked_reg;
10703
10704 if (exp->X_op == O_register && exp->X_add_number >= 0)
10705 {
10706 if ((addressT) exp->X_add_number < i386_regtab_size)
10707 {
10708 exp->X_op = O_constant;
10709 exp->X_add_number = i386_regtab[exp->X_add_number]
10710 .dw2_regnum[flag_code >> 1];
10711 }
10712 else
10713 exp->X_op = O_illegal;
10714 }
10715 }
10716
10717 void
10718 tc_x86_frame_initial_instructions (void)
10719 {
10720 static unsigned int sp_regno[2];
10721
10722 if (!sp_regno[flag_code >> 1])
10723 {
10724 char *saved_input = input_line_pointer;
10725 char sp[][4] = {"esp", "rsp"};
10726 expressionS exp;
10727
10728 input_line_pointer = sp[flag_code >> 1];
10729 tc_x86_parse_to_dw2regnum (&exp);
10730 gas_assert (exp.X_op == O_constant);
10731 sp_regno[flag_code >> 1] = exp.X_add_number;
10732 input_line_pointer = saved_input;
10733 }
10734
10735 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
10736 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
10737 }
10738
10739 int
10740 x86_dwarf2_addr_size (void)
10741 {
10742 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10743 if (x86_elf_abi == X86_64_X32_ABI)
10744 return 4;
10745 #endif
10746 return bfd_arch_bits_per_address (stdoutput) / 8;
10747 }
10748
10749 int
10750 i386_elf_section_type (const char *str, size_t len)
10751 {
10752 if (flag_code == CODE_64BIT
10753 && len == sizeof ("unwind") - 1
10754 && strncmp (str, "unwind", 6) == 0)
10755 return SHT_X86_64_UNWIND;
10756
10757 return -1;
10758 }
10759
10760 #ifdef TE_SOLARIS
10761 void
10762 i386_solaris_fix_up_eh_frame (segT sec)
10763 {
10764 if (flag_code == CODE_64BIT)
10765 elf_section_type (sec) = SHT_X86_64_UNWIND;
10766 }
10767 #endif
10768
10769 #ifdef TE_PE
10770 void
10771 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
10772 {
10773 expressionS exp;
10774
10775 exp.X_op = O_secrel;
10776 exp.X_add_symbol = symbol;
10777 exp.X_add_number = 0;
10778 emit_expr (&exp, size);
10779 }
10780 #endif
10781
10782 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10783 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
10784
10785 bfd_vma
10786 x86_64_section_letter (int letter, const char **ptr_msg)
10787 {
10788 if (flag_code == CODE_64BIT)
10789 {
10790 if (letter == 'l')
10791 return SHF_X86_64_LARGE;
10792
10793 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
10794 }
10795 else
10796 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
10797 return -1;
10798 }
10799
10800 bfd_vma
10801 x86_64_section_word (char *str, size_t len)
10802 {
10803 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
10804 return SHF_X86_64_LARGE;
10805
10806 return -1;
10807 }
10808
10809 static void
10810 handle_large_common (int small ATTRIBUTE_UNUSED)
10811 {
10812 if (flag_code != CODE_64BIT)
10813 {
10814 s_comm_internal (0, elf_common_parse);
10815 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
10816 }
10817 else
10818 {
10819 static segT lbss_section;
10820 asection *saved_com_section_ptr = elf_com_section_ptr;
10821 asection *saved_bss_section = bss_section;
10822
10823 if (lbss_section == NULL)
10824 {
10825 flagword applicable;
10826 segT seg = now_seg;
10827 subsegT subseg = now_subseg;
10828
10829 /* The .lbss section is for local .largecomm symbols. */
10830 lbss_section = subseg_new (".lbss", 0);
10831 applicable = bfd_applicable_section_flags (stdoutput);
10832 bfd_set_section_flags (stdoutput, lbss_section,
10833 applicable & SEC_ALLOC);
10834 seg_info (lbss_section)->bss = 1;
10835
10836 subseg_set (seg, subseg);
10837 }
10838
10839 elf_com_section_ptr = &_bfd_elf_large_com_section;
10840 bss_section = lbss_section;
10841
10842 s_comm_internal (0, elf_common_parse);
10843
10844 elf_com_section_ptr = saved_com_section_ptr;
10845 bss_section = saved_bss_section;
10846 }
10847 }
10848 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */