1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
4 This file is part of GAS, the GNU Assembler.
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
21 /* Intel 80386 machine specific gas.
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
29 #include "safe-ctype.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
47 #ifndef REGISTER_WARNINGS
48 #define REGISTER_WARNINGS 1
51 #ifndef INFER_ADDR_PREFIX
52 #define INFER_ADDR_PREFIX 1
56 #define DEFAULT_ARCH "i386"
61 #define INLINE __inline__
67 /* Prefixes will be emitted in the order defined below.
68 WAIT_PREFIX must be the first prefix since FWAIT is really is an
69 instruction, and so must come before any prefixes.
70 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
71 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
77 #define HLE_PREFIX REP_PREFIX
78 #define BND_PREFIX REP_PREFIX
80 #define REX_PREFIX 6 /* must come last. */
81 #define MAX_PREFIXES 7 /* max prefixes per opcode */
83 /* we define the syntax here (modulo base,index,scale syntax) */
84 #define REGISTER_PREFIX '%'
85 #define IMMEDIATE_PREFIX '$'
86 #define ABSOLUTE_PREFIX '*'
88 /* these are the instruction mnemonic suffixes in AT&T syntax or
89 memory operand size in Intel syntax. */
90 #define WORD_MNEM_SUFFIX 'w'
91 #define BYTE_MNEM_SUFFIX 'b'
92 #define SHORT_MNEM_SUFFIX 's'
93 #define LONG_MNEM_SUFFIX 'l'
94 #define QWORD_MNEM_SUFFIX 'q'
95 /* Intel Syntax. Use a non-ascii letter since since it never appears
97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
99 #define END_OF_INSN '\0'
101 /* This matches the C -> StaticRounding alias in the opcode table. */
102 #define commutative staticrounding
105 'templates' is for grouping together 'template' structures for opcodes
106 of the same name. This is only used for storing the insns in the grand
107 ole hash table of insns.
108 The templates themselves start at START and range up to (but not including)
113 const insn_template *start;
114 const insn_template *end;
118 /* 386 operand encoding bytes: see 386 book for details of this. */
121 unsigned int regmem; /* codes register or memory operand */
122 unsigned int reg; /* codes register operand (or extended opcode) */
123 unsigned int mode; /* how to interpret regmem & reg */
127 /* x86-64 extension prefix. */
128 typedef int rex_byte;
130 /* 386 opcode byte to code indirect addressing. */
139 /* x86 arch names, types and features */
142 const char *name; /* arch name */
143 unsigned int len; /* arch string length */
144 enum processor_type type; /* arch type */
145 i386_cpu_flags flags; /* cpu feature flags */
146 unsigned int skip; /* show_arch should skip this. */
150 /* Used to turn off indicated flags. */
153 const char *name; /* arch name */
154 unsigned int len; /* arch string length */
155 i386_cpu_flags flags; /* cpu feature flags */
159 static void update_code_flag (int, int);
160 static void set_code_flag (int);
161 static void set_16bit_gcc_code_flag (int);
162 static void set_intel_syntax (int);
163 static void set_intel_mnemonic (int);
164 static void set_allow_index_reg (int);
165 static void set_check (int);
166 static void set_cpu_arch (int);
168 static void pe_directive_secrel (int);
170 static void signed_cons (int);
171 static char *output_invalid (int c);
172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
176 static int i386_att_operand (char *);
177 static int i386_intel_operand (char *, int);
178 static int i386_intel_simplify (expressionS *);
179 static int i386_intel_parse_name (const char *, expressionS *);
180 static const reg_entry *parse_register (char *, char **);
181 static char *parse_insn (char *, char *);
182 static char *parse_operands (char *, const char *);
183 static void swap_operands (void);
184 static void swap_2_operands (int, int);
185 static enum flag_code i386_addressing_mode (void);
186 static void optimize_imm (void);
187 static void optimize_disp (void);
188 static const insn_template *match_template (char);
189 static int check_string (void);
190 static int process_suffix (void);
191 static int check_byte_reg (void);
192 static int check_long_reg (void);
193 static int check_qword_reg (void);
194 static int check_word_reg (void);
195 static int finalize_imm (void);
196 static int process_operands (void);
197 static const seg_entry *build_modrm_byte (void);
198 static void output_insn (void);
199 static void output_imm (fragS *, offsetT);
200 static void output_disp (fragS *, offsetT);
202 static void s_bss (int);
204 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
205 static void handle_large_common (int small ATTRIBUTE_UNUSED);
207 /* GNU_PROPERTY_X86_ISA_1_USED. */
208 static unsigned int x86_isa_1_used;
209 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
210 static unsigned int x86_feature_2_used;
211 /* Generate x86 used ISA and feature properties. */
212 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
215 static const char *default_arch = DEFAULT_ARCH;
217 /* This struct describes rounding control and SAE in the instruction. */
231 static struct RC_Operation rc_op;
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
244 static struct Mask_Operation mask_op;
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
248 struct Broadcast_Operation
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
253 /* Index of broadcasted operand. */
256 /* Number of bytes to broadcast. */
260 static struct Broadcast_Operation broadcast_op;
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
272 /* 'md_assemble ()' gathers together information and puts it into a
279 const reg_entry *regs;
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
290 unsupported_with_intel_mnemonic,
293 invalid_vsib_address,
294 invalid_vector_register_set,
295 unsupported_vector_index_register,
296 unsupported_broadcast,
299 mask_not_on_destination,
302 rc_sae_operand_not_last_imm,
303 invalid_register_operand,
308 /* TM holds the template for the insn were currently assembling. */
311 /* SUFFIX holds the instruction size suffix for byte, word, dword
312 or qword, if given. */
315 /* OPERANDS gives the number of given operands. */
316 unsigned int operands;
318 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
319 of given register, displacement, memory operands and immediate
321 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
323 /* TYPES [i] is the type (see above #defines) which tells us how to
324 use OP[i] for the corresponding operand. */
325 i386_operand_type types[MAX_OPERANDS];
327 /* Displacement expression, immediate expression, or register for each
329 union i386_op op[MAX_OPERANDS];
331 /* Flags for operands. */
332 unsigned int flags[MAX_OPERANDS];
333 #define Operand_PCrel 1
334 #define Operand_Mem 2
336 /* Relocation type for operand */
337 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
339 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
340 the base index byte below. */
341 const reg_entry *base_reg;
342 const reg_entry *index_reg;
343 unsigned int log2_scale_factor;
345 /* SEG gives the seg_entries of this insn. They are zero unless
346 explicit segment overrides are given. */
347 const seg_entry *seg[2];
349 /* Copied first memory operand string, for re-checking. */
352 /* PREFIX holds all the given prefix opcodes (usually null).
353 PREFIXES is the number of prefix opcodes. */
354 unsigned int prefixes;
355 unsigned char prefix[MAX_PREFIXES];
357 /* The operand to a branch insn indicates an absolute branch. */
358 bfd_boolean jumpabsolute;
360 /* Has MMX register operands. */
361 bfd_boolean has_regmmx;
363 /* Has XMM register operands. */
364 bfd_boolean has_regxmm;
366 /* Has YMM register operands. */
367 bfd_boolean has_regymm;
369 /* Has ZMM register operands. */
370 bfd_boolean has_regzmm;
372 /* Has GOTPC or TLS relocation. */
373 bfd_boolean has_gotpc_tls_reloc;
375 /* RM and SIB are the modrm byte and the sib byte where the
376 addressing modes of this insn are encoded. */
383 /* Masking attributes. */
384 struct Mask_Operation *mask;
386 /* Rounding control and SAE attributes. */
387 struct RC_Operation *rounding;
389 /* Broadcasting attributes. */
390 struct Broadcast_Operation *broadcast;
392 /* Compressed disp8*N attribute. */
393 unsigned int memshift;
395 /* Prefer load or store in encoding. */
398 dir_encoding_default = 0,
404 /* Prefer 8bit or 32bit displacement in encoding. */
407 disp_encoding_default = 0,
412 /* Prefer the REX byte in encoding. */
413 bfd_boolean rex_encoding;
415 /* Disable instruction size optimization. */
416 bfd_boolean no_optimize;
418 /* How to encode vector instructions. */
421 vex_encoding_default = 0,
428 const char *rep_prefix;
431 const char *hle_prefix;
433 /* Have BND prefix. */
434 const char *bnd_prefix;
436 /* Have NOTRACK prefix. */
437 const char *notrack_prefix;
440 enum i386_error error;
443 typedef struct _i386_insn i386_insn;
445 /* Link RC type with corresponding string, that'll be looked for in
454 static const struct RC_name RC_NamesTable[] =
456 { rne, STRING_COMMA_LEN ("rn-sae") },
457 { rd, STRING_COMMA_LEN ("rd-sae") },
458 { ru, STRING_COMMA_LEN ("ru-sae") },
459 { rz, STRING_COMMA_LEN ("rz-sae") },
460 { saeonly, STRING_COMMA_LEN ("sae") },
463 /* List of chars besides those in app.c:symbol_chars that can start an
464 operand. Used to prevent the scrubber eating vital white-space. */
465 const char extra_symbol_chars[] = "*%-([{}"
474 #if (defined (TE_I386AIX) \
475 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
476 && !defined (TE_GNU) \
477 && !defined (TE_LINUX) \
478 && !defined (TE_NACL) \
479 && !defined (TE_FreeBSD) \
480 && !defined (TE_DragonFly) \
481 && !defined (TE_NetBSD)))
482 /* This array holds the chars that always start a comment. If the
483 pre-processor is disabled, these aren't very useful. The option
484 --divide will remove '/' from this list. */
485 const char *i386_comment_chars = "#/";
486 #define SVR4_COMMENT_CHARS 1
487 #define PREFIX_SEPARATOR '\\'
490 const char *i386_comment_chars = "#";
491 #define PREFIX_SEPARATOR '/'
494 /* This array holds the chars that only start a comment at the beginning of
495 a line. If the line seems to have the form '# 123 filename'
496 .line and .file directives will appear in the pre-processed output.
497 Note that input_file.c hand checks for '#' at the beginning of the
498 first line of the input file. This is because the compiler outputs
499 #NO_APP at the beginning of its output.
500 Also note that comments started like this one will always work if
501 '/' isn't otherwise defined. */
502 const char line_comment_chars[] = "#/";
504 const char line_separator_chars[] = ";";
506 /* Chars that can be used to separate mant from exp in floating point
508 const char EXP_CHARS[] = "eE";
510 /* Chars that mean this number is a floating point constant
513 const char FLT_CHARS[] = "fFdDxX";
515 /* Tables for lexical analysis. */
516 static char mnemonic_chars[256];
517 static char register_chars[256];
518 static char operand_chars[256];
519 static char identifier_chars[256];
520 static char digit_chars[256];
522 /* Lexical macros. */
523 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
524 #define is_operand_char(x) (operand_chars[(unsigned char) x])
525 #define is_register_char(x) (register_chars[(unsigned char) x])
526 #define is_space_char(x) ((x) == ' ')
527 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
528 #define is_digit_char(x) (digit_chars[(unsigned char) x])
530 /* All non-digit non-letter characters that may occur in an operand. */
531 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
533 /* md_assemble() always leaves the strings it's passed unaltered. To
534 effect this we maintain a stack of saved characters that we've smashed
535 with '\0's (indicating end of strings for various sub-fields of the
536 assembler instruction). */
537 static char save_stack[32];
538 static char *save_stack_p;
539 #define END_STRING_AND_SAVE(s) \
540 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
541 #define RESTORE_END_STRING(s) \
542 do { *(s) = *--save_stack_p; } while (0)
544 /* The instruction we're assembling. */
547 /* Possible templates for current insn. */
548 static const templates *current_templates;
550 /* Per instruction expressionS buffers: max displacements & immediates. */
551 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
552 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
554 /* Current operand we are working on. */
555 static int this_operand = -1;
557 /* We support four different modes. FLAG_CODE variable is used to distinguish
565 static enum flag_code flag_code;
566 static unsigned int object_64bit;
567 static unsigned int disallow_64bit_reloc;
568 static int use_rela_relocations = 0;
569 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
570 static const char *tls_get_addr;
572 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
573 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
574 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
576 /* The ELF ABI to use. */
584 static enum x86_elf_abi x86_elf_abi = I386_ABI;
587 #if defined (TE_PE) || defined (TE_PEP)
588 /* Use big object file format. */
589 static int use_big_obj = 0;
592 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
593 /* 1 if generating code for a shared library. */
594 static int shared = 0;
597 /* 1 for intel syntax,
599 static int intel_syntax = 0;
601 /* 1 for Intel64 ISA,
605 /* 1 for intel mnemonic,
606 0 if att mnemonic. */
607 static int intel_mnemonic = !SYSV386_COMPAT;
609 /* 1 if pseudo registers are permitted. */
610 static int allow_pseudo_reg = 0;
612 /* 1 if register prefix % not required. */
613 static int allow_naked_reg = 0;
615 /* 1 if the assembler should add BND prefix for all control-transferring
616 instructions supporting it, even if this prefix wasn't specified
618 static int add_bnd_prefix = 0;
620 /* 1 if pseudo index register, eiz/riz, is allowed . */
621 static int allow_index_reg = 0;
623 /* 1 if the assembler should ignore LOCK prefix, even if it was
624 specified explicitly. */
625 static int omit_lock_prefix = 0;
627 /* 1 if the assembler should encode lfence, mfence, and sfence as
628 "lock addl $0, (%{re}sp)". */
629 static int avoid_fence = 0;
631 /* Type of the previous instruction. */
646 /* 1 if the assembler should generate relax relocations. */
648 static int generate_relax_relocations
649 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
651 static enum check_kind
657 sse_check, operand_check = check_warning;
659 /* Non-zero if branches should be aligned within power of 2 boundary. */
660 static int align_branch_power = 0;
662 /* Types of branches to align. */
663 enum align_branch_kind
665 align_branch_none = 0,
666 align_branch_jcc = 1,
667 align_branch_fused = 2,
668 align_branch_jmp = 3,
669 align_branch_call = 4,
670 align_branch_indirect = 5,
674 /* Type bits of branches to align. */
675 enum align_branch_bit
677 align_branch_jcc_bit = 1 << align_branch_jcc,
678 align_branch_fused_bit = 1 << align_branch_fused,
679 align_branch_jmp_bit = 1 << align_branch_jmp,
680 align_branch_call_bit = 1 << align_branch_call,
681 align_branch_indirect_bit = 1 << align_branch_indirect,
682 align_branch_ret_bit = 1 << align_branch_ret
685 static unsigned int align_branch = (align_branch_jcc_bit
686 | align_branch_fused_bit
687 | align_branch_jmp_bit);
689 /* The maximum padding size for fused jcc. CMP like instruction can
690 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
692 #define MAX_FUSED_JCC_PADDING_SIZE 20
694 /* The maximum number of prefixes added for an instruction. */
695 static unsigned int align_branch_prefix_size = 5;
698 1. Clear the REX_W bit with register operand if possible.
699 2. Above plus use 128bit vector instruction to clear the full vector
702 static int optimize = 0;
705 1. Clear the REX_W bit with register operand if possible.
706 2. Above plus use 128bit vector instruction to clear the full vector
708 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
711 static int optimize_for_space = 0;
713 /* Register prefix used for error message. */
714 static const char *register_prefix = "%";
716 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
717 leave, push, and pop instructions so that gcc has the same stack
718 frame as in 32 bit mode. */
719 static char stackop_size = '\0';
721 /* Non-zero to optimize code alignment. */
722 int optimize_align_code = 1;
724 /* Non-zero to quieten some warnings. */
725 static int quiet_warnings = 0;
728 static const char *cpu_arch_name = NULL;
729 static char *cpu_sub_arch_name = NULL;
731 /* CPU feature flags. */
732 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
734 /* If we have selected a cpu we are generating instructions for. */
735 static int cpu_arch_tune_set = 0;
737 /* Cpu we are generating instructions for. */
738 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
740 /* CPU feature flags of cpu we are generating instructions for. */
741 static i386_cpu_flags cpu_arch_tune_flags;
743 /* CPU instruction set architecture used. */
744 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
746 /* CPU feature flags of instruction set architecture used. */
747 i386_cpu_flags cpu_arch_isa_flags;
749 /* If set, conditional jumps are not automatically promoted to handle
750 larger than a byte offset. */
751 static unsigned int no_cond_jump_promotion = 0;
753 /* Encode SSE instructions with VEX prefix. */
754 static unsigned int sse2avx;
756 /* Encode scalar AVX instructions with specific vector length. */
763 /* Encode VEX WIG instructions with specific vex.w. */
770 /* Encode scalar EVEX LIG instructions with specific vector length. */
778 /* Encode EVEX WIG instructions with specific evex.w. */
785 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
786 static enum rc_type evexrcig = rne;
788 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
789 static symbolS *GOT_symbol;
791 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
792 unsigned int x86_dwarf2_return_column;
794 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
795 int x86_cie_data_alignment;
797 /* Interface to relax_segment.
798 There are 3 major relax states for 386 jump insns because the
799 different types of jumps add different sizes to frags when we're
800 figuring out what sort of jump to choose to reach a given label.
802 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
803 branches which are handled by md_estimate_size_before_relax() and
804 i386_generic_table_relax_frag(). */
807 #define UNCOND_JUMP 0
809 #define COND_JUMP86 2
810 #define BRANCH_PADDING 3
811 #define BRANCH_PREFIX 4
812 #define FUSED_JCC_PADDING 5
817 #define SMALL16 (SMALL | CODE16)
819 #define BIG16 (BIG | CODE16)
823 #define INLINE __inline__
829 #define ENCODE_RELAX_STATE(type, size) \
830 ((relax_substateT) (((type) << 2) | (size)))
831 #define TYPE_FROM_RELAX_STATE(s) \
833 #define DISP_SIZE_FROM_RELAX_STATE(s) \
834 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
836 /* This table is used by relax_frag to promote short jumps to long
837 ones where necessary. SMALL (short) jumps may be promoted to BIG
838 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
839 don't allow a short jump in a 32 bit code segment to be promoted to
840 a 16 bit offset jump because it's slower (requires data size
841 prefix), and doesn't work, unless the destination is in the bottom
842 64k of the code segment (The top 16 bits of eip are zeroed). */
844 const relax_typeS md_relax_table[] =
847 1) most positive reach of this state,
848 2) most negative reach of this state,
849 3) how many bytes this mode will have in the variable part of the frag
850 4) which index into the table to try if we can't fit into this one. */
852 /* UNCOND_JUMP states. */
853 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
854 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
855 /* dword jmp adds 4 bytes to frag:
856 0 extra opcode bytes, 4 displacement bytes. */
858 /* word jmp adds 2 byte2 to frag:
859 0 extra opcode bytes, 2 displacement bytes. */
862 /* COND_JUMP states. */
863 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
864 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
865 /* dword conditionals adds 5 bytes to frag:
866 1 extra opcode byte, 4 displacement bytes. */
868 /* word conditionals add 3 bytes to frag:
869 1 extra opcode byte, 2 displacement bytes. */
872 /* COND_JUMP86 states. */
873 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
874 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
875 /* dword conditionals adds 5 bytes to frag:
876 1 extra opcode byte, 4 displacement bytes. */
878 /* word conditionals add 4 bytes to frag:
879 1 displacement byte and a 3 byte long branch insn. */
883 static const arch_entry cpu_arch[] =
885 /* Do not replace the first two entries - i386_target_format()
886 relies on them being there in this order. */
887 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
888 CPU_GENERIC32_FLAGS, 0 },
889 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
890 CPU_GENERIC64_FLAGS, 0 },
891 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
893 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
895 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
897 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
899 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
901 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
903 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
905 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
907 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
908 CPU_PENTIUMPRO_FLAGS, 0 },
909 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
911 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
913 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
915 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
917 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
918 CPU_NOCONA_FLAGS, 0 },
919 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
921 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
923 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
924 CPU_CORE2_FLAGS, 1 },
925 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
926 CPU_CORE2_FLAGS, 0 },
927 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
928 CPU_COREI7_FLAGS, 0 },
929 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
931 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
933 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
934 CPU_IAMCU_FLAGS, 0 },
935 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
937 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
939 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
940 CPU_ATHLON_FLAGS, 0 },
941 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
943 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
945 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
947 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
948 CPU_AMDFAM10_FLAGS, 0 },
949 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
950 CPU_BDVER1_FLAGS, 0 },
951 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
952 CPU_BDVER2_FLAGS, 0 },
953 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
954 CPU_BDVER3_FLAGS, 0 },
955 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
956 CPU_BDVER4_FLAGS, 0 },
957 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
958 CPU_ZNVER1_FLAGS, 0 },
959 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
960 CPU_ZNVER2_FLAGS, 0 },
961 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
962 CPU_BTVER1_FLAGS, 0 },
963 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
964 CPU_BTVER2_FLAGS, 0 },
965 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
967 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
969 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
971 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
973 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
975 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
977 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
979 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
981 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
983 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
985 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
986 CPU_SSSE3_FLAGS, 0 },
987 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
988 CPU_SSE4_1_FLAGS, 0 },
989 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
990 CPU_SSE4_2_FLAGS, 0 },
991 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
992 CPU_SSE4_2_FLAGS, 0 },
993 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
995 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
997 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
998 CPU_AVX512F_FLAGS, 0 },
999 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1000 CPU_AVX512CD_FLAGS, 0 },
1001 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1002 CPU_AVX512ER_FLAGS, 0 },
1003 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1004 CPU_AVX512PF_FLAGS, 0 },
1005 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1006 CPU_AVX512DQ_FLAGS, 0 },
1007 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1008 CPU_AVX512BW_FLAGS, 0 },
1009 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1010 CPU_AVX512VL_FLAGS, 0 },
1011 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1013 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1014 CPU_VMFUNC_FLAGS, 0 },
1015 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1017 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1018 CPU_XSAVE_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1020 CPU_XSAVEOPT_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1022 CPU_XSAVEC_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1024 CPU_XSAVES_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1027 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1028 CPU_PCLMUL_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1030 CPU_PCLMUL_FLAGS, 1 },
1031 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1032 CPU_FSGSBASE_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1034 CPU_RDRND_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1036 CPU_F16C_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1038 CPU_BMI2_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1041 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1042 CPU_FMA4_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1045 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1047 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1048 CPU_MOVBE_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1050 CPU_CX16_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1053 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1054 CPU_LZCNT_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1057 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1059 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1060 CPU_INVPCID_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1062 CPU_CLFLUSH_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1065 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1066 CPU_SYSCALL_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1068 CPU_RDTSCP_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1070 CPU_3DNOW_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1072 CPU_3DNOWA_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1074 CPU_PADLOCK_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1076 CPU_SVME_FLAGS, 1 },
1077 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1078 CPU_SVME_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1080 CPU_SSE4A_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1083 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1085 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1087 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1089 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1090 CPU_RDSEED_FLAGS, 0 },
1091 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1092 CPU_PRFCHW_FLAGS, 0 },
1093 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1094 CPU_SMAP_FLAGS, 0 },
1095 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1097 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1099 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1100 CPU_CLFLUSHOPT_FLAGS, 0 },
1101 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1102 CPU_PREFETCHWT1_FLAGS, 0 },
1103 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1105 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1106 CPU_CLWB_FLAGS, 0 },
1107 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1108 CPU_AVX512IFMA_FLAGS, 0 },
1109 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1110 CPU_AVX512VBMI_FLAGS, 0 },
1111 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1112 CPU_AVX512_4FMAPS_FLAGS, 0 },
1113 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1114 CPU_AVX512_4VNNIW_FLAGS, 0 },
1115 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1116 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1117 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1118 CPU_AVX512_VBMI2_FLAGS, 0 },
1119 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1120 CPU_AVX512_VNNI_FLAGS, 0 },
1121 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1122 CPU_AVX512_BITALG_FLAGS, 0 },
1123 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1124 CPU_CLZERO_FLAGS, 0 },
1125 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1126 CPU_MWAITX_FLAGS, 0 },
1127 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1128 CPU_OSPKE_FLAGS, 0 },
1129 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1130 CPU_RDPID_FLAGS, 0 },
1131 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1132 CPU_PTWRITE_FLAGS, 0 },
1133 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1135 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1136 CPU_SHSTK_FLAGS, 0 },
1137 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1138 CPU_GFNI_FLAGS, 0 },
1139 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1140 CPU_VAES_FLAGS, 0 },
1141 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1142 CPU_VPCLMULQDQ_FLAGS, 0 },
1143 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1144 CPU_WBNOINVD_FLAGS, 0 },
1145 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1146 CPU_PCONFIG_FLAGS, 0 },
1147 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1148 CPU_WAITPKG_FLAGS, 0 },
1149 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1150 CPU_CLDEMOTE_FLAGS, 0 },
1151 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1152 CPU_MOVDIRI_FLAGS, 0 },
1153 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1154 CPU_MOVDIR64B_FLAGS, 0 },
1155 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1156 CPU_AVX512_BF16_FLAGS, 0 },
1157 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1158 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1159 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1160 CPU_ENQCMD_FLAGS, 0 },
1161 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1162 CPU_RDPRU_FLAGS, 0 },
1163 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1164 CPU_MCOMMIT_FLAGS, 0 },
1167 static const noarch_entry cpu_noarch[] =
1169 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1170 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1171 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1172 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1173 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1174 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1175 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1176 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1177 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1178 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1179 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1180 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1181 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1182 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1183 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1184 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1185 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1186 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1187 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1188 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1189 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1190 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1191 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1192 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1193 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1194 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1195 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1196 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1197 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1198 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1199 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1200 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1201 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1202 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1203 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1204 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1205 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1206 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1210 /* Like s_lcomm_internal in gas/read.c but the alignment string
1211 is allowed to be optional. */
1214 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1221 && *input_line_pointer == ',')
1223 align = parse_align (needs_align - 1);
1225 if (align == (addressT) -1)
1240 bss_alloc (symbolP, size, align);
1245 pe_lcomm (int needs_align)
1247 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1251 const pseudo_typeS md_pseudo_table[] =
1253 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1254 {"align", s_align_bytes, 0},
1256 {"align", s_align_ptwo, 0},
1258 {"arch", set_cpu_arch, 0},
1262 {"lcomm", pe_lcomm, 1},
1264 {"ffloat", float_cons, 'f'},
1265 {"dfloat", float_cons, 'd'},
1266 {"tfloat", float_cons, 'x'},
1268 {"slong", signed_cons, 4},
1269 {"noopt", s_ignore, 0},
1270 {"optim", s_ignore, 0},
1271 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1272 {"code16", set_code_flag, CODE_16BIT},
1273 {"code32", set_code_flag, CODE_32BIT},
1275 {"code64", set_code_flag, CODE_64BIT},
1277 {"intel_syntax", set_intel_syntax, 1},
1278 {"att_syntax", set_intel_syntax, 0},
1279 {"intel_mnemonic", set_intel_mnemonic, 1},
1280 {"att_mnemonic", set_intel_mnemonic, 0},
1281 {"allow_index_reg", set_allow_index_reg, 1},
1282 {"disallow_index_reg", set_allow_index_reg, 0},
1283 {"sse_check", set_check, 0},
1284 {"operand_check", set_check, 1},
1285 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1286 {"largecomm", handle_large_common, 0},
1288 {"file", dwarf2_directive_file, 0},
1289 {"loc", dwarf2_directive_loc, 0},
1290 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1293 {"secrel32", pe_directive_secrel, 0},
1298 /* For interface with expression (). */
1299 extern char *input_line_pointer;
1301 /* Hash table for instruction mnemonic lookup. */
1302 static struct hash_control *op_hash;
1304 /* Hash table for register lookup. */
1305 static struct hash_control *reg_hash;
1307 /* Various efficient no-op patterns for aligning code labels.
1308 Note: Don't try to assemble the instructions in the comments.
1309 0L and 0w are not legal. */
1310 static const unsigned char f32_1[] =
1312 static const unsigned char f32_2[] =
1313 {0x66,0x90}; /* xchg %ax,%ax */
1314 static const unsigned char f32_3[] =
1315 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1316 static const unsigned char f32_4[] =
1317 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1318 static const unsigned char f32_6[] =
1319 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1320 static const unsigned char f32_7[] =
1321 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1322 static const unsigned char f16_3[] =
1323 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1324 static const unsigned char f16_4[] =
1325 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1326 static const unsigned char jump_disp8[] =
1327 {0xeb}; /* jmp disp8 */
1328 static const unsigned char jump32_disp32[] =
1329 {0xe9}; /* jmp disp32 */
1330 static const unsigned char jump16_disp32[] =
1331 {0x66,0xe9}; /* jmp disp32 */
1332 /* 32-bit NOPs patterns. */
1333 static const unsigned char *const f32_patt[] = {
1334 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1336 /* 16-bit NOPs patterns. */
1337 static const unsigned char *const f16_patt[] = {
1338 f32_1, f32_2, f16_3, f16_4
1340 /* nopl (%[re]ax) */
1341 static const unsigned char alt_3[] =
1343 /* nopl 0(%[re]ax) */
1344 static const unsigned char alt_4[] =
1345 {0x0f,0x1f,0x40,0x00};
1346 /* nopl 0(%[re]ax,%[re]ax,1) */
1347 static const unsigned char alt_5[] =
1348 {0x0f,0x1f,0x44,0x00,0x00};
1349 /* nopw 0(%[re]ax,%[re]ax,1) */
1350 static const unsigned char alt_6[] =
1351 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1352 /* nopl 0L(%[re]ax) */
1353 static const unsigned char alt_7[] =
1354 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1355 /* nopl 0L(%[re]ax,%[re]ax,1) */
1356 static const unsigned char alt_8[] =
1357 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1358 /* nopw 0L(%[re]ax,%[re]ax,1) */
1359 static const unsigned char alt_9[] =
1360 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1361 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1362 static const unsigned char alt_10[] =
1363 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1364 /* data16 nopw %cs:0L(%eax,%eax,1) */
1365 static const unsigned char alt_11[] =
1366 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1367 /* 32-bit and 64-bit NOPs patterns. */
1368 static const unsigned char *const alt_patt[] = {
1369 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1370 alt_9, alt_10, alt_11
1373 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1374 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1377 i386_output_nops (char *where, const unsigned char *const *patt,
1378 int count, int max_single_nop_size)
1381 /* Place the longer NOP first. */
1384 const unsigned char *nops;
1386 if (max_single_nop_size < 1)
1388 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1389 max_single_nop_size);
1393 nops = patt[max_single_nop_size - 1];
1395 /* Use the smaller one if the requsted one isn't available. */
1398 max_single_nop_size--;
1399 nops = patt[max_single_nop_size - 1];
1402 last = count % max_single_nop_size;
1405 for (offset = 0; offset < count; offset += max_single_nop_size)
1406 memcpy (where + offset, nops, max_single_nop_size);
1410 nops = patt[last - 1];
1413 /* Use the smaller one plus one-byte NOP if the needed one
1416 nops = patt[last - 1];
1417 memcpy (where + offset, nops, last);
1418 where[offset + last] = *patt[0];
1421 memcpy (where + offset, nops, last);
1426 fits_in_imm7 (offsetT num)
1428 return (num & 0x7f) == num;
1432 fits_in_imm31 (offsetT num)
1434 return (num & 0x7fffffff) == num;
1437 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1438 single NOP instruction LIMIT. */
1441 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1443 const unsigned char *const *patt = NULL;
1444 int max_single_nop_size;
1445 /* Maximum number of NOPs before switching to jump over NOPs. */
1446 int max_number_of_nops;
1448 switch (fragP->fr_type)
1453 case rs_machine_dependent:
1454 /* Allow NOP padding for jumps and calls. */
1455 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1456 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1463 /* We need to decide which NOP sequence to use for 32bit and
1464 64bit. When -mtune= is used:
1466 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1467 PROCESSOR_GENERIC32, f32_patt will be used.
1468 2. For the rest, alt_patt will be used.
1470 When -mtune= isn't used, alt_patt will be used if
1471 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1474 When -march= or .arch is used, we can't use anything beyond
1475 cpu_arch_isa_flags. */
1477 if (flag_code == CODE_16BIT)
1480 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1481 /* Limit number of NOPs to 2 in 16-bit mode. */
1482 max_number_of_nops = 2;
1486 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1488 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1489 switch (cpu_arch_tune)
1491 case PROCESSOR_UNKNOWN:
1492 /* We use cpu_arch_isa_flags to check if we SHOULD
1493 optimize with nops. */
1494 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1499 case PROCESSOR_PENTIUM4:
1500 case PROCESSOR_NOCONA:
1501 case PROCESSOR_CORE:
1502 case PROCESSOR_CORE2:
1503 case PROCESSOR_COREI7:
1504 case PROCESSOR_L1OM:
1505 case PROCESSOR_K1OM:
1506 case PROCESSOR_GENERIC64:
1508 case PROCESSOR_ATHLON:
1510 case PROCESSOR_AMDFAM10:
1512 case PROCESSOR_ZNVER:
1516 case PROCESSOR_I386:
1517 case PROCESSOR_I486:
1518 case PROCESSOR_PENTIUM:
1519 case PROCESSOR_PENTIUMPRO:
1520 case PROCESSOR_IAMCU:
1521 case PROCESSOR_GENERIC32:
1528 switch (fragP->tc_frag_data.tune)
1530 case PROCESSOR_UNKNOWN:
1531 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1532 PROCESSOR_UNKNOWN. */
1536 case PROCESSOR_I386:
1537 case PROCESSOR_I486:
1538 case PROCESSOR_PENTIUM:
1539 case PROCESSOR_IAMCU:
1541 case PROCESSOR_ATHLON:
1543 case PROCESSOR_AMDFAM10:
1545 case PROCESSOR_ZNVER:
1547 case PROCESSOR_GENERIC32:
1548 /* We use cpu_arch_isa_flags to check if we CAN optimize
1550 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1555 case PROCESSOR_PENTIUMPRO:
1556 case PROCESSOR_PENTIUM4:
1557 case PROCESSOR_NOCONA:
1558 case PROCESSOR_CORE:
1559 case PROCESSOR_CORE2:
1560 case PROCESSOR_COREI7:
1561 case PROCESSOR_L1OM:
1562 case PROCESSOR_K1OM:
1563 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1568 case PROCESSOR_GENERIC64:
1574 if (patt == f32_patt)
1576 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1577 /* Limit number of NOPs to 2 for older processors. */
1578 max_number_of_nops = 2;
1582 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1583 /* Limit number of NOPs to 7 for newer processors. */
1584 max_number_of_nops = 7;
1589 limit = max_single_nop_size;
1591 if (fragP->fr_type == rs_fill_nop)
1593 /* Output NOPs for .nop directive. */
1594 if (limit > max_single_nop_size)
1596 as_bad_where (fragP->fr_file, fragP->fr_line,
1597 _("invalid single nop size: %d "
1598 "(expect within [0, %d])"),
1599 limit, max_single_nop_size);
1603 else if (fragP->fr_type != rs_machine_dependent)
1604 fragP->fr_var = count;
1606 if ((count / max_single_nop_size) > max_number_of_nops)
1608 /* Generate jump over NOPs. */
1609 offsetT disp = count - 2;
1610 if (fits_in_imm7 (disp))
1612 /* Use "jmp disp8" if possible. */
1614 where[0] = jump_disp8[0];
1620 unsigned int size_of_jump;
1622 if (flag_code == CODE_16BIT)
1624 where[0] = jump16_disp32[0];
1625 where[1] = jump16_disp32[1];
1630 where[0] = jump32_disp32[0];
1634 count -= size_of_jump + 4;
1635 if (!fits_in_imm31 (count))
1637 as_bad_where (fragP->fr_file, fragP->fr_line,
1638 _("jump over nop padding out of range"));
1642 md_number_to_chars (where + size_of_jump, count, 4);
1643 where += size_of_jump + 4;
1647 /* Generate multiple NOPs. */
1648 i386_output_nops (where, patt, count, limit);
1652 operand_type_all_zero (const union i386_operand_type *x)
1654 switch (ARRAY_SIZE(x->array))
1665 return !x->array[0];
1672 operand_type_set (union i386_operand_type *x, unsigned int v)
1674 switch (ARRAY_SIZE(x->array))
1690 x->bitfield.class = ClassNone;
1691 x->bitfield.instance = InstanceNone;
1695 operand_type_equal (const union i386_operand_type *x,
1696 const union i386_operand_type *y)
1698 switch (ARRAY_SIZE(x->array))
1701 if (x->array[2] != y->array[2])
1705 if (x->array[1] != y->array[1])
1709 return x->array[0] == y->array[0];
1717 cpu_flags_all_zero (const union i386_cpu_flags *x)
1719 switch (ARRAY_SIZE(x->array))
1734 return !x->array[0];
1741 cpu_flags_equal (const union i386_cpu_flags *x,
1742 const union i386_cpu_flags *y)
1744 switch (ARRAY_SIZE(x->array))
1747 if (x->array[3] != y->array[3])
1751 if (x->array[2] != y->array[2])
1755 if (x->array[1] != y->array[1])
1759 return x->array[0] == y->array[0];
1767 cpu_flags_check_cpu64 (i386_cpu_flags f)
1769 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1770 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1773 static INLINE i386_cpu_flags
1774 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1776 switch (ARRAY_SIZE (x.array))
1779 x.array [3] &= y.array [3];
1782 x.array [2] &= y.array [2];
1785 x.array [1] &= y.array [1];
1788 x.array [0] &= y.array [0];
1796 static INLINE i386_cpu_flags
1797 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1799 switch (ARRAY_SIZE (x.array))
1802 x.array [3] |= y.array [3];
1805 x.array [2] |= y.array [2];
1808 x.array [1] |= y.array [1];
1811 x.array [0] |= y.array [0];
1819 static INLINE i386_cpu_flags
1820 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1822 switch (ARRAY_SIZE (x.array))
1825 x.array [3] &= ~y.array [3];
1828 x.array [2] &= ~y.array [2];
1831 x.array [1] &= ~y.array [1];
1834 x.array [0] &= ~y.array [0];
1842 #define CPU_FLAGS_ARCH_MATCH 0x1
1843 #define CPU_FLAGS_64BIT_MATCH 0x2
1845 #define CPU_FLAGS_PERFECT_MATCH \
1846 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1848 /* Return CPU flags match bits. */
1851 cpu_flags_match (const insn_template *t)
1853 i386_cpu_flags x = t->cpu_flags;
1854 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1856 x.bitfield.cpu64 = 0;
1857 x.bitfield.cpuno64 = 0;
1859 if (cpu_flags_all_zero (&x))
1861 /* This instruction is available on all archs. */
1862 match |= CPU_FLAGS_ARCH_MATCH;
1866 /* This instruction is available only on some archs. */
1867 i386_cpu_flags cpu = cpu_arch_flags;
1869 /* AVX512VL is no standalone feature - match it and then strip it. */
1870 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1872 x.bitfield.cpuavx512vl = 0;
1874 cpu = cpu_flags_and (x, cpu);
1875 if (!cpu_flags_all_zero (&cpu))
1877 if (x.bitfield.cpuavx)
1879 /* We need to check a few extra flags with AVX. */
1880 if (cpu.bitfield.cpuavx
1881 && (!t->opcode_modifier.sse2avx || sse2avx)
1882 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1883 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1884 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1885 match |= CPU_FLAGS_ARCH_MATCH;
1887 else if (x.bitfield.cpuavx512f)
1889 /* We need to check a few extra flags with AVX512F. */
1890 if (cpu.bitfield.cpuavx512f
1891 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1892 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1893 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1894 match |= CPU_FLAGS_ARCH_MATCH;
1897 match |= CPU_FLAGS_ARCH_MATCH;
1903 static INLINE i386_operand_type
1904 operand_type_and (i386_operand_type x, i386_operand_type y)
1906 if (x.bitfield.class != y.bitfield.class)
1907 x.bitfield.class = ClassNone;
1908 if (x.bitfield.instance != y.bitfield.instance)
1909 x.bitfield.instance = InstanceNone;
1911 switch (ARRAY_SIZE (x.array))
1914 x.array [2] &= y.array [2];
1917 x.array [1] &= y.array [1];
1920 x.array [0] &= y.array [0];
1928 static INLINE i386_operand_type
1929 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1931 gas_assert (y.bitfield.class == ClassNone);
1932 gas_assert (y.bitfield.instance == InstanceNone);
1934 switch (ARRAY_SIZE (x.array))
1937 x.array [2] &= ~y.array [2];
1940 x.array [1] &= ~y.array [1];
1943 x.array [0] &= ~y.array [0];
1951 static INLINE i386_operand_type
1952 operand_type_or (i386_operand_type x, i386_operand_type y)
1954 gas_assert (x.bitfield.class == ClassNone ||
1955 y.bitfield.class == ClassNone ||
1956 x.bitfield.class == y.bitfield.class);
1957 gas_assert (x.bitfield.instance == InstanceNone ||
1958 y.bitfield.instance == InstanceNone ||
1959 x.bitfield.instance == y.bitfield.instance);
1961 switch (ARRAY_SIZE (x.array))
1964 x.array [2] |= y.array [2];
1967 x.array [1] |= y.array [1];
1970 x.array [0] |= y.array [0];
1978 static INLINE i386_operand_type
1979 operand_type_xor (i386_operand_type x, i386_operand_type y)
1981 gas_assert (y.bitfield.class == ClassNone);
1982 gas_assert (y.bitfield.instance == InstanceNone);
1984 switch (ARRAY_SIZE (x.array))
1987 x.array [2] ^= y.array [2];
1990 x.array [1] ^= y.array [1];
1993 x.array [0] ^= y.array [0];
2001 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2002 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2003 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2004 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2005 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2006 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2007 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2008 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2009 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2010 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2011 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2012 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2013 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2014 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2015 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2016 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2017 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2028 operand_type_check (i386_operand_type t, enum operand_type c)
2033 return t.bitfield.class == Reg;
2036 return (t.bitfield.imm8
2040 || t.bitfield.imm32s
2041 || t.bitfield.imm64);
2044 return (t.bitfield.disp8
2045 || t.bitfield.disp16
2046 || t.bitfield.disp32
2047 || t.bitfield.disp32s
2048 || t.bitfield.disp64);
2051 return (t.bitfield.disp8
2052 || t.bitfield.disp16
2053 || t.bitfield.disp32
2054 || t.bitfield.disp32s
2055 || t.bitfield.disp64
2056 || t.bitfield.baseindex);
2065 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2066 between operand GIVEN and opeand WANTED for instruction template T. */
2069 match_operand_size (const insn_template *t, unsigned int wanted,
2072 return !((i.types[given].bitfield.byte
2073 && !t->operand_types[wanted].bitfield.byte)
2074 || (i.types[given].bitfield.word
2075 && !t->operand_types[wanted].bitfield.word)
2076 || (i.types[given].bitfield.dword
2077 && !t->operand_types[wanted].bitfield.dword)
2078 || (i.types[given].bitfield.qword
2079 && !t->operand_types[wanted].bitfield.qword)
2080 || (i.types[given].bitfield.tbyte
2081 && !t->operand_types[wanted].bitfield.tbyte));
2084 /* Return 1 if there is no conflict in SIMD register between operand
2085 GIVEN and opeand WANTED for instruction template T. */
2088 match_simd_size (const insn_template *t, unsigned int wanted,
2091 return !((i.types[given].bitfield.xmmword
2092 && !t->operand_types[wanted].bitfield.xmmword)
2093 || (i.types[given].bitfield.ymmword
2094 && !t->operand_types[wanted].bitfield.ymmword)
2095 || (i.types[given].bitfield.zmmword
2096 && !t->operand_types[wanted].bitfield.zmmword));
2099 /* Return 1 if there is no conflict in any size between operand GIVEN
2100 and opeand WANTED for instruction template T. */
2103 match_mem_size (const insn_template *t, unsigned int wanted,
2106 return (match_operand_size (t, wanted, given)
2107 && !((i.types[given].bitfield.unspecified
2109 && !t->operand_types[wanted].bitfield.unspecified)
2110 || (i.types[given].bitfield.fword
2111 && !t->operand_types[wanted].bitfield.fword)
2112 /* For scalar opcode templates to allow register and memory
2113 operands at the same time, some special casing is needed
2114 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2115 down-conversion vpmov*. */
2116 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2117 && !t->opcode_modifier.broadcast
2118 && (t->operand_types[wanted].bitfield.byte
2119 || t->operand_types[wanted].bitfield.word
2120 || t->operand_types[wanted].bitfield.dword
2121 || t->operand_types[wanted].bitfield.qword))
2122 ? (i.types[given].bitfield.xmmword
2123 || i.types[given].bitfield.ymmword
2124 || i.types[given].bitfield.zmmword)
2125 : !match_simd_size(t, wanted, given))));
2128 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2129 operands for instruction template T, and it has MATCH_REVERSE set if there
2130 is no size conflict on any operands for the template with operands reversed
2131 (and the template allows for reversing in the first place). */
2133 #define MATCH_STRAIGHT 1
2134 #define MATCH_REVERSE 2
2136 static INLINE unsigned int
2137 operand_size_match (const insn_template *t)
2139 unsigned int j, match = MATCH_STRAIGHT;
2141 /* Don't check non-absolute jump instructions. */
2142 if (t->opcode_modifier.jump
2143 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2146 /* Check memory and accumulator operand size. */
2147 for (j = 0; j < i.operands; j++)
2149 if (i.types[j].bitfield.class != Reg
2150 && i.types[j].bitfield.class != RegSIMD
2151 && t->opcode_modifier.anysize)
2154 if (t->operand_types[j].bitfield.class == Reg
2155 && !match_operand_size (t, j, j))
2161 if (t->operand_types[j].bitfield.class == RegSIMD
2162 && !match_simd_size (t, j, j))
2168 if (t->operand_types[j].bitfield.instance == Accum
2169 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2175 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2182 if (!t->opcode_modifier.d)
2186 i.error = operand_size_mismatch;
2190 /* Check reverse. */
2191 gas_assert (i.operands >= 2 && i.operands <= 3);
2193 for (j = 0; j < i.operands; j++)
2195 unsigned int given = i.operands - j - 1;
2197 if (t->operand_types[j].bitfield.class == Reg
2198 && !match_operand_size (t, j, given))
2201 if (t->operand_types[j].bitfield.class == RegSIMD
2202 && !match_simd_size (t, j, given))
2205 if (t->operand_types[j].bitfield.instance == Accum
2206 && (!match_operand_size (t, j, given)
2207 || !match_simd_size (t, j, given)))
2210 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2214 return match | MATCH_REVERSE;
2218 operand_type_match (i386_operand_type overlap,
2219 i386_operand_type given)
2221 i386_operand_type temp = overlap;
2223 temp.bitfield.unspecified = 0;
2224 temp.bitfield.byte = 0;
2225 temp.bitfield.word = 0;
2226 temp.bitfield.dword = 0;
2227 temp.bitfield.fword = 0;
2228 temp.bitfield.qword = 0;
2229 temp.bitfield.tbyte = 0;
2230 temp.bitfield.xmmword = 0;
2231 temp.bitfield.ymmword = 0;
2232 temp.bitfield.zmmword = 0;
2233 if (operand_type_all_zero (&temp))
2236 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2240 i.error = operand_type_mismatch;
2244 /* If given types g0 and g1 are registers they must be of the same type
2245 unless the expected operand type register overlap is null.
2246 Memory operand size of certain SIMD instructions is also being checked
2250 operand_type_register_match (i386_operand_type g0,
2251 i386_operand_type t0,
2252 i386_operand_type g1,
2253 i386_operand_type t1)
2255 if (g0.bitfield.class != Reg
2256 && g0.bitfield.class != RegSIMD
2257 && (!operand_type_check (g0, anymem)
2258 || g0.bitfield.unspecified
2259 || t0.bitfield.class != RegSIMD))
2262 if (g1.bitfield.class != Reg
2263 && g1.bitfield.class != RegSIMD
2264 && (!operand_type_check (g1, anymem)
2265 || g1.bitfield.unspecified
2266 || t1.bitfield.class != RegSIMD))
2269 if (g0.bitfield.byte == g1.bitfield.byte
2270 && g0.bitfield.word == g1.bitfield.word
2271 && g0.bitfield.dword == g1.bitfield.dword
2272 && g0.bitfield.qword == g1.bitfield.qword
2273 && g0.bitfield.xmmword == g1.bitfield.xmmword
2274 && g0.bitfield.ymmword == g1.bitfield.ymmword
2275 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2278 if (!(t0.bitfield.byte & t1.bitfield.byte)
2279 && !(t0.bitfield.word & t1.bitfield.word)
2280 && !(t0.bitfield.dword & t1.bitfield.dword)
2281 && !(t0.bitfield.qword & t1.bitfield.qword)
2282 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2283 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2284 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2287 i.error = register_type_mismatch;
2292 static INLINE unsigned int
2293 register_number (const reg_entry *r)
2295 unsigned int nr = r->reg_num;
2297 if (r->reg_flags & RegRex)
2300 if (r->reg_flags & RegVRex)
2306 static INLINE unsigned int
2307 mode_from_disp_size (i386_operand_type t)
2309 if (t.bitfield.disp8)
2311 else if (t.bitfield.disp16
2312 || t.bitfield.disp32
2313 || t.bitfield.disp32s)
2320 fits_in_signed_byte (addressT num)
2322 return num + 0x80 <= 0xff;
2326 fits_in_unsigned_byte (addressT num)
2332 fits_in_unsigned_word (addressT num)
2334 return num <= 0xffff;
2338 fits_in_signed_word (addressT num)
2340 return num + 0x8000 <= 0xffff;
2344 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2349 return num + 0x80000000 <= 0xffffffff;
2351 } /* fits_in_signed_long() */
2354 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2359 return num <= 0xffffffff;
2361 } /* fits_in_unsigned_long() */
2364 fits_in_disp8 (offsetT num)
2366 int shift = i.memshift;
2372 mask = (1 << shift) - 1;
2374 /* Return 0 if NUM isn't properly aligned. */
2378 /* Check if NUM will fit in 8bit after shift. */
2379 return fits_in_signed_byte (num >> shift);
2383 fits_in_imm4 (offsetT num)
2385 return (num & 0xf) == num;
2388 static i386_operand_type
2389 smallest_imm_type (offsetT num)
2391 i386_operand_type t;
2393 operand_type_set (&t, 0);
2394 t.bitfield.imm64 = 1;
2396 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2398 /* This code is disabled on the 486 because all the Imm1 forms
2399 in the opcode table are slower on the i486. They're the
2400 versions with the implicitly specified single-position
2401 displacement, which has another syntax if you really want to
2403 t.bitfield.imm1 = 1;
2404 t.bitfield.imm8 = 1;
2405 t.bitfield.imm8s = 1;
2406 t.bitfield.imm16 = 1;
2407 t.bitfield.imm32 = 1;
2408 t.bitfield.imm32s = 1;
2410 else if (fits_in_signed_byte (num))
2412 t.bitfield.imm8 = 1;
2413 t.bitfield.imm8s = 1;
2414 t.bitfield.imm16 = 1;
2415 t.bitfield.imm32 = 1;
2416 t.bitfield.imm32s = 1;
2418 else if (fits_in_unsigned_byte (num))
2420 t.bitfield.imm8 = 1;
2421 t.bitfield.imm16 = 1;
2422 t.bitfield.imm32 = 1;
2423 t.bitfield.imm32s = 1;
2425 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2427 t.bitfield.imm16 = 1;
2428 t.bitfield.imm32 = 1;
2429 t.bitfield.imm32s = 1;
2431 else if (fits_in_signed_long (num))
2433 t.bitfield.imm32 = 1;
2434 t.bitfield.imm32s = 1;
2436 else if (fits_in_unsigned_long (num))
2437 t.bitfield.imm32 = 1;
2443 offset_in_range (offsetT val, int size)
2449 case 1: mask = ((addressT) 1 << 8) - 1; break;
2450 case 2: mask = ((addressT) 1 << 16) - 1; break;
2451 case 4: mask = ((addressT) 2 << 31) - 1; break;
2453 case 8: mask = ((addressT) 2 << 63) - 1; break;
2459 /* If BFD64, sign extend val for 32bit address mode. */
2460 if (flag_code != CODE_64BIT
2461 || i.prefix[ADDR_PREFIX])
2462 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2463 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2466 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2468 char buf1[40], buf2[40];
2470 sprint_value (buf1, val);
2471 sprint_value (buf2, val & mask);
2472 as_warn (_("%s shortened to %s"), buf1, buf2);
2487 a. PREFIX_EXIST if attempting to add a prefix where one from the
2488 same class already exists.
2489 b. PREFIX_LOCK if lock prefix is added.
2490 c. PREFIX_REP if rep/repne prefix is added.
2491 d. PREFIX_DS if ds prefix is added.
2492 e. PREFIX_OTHER if other prefix is added.
2495 static enum PREFIX_GROUP
2496 add_prefix (unsigned int prefix)
2498 enum PREFIX_GROUP ret = PREFIX_OTHER;
2501 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2502 && flag_code == CODE_64BIT)
2504 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2505 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2506 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2507 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2518 case DS_PREFIX_OPCODE:
2521 case CS_PREFIX_OPCODE:
2522 case ES_PREFIX_OPCODE:
2523 case FS_PREFIX_OPCODE:
2524 case GS_PREFIX_OPCODE:
2525 case SS_PREFIX_OPCODE:
2529 case REPNE_PREFIX_OPCODE:
2530 case REPE_PREFIX_OPCODE:
2535 case LOCK_PREFIX_OPCODE:
2544 case ADDR_PREFIX_OPCODE:
2548 case DATA_PREFIX_OPCODE:
2552 if (i.prefix[q] != 0)
2560 i.prefix[q] |= prefix;
2563 as_bad (_("same type of prefix used twice"));
2569 update_code_flag (int value, int check)
2571 PRINTF_LIKE ((*as_error));
2573 flag_code = (enum flag_code) value;
2574 if (flag_code == CODE_64BIT)
2576 cpu_arch_flags.bitfield.cpu64 = 1;
2577 cpu_arch_flags.bitfield.cpuno64 = 0;
2581 cpu_arch_flags.bitfield.cpu64 = 0;
2582 cpu_arch_flags.bitfield.cpuno64 = 1;
2584 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2587 as_error = as_fatal;
2590 (*as_error) (_("64bit mode not supported on `%s'."),
2591 cpu_arch_name ? cpu_arch_name : default_arch);
2593 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2596 as_error = as_fatal;
2599 (*as_error) (_("32bit mode not supported on `%s'."),
2600 cpu_arch_name ? cpu_arch_name : default_arch);
2602 stackop_size = '\0';
2606 set_code_flag (int value)
2608 update_code_flag (value, 0);
2612 set_16bit_gcc_code_flag (int new_code_flag)
2614 flag_code = (enum flag_code) new_code_flag;
2615 if (flag_code != CODE_16BIT)
2617 cpu_arch_flags.bitfield.cpu64 = 0;
2618 cpu_arch_flags.bitfield.cpuno64 = 1;
2619 stackop_size = LONG_MNEM_SUFFIX;
2623 set_intel_syntax (int syntax_flag)
2625 /* Find out if register prefixing is specified. */
2626 int ask_naked_reg = 0;
2629 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2632 int e = get_symbol_name (&string);
2634 if (strcmp (string, "prefix") == 0)
2636 else if (strcmp (string, "noprefix") == 0)
2639 as_bad (_("bad argument to syntax directive."));
2640 (void) restore_line_pointer (e);
2642 demand_empty_rest_of_line ();
2644 intel_syntax = syntax_flag;
2646 if (ask_naked_reg == 0)
2647 allow_naked_reg = (intel_syntax
2648 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2650 allow_naked_reg = (ask_naked_reg < 0);
2652 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2654 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2655 identifier_chars['$'] = intel_syntax ? '$' : 0;
2656 register_prefix = allow_naked_reg ? "" : "%";
2660 set_intel_mnemonic (int mnemonic_flag)
2662 intel_mnemonic = mnemonic_flag;
2666 set_allow_index_reg (int flag)
2668 allow_index_reg = flag;
2672 set_check (int what)
2674 enum check_kind *kind;
2679 kind = &operand_check;
2690 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2693 int e = get_symbol_name (&string);
2695 if (strcmp (string, "none") == 0)
2697 else if (strcmp (string, "warning") == 0)
2698 *kind = check_warning;
2699 else if (strcmp (string, "error") == 0)
2700 *kind = check_error;
2702 as_bad (_("bad argument to %s_check directive."), str);
2703 (void) restore_line_pointer (e);
2706 as_bad (_("missing argument for %s_check directive"), str);
2708 demand_empty_rest_of_line ();
2712 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2713 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2715 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2716 static const char *arch;
2718 /* Intel LIOM is only supported on ELF. */
2724 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2725 use default_arch. */
2726 arch = cpu_arch_name;
2728 arch = default_arch;
2731 /* If we are targeting Intel MCU, we must enable it. */
2732 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2733 || new_flag.bitfield.cpuiamcu)
2736 /* If we are targeting Intel L1OM, we must enable it. */
2737 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2738 || new_flag.bitfield.cpul1om)
2741 /* If we are targeting Intel K1OM, we must enable it. */
2742 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2743 || new_flag.bitfield.cpuk1om)
2746 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2751 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2755 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2758 int e = get_symbol_name (&string);
2760 i386_cpu_flags flags;
2762 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2764 if (strcmp (string, cpu_arch[j].name) == 0)
2766 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2770 cpu_arch_name = cpu_arch[j].name;
2771 cpu_sub_arch_name = NULL;
2772 cpu_arch_flags = cpu_arch[j].flags;
2773 if (flag_code == CODE_64BIT)
2775 cpu_arch_flags.bitfield.cpu64 = 1;
2776 cpu_arch_flags.bitfield.cpuno64 = 0;
2780 cpu_arch_flags.bitfield.cpu64 = 0;
2781 cpu_arch_flags.bitfield.cpuno64 = 1;
2783 cpu_arch_isa = cpu_arch[j].type;
2784 cpu_arch_isa_flags = cpu_arch[j].flags;
2785 if (!cpu_arch_tune_set)
2787 cpu_arch_tune = cpu_arch_isa;
2788 cpu_arch_tune_flags = cpu_arch_isa_flags;
2793 flags = cpu_flags_or (cpu_arch_flags,
2796 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2798 if (cpu_sub_arch_name)
2800 char *name = cpu_sub_arch_name;
2801 cpu_sub_arch_name = concat (name,
2803 (const char *) NULL);
2807 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2808 cpu_arch_flags = flags;
2809 cpu_arch_isa_flags = flags;
2813 = cpu_flags_or (cpu_arch_isa_flags,
2815 (void) restore_line_pointer (e);
2816 demand_empty_rest_of_line ();
2821 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2823 /* Disable an ISA extension. */
2824 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2825 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2827 flags = cpu_flags_and_not (cpu_arch_flags,
2828 cpu_noarch[j].flags);
2829 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2831 if (cpu_sub_arch_name)
2833 char *name = cpu_sub_arch_name;
2834 cpu_sub_arch_name = concat (name, string,
2835 (const char *) NULL);
2839 cpu_sub_arch_name = xstrdup (string);
2840 cpu_arch_flags = flags;
2841 cpu_arch_isa_flags = flags;
2843 (void) restore_line_pointer (e);
2844 demand_empty_rest_of_line ();
2848 j = ARRAY_SIZE (cpu_arch);
2851 if (j >= ARRAY_SIZE (cpu_arch))
2852 as_bad (_("no such architecture: `%s'"), string);
2854 *input_line_pointer = e;
2857 as_bad (_("missing cpu architecture"));
2859 no_cond_jump_promotion = 0;
2860 if (*input_line_pointer == ','
2861 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2866 ++input_line_pointer;
2867 e = get_symbol_name (&string);
2869 if (strcmp (string, "nojumps") == 0)
2870 no_cond_jump_promotion = 1;
2871 else if (strcmp (string, "jumps") == 0)
2874 as_bad (_("no such architecture modifier: `%s'"), string);
2876 (void) restore_line_pointer (e);
2879 demand_empty_rest_of_line ();
2882 enum bfd_architecture
2885 if (cpu_arch_isa == PROCESSOR_L1OM)
2887 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2888 || flag_code != CODE_64BIT)
2889 as_fatal (_("Intel L1OM is 64bit ELF only"));
2890 return bfd_arch_l1om;
2892 else if (cpu_arch_isa == PROCESSOR_K1OM)
2894 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2895 || flag_code != CODE_64BIT)
2896 as_fatal (_("Intel K1OM is 64bit ELF only"));
2897 return bfd_arch_k1om;
2899 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2901 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2902 || flag_code == CODE_64BIT)
2903 as_fatal (_("Intel MCU is 32bit ELF only"));
2904 return bfd_arch_iamcu;
2907 return bfd_arch_i386;
2913 if (!strncmp (default_arch, "x86_64", 6))
2915 if (cpu_arch_isa == PROCESSOR_L1OM)
2917 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2918 || default_arch[6] != '\0')
2919 as_fatal (_("Intel L1OM is 64bit ELF only"));
2920 return bfd_mach_l1om;
2922 else if (cpu_arch_isa == PROCESSOR_K1OM)
2924 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2925 || default_arch[6] != '\0')
2926 as_fatal (_("Intel K1OM is 64bit ELF only"));
2927 return bfd_mach_k1om;
2929 else if (default_arch[6] == '\0')
2930 return bfd_mach_x86_64;
2932 return bfd_mach_x64_32;
2934 else if (!strcmp (default_arch, "i386")
2935 || !strcmp (default_arch, "iamcu"))
2937 if (cpu_arch_isa == PROCESSOR_IAMCU)
2939 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2940 as_fatal (_("Intel MCU is 32bit ELF only"));
2941 return bfd_mach_i386_iamcu;
2944 return bfd_mach_i386_i386;
2947 as_fatal (_("unknown architecture"));
2953 const char *hash_err;
2955 /* Support pseudo prefixes like {disp32}. */
2956 lex_type ['{'] = LEX_BEGIN_NAME;
2958 /* Initialize op_hash hash table. */
2959 op_hash = hash_new ();
2962 const insn_template *optab;
2963 templates *core_optab;
2965 /* Setup for loop. */
2967 core_optab = XNEW (templates);
2968 core_optab->start = optab;
2973 if (optab->name == NULL
2974 || strcmp (optab->name, (optab - 1)->name) != 0)
2976 /* different name --> ship out current template list;
2977 add to hash table; & begin anew. */
2978 core_optab->end = optab;
2979 hash_err = hash_insert (op_hash,
2981 (void *) core_optab);
2984 as_fatal (_("can't hash %s: %s"),
2988 if (optab->name == NULL)
2990 core_optab = XNEW (templates);
2991 core_optab->start = optab;
2996 /* Initialize reg_hash hash table. */
2997 reg_hash = hash_new ();
2999 const reg_entry *regtab;
3000 unsigned int regtab_size = i386_regtab_size;
3002 for (regtab = i386_regtab; regtab_size--; regtab++)
3004 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3006 as_fatal (_("can't hash %s: %s"),
3012 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3017 for (c = 0; c < 256; c++)
3022 mnemonic_chars[c] = c;
3023 register_chars[c] = c;
3024 operand_chars[c] = c;
3026 else if (ISLOWER (c))
3028 mnemonic_chars[c] = c;
3029 register_chars[c] = c;
3030 operand_chars[c] = c;
3032 else if (ISUPPER (c))
3034 mnemonic_chars[c] = TOLOWER (c);
3035 register_chars[c] = mnemonic_chars[c];
3036 operand_chars[c] = c;
3038 else if (c == '{' || c == '}')
3040 mnemonic_chars[c] = c;
3041 operand_chars[c] = c;
3044 if (ISALPHA (c) || ISDIGIT (c))
3045 identifier_chars[c] = c;
3048 identifier_chars[c] = c;
3049 operand_chars[c] = c;
3054 identifier_chars['@'] = '@';
3057 identifier_chars['?'] = '?';
3058 operand_chars['?'] = '?';
3060 digit_chars['-'] = '-';
3061 mnemonic_chars['_'] = '_';
3062 mnemonic_chars['-'] = '-';
3063 mnemonic_chars['.'] = '.';
3064 identifier_chars['_'] = '_';
3065 identifier_chars['.'] = '.';
3067 for (p = operand_special_chars; *p != '\0'; p++)
3068 operand_chars[(unsigned char) *p] = *p;
3071 if (flag_code == CODE_64BIT)
3073 #if defined (OBJ_COFF) && defined (TE_PE)
3074 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3077 x86_dwarf2_return_column = 16;
3079 x86_cie_data_alignment = -8;
3083 x86_dwarf2_return_column = 8;
3084 x86_cie_data_alignment = -4;
3087 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3088 can be turned into BRANCH_PREFIX frag. */
3089 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3094 i386_print_statistics (FILE *file)
3096 hash_print_statistics (file, "i386 opcode", op_hash);
3097 hash_print_statistics (file, "i386 register", reg_hash);
3102 /* Debugging routines for md_assemble. */
3103 static void pte (insn_template *);
3104 static void pt (i386_operand_type);
3105 static void pe (expressionS *);
3106 static void ps (symbolS *);
3109 pi (const char *line, i386_insn *x)
3113 fprintf (stdout, "%s: template ", line);
3115 fprintf (stdout, " address: base %s index %s scale %x\n",
3116 x->base_reg ? x->base_reg->reg_name : "none",
3117 x->index_reg ? x->index_reg->reg_name : "none",
3118 x->log2_scale_factor);
3119 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3120 x->rm.mode, x->rm.reg, x->rm.regmem);
3121 fprintf (stdout, " sib: base %x index %x scale %x\n",
3122 x->sib.base, x->sib.index, x->sib.scale);
3123 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3124 (x->rex & REX_W) != 0,
3125 (x->rex & REX_R) != 0,
3126 (x->rex & REX_X) != 0,
3127 (x->rex & REX_B) != 0);
3128 for (j = 0; j < x->operands; j++)
3130 fprintf (stdout, " #%d: ", j + 1);
3132 fprintf (stdout, "\n");
3133 if (x->types[j].bitfield.class == Reg
3134 || x->types[j].bitfield.class == RegMMX
3135 || x->types[j].bitfield.class == RegSIMD
3136 || x->types[j].bitfield.class == SReg
3137 || x->types[j].bitfield.class == RegCR
3138 || x->types[j].bitfield.class == RegDR
3139 || x->types[j].bitfield.class == RegTR)
3140 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3141 if (operand_type_check (x->types[j], imm))
3143 if (operand_type_check (x->types[j], disp))
3144 pe (x->op[j].disps);
3149 pte (insn_template *t)
3152 fprintf (stdout, " %d operands ", t->operands);
3153 fprintf (stdout, "opcode %x ", t->base_opcode);
3154 if (t->extension_opcode != None)
3155 fprintf (stdout, "ext %x ", t->extension_opcode);
3156 if (t->opcode_modifier.d)
3157 fprintf (stdout, "D");
3158 if (t->opcode_modifier.w)
3159 fprintf (stdout, "W");
3160 fprintf (stdout, "\n");
3161 for (j = 0; j < t->operands; j++)
3163 fprintf (stdout, " #%d type ", j + 1);
3164 pt (t->operand_types[j]);
3165 fprintf (stdout, "\n");
3172 fprintf (stdout, " operation %d\n", e->X_op);
3173 fprintf (stdout, " add_number %ld (%lx)\n",
3174 (long) e->X_add_number, (long) e->X_add_number);
3175 if (e->X_add_symbol)
3177 fprintf (stdout, " add_symbol ");
3178 ps (e->X_add_symbol);
3179 fprintf (stdout, "\n");
3183 fprintf (stdout, " op_symbol ");
3184 ps (e->X_op_symbol);
3185 fprintf (stdout, "\n");
3192 fprintf (stdout, "%s type %s%s",
3194 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3195 segment_name (S_GET_SEGMENT (s)));
3198 static struct type_name
3200 i386_operand_type mask;
3203 const type_names[] =
3205 { OPERAND_TYPE_REG8, "r8" },
3206 { OPERAND_TYPE_REG16, "r16" },
3207 { OPERAND_TYPE_REG32, "r32" },
3208 { OPERAND_TYPE_REG64, "r64" },
3209 { OPERAND_TYPE_ACC8, "acc8" },
3210 { OPERAND_TYPE_ACC16, "acc16" },
3211 { OPERAND_TYPE_ACC32, "acc32" },
3212 { OPERAND_TYPE_ACC64, "acc64" },
3213 { OPERAND_TYPE_IMM8, "i8" },
3214 { OPERAND_TYPE_IMM8, "i8s" },
3215 { OPERAND_TYPE_IMM16, "i16" },
3216 { OPERAND_TYPE_IMM32, "i32" },
3217 { OPERAND_TYPE_IMM32S, "i32s" },
3218 { OPERAND_TYPE_IMM64, "i64" },
3219 { OPERAND_TYPE_IMM1, "i1" },
3220 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3221 { OPERAND_TYPE_DISP8, "d8" },
3222 { OPERAND_TYPE_DISP16, "d16" },
3223 { OPERAND_TYPE_DISP32, "d32" },
3224 { OPERAND_TYPE_DISP32S, "d32s" },
3225 { OPERAND_TYPE_DISP64, "d64" },
3226 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3227 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3228 { OPERAND_TYPE_CONTROL, "control reg" },
3229 { OPERAND_TYPE_TEST, "test reg" },
3230 { OPERAND_TYPE_DEBUG, "debug reg" },
3231 { OPERAND_TYPE_FLOATREG, "FReg" },
3232 { OPERAND_TYPE_FLOATACC, "FAcc" },
3233 { OPERAND_TYPE_SREG, "SReg" },
3234 { OPERAND_TYPE_REGMMX, "rMMX" },
3235 { OPERAND_TYPE_REGXMM, "rXMM" },
3236 { OPERAND_TYPE_REGYMM, "rYMM" },
3237 { OPERAND_TYPE_REGZMM, "rZMM" },
3238 { OPERAND_TYPE_REGMASK, "Mask reg" },
3242 pt (i386_operand_type t)
3245 i386_operand_type a;
3247 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3249 a = operand_type_and (t, type_names[j].mask);
3250 if (operand_type_equal (&a, &type_names[j].mask))
3251 fprintf (stdout, "%s, ", type_names[j].name);
3256 #endif /* DEBUG386 */
3258 static bfd_reloc_code_real_type
3259 reloc (unsigned int size,
3262 bfd_reloc_code_real_type other)
3264 if (other != NO_RELOC)
3266 reloc_howto_type *rel;
3271 case BFD_RELOC_X86_64_GOT32:
3272 return BFD_RELOC_X86_64_GOT64;
3274 case BFD_RELOC_X86_64_GOTPLT64:
3275 return BFD_RELOC_X86_64_GOTPLT64;
3277 case BFD_RELOC_X86_64_PLTOFF64:
3278 return BFD_RELOC_X86_64_PLTOFF64;
3280 case BFD_RELOC_X86_64_GOTPC32:
3281 other = BFD_RELOC_X86_64_GOTPC64;
3283 case BFD_RELOC_X86_64_GOTPCREL:
3284 other = BFD_RELOC_X86_64_GOTPCREL64;
3286 case BFD_RELOC_X86_64_TPOFF32:
3287 other = BFD_RELOC_X86_64_TPOFF64;
3289 case BFD_RELOC_X86_64_DTPOFF32:
3290 other = BFD_RELOC_X86_64_DTPOFF64;
3296 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3297 if (other == BFD_RELOC_SIZE32)
3300 other = BFD_RELOC_SIZE64;
3303 as_bad (_("there are no pc-relative size relocations"));
3309 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3310 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3313 rel = bfd_reloc_type_lookup (stdoutput, other);
3315 as_bad (_("unknown relocation (%u)"), other);
3316 else if (size != bfd_get_reloc_size (rel))
3317 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3318 bfd_get_reloc_size (rel),
3320 else if (pcrel && !rel->pc_relative)
3321 as_bad (_("non-pc-relative relocation for pc-relative field"));
3322 else if ((rel->complain_on_overflow == complain_overflow_signed
3324 || (rel->complain_on_overflow == complain_overflow_unsigned
3326 as_bad (_("relocated field and relocation type differ in signedness"));
3335 as_bad (_("there are no unsigned pc-relative relocations"));
3338 case 1: return BFD_RELOC_8_PCREL;
3339 case 2: return BFD_RELOC_16_PCREL;
3340 case 4: return BFD_RELOC_32_PCREL;
3341 case 8: return BFD_RELOC_64_PCREL;
3343 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3350 case 4: return BFD_RELOC_X86_64_32S;
3355 case 1: return BFD_RELOC_8;
3356 case 2: return BFD_RELOC_16;
3357 case 4: return BFD_RELOC_32;
3358 case 8: return BFD_RELOC_64;
3360 as_bad (_("cannot do %s %u byte relocation"),
3361 sign > 0 ? "signed" : "unsigned", size);
3367 /* Here we decide which fixups can be adjusted to make them relative to
3368 the beginning of the section instead of the symbol. Basically we need
3369 to make sure that the dynamic relocations are done correctly, so in
3370 some cases we force the original symbol to be used. */
3373 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3375 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3379 /* Don't adjust pc-relative references to merge sections in 64-bit
3381 if (use_rela_relocations
3382 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3386 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3387 and changed later by validate_fix. */
3388 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3389 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3392 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3393 for size relocations. */
3394 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3395 || fixP->fx_r_type == BFD_RELOC_SIZE64
3396 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3397 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3398 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3399 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3400 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3401 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3402 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3403 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3404 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3405 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3406 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3407 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3408 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3409 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3410 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3411 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3412 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3413 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3414 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3415 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3416 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3417 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3418 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3419 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3420 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3421 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3422 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3423 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3424 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3425 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3426 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3433 intel_float_operand (const char *mnemonic)
3435 /* Note that the value returned is meaningful only for opcodes with (memory)
3436 operands, hence the code here is free to improperly handle opcodes that
3437 have no operands (for better performance and smaller code). */
3439 if (mnemonic[0] != 'f')
3440 return 0; /* non-math */
3442 switch (mnemonic[1])
3444 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3445 the fs segment override prefix not currently handled because no
3446 call path can make opcodes without operands get here */
3448 return 2 /* integer op */;
3450 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3451 return 3; /* fldcw/fldenv */
3454 if (mnemonic[2] != 'o' /* fnop */)
3455 return 3; /* non-waiting control op */
3458 if (mnemonic[2] == 's')
3459 return 3; /* frstor/frstpm */
3462 if (mnemonic[2] == 'a')
3463 return 3; /* fsave */
3464 if (mnemonic[2] == 't')
3466 switch (mnemonic[3])
3468 case 'c': /* fstcw */
3469 case 'd': /* fstdw */
3470 case 'e': /* fstenv */
3471 case 's': /* fsts[gw] */
3477 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3478 return 0; /* fxsave/fxrstor are not really math ops */
3485 /* Build the VEX prefix. */
3488 build_vex_prefix (const insn_template *t)
3490 unsigned int register_specifier;
3491 unsigned int implied_prefix;
3492 unsigned int vector_length;
3495 /* Check register specifier. */
3496 if (i.vex.register_specifier)
3498 register_specifier =
3499 ~register_number (i.vex.register_specifier) & 0xf;
3500 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3503 register_specifier = 0xf;
3505 /* Use 2-byte VEX prefix by swapping destination and source operand
3506 if there are more than 1 register operand. */
3507 if (i.reg_operands > 1
3508 && i.vec_encoding != vex_encoding_vex3
3509 && i.dir_encoding == dir_encoding_default
3510 && i.operands == i.reg_operands
3511 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3512 && i.tm.opcode_modifier.vexopcode == VEX0F
3513 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3516 unsigned int xchg = i.operands - 1;
3517 union i386_op temp_op;
3518 i386_operand_type temp_type;
3520 temp_type = i.types[xchg];
3521 i.types[xchg] = i.types[0];
3522 i.types[0] = temp_type;
3523 temp_op = i.op[xchg];
3524 i.op[xchg] = i.op[0];
3527 gas_assert (i.rm.mode == 3);
3531 i.rm.regmem = i.rm.reg;
3534 if (i.tm.opcode_modifier.d)
3535 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3536 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3537 else /* Use the next insn. */
3541 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3542 are no memory operands and at least 3 register ones. */
3543 if (i.reg_operands >= 3
3544 && i.vec_encoding != vex_encoding_vex3
3545 && i.reg_operands == i.operands - i.imm_operands
3546 && i.tm.opcode_modifier.vex
3547 && i.tm.opcode_modifier.commutative
3548 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3550 && i.vex.register_specifier
3551 && !(i.vex.register_specifier->reg_flags & RegRex))
3553 unsigned int xchg = i.operands - i.reg_operands;
3554 union i386_op temp_op;
3555 i386_operand_type temp_type;
3557 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3558 gas_assert (!i.tm.opcode_modifier.sae);
3559 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3560 &i.types[i.operands - 3]));
3561 gas_assert (i.rm.mode == 3);
3563 temp_type = i.types[xchg];
3564 i.types[xchg] = i.types[xchg + 1];
3565 i.types[xchg + 1] = temp_type;
3566 temp_op = i.op[xchg];
3567 i.op[xchg] = i.op[xchg + 1];
3568 i.op[xchg + 1] = temp_op;
3571 xchg = i.rm.regmem | 8;
3572 i.rm.regmem = ~register_specifier & 0xf;
3573 gas_assert (!(i.rm.regmem & 8));
3574 i.vex.register_specifier += xchg - i.rm.regmem;
3575 register_specifier = ~xchg & 0xf;
3578 if (i.tm.opcode_modifier.vex == VEXScalar)
3579 vector_length = avxscalar;
3580 else if (i.tm.opcode_modifier.vex == VEX256)
3586 /* Determine vector length from the last multi-length vector
3589 for (op = t->operands; op--;)
3590 if (t->operand_types[op].bitfield.xmmword
3591 && t->operand_types[op].bitfield.ymmword
3592 && i.types[op].bitfield.ymmword)
3599 switch ((i.tm.base_opcode >> 8) & 0xff)
3604 case DATA_PREFIX_OPCODE:
3607 case REPE_PREFIX_OPCODE:
3610 case REPNE_PREFIX_OPCODE:
3617 /* Check the REX.W bit and VEXW. */
3618 if (i.tm.opcode_modifier.vexw == VEXWIG)
3619 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3620 else if (i.tm.opcode_modifier.vexw)
3621 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3623 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3625 /* Use 2-byte VEX prefix if possible. */
3627 && i.vec_encoding != vex_encoding_vex3
3628 && i.tm.opcode_modifier.vexopcode == VEX0F
3629 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3631 /* 2-byte VEX prefix. */
3635 i.vex.bytes[0] = 0xc5;
3637 /* Check the REX.R bit. */
3638 r = (i.rex & REX_R) ? 0 : 1;
3639 i.vex.bytes[1] = (r << 7
3640 | register_specifier << 3
3641 | vector_length << 2
3646 /* 3-byte VEX prefix. */
3651 switch (i.tm.opcode_modifier.vexopcode)
3655 i.vex.bytes[0] = 0xc4;
3659 i.vex.bytes[0] = 0xc4;
3663 i.vex.bytes[0] = 0xc4;
3667 i.vex.bytes[0] = 0x8f;
3671 i.vex.bytes[0] = 0x8f;
3675 i.vex.bytes[0] = 0x8f;
3681 /* The high 3 bits of the second VEX byte are 1's compliment
3682 of RXB bits from REX. */
3683 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3685 i.vex.bytes[2] = (w << 7
3686 | register_specifier << 3
3687 | vector_length << 2
3692 static INLINE bfd_boolean
3693 is_evex_encoding (const insn_template *t)
3695 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3696 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3697 || t->opcode_modifier.sae;
3700 static INLINE bfd_boolean
3701 is_any_vex_encoding (const insn_template *t)
3703 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3704 || is_evex_encoding (t);
3707 /* Build the EVEX prefix. */
3710 build_evex_prefix (void)
3712 unsigned int register_specifier;
3713 unsigned int implied_prefix;
3715 rex_byte vrex_used = 0;
3717 /* Check register specifier. */
3718 if (i.vex.register_specifier)
3720 gas_assert ((i.vrex & REX_X) == 0);
3722 register_specifier = i.vex.register_specifier->reg_num;
3723 if ((i.vex.register_specifier->reg_flags & RegRex))
3724 register_specifier += 8;
3725 /* The upper 16 registers are encoded in the fourth byte of the
3727 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3728 i.vex.bytes[3] = 0x8;
3729 register_specifier = ~register_specifier & 0xf;
3733 register_specifier = 0xf;
3735 /* Encode upper 16 vector index register in the fourth byte of
3737 if (!(i.vrex & REX_X))
3738 i.vex.bytes[3] = 0x8;
3743 switch ((i.tm.base_opcode >> 8) & 0xff)
3748 case DATA_PREFIX_OPCODE:
3751 case REPE_PREFIX_OPCODE:
3754 case REPNE_PREFIX_OPCODE:
3761 /* 4 byte EVEX prefix. */
3763 i.vex.bytes[0] = 0x62;
3766 switch (i.tm.opcode_modifier.vexopcode)
3782 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3784 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3786 /* The fifth bit of the second EVEX byte is 1's compliment of the
3787 REX_R bit in VREX. */
3788 if (!(i.vrex & REX_R))
3789 i.vex.bytes[1] |= 0x10;
3793 if ((i.reg_operands + i.imm_operands) == i.operands)
3795 /* When all operands are registers, the REX_X bit in REX is not
3796 used. We reuse it to encode the upper 16 registers, which is
3797 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3798 as 1's compliment. */
3799 if ((i.vrex & REX_B))
3802 i.vex.bytes[1] &= ~0x40;
3806 /* EVEX instructions shouldn't need the REX prefix. */
3807 i.vrex &= ~vrex_used;
3808 gas_assert (i.vrex == 0);
3810 /* Check the REX.W bit and VEXW. */
3811 if (i.tm.opcode_modifier.vexw == VEXWIG)
3812 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3813 else if (i.tm.opcode_modifier.vexw)
3814 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3816 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3818 /* Encode the U bit. */
3819 implied_prefix |= 0x4;
3821 /* The third byte of the EVEX prefix. */
3822 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3824 /* The fourth byte of the EVEX prefix. */
3825 /* The zeroing-masking bit. */
3826 if (i.mask && i.mask->zeroing)
3827 i.vex.bytes[3] |= 0x80;
3829 /* Don't always set the broadcast bit if there is no RC. */
3832 /* Encode the vector length. */
3833 unsigned int vec_length;
3835 if (!i.tm.opcode_modifier.evex
3836 || i.tm.opcode_modifier.evex == EVEXDYN)
3840 /* Determine vector length from the last multi-length vector
3843 for (op = i.operands; op--;)
3844 if (i.tm.operand_types[op].bitfield.xmmword
3845 + i.tm.operand_types[op].bitfield.ymmword
3846 + i.tm.operand_types[op].bitfield.zmmword > 1)
3848 if (i.types[op].bitfield.zmmword)
3850 i.tm.opcode_modifier.evex = EVEX512;
3853 else if (i.types[op].bitfield.ymmword)
3855 i.tm.opcode_modifier.evex = EVEX256;
3858 else if (i.types[op].bitfield.xmmword)
3860 i.tm.opcode_modifier.evex = EVEX128;
3863 else if (i.broadcast && (int) op == i.broadcast->operand)
3865 switch (i.broadcast->bytes)
3868 i.tm.opcode_modifier.evex = EVEX512;
3871 i.tm.opcode_modifier.evex = EVEX256;
3874 i.tm.opcode_modifier.evex = EVEX128;
3883 if (op >= MAX_OPERANDS)
3887 switch (i.tm.opcode_modifier.evex)
3889 case EVEXLIG: /* LL' is ignored */
3890 vec_length = evexlig << 5;
3893 vec_length = 0 << 5;
3896 vec_length = 1 << 5;
3899 vec_length = 2 << 5;
3905 i.vex.bytes[3] |= vec_length;
3906 /* Encode the broadcast bit. */
3908 i.vex.bytes[3] |= 0x10;
3912 if (i.rounding->type != saeonly)
3913 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3915 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3918 if (i.mask && i.mask->mask)
3919 i.vex.bytes[3] |= i.mask->mask->reg_num;
3923 process_immext (void)
3927 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3928 which is coded in the same place as an 8-bit immediate field
3929 would be. Here we fake an 8-bit immediate operand from the
3930 opcode suffix stored in tm.extension_opcode.
3932 AVX instructions also use this encoding, for some of
3933 3 argument instructions. */
3935 gas_assert (i.imm_operands <= 1
3937 || (is_any_vex_encoding (&i.tm)
3938 && i.operands <= 4)));
3940 exp = &im_expressions[i.imm_operands++];
3941 i.op[i.operands].imms = exp;
3942 i.types[i.operands] = imm8;
3944 exp->X_op = O_constant;
3945 exp->X_add_number = i.tm.extension_opcode;
3946 i.tm.extension_opcode = None;
3953 switch (i.tm.opcode_modifier.hleprefixok)
3958 as_bad (_("invalid instruction `%s' after `%s'"),
3959 i.tm.name, i.hle_prefix);
3962 if (i.prefix[LOCK_PREFIX])
3964 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3968 case HLEPrefixRelease:
3969 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3971 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3975 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3977 as_bad (_("memory destination needed for instruction `%s'"
3978 " after `xrelease'"), i.tm.name);
3985 /* Try the shortest encoding by shortening operand size. */
3988 optimize_encoding (void)
3992 if (optimize_for_space
3993 && i.reg_operands == 1
3994 && i.imm_operands == 1
3995 && !i.types[1].bitfield.byte
3996 && i.op[0].imms->X_op == O_constant
3997 && fits_in_imm7 (i.op[0].imms->X_add_number)
3998 && ((i.tm.base_opcode == 0xa8
3999 && i.tm.extension_opcode == None)
4000 || (i.tm.base_opcode == 0xf6
4001 && i.tm.extension_opcode == 0x0)))
4004 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4006 unsigned int base_regnum = i.op[1].regs->reg_num;
4007 if (flag_code == CODE_64BIT || base_regnum < 4)
4009 i.types[1].bitfield.byte = 1;
4010 /* Ignore the suffix. */
4012 /* Convert to byte registers. */
4013 if (i.types[1].bitfield.word)
4015 else if (i.types[1].bitfield.dword)
4019 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4024 else if (flag_code == CODE_64BIT
4025 && ((i.types[1].bitfield.qword
4026 && i.reg_operands == 1
4027 && i.imm_operands == 1
4028 && i.op[0].imms->X_op == O_constant
4029 && ((i.tm.base_opcode == 0xb8
4030 && i.tm.extension_opcode == None
4031 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4032 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4033 && (((i.tm.base_opcode == 0x24
4034 || i.tm.base_opcode == 0xa8)
4035 && i.tm.extension_opcode == None)
4036 || (i.tm.base_opcode == 0x80
4037 && i.tm.extension_opcode == 0x4)
4038 || ((i.tm.base_opcode == 0xf6
4039 || (i.tm.base_opcode | 1) == 0xc7)
4040 && i.tm.extension_opcode == 0x0)))
4041 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4042 && i.tm.base_opcode == 0x83
4043 && i.tm.extension_opcode == 0x4)))
4044 || (i.types[0].bitfield.qword
4045 && ((i.reg_operands == 2
4046 && i.op[0].regs == i.op[1].regs
4047 && ((i.tm.base_opcode == 0x30
4048 || i.tm.base_opcode == 0x28)
4049 && i.tm.extension_opcode == None))
4050 || (i.reg_operands == 1
4052 && i.tm.base_opcode == 0x30
4053 && i.tm.extension_opcode == None)))))
4056 andq $imm31, %r64 -> andl $imm31, %r32
4057 andq $imm7, %r64 -> andl $imm7, %r32
4058 testq $imm31, %r64 -> testl $imm31, %r32
4059 xorq %r64, %r64 -> xorl %r32, %r32
4060 subq %r64, %r64 -> subl %r32, %r32
4061 movq $imm31, %r64 -> movl $imm31, %r32
4062 movq $imm32, %r64 -> movl $imm32, %r32
4064 i.tm.opcode_modifier.norex64 = 1;
4065 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4068 movq $imm31, %r64 -> movl $imm31, %r32
4069 movq $imm32, %r64 -> movl $imm32, %r32
4071 i.tm.operand_types[0].bitfield.imm32 = 1;
4072 i.tm.operand_types[0].bitfield.imm32s = 0;
4073 i.tm.operand_types[0].bitfield.imm64 = 0;
4074 i.types[0].bitfield.imm32 = 1;
4075 i.types[0].bitfield.imm32s = 0;
4076 i.types[0].bitfield.imm64 = 0;
4077 i.types[1].bitfield.dword = 1;
4078 i.types[1].bitfield.qword = 0;
4079 if ((i.tm.base_opcode | 1) == 0xc7)
4082 movq $imm31, %r64 -> movl $imm31, %r32
4084 i.tm.base_opcode = 0xb8;
4085 i.tm.extension_opcode = None;
4086 i.tm.opcode_modifier.w = 0;
4087 i.tm.opcode_modifier.shortform = 1;
4088 i.tm.opcode_modifier.modrm = 0;
4092 else if (optimize > 1
4093 && !optimize_for_space
4094 && i.reg_operands == 2
4095 && i.op[0].regs == i.op[1].regs
4096 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4097 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4098 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4101 andb %rN, %rN -> testb %rN, %rN
4102 andw %rN, %rN -> testw %rN, %rN
4103 andq %rN, %rN -> testq %rN, %rN
4104 orb %rN, %rN -> testb %rN, %rN
4105 orw %rN, %rN -> testw %rN, %rN
4106 orq %rN, %rN -> testq %rN, %rN
4108 and outside of 64-bit mode
4110 andl %rN, %rN -> testl %rN, %rN
4111 orl %rN, %rN -> testl %rN, %rN
4113 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4115 else if (i.reg_operands == 3
4116 && i.op[0].regs == i.op[1].regs
4117 && !i.types[2].bitfield.xmmword
4118 && (i.tm.opcode_modifier.vex
4119 || ((!i.mask || i.mask->zeroing)
4121 && is_evex_encoding (&i.tm)
4122 && (i.vec_encoding != vex_encoding_evex
4123 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4124 || i.tm.cpu_flags.bitfield.cpuavx512vl
4125 || (i.tm.operand_types[2].bitfield.zmmword
4126 && i.types[2].bitfield.ymmword))))
4127 && ((i.tm.base_opcode == 0x55
4128 || i.tm.base_opcode == 0x6655
4129 || i.tm.base_opcode == 0x66df
4130 || i.tm.base_opcode == 0x57
4131 || i.tm.base_opcode == 0x6657
4132 || i.tm.base_opcode == 0x66ef
4133 || i.tm.base_opcode == 0x66f8
4134 || i.tm.base_opcode == 0x66f9
4135 || i.tm.base_opcode == 0x66fa
4136 || i.tm.base_opcode == 0x66fb
4137 || i.tm.base_opcode == 0x42
4138 || i.tm.base_opcode == 0x6642
4139 || i.tm.base_opcode == 0x47
4140 || i.tm.base_opcode == 0x6647)
4141 && i.tm.extension_opcode == None))
4144 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4146 EVEX VOP %zmmM, %zmmM, %zmmN
4147 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4148 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4149 EVEX VOP %ymmM, %ymmM, %ymmN
4150 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4151 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4152 VEX VOP %ymmM, %ymmM, %ymmN
4153 -> VEX VOP %xmmM, %xmmM, %xmmN
4154 VOP, one of vpandn and vpxor:
4155 VEX VOP %ymmM, %ymmM, %ymmN
4156 -> VEX VOP %xmmM, %xmmM, %xmmN
4157 VOP, one of vpandnd and vpandnq:
4158 EVEX VOP %zmmM, %zmmM, %zmmN
4159 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4160 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4161 EVEX VOP %ymmM, %ymmM, %ymmN
4162 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4163 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4164 VOP, one of vpxord and vpxorq:
4165 EVEX VOP %zmmM, %zmmM, %zmmN
4166 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4167 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4168 EVEX VOP %ymmM, %ymmM, %ymmN
4169 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4170 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4171 VOP, one of kxord and kxorq:
4172 VEX VOP %kM, %kM, %kN
4173 -> VEX kxorw %kM, %kM, %kN
4174 VOP, one of kandnd and kandnq:
4175 VEX VOP %kM, %kM, %kN
4176 -> VEX kandnw %kM, %kM, %kN
4178 if (is_evex_encoding (&i.tm))
4180 if (i.vec_encoding != vex_encoding_evex)
4182 i.tm.opcode_modifier.vex = VEX128;
4183 i.tm.opcode_modifier.vexw = VEXW0;
4184 i.tm.opcode_modifier.evex = 0;
4186 else if (optimize > 1)
4187 i.tm.opcode_modifier.evex = EVEX128;
4191 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4193 i.tm.base_opcode &= 0xff;
4194 i.tm.opcode_modifier.vexw = VEXW0;
4197 i.tm.opcode_modifier.vex = VEX128;
4199 if (i.tm.opcode_modifier.vex)
4200 for (j = 0; j < 3; j++)
4202 i.types[j].bitfield.xmmword = 1;
4203 i.types[j].bitfield.ymmword = 0;
4206 else if (i.vec_encoding != vex_encoding_evex
4207 && !i.types[0].bitfield.zmmword
4208 && !i.types[1].bitfield.zmmword
4211 && is_evex_encoding (&i.tm)
4212 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4213 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4214 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4215 || (i.tm.base_opcode & ~4) == 0x66db
4216 || (i.tm.base_opcode & ~4) == 0x66eb)
4217 && i.tm.extension_opcode == None)
4220 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4221 vmovdqu32 and vmovdqu64:
4222 EVEX VOP %xmmM, %xmmN
4223 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4224 EVEX VOP %ymmM, %ymmN
4225 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4227 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4229 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4231 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4233 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4234 VOP, one of vpand, vpandn, vpor, vpxor:
4235 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4236 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4237 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4238 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4239 EVEX VOP{d,q} mem, %xmmM, %xmmN
4240 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4241 EVEX VOP{d,q} mem, %ymmM, %ymmN
4242 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4244 for (j = 0; j < i.operands; j++)
4245 if (operand_type_check (i.types[j], disp)
4246 && i.op[j].disps->X_op == O_constant)
4248 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4249 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4250 bytes, we choose EVEX Disp8 over VEX Disp32. */
4251 int evex_disp8, vex_disp8;
4252 unsigned int memshift = i.memshift;
4253 offsetT n = i.op[j].disps->X_add_number;
4255 evex_disp8 = fits_in_disp8 (n);
4257 vex_disp8 = fits_in_disp8 (n);
4258 if (evex_disp8 != vex_disp8)
4260 i.memshift = memshift;
4264 i.types[j].bitfield.disp8 = vex_disp8;
4267 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4268 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4269 i.tm.opcode_modifier.vex
4270 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4271 i.tm.opcode_modifier.vexw = VEXW0;
4272 /* VPAND, VPOR, and VPXOR are commutative. */
4273 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4274 i.tm.opcode_modifier.commutative = 1;
4275 i.tm.opcode_modifier.evex = 0;
4276 i.tm.opcode_modifier.masking = 0;
4277 i.tm.opcode_modifier.broadcast = 0;
4278 i.tm.opcode_modifier.disp8memshift = 0;
4281 i.types[j].bitfield.disp8
4282 = fits_in_disp8 (i.op[j].disps->X_add_number);
4286 /* This is the guts of the machine-dependent assembler. LINE points to a
4287 machine dependent instruction. This function is supposed to emit
4288 the frags/bytes it assembles to. */
4291 md_assemble (char *line)
4294 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4295 const insn_template *t;
4297 /* Initialize globals. */
4298 memset (&i, '\0', sizeof (i));
4299 for (j = 0; j < MAX_OPERANDS; j++)
4300 i.reloc[j] = NO_RELOC;
4301 memset (disp_expressions, '\0', sizeof (disp_expressions));
4302 memset (im_expressions, '\0', sizeof (im_expressions));
4303 save_stack_p = save_stack;
4305 /* First parse an instruction mnemonic & call i386_operand for the operands.
4306 We assume that the scrubber has arranged it so that line[0] is the valid
4307 start of a (possibly prefixed) mnemonic. */
4309 line = parse_insn (line, mnemonic);
4312 mnem_suffix = i.suffix;
4314 line = parse_operands (line, mnemonic);
4316 xfree (i.memop1_string);
4317 i.memop1_string = NULL;
4321 /* Now we've parsed the mnemonic into a set of templates, and have the
4322 operands at hand. */
4324 /* All intel opcodes have reversed operands except for "bound" and
4325 "enter". We also don't reverse intersegment "jmp" and "call"
4326 instructions with 2 immediate operands so that the immediate segment
4327 precedes the offset, as it does when in AT&T mode. */
4330 && (strcmp (mnemonic, "bound") != 0)
4331 && (strcmp (mnemonic, "invlpga") != 0)
4332 && !(operand_type_check (i.types[0], imm)
4333 && operand_type_check (i.types[1], imm)))
4336 /* The order of the immediates should be reversed
4337 for 2 immediates extrq and insertq instructions */
4338 if (i.imm_operands == 2
4339 && (strcmp (mnemonic, "extrq") == 0
4340 || strcmp (mnemonic, "insertq") == 0))
4341 swap_2_operands (0, 1);
4346 /* Don't optimize displacement for movabs since it only takes 64bit
4349 && i.disp_encoding != disp_encoding_32bit
4350 && (flag_code != CODE_64BIT
4351 || strcmp (mnemonic, "movabs") != 0))
4354 /* Next, we find a template that matches the given insn,
4355 making sure the overlap of the given operands types is consistent
4356 with the template operand types. */
4358 if (!(t = match_template (mnem_suffix)))
4361 if (sse_check != check_none
4362 && !i.tm.opcode_modifier.noavx
4363 && !i.tm.cpu_flags.bitfield.cpuavx
4364 && !i.tm.cpu_flags.bitfield.cpuavx512f
4365 && (i.tm.cpu_flags.bitfield.cpusse
4366 || i.tm.cpu_flags.bitfield.cpusse2
4367 || i.tm.cpu_flags.bitfield.cpusse3
4368 || i.tm.cpu_flags.bitfield.cpussse3
4369 || i.tm.cpu_flags.bitfield.cpusse4_1
4370 || i.tm.cpu_flags.bitfield.cpusse4_2
4371 || i.tm.cpu_flags.bitfield.cpusse4a
4372 || i.tm.cpu_flags.bitfield.cpupclmul
4373 || i.tm.cpu_flags.bitfield.cpuaes
4374 || i.tm.cpu_flags.bitfield.cpusha
4375 || i.tm.cpu_flags.bitfield.cpugfni))
4377 (sse_check == check_warning
4379 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4382 /* Zap movzx and movsx suffix. The suffix has been set from
4383 "word ptr" or "byte ptr" on the source operand in Intel syntax
4384 or extracted from mnemonic in AT&T syntax. But we'll use
4385 the destination register to choose the suffix for encoding. */
4386 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4388 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4389 there is no suffix, the default will be byte extension. */
4390 if (i.reg_operands != 2
4393 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4398 if (i.tm.opcode_modifier.fwait)
4399 if (!add_prefix (FWAIT_OPCODE))
4402 /* Check if REP prefix is OK. */
4403 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4405 as_bad (_("invalid instruction `%s' after `%s'"),
4406 i.tm.name, i.rep_prefix);
4410 /* Check for lock without a lockable instruction. Destination operand
4411 must be memory unless it is xchg (0x86). */
4412 if (i.prefix[LOCK_PREFIX]
4413 && (!i.tm.opcode_modifier.islockable
4414 || i.mem_operands == 0
4415 || (i.tm.base_opcode != 0x86
4416 && !(i.flags[i.operands - 1] & Operand_Mem))))
4418 as_bad (_("expecting lockable instruction after `lock'"));
4422 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4423 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4425 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4429 /* Check if HLE prefix is OK. */
4430 if (i.hle_prefix && !check_hle ())
4433 /* Check BND prefix. */
4434 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4435 as_bad (_("expecting valid branch instruction after `bnd'"));
4437 /* Check NOTRACK prefix. */
4438 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4439 as_bad (_("expecting indirect branch instruction after `notrack'"));
4441 if (i.tm.cpu_flags.bitfield.cpumpx)
4443 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4444 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4445 else if (flag_code != CODE_16BIT
4446 ? i.prefix[ADDR_PREFIX]
4447 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4448 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4451 /* Insert BND prefix. */
4452 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4454 if (!i.prefix[BND_PREFIX])
4455 add_prefix (BND_PREFIX_OPCODE);
4456 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4458 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4459 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4463 /* Check string instruction segment overrides. */
4464 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4466 gas_assert (i.mem_operands);
4467 if (!check_string ())
4469 i.disp_operands = 0;
4472 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4473 optimize_encoding ();
4475 if (!process_suffix ())
4478 /* Update operand types. */
4479 for (j = 0; j < i.operands; j++)
4480 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4482 /* Make still unresolved immediate matches conform to size of immediate
4483 given in i.suffix. */
4484 if (!finalize_imm ())
4487 if (i.types[0].bitfield.imm1)
4488 i.imm_operands = 0; /* kludge for shift insns. */
4490 /* We only need to check those implicit registers for instructions
4491 with 3 operands or less. */
4492 if (i.operands <= 3)
4493 for (j = 0; j < i.operands; j++)
4494 if (i.types[j].bitfield.instance != InstanceNone
4495 && !i.types[j].bitfield.xmmword)
4498 /* ImmExt should be processed after SSE2AVX. */
4499 if (!i.tm.opcode_modifier.sse2avx
4500 && i.tm.opcode_modifier.immext)
4503 /* For insns with operands there are more diddles to do to the opcode. */
4506 if (!process_operands ())
4509 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4511 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4512 as_warn (_("translating to `%sp'"), i.tm.name);
4515 if (is_any_vex_encoding (&i.tm))
4517 if (!cpu_arch_flags.bitfield.cpui286)
4519 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4524 if (i.tm.opcode_modifier.vex)
4525 build_vex_prefix (t);
4527 build_evex_prefix ();
4530 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4531 instructions may define INT_OPCODE as well, so avoid this corner
4532 case for those instructions that use MODRM. */
4533 if (i.tm.base_opcode == INT_OPCODE
4534 && !i.tm.opcode_modifier.modrm
4535 && i.op[0].imms->X_add_number == 3)
4537 i.tm.base_opcode = INT3_OPCODE;
4541 if ((i.tm.opcode_modifier.jump == JUMP
4542 || i.tm.opcode_modifier.jump == JUMP_BYTE
4543 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4544 && i.op[0].disps->X_op == O_constant)
4546 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4547 the absolute address given by the constant. Since ix86 jumps and
4548 calls are pc relative, we need to generate a reloc. */
4549 i.op[0].disps->X_add_symbol = &abs_symbol;
4550 i.op[0].disps->X_op = O_symbol;
4553 if (i.tm.opcode_modifier.rex64)
4556 /* For 8 bit registers we need an empty rex prefix. Also if the
4557 instruction already has a prefix, we need to convert old
4558 registers to new ones. */
4560 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4561 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4562 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4563 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4564 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4565 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4570 i.rex |= REX_OPCODE;
4571 for (x = 0; x < 2; x++)
4573 /* Look for 8 bit operand that uses old registers. */
4574 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4575 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4577 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4578 /* In case it is "hi" register, give up. */
4579 if (i.op[x].regs->reg_num > 3)
4580 as_bad (_("can't encode register '%s%s' in an "
4581 "instruction requiring REX prefix."),
4582 register_prefix, i.op[x].regs->reg_name);
4584 /* Otherwise it is equivalent to the extended register.
4585 Since the encoding doesn't change this is merely
4586 cosmetic cleanup for debug output. */
4588 i.op[x].regs = i.op[x].regs + 8;
4593 if (i.rex == 0 && i.rex_encoding)
4595 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4596 that uses legacy register. If it is "hi" register, don't add
4597 the REX_OPCODE byte. */
4599 for (x = 0; x < 2; x++)
4600 if (i.types[x].bitfield.class == Reg
4601 && i.types[x].bitfield.byte
4602 && (i.op[x].regs->reg_flags & RegRex64) == 0
4603 && i.op[x].regs->reg_num > 3)
4605 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4606 i.rex_encoding = FALSE;
4615 add_prefix (REX_OPCODE | i.rex);
4617 /* We are ready to output the insn. */
4620 last_insn.seg = now_seg;
4622 if (i.tm.opcode_modifier.isprefix)
4624 last_insn.kind = last_insn_prefix;
4625 last_insn.name = i.tm.name;
4626 last_insn.file = as_where (&last_insn.line);
4629 last_insn.kind = last_insn_other;
4633 parse_insn (char *line, char *mnemonic)
4636 char *token_start = l;
4639 const insn_template *t;
4645 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4650 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4652 as_bad (_("no such instruction: `%s'"), token_start);
4657 if (!is_space_char (*l)
4658 && *l != END_OF_INSN
4660 || (*l != PREFIX_SEPARATOR
4663 as_bad (_("invalid character %s in mnemonic"),
4664 output_invalid (*l));
4667 if (token_start == l)
4669 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4670 as_bad (_("expecting prefix; got nothing"));
4672 as_bad (_("expecting mnemonic; got nothing"));
4676 /* Look up instruction (or prefix) via hash table. */
4677 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4679 if (*l != END_OF_INSN
4680 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4681 && current_templates
4682 && current_templates->start->opcode_modifier.isprefix)
4684 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4686 as_bad ((flag_code != CODE_64BIT
4687 ? _("`%s' is only supported in 64-bit mode")
4688 : _("`%s' is not supported in 64-bit mode")),
4689 current_templates->start->name);
4692 /* If we are in 16-bit mode, do not allow addr16 or data16.
4693 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4694 if ((current_templates->start->opcode_modifier.size == SIZE16
4695 || current_templates->start->opcode_modifier.size == SIZE32)
4696 && flag_code != CODE_64BIT
4697 && ((current_templates->start->opcode_modifier.size == SIZE32)
4698 ^ (flag_code == CODE_16BIT)))
4700 as_bad (_("redundant %s prefix"),
4701 current_templates->start->name);
4704 if (current_templates->start->opcode_length == 0)
4706 /* Handle pseudo prefixes. */
4707 switch (current_templates->start->base_opcode)
4711 i.disp_encoding = disp_encoding_8bit;
4715 i.disp_encoding = disp_encoding_32bit;
4719 i.dir_encoding = dir_encoding_load;
4723 i.dir_encoding = dir_encoding_store;
4727 i.vec_encoding = vex_encoding_vex2;
4731 i.vec_encoding = vex_encoding_vex3;
4735 i.vec_encoding = vex_encoding_evex;
4739 i.rex_encoding = TRUE;
4743 i.no_optimize = TRUE;
4751 /* Add prefix, checking for repeated prefixes. */
4752 switch (add_prefix (current_templates->start->base_opcode))
4757 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4758 i.notrack_prefix = current_templates->start->name;
4761 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4762 i.hle_prefix = current_templates->start->name;
4763 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4764 i.bnd_prefix = current_templates->start->name;
4766 i.rep_prefix = current_templates->start->name;
4772 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4779 if (!current_templates)
4781 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4782 Check if we should swap operand or force 32bit displacement in
4784 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4785 i.dir_encoding = dir_encoding_swap;
4786 else if (mnem_p - 3 == dot_p
4789 i.disp_encoding = disp_encoding_8bit;
4790 else if (mnem_p - 4 == dot_p
4794 i.disp_encoding = disp_encoding_32bit;
4799 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4802 if (!current_templates)
4805 if (mnem_p > mnemonic)
4807 /* See if we can get a match by trimming off a suffix. */
4810 case WORD_MNEM_SUFFIX:
4811 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4812 i.suffix = SHORT_MNEM_SUFFIX;
4815 case BYTE_MNEM_SUFFIX:
4816 case QWORD_MNEM_SUFFIX:
4817 i.suffix = mnem_p[-1];
4819 current_templates = (const templates *) hash_find (op_hash,
4822 case SHORT_MNEM_SUFFIX:
4823 case LONG_MNEM_SUFFIX:
4826 i.suffix = mnem_p[-1];
4828 current_templates = (const templates *) hash_find (op_hash,
4837 if (intel_float_operand (mnemonic) == 1)
4838 i.suffix = SHORT_MNEM_SUFFIX;
4840 i.suffix = LONG_MNEM_SUFFIX;
4842 current_templates = (const templates *) hash_find (op_hash,
4849 if (!current_templates)
4851 as_bad (_("no such instruction: `%s'"), token_start);
4856 if (current_templates->start->opcode_modifier.jump == JUMP
4857 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4859 /* Check for a branch hint. We allow ",pt" and ",pn" for
4860 predict taken and predict not taken respectively.
4861 I'm not sure that branch hints actually do anything on loop
4862 and jcxz insns (JumpByte) for current Pentium4 chips. They
4863 may work in the future and it doesn't hurt to accept them
4865 if (l[0] == ',' && l[1] == 'p')
4869 if (!add_prefix (DS_PREFIX_OPCODE))
4873 else if (l[2] == 'n')
4875 if (!add_prefix (CS_PREFIX_OPCODE))
4881 /* Any other comma loses. */
4884 as_bad (_("invalid character %s in mnemonic"),
4885 output_invalid (*l));
4889 /* Check if instruction is supported on specified architecture. */
4891 for (t = current_templates->start; t < current_templates->end; ++t)
4893 supported |= cpu_flags_match (t);
4894 if (supported == CPU_FLAGS_PERFECT_MATCH)
4896 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4897 as_warn (_("use .code16 to ensure correct addressing mode"));
4903 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4904 as_bad (flag_code == CODE_64BIT
4905 ? _("`%s' is not supported in 64-bit mode")
4906 : _("`%s' is only supported in 64-bit mode"),
4907 current_templates->start->name);
4909 as_bad (_("`%s' is not supported on `%s%s'"),
4910 current_templates->start->name,
4911 cpu_arch_name ? cpu_arch_name : default_arch,
4912 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4918 parse_operands (char *l, const char *mnemonic)
4922 /* 1 if operand is pending after ','. */
4923 unsigned int expecting_operand = 0;
4925 /* Non-zero if operand parens not balanced. */
4926 unsigned int paren_not_balanced;
4928 while (*l != END_OF_INSN)
4930 /* Skip optional white space before operand. */
4931 if (is_space_char (*l))
4933 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4935 as_bad (_("invalid character %s before operand %d"),
4936 output_invalid (*l),
4940 token_start = l; /* After white space. */
4941 paren_not_balanced = 0;
4942 while (paren_not_balanced || *l != ',')
4944 if (*l == END_OF_INSN)
4946 if (paren_not_balanced)
4949 as_bad (_("unbalanced parenthesis in operand %d."),
4952 as_bad (_("unbalanced brackets in operand %d."),
4957 break; /* we are done */
4959 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4961 as_bad (_("invalid character %s in operand %d"),
4962 output_invalid (*l),
4969 ++paren_not_balanced;
4971 --paren_not_balanced;
4976 ++paren_not_balanced;
4978 --paren_not_balanced;
4982 if (l != token_start)
4983 { /* Yes, we've read in another operand. */
4984 unsigned int operand_ok;
4985 this_operand = i.operands++;
4986 if (i.operands > MAX_OPERANDS)
4988 as_bad (_("spurious operands; (%d operands/instruction max)"),
4992 i.types[this_operand].bitfield.unspecified = 1;
4993 /* Now parse operand adding info to 'i' as we go along. */
4994 END_STRING_AND_SAVE (l);
4996 if (i.mem_operands > 1)
4998 as_bad (_("too many memory references for `%s'"),
5005 i386_intel_operand (token_start,
5006 intel_float_operand (mnemonic));
5008 operand_ok = i386_att_operand (token_start);
5010 RESTORE_END_STRING (l);
5016 if (expecting_operand)
5018 expecting_operand_after_comma:
5019 as_bad (_("expecting operand after ','; got nothing"));
5024 as_bad (_("expecting operand before ','; got nothing"));
5029 /* Now *l must be either ',' or END_OF_INSN. */
5032 if (*++l == END_OF_INSN)
5034 /* Just skip it, if it's \n complain. */
5035 goto expecting_operand_after_comma;
5037 expecting_operand = 1;
5044 swap_2_operands (int xchg1, int xchg2)
5046 union i386_op temp_op;
5047 i386_operand_type temp_type;
5048 unsigned int temp_flags;
5049 enum bfd_reloc_code_real temp_reloc;
5051 temp_type = i.types[xchg2];
5052 i.types[xchg2] = i.types[xchg1];
5053 i.types[xchg1] = temp_type;
5055 temp_flags = i.flags[xchg2];
5056 i.flags[xchg2] = i.flags[xchg1];
5057 i.flags[xchg1] = temp_flags;
5059 temp_op = i.op[xchg2];
5060 i.op[xchg2] = i.op[xchg1];
5061 i.op[xchg1] = temp_op;
5063 temp_reloc = i.reloc[xchg2];
5064 i.reloc[xchg2] = i.reloc[xchg1];
5065 i.reloc[xchg1] = temp_reloc;
5069 if (i.mask->operand == xchg1)
5070 i.mask->operand = xchg2;
5071 else if (i.mask->operand == xchg2)
5072 i.mask->operand = xchg1;
5076 if (i.broadcast->operand == xchg1)
5077 i.broadcast->operand = xchg2;
5078 else if (i.broadcast->operand == xchg2)
5079 i.broadcast->operand = xchg1;
5083 if (i.rounding->operand == xchg1)
5084 i.rounding->operand = xchg2;
5085 else if (i.rounding->operand == xchg2)
5086 i.rounding->operand = xchg1;
5091 swap_operands (void)
5097 swap_2_operands (1, i.operands - 2);
5101 swap_2_operands (0, i.operands - 1);
5107 if (i.mem_operands == 2)
5109 const seg_entry *temp_seg;
5110 temp_seg = i.seg[0];
5111 i.seg[0] = i.seg[1];
5112 i.seg[1] = temp_seg;
5116 /* Try to ensure constant immediates are represented in the smallest
5121 char guess_suffix = 0;
5125 guess_suffix = i.suffix;
5126 else if (i.reg_operands)
5128 /* Figure out a suffix from the last register operand specified.
5129 We can't do this properly yet, i.e. excluding special register
5130 instances, but the following works for instructions with
5131 immediates. In any case, we can't set i.suffix yet. */
5132 for (op = i.operands; --op >= 0;)
5133 if (i.types[op].bitfield.class != Reg)
5135 else if (i.types[op].bitfield.byte)
5137 guess_suffix = BYTE_MNEM_SUFFIX;
5140 else if (i.types[op].bitfield.word)
5142 guess_suffix = WORD_MNEM_SUFFIX;
5145 else if (i.types[op].bitfield.dword)
5147 guess_suffix = LONG_MNEM_SUFFIX;
5150 else if (i.types[op].bitfield.qword)
5152 guess_suffix = QWORD_MNEM_SUFFIX;
5156 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5157 guess_suffix = WORD_MNEM_SUFFIX;
5159 for (op = i.operands; --op >= 0;)
5160 if (operand_type_check (i.types[op], imm))
5162 switch (i.op[op].imms->X_op)
5165 /* If a suffix is given, this operand may be shortened. */
5166 switch (guess_suffix)
5168 case LONG_MNEM_SUFFIX:
5169 i.types[op].bitfield.imm32 = 1;
5170 i.types[op].bitfield.imm64 = 1;
5172 case WORD_MNEM_SUFFIX:
5173 i.types[op].bitfield.imm16 = 1;
5174 i.types[op].bitfield.imm32 = 1;
5175 i.types[op].bitfield.imm32s = 1;
5176 i.types[op].bitfield.imm64 = 1;
5178 case BYTE_MNEM_SUFFIX:
5179 i.types[op].bitfield.imm8 = 1;
5180 i.types[op].bitfield.imm8s = 1;
5181 i.types[op].bitfield.imm16 = 1;
5182 i.types[op].bitfield.imm32 = 1;
5183 i.types[op].bitfield.imm32s = 1;
5184 i.types[op].bitfield.imm64 = 1;
5188 /* If this operand is at most 16 bits, convert it
5189 to a signed 16 bit number before trying to see
5190 whether it will fit in an even smaller size.
5191 This allows a 16-bit operand such as $0xffe0 to
5192 be recognised as within Imm8S range. */
5193 if ((i.types[op].bitfield.imm16)
5194 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5196 i.op[op].imms->X_add_number =
5197 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5200 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5201 if ((i.types[op].bitfield.imm32)
5202 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5205 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5206 ^ ((offsetT) 1 << 31))
5207 - ((offsetT) 1 << 31));
5211 = operand_type_or (i.types[op],
5212 smallest_imm_type (i.op[op].imms->X_add_number));
5214 /* We must avoid matching of Imm32 templates when 64bit
5215 only immediate is available. */
5216 if (guess_suffix == QWORD_MNEM_SUFFIX)
5217 i.types[op].bitfield.imm32 = 0;
5224 /* Symbols and expressions. */
5226 /* Convert symbolic operand to proper sizes for matching, but don't
5227 prevent matching a set of insns that only supports sizes other
5228 than those matching the insn suffix. */
5230 i386_operand_type mask, allowed;
5231 const insn_template *t;
5233 operand_type_set (&mask, 0);
5234 operand_type_set (&allowed, 0);
5236 for (t = current_templates->start;
5237 t < current_templates->end;
5240 allowed = operand_type_or (allowed, t->operand_types[op]);
5241 allowed = operand_type_and (allowed, anyimm);
5243 switch (guess_suffix)
5245 case QWORD_MNEM_SUFFIX:
5246 mask.bitfield.imm64 = 1;
5247 mask.bitfield.imm32s = 1;
5249 case LONG_MNEM_SUFFIX:
5250 mask.bitfield.imm32 = 1;
5252 case WORD_MNEM_SUFFIX:
5253 mask.bitfield.imm16 = 1;
5255 case BYTE_MNEM_SUFFIX:
5256 mask.bitfield.imm8 = 1;
5261 allowed = operand_type_and (mask, allowed);
5262 if (!operand_type_all_zero (&allowed))
5263 i.types[op] = operand_type_and (i.types[op], mask);
5270 /* Try to use the smallest displacement type too. */
5272 optimize_disp (void)
5276 for (op = i.operands; --op >= 0;)
5277 if (operand_type_check (i.types[op], disp))
5279 if (i.op[op].disps->X_op == O_constant)
5281 offsetT op_disp = i.op[op].disps->X_add_number;
5283 if (i.types[op].bitfield.disp16
5284 && (op_disp & ~(offsetT) 0xffff) == 0)
5286 /* If this operand is at most 16 bits, convert
5287 to a signed 16 bit number and don't use 64bit
5289 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5290 i.types[op].bitfield.disp64 = 0;
5293 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5294 if (i.types[op].bitfield.disp32
5295 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5297 /* If this operand is at most 32 bits, convert
5298 to a signed 32 bit number and don't use 64bit
5300 op_disp &= (((offsetT) 2 << 31) - 1);
5301 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5302 i.types[op].bitfield.disp64 = 0;
5305 if (!op_disp && i.types[op].bitfield.baseindex)
5307 i.types[op].bitfield.disp8 = 0;
5308 i.types[op].bitfield.disp16 = 0;
5309 i.types[op].bitfield.disp32 = 0;
5310 i.types[op].bitfield.disp32s = 0;
5311 i.types[op].bitfield.disp64 = 0;
5315 else if (flag_code == CODE_64BIT)
5317 if (fits_in_signed_long (op_disp))
5319 i.types[op].bitfield.disp64 = 0;
5320 i.types[op].bitfield.disp32s = 1;
5322 if (i.prefix[ADDR_PREFIX]
5323 && fits_in_unsigned_long (op_disp))
5324 i.types[op].bitfield.disp32 = 1;
5326 if ((i.types[op].bitfield.disp32
5327 || i.types[op].bitfield.disp32s
5328 || i.types[op].bitfield.disp16)
5329 && fits_in_disp8 (op_disp))
5330 i.types[op].bitfield.disp8 = 1;
5332 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5333 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5335 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5336 i.op[op].disps, 0, i.reloc[op]);
5337 i.types[op].bitfield.disp8 = 0;
5338 i.types[op].bitfield.disp16 = 0;
5339 i.types[op].bitfield.disp32 = 0;
5340 i.types[op].bitfield.disp32s = 0;
5341 i.types[op].bitfield.disp64 = 0;
5344 /* We only support 64bit displacement on constants. */
5345 i.types[op].bitfield.disp64 = 0;
5349 /* Return 1 if there is a match in broadcast bytes between operand
5350 GIVEN and instruction template T. */
5353 match_broadcast_size (const insn_template *t, unsigned int given)
5355 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5356 && i.types[given].bitfield.byte)
5357 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5358 && i.types[given].bitfield.word)
5359 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5360 && i.types[given].bitfield.dword)
5361 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5362 && i.types[given].bitfield.qword));
5365 /* Check if operands are valid for the instruction. */
5368 check_VecOperands (const insn_template *t)
5372 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5374 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5375 any one operand are implicity requiring AVX512VL support if the actual
5376 operand size is YMMword or XMMword. Since this function runs after
5377 template matching, there's no need to check for YMMword/XMMword in
5379 cpu = cpu_flags_and (t->cpu_flags, avx512);
5380 if (!cpu_flags_all_zero (&cpu)
5381 && !t->cpu_flags.bitfield.cpuavx512vl
5382 && !cpu_arch_flags.bitfield.cpuavx512vl)
5384 for (op = 0; op < t->operands; ++op)
5386 if (t->operand_types[op].bitfield.zmmword
5387 && (i.types[op].bitfield.ymmword
5388 || i.types[op].bitfield.xmmword))
5390 i.error = unsupported;
5396 /* Without VSIB byte, we can't have a vector register for index. */
5397 if (!t->opcode_modifier.vecsib
5399 && (i.index_reg->reg_type.bitfield.xmmword
5400 || i.index_reg->reg_type.bitfield.ymmword
5401 || i.index_reg->reg_type.bitfield.zmmword))
5403 i.error = unsupported_vector_index_register;
5407 /* Check if default mask is allowed. */
5408 if (t->opcode_modifier.nodefmask
5409 && (!i.mask || i.mask->mask->reg_num == 0))
5411 i.error = no_default_mask;
5415 /* For VSIB byte, we need a vector register for index, and all vector
5416 registers must be distinct. */
5417 if (t->opcode_modifier.vecsib)
5420 || !((t->opcode_modifier.vecsib == VecSIB128
5421 && i.index_reg->reg_type.bitfield.xmmword)
5422 || (t->opcode_modifier.vecsib == VecSIB256
5423 && i.index_reg->reg_type.bitfield.ymmword)
5424 || (t->opcode_modifier.vecsib == VecSIB512
5425 && i.index_reg->reg_type.bitfield.zmmword)))
5427 i.error = invalid_vsib_address;
5431 gas_assert (i.reg_operands == 2 || i.mask);
5432 if (i.reg_operands == 2 && !i.mask)
5434 gas_assert (i.types[0].bitfield.class == RegSIMD);
5435 gas_assert (i.types[0].bitfield.xmmword
5436 || i.types[0].bitfield.ymmword);
5437 gas_assert (i.types[2].bitfield.class == RegSIMD);
5438 gas_assert (i.types[2].bitfield.xmmword
5439 || i.types[2].bitfield.ymmword);
5440 if (operand_check == check_none)
5442 if (register_number (i.op[0].regs)
5443 != register_number (i.index_reg)
5444 && register_number (i.op[2].regs)
5445 != register_number (i.index_reg)
5446 && register_number (i.op[0].regs)
5447 != register_number (i.op[2].regs))
5449 if (operand_check == check_error)
5451 i.error = invalid_vector_register_set;
5454 as_warn (_("mask, index, and destination registers should be distinct"));
5456 else if (i.reg_operands == 1 && i.mask)
5458 if (i.types[1].bitfield.class == RegSIMD
5459 && (i.types[1].bitfield.xmmword
5460 || i.types[1].bitfield.ymmword
5461 || i.types[1].bitfield.zmmword)
5462 && (register_number (i.op[1].regs)
5463 == register_number (i.index_reg)))
5465 if (operand_check == check_error)
5467 i.error = invalid_vector_register_set;
5470 if (operand_check != check_none)
5471 as_warn (_("index and destination registers should be distinct"));
5476 /* Check if broadcast is supported by the instruction and is applied
5477 to the memory operand. */
5480 i386_operand_type type, overlap;
5482 /* Check if specified broadcast is supported in this instruction,
5483 and its broadcast bytes match the memory operand. */
5484 op = i.broadcast->operand;
5485 if (!t->opcode_modifier.broadcast
5486 || !(i.flags[op] & Operand_Mem)
5487 || (!i.types[op].bitfield.unspecified
5488 && !match_broadcast_size (t, op)))
5491 i.error = unsupported_broadcast;
5495 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5496 * i.broadcast->type);
5497 operand_type_set (&type, 0);
5498 switch (i.broadcast->bytes)
5501 type.bitfield.word = 1;
5504 type.bitfield.dword = 1;
5507 type.bitfield.qword = 1;
5510 type.bitfield.xmmword = 1;
5513 type.bitfield.ymmword = 1;
5516 type.bitfield.zmmword = 1;
5522 overlap = operand_type_and (type, t->operand_types[op]);
5523 if (operand_type_all_zero (&overlap))
5526 if (t->opcode_modifier.checkregsize)
5530 type.bitfield.baseindex = 1;
5531 for (j = 0; j < i.operands; ++j)
5534 && !operand_type_register_match(i.types[j],
5535 t->operand_types[j],
5537 t->operand_types[op]))
5542 /* If broadcast is supported in this instruction, we need to check if
5543 operand of one-element size isn't specified without broadcast. */
5544 else if (t->opcode_modifier.broadcast && i.mem_operands)
5546 /* Find memory operand. */
5547 for (op = 0; op < i.operands; op++)
5548 if (i.flags[op] & Operand_Mem)
5550 gas_assert (op < i.operands);
5551 /* Check size of the memory operand. */
5552 if (match_broadcast_size (t, op))
5554 i.error = broadcast_needed;
5559 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5561 /* Check if requested masking is supported. */
5564 switch (t->opcode_modifier.masking)
5568 case MERGING_MASKING:
5569 if (i.mask->zeroing)
5572 i.error = unsupported_masking;
5576 case DYNAMIC_MASKING:
5577 /* Memory destinations allow only merging masking. */
5578 if (i.mask->zeroing && i.mem_operands)
5580 /* Find memory operand. */
5581 for (op = 0; op < i.operands; op++)
5582 if (i.flags[op] & Operand_Mem)
5584 gas_assert (op < i.operands);
5585 if (op == i.operands - 1)
5587 i.error = unsupported_masking;
5597 /* Check if masking is applied to dest operand. */
5598 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5600 i.error = mask_not_on_destination;
5607 if (!t->opcode_modifier.sae
5608 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5610 i.error = unsupported_rc_sae;
5613 /* If the instruction has several immediate operands and one of
5614 them is rounding, the rounding operand should be the last
5615 immediate operand. */
5616 if (i.imm_operands > 1
5617 && i.rounding->operand != (int) (i.imm_operands - 1))
5619 i.error = rc_sae_operand_not_last_imm;
5624 /* Check vector Disp8 operand. */
5625 if (t->opcode_modifier.disp8memshift
5626 && i.disp_encoding != disp_encoding_32bit)
5629 i.memshift = t->opcode_modifier.broadcast - 1;
5630 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5631 i.memshift = t->opcode_modifier.disp8memshift;
5634 const i386_operand_type *type = NULL;
5637 for (op = 0; op < i.operands; op++)
5638 if (i.flags[op] & Operand_Mem)
5640 if (t->opcode_modifier.evex == EVEXLIG)
5641 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5642 else if (t->operand_types[op].bitfield.xmmword
5643 + t->operand_types[op].bitfield.ymmword
5644 + t->operand_types[op].bitfield.zmmword <= 1)
5645 type = &t->operand_types[op];
5646 else if (!i.types[op].bitfield.unspecified)
5647 type = &i.types[op];
5649 else if (i.types[op].bitfield.class == RegSIMD
5650 && t->opcode_modifier.evex != EVEXLIG)
5652 if (i.types[op].bitfield.zmmword)
5654 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5656 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5662 if (type->bitfield.zmmword)
5664 else if (type->bitfield.ymmword)
5666 else if (type->bitfield.xmmword)
5670 /* For the check in fits_in_disp8(). */
5671 if (i.memshift == 0)
5675 for (op = 0; op < i.operands; op++)
5676 if (operand_type_check (i.types[op], disp)
5677 && i.op[op].disps->X_op == O_constant)
5679 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5681 i.types[op].bitfield.disp8 = 1;
5684 i.types[op].bitfield.disp8 = 0;
5693 /* Check if operands are valid for the instruction. Update VEX
5697 VEX_check_operands (const insn_template *t)
5699 if (i.vec_encoding == vex_encoding_evex)
5701 /* This instruction must be encoded with EVEX prefix. */
5702 if (!is_evex_encoding (t))
5704 i.error = unsupported;
5710 if (!t->opcode_modifier.vex)
5712 /* This instruction template doesn't have VEX prefix. */
5713 if (i.vec_encoding != vex_encoding_default)
5715 i.error = unsupported;
5721 /* Check the special Imm4 cases; must be the first operand. */
5722 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5724 if (i.op[0].imms->X_op != O_constant
5725 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5731 /* Turn off Imm<N> so that update_imm won't complain. */
5732 operand_type_set (&i.types[0], 0);
5738 static const insn_template *
5739 match_template (char mnem_suffix)
5741 /* Points to template once we've found it. */
5742 const insn_template *t;
5743 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5744 i386_operand_type overlap4;
5745 unsigned int found_reverse_match;
5746 i386_opcode_modifier suffix_check;
5747 i386_operand_type operand_types [MAX_OPERANDS];
5748 int addr_prefix_disp;
5750 unsigned int found_cpu_match, size_match;
5751 unsigned int check_register;
5752 enum i386_error specific_error = 0;
5754 #if MAX_OPERANDS != 5
5755 # error "MAX_OPERANDS must be 5."
5758 found_reverse_match = 0;
5759 addr_prefix_disp = -1;
5761 /* Prepare for mnemonic suffix check. */
5762 memset (&suffix_check, 0, sizeof (suffix_check));
5763 switch (mnem_suffix)
5765 case BYTE_MNEM_SUFFIX:
5766 suffix_check.no_bsuf = 1;
5768 case WORD_MNEM_SUFFIX:
5769 suffix_check.no_wsuf = 1;
5771 case SHORT_MNEM_SUFFIX:
5772 suffix_check.no_ssuf = 1;
5774 case LONG_MNEM_SUFFIX:
5775 suffix_check.no_lsuf = 1;
5777 case QWORD_MNEM_SUFFIX:
5778 suffix_check.no_qsuf = 1;
5781 /* NB: In Intel syntax, normally we can check for memory operand
5782 size when there is no mnemonic suffix. But jmp and call have
5783 2 different encodings with Dword memory operand size, one with
5784 No_ldSuf and the other without. i.suffix is set to
5785 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5786 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5787 suffix_check.no_ldsuf = 1;
5790 /* Must have right number of operands. */
5791 i.error = number_of_operands_mismatch;
5793 for (t = current_templates->start; t < current_templates->end; t++)
5795 addr_prefix_disp = -1;
5796 found_reverse_match = 0;
5798 if (i.operands != t->operands)
5801 /* Check processor support. */
5802 i.error = unsupported;
5803 found_cpu_match = (cpu_flags_match (t)
5804 == CPU_FLAGS_PERFECT_MATCH);
5805 if (!found_cpu_match)
5808 /* Check AT&T mnemonic. */
5809 i.error = unsupported_with_intel_mnemonic;
5810 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5813 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5814 i.error = unsupported_syntax;
5815 if ((intel_syntax && t->opcode_modifier.attsyntax)
5816 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5817 || (intel64 && t->opcode_modifier.amd64)
5818 || (!intel64 && t->opcode_modifier.intel64))
5821 /* Check the suffix. */
5822 i.error = invalid_instruction_suffix;
5823 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5824 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5825 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5826 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5827 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5828 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5831 size_match = operand_size_match (t);
5835 /* This is intentionally not
5837 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5839 as the case of a missing * on the operand is accepted (perhaps with
5840 a warning, issued further down). */
5841 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5843 i.error = operand_type_mismatch;
5847 for (j = 0; j < MAX_OPERANDS; j++)
5848 operand_types[j] = t->operand_types[j];
5850 /* In general, don't allow 64-bit operands in 32-bit mode. */
5851 if (i.suffix == QWORD_MNEM_SUFFIX
5852 && flag_code != CODE_64BIT
5854 ? (!t->opcode_modifier.ignoresize
5855 && !t->opcode_modifier.broadcast
5856 && !intel_float_operand (t->name))
5857 : intel_float_operand (t->name) != 2)
5858 && ((operand_types[0].bitfield.class != RegMMX
5859 && operand_types[0].bitfield.class != RegSIMD)
5860 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5861 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5862 && (t->base_opcode != 0x0fc7
5863 || t->extension_opcode != 1 /* cmpxchg8b */))
5866 /* In general, don't allow 32-bit operands on pre-386. */
5867 else if (i.suffix == LONG_MNEM_SUFFIX
5868 && !cpu_arch_flags.bitfield.cpui386
5870 ? (!t->opcode_modifier.ignoresize
5871 && !intel_float_operand (t->name))
5872 : intel_float_operand (t->name) != 2)
5873 && ((operand_types[0].bitfield.class != RegMMX
5874 && operand_types[0].bitfield.class != RegSIMD)
5875 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5876 && operand_types[t->operands > 1].bitfield.class
5880 /* Do not verify operands when there are none. */
5884 /* We've found a match; break out of loop. */
5888 if (!t->opcode_modifier.jump
5889 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5891 /* There should be only one Disp operand. */
5892 for (j = 0; j < MAX_OPERANDS; j++)
5893 if (operand_type_check (operand_types[j], disp))
5895 if (j < MAX_OPERANDS)
5897 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5899 addr_prefix_disp = j;
5901 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5902 operand into Disp32/Disp32/Disp16/Disp32 operand. */
5906 override = !override;
5909 if (operand_types[j].bitfield.disp32
5910 && operand_types[j].bitfield.disp16)
5912 operand_types[j].bitfield.disp16 = override;
5913 operand_types[j].bitfield.disp32 = !override;
5915 operand_types[j].bitfield.disp32s = 0;
5916 operand_types[j].bitfield.disp64 = 0;
5920 if (operand_types[j].bitfield.disp32s
5921 || operand_types[j].bitfield.disp64)
5923 operand_types[j].bitfield.disp64 &= !override;
5924 operand_types[j].bitfield.disp32s &= !override;
5925 operand_types[j].bitfield.disp32 = override;
5927 operand_types[j].bitfield.disp16 = 0;
5933 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5934 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5937 /* We check register size if needed. */
5938 if (t->opcode_modifier.checkregsize)
5940 check_register = (1 << t->operands) - 1;
5942 check_register &= ~(1 << i.broadcast->operand);
5947 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5948 switch (t->operands)
5951 if (!operand_type_match (overlap0, i.types[0]))
5955 /* xchg %eax, %eax is a special case. It is an alias for nop
5956 only in 32bit mode and we can use opcode 0x90. In 64bit
5957 mode, we can't use 0x90 for xchg %eax, %eax since it should
5958 zero-extend %eax to %rax. */
5959 if (flag_code == CODE_64BIT
5960 && t->base_opcode == 0x90
5961 && i.types[0].bitfield.instance == Accum
5962 && i.types[0].bitfield.dword
5963 && i.types[1].bitfield.instance == Accum
5964 && i.types[1].bitfield.dword)
5966 /* xrelease mov %eax, <disp> is another special case. It must not
5967 match the accumulator-only encoding of mov. */
5968 if (flag_code != CODE_64BIT
5970 && t->base_opcode == 0xa0
5971 && i.types[0].bitfield.instance == Accum
5972 && (i.flags[1] & Operand_Mem))
5977 if (!(size_match & MATCH_STRAIGHT))
5979 /* Reverse direction of operands if swapping is possible in the first
5980 place (operands need to be symmetric) and
5981 - the load form is requested, and the template is a store form,
5982 - the store form is requested, and the template is a load form,
5983 - the non-default (swapped) form is requested. */
5984 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5985 if (t->opcode_modifier.d && i.reg_operands == i.operands
5986 && !operand_type_all_zero (&overlap1))
5987 switch (i.dir_encoding)
5989 case dir_encoding_load:
5990 if (operand_type_check (operand_types[i.operands - 1], anymem)
5991 || t->opcode_modifier.regmem)
5995 case dir_encoding_store:
5996 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5997 && !t->opcode_modifier.regmem)
6001 case dir_encoding_swap:
6004 case dir_encoding_default:
6007 /* If we want store form, we skip the current load. */
6008 if ((i.dir_encoding == dir_encoding_store
6009 || i.dir_encoding == dir_encoding_swap)
6010 && i.mem_operands == 0
6011 && t->opcode_modifier.load)
6016 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6017 if (!operand_type_match (overlap0, i.types[0])
6018 || !operand_type_match (overlap1, i.types[1])
6019 || ((check_register & 3) == 3
6020 && !operand_type_register_match (i.types[0],
6025 /* Check if other direction is valid ... */
6026 if (!t->opcode_modifier.d)
6030 if (!(size_match & MATCH_REVERSE))
6032 /* Try reversing direction of operands. */
6033 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6034 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6035 if (!operand_type_match (overlap0, i.types[0])
6036 || !operand_type_match (overlap1, i.types[i.operands - 1])
6038 && !operand_type_register_match (i.types[0],
6039 operand_types[i.operands - 1],
6040 i.types[i.operands - 1],
6043 /* Does not match either direction. */
6046 /* found_reverse_match holds which of D or FloatR
6048 if (!t->opcode_modifier.d)
6049 found_reverse_match = 0;
6050 else if (operand_types[0].bitfield.tbyte)
6051 found_reverse_match = Opcode_FloatD;
6052 else if (operand_types[0].bitfield.xmmword
6053 || operand_types[i.operands - 1].bitfield.xmmword
6054 || operand_types[0].bitfield.class == RegMMX
6055 || operand_types[i.operands - 1].bitfield.class == RegMMX
6056 || is_any_vex_encoding(t))
6057 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6058 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6060 found_reverse_match = Opcode_D;
6061 if (t->opcode_modifier.floatr)
6062 found_reverse_match |= Opcode_FloatR;
6066 /* Found a forward 2 operand match here. */
6067 switch (t->operands)
6070 overlap4 = operand_type_and (i.types[4],
6074 overlap3 = operand_type_and (i.types[3],
6078 overlap2 = operand_type_and (i.types[2],
6083 switch (t->operands)
6086 if (!operand_type_match (overlap4, i.types[4])
6087 || !operand_type_register_match (i.types[3],
6094 if (!operand_type_match (overlap3, i.types[3])
6095 || ((check_register & 0xa) == 0xa
6096 && !operand_type_register_match (i.types[1],
6100 || ((check_register & 0xc) == 0xc
6101 && !operand_type_register_match (i.types[2],
6108 /* Here we make use of the fact that there are no
6109 reverse match 3 operand instructions. */
6110 if (!operand_type_match (overlap2, i.types[2])
6111 || ((check_register & 5) == 5
6112 && !operand_type_register_match (i.types[0],
6116 || ((check_register & 6) == 6
6117 && !operand_type_register_match (i.types[1],
6125 /* Found either forward/reverse 2, 3 or 4 operand match here:
6126 slip through to break. */
6128 if (!found_cpu_match)
6131 /* Check if vector and VEX operands are valid. */
6132 if (check_VecOperands (t) || VEX_check_operands (t))
6134 specific_error = i.error;
6138 /* We've found a match; break out of loop. */
6142 if (t == current_templates->end)
6144 /* We found no match. */
6145 const char *err_msg;
6146 switch (specific_error ? specific_error : i.error)
6150 case operand_size_mismatch:
6151 err_msg = _("operand size mismatch");
6153 case operand_type_mismatch:
6154 err_msg = _("operand type mismatch");
6156 case register_type_mismatch:
6157 err_msg = _("register type mismatch");
6159 case number_of_operands_mismatch:
6160 err_msg = _("number of operands mismatch");
6162 case invalid_instruction_suffix:
6163 err_msg = _("invalid instruction suffix");
6166 err_msg = _("constant doesn't fit in 4 bits");
6168 case unsupported_with_intel_mnemonic:
6169 err_msg = _("unsupported with Intel mnemonic");
6171 case unsupported_syntax:
6172 err_msg = _("unsupported syntax");
6175 as_bad (_("unsupported instruction `%s'"),
6176 current_templates->start->name);
6178 case invalid_vsib_address:
6179 err_msg = _("invalid VSIB address");
6181 case invalid_vector_register_set:
6182 err_msg = _("mask, index, and destination registers must be distinct");
6184 case unsupported_vector_index_register:
6185 err_msg = _("unsupported vector index register");
6187 case unsupported_broadcast:
6188 err_msg = _("unsupported broadcast");
6190 case broadcast_needed:
6191 err_msg = _("broadcast is needed for operand of such type");
6193 case unsupported_masking:
6194 err_msg = _("unsupported masking");
6196 case mask_not_on_destination:
6197 err_msg = _("mask not on destination operand");
6199 case no_default_mask:
6200 err_msg = _("default mask isn't allowed");
6202 case unsupported_rc_sae:
6203 err_msg = _("unsupported static rounding/sae");
6205 case rc_sae_operand_not_last_imm:
6207 err_msg = _("RC/SAE operand must precede immediate operands");
6209 err_msg = _("RC/SAE operand must follow immediate operands");
6211 case invalid_register_operand:
6212 err_msg = _("invalid register operand");
6215 as_bad (_("%s for `%s'"), err_msg,
6216 current_templates->start->name);
6220 if (!quiet_warnings)
6223 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6224 as_warn (_("indirect %s without `*'"), t->name);
6226 if (t->opcode_modifier.isprefix
6227 && t->opcode_modifier.ignoresize)
6229 /* Warn them that a data or address size prefix doesn't
6230 affect assembly of the next line of code. */
6231 as_warn (_("stand-alone `%s' prefix"), t->name);
6235 /* Copy the template we found. */
6238 if (addr_prefix_disp != -1)
6239 i.tm.operand_types[addr_prefix_disp]
6240 = operand_types[addr_prefix_disp];
6242 if (found_reverse_match)
6244 /* If we found a reverse match we must alter the opcode direction
6245 bit and clear/flip the regmem modifier one. found_reverse_match
6246 holds bits to change (different for int & float insns). */
6248 i.tm.base_opcode ^= found_reverse_match;
6250 i.tm.operand_types[0] = operand_types[i.operands - 1];
6251 i.tm.operand_types[i.operands - 1] = operand_types[0];
6253 /* Certain SIMD insns have their load forms specified in the opcode
6254 table, and hence we need to _set_ RegMem instead of clearing it.
6255 We need to avoid setting the bit though on insns like KMOVW. */
6256 i.tm.opcode_modifier.regmem
6257 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6258 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6259 && !i.tm.opcode_modifier.regmem;
6268 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6269 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6271 if (i.seg[op] != NULL && i.seg[op] != &es)
6273 as_bad (_("`%s' operand %u must use `%ses' segment"),
6275 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6280 /* There's only ever one segment override allowed per instruction.
6281 This instruction possibly has a legal segment override on the
6282 second operand, so copy the segment to where non-string
6283 instructions store it, allowing common code. */
6284 i.seg[op] = i.seg[1];
6290 process_suffix (void)
6292 /* If matched instruction specifies an explicit instruction mnemonic
6294 if (i.tm.opcode_modifier.size == SIZE16)
6295 i.suffix = WORD_MNEM_SUFFIX;
6296 else if (i.tm.opcode_modifier.size == SIZE32)
6297 i.suffix = LONG_MNEM_SUFFIX;
6298 else if (i.tm.opcode_modifier.size == SIZE64)
6299 i.suffix = QWORD_MNEM_SUFFIX;
6300 else if (i.reg_operands
6301 && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6303 /* If there's no instruction mnemonic suffix we try to invent one
6304 based on GPR operands. */
6307 /* We take i.suffix from the last register operand specified,
6308 Destination register type is more significant than source
6309 register type. crc32 in SSE4.2 prefers source register
6311 if (i.tm.base_opcode == 0xf20f38f0
6312 && i.types[0].bitfield.class == Reg)
6314 if (i.types[0].bitfield.byte)
6315 i.suffix = BYTE_MNEM_SUFFIX;
6316 else if (i.types[0].bitfield.word)
6317 i.suffix = WORD_MNEM_SUFFIX;
6318 else if (i.types[0].bitfield.dword)
6319 i.suffix = LONG_MNEM_SUFFIX;
6320 else if (i.types[0].bitfield.qword)
6321 i.suffix = QWORD_MNEM_SUFFIX;
6328 if (i.tm.base_opcode == 0xf20f38f0)
6330 /* We have to know the operand size for crc32. */
6331 as_bad (_("ambiguous memory operand size for `%s`"),
6336 for (op = i.operands; --op >= 0;)
6337 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6338 || i.tm.operand_types[op].bitfield.instance == Accum)
6340 if (i.types[op].bitfield.class != Reg)
6342 if (i.types[op].bitfield.byte)
6343 i.suffix = BYTE_MNEM_SUFFIX;
6344 else if (i.types[op].bitfield.word)
6345 i.suffix = WORD_MNEM_SUFFIX;
6346 else if (i.types[op].bitfield.dword)
6347 i.suffix = LONG_MNEM_SUFFIX;
6348 else if (i.types[op].bitfield.qword)
6349 i.suffix = QWORD_MNEM_SUFFIX;
6356 else if (i.suffix == BYTE_MNEM_SUFFIX)
6359 && i.tm.opcode_modifier.ignoresize
6360 && i.tm.opcode_modifier.no_bsuf)
6362 else if (!check_byte_reg ())
6365 else if (i.suffix == LONG_MNEM_SUFFIX)
6368 && i.tm.opcode_modifier.ignoresize
6369 && i.tm.opcode_modifier.no_lsuf
6370 && !i.tm.opcode_modifier.todword
6371 && !i.tm.opcode_modifier.toqword)
6373 else if (!check_long_reg ())
6376 else if (i.suffix == QWORD_MNEM_SUFFIX)
6379 && i.tm.opcode_modifier.ignoresize
6380 && i.tm.opcode_modifier.no_qsuf
6381 && !i.tm.opcode_modifier.todword
6382 && !i.tm.opcode_modifier.toqword)
6384 else if (!check_qword_reg ())
6387 else if (i.suffix == WORD_MNEM_SUFFIX)
6390 && i.tm.opcode_modifier.ignoresize
6391 && i.tm.opcode_modifier.no_wsuf)
6393 else if (!check_word_reg ())
6396 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6397 /* Do nothing if the instruction is going to ignore the prefix. */
6402 else if (i.tm.opcode_modifier.defaultsize
6404 /* exclude fldenv/frstor/fsave/fstenv */
6405 && i.tm.opcode_modifier.no_ssuf
6406 /* exclude sysret */
6407 && i.tm.base_opcode != 0x0f07)
6409 i.suffix = stackop_size;
6410 if (stackop_size == LONG_MNEM_SUFFIX)
6412 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6413 .code16gcc directive to support 16-bit mode with
6414 32-bit address. For IRET without a suffix, generate
6415 16-bit IRET (opcode 0xcf) to return from an interrupt
6417 if (i.tm.base_opcode == 0xcf)
6419 i.suffix = WORD_MNEM_SUFFIX;
6420 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6422 /* Warn about changed behavior for segment register push/pop. */
6423 else if ((i.tm.base_opcode | 1) == 0x07)
6424 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6428 else if (intel_syntax
6430 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6431 || i.tm.opcode_modifier.jump == JUMP_BYTE
6432 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6433 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6434 && i.tm.extension_opcode <= 3)))
6439 if (!i.tm.opcode_modifier.no_qsuf)
6441 i.suffix = QWORD_MNEM_SUFFIX;
6446 if (!i.tm.opcode_modifier.no_lsuf)
6447 i.suffix = LONG_MNEM_SUFFIX;
6450 if (!i.tm.opcode_modifier.no_wsuf)
6451 i.suffix = WORD_MNEM_SUFFIX;
6460 if (i.tm.opcode_modifier.w)
6462 as_bad (_("no instruction mnemonic suffix given and "
6463 "no register operands; can't size instruction"));
6469 unsigned int suffixes;
6471 suffixes = !i.tm.opcode_modifier.no_bsuf;
6472 if (!i.tm.opcode_modifier.no_wsuf)
6474 if (!i.tm.opcode_modifier.no_lsuf)
6476 if (!i.tm.opcode_modifier.no_ldsuf)
6478 if (!i.tm.opcode_modifier.no_ssuf)
6480 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6483 /* There are more than suffix matches. */
6484 if (i.tm.opcode_modifier.w
6485 || ((suffixes & (suffixes - 1))
6486 && !i.tm.opcode_modifier.defaultsize
6487 && !i.tm.opcode_modifier.ignoresize))
6489 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6495 /* Change the opcode based on the operand size given by i.suffix. */
6498 /* Size floating point instruction. */
6499 case LONG_MNEM_SUFFIX:
6500 if (i.tm.opcode_modifier.floatmf)
6502 i.tm.base_opcode ^= 4;
6506 case WORD_MNEM_SUFFIX:
6507 case QWORD_MNEM_SUFFIX:
6508 /* It's not a byte, select word/dword operation. */
6509 if (i.tm.opcode_modifier.w)
6511 if (i.tm.opcode_modifier.shortform)
6512 i.tm.base_opcode |= 8;
6514 i.tm.base_opcode |= 1;
6517 case SHORT_MNEM_SUFFIX:
6518 /* Now select between word & dword operations via the operand
6519 size prefix, except for instructions that will ignore this
6521 if (i.reg_operands > 0
6522 && i.types[0].bitfield.class == Reg
6523 && i.tm.opcode_modifier.addrprefixopreg
6524 && (i.tm.operand_types[0].bitfield.instance == Accum
6525 || i.operands == 1))
6527 /* The address size override prefix changes the size of the
6529 if ((flag_code == CODE_32BIT
6530 && i.op[0].regs->reg_type.bitfield.word)
6531 || (flag_code != CODE_32BIT
6532 && i.op[0].regs->reg_type.bitfield.dword))
6533 if (!add_prefix (ADDR_PREFIX_OPCODE))
6536 else if (i.suffix != QWORD_MNEM_SUFFIX
6537 && !i.tm.opcode_modifier.ignoresize
6538 && !i.tm.opcode_modifier.floatmf
6539 && !is_any_vex_encoding (&i.tm)
6540 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6541 || (flag_code == CODE_64BIT
6542 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6544 unsigned int prefix = DATA_PREFIX_OPCODE;
6546 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6547 prefix = ADDR_PREFIX_OPCODE;
6549 if (!add_prefix (prefix))
6553 /* Set mode64 for an operand. */
6554 if (i.suffix == QWORD_MNEM_SUFFIX
6555 && flag_code == CODE_64BIT
6556 && !i.tm.opcode_modifier.norex64
6557 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6559 && ! (i.operands == 2
6560 && i.tm.base_opcode == 0x90
6561 && i.tm.extension_opcode == None
6562 && i.types[0].bitfield.instance == Accum
6563 && i.types[0].bitfield.qword
6564 && i.types[1].bitfield.instance == Accum
6565 && i.types[1].bitfield.qword))
6571 if (i.reg_operands != 0
6573 && i.tm.opcode_modifier.addrprefixopreg
6574 && i.tm.operand_types[0].bitfield.instance != Accum)
6576 /* Check invalid register operand when the address size override
6577 prefix changes the size of register operands. */
6579 enum { need_word, need_dword, need_qword } need;
6581 if (flag_code == CODE_32BIT)
6582 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6585 if (i.prefix[ADDR_PREFIX])
6588 need = flag_code == CODE_64BIT ? need_qword : need_word;
6591 for (op = 0; op < i.operands; op++)
6592 if (i.types[op].bitfield.class == Reg
6593 && ((need == need_word
6594 && !i.op[op].regs->reg_type.bitfield.word)
6595 || (need == need_dword
6596 && !i.op[op].regs->reg_type.bitfield.dword)
6597 || (need == need_qword
6598 && !i.op[op].regs->reg_type.bitfield.qword)))
6600 as_bad (_("invalid register operand size for `%s'"),
6610 check_byte_reg (void)
6614 for (op = i.operands; --op >= 0;)
6616 /* Skip non-register operands. */
6617 if (i.types[op].bitfield.class != Reg)
6620 /* If this is an eight bit register, it's OK. If it's the 16 or
6621 32 bit version of an eight bit register, we will just use the
6622 low portion, and that's OK too. */
6623 if (i.types[op].bitfield.byte)
6626 /* I/O port address operands are OK too. */
6627 if (i.tm.operand_types[op].bitfield.instance == RegD
6628 && i.tm.operand_types[op].bitfield.word)
6631 /* crc32 doesn't generate this warning. */
6632 if (i.tm.base_opcode == 0xf20f38f0)
6635 if ((i.types[op].bitfield.word
6636 || i.types[op].bitfield.dword
6637 || i.types[op].bitfield.qword)
6638 && i.op[op].regs->reg_num < 4
6639 /* Prohibit these changes in 64bit mode, since the lowering
6640 would be more complicated. */
6641 && flag_code != CODE_64BIT)
6643 #if REGISTER_WARNINGS
6644 if (!quiet_warnings)
6645 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6647 (i.op[op].regs + (i.types[op].bitfield.word
6648 ? REGNAM_AL - REGNAM_AX
6649 : REGNAM_AL - REGNAM_EAX))->reg_name,
6651 i.op[op].regs->reg_name,
6656 /* Any other register is bad. */
6657 if (i.types[op].bitfield.class == Reg
6658 || i.types[op].bitfield.class == RegMMX
6659 || i.types[op].bitfield.class == RegSIMD
6660 || i.types[op].bitfield.class == SReg
6661 || i.types[op].bitfield.class == RegCR
6662 || i.types[op].bitfield.class == RegDR
6663 || i.types[op].bitfield.class == RegTR)
6665 as_bad (_("`%s%s' not allowed with `%s%c'"),
6667 i.op[op].regs->reg_name,
6677 check_long_reg (void)
6681 for (op = i.operands; --op >= 0;)
6682 /* Skip non-register operands. */
6683 if (i.types[op].bitfield.class != Reg)
6685 /* Reject eight bit registers, except where the template requires
6686 them. (eg. movzb) */
6687 else if (i.types[op].bitfield.byte
6688 && (i.tm.operand_types[op].bitfield.class == Reg
6689 || i.tm.operand_types[op].bitfield.instance == Accum)
6690 && (i.tm.operand_types[op].bitfield.word
6691 || i.tm.operand_types[op].bitfield.dword))
6693 as_bad (_("`%s%s' not allowed with `%s%c'"),
6695 i.op[op].regs->reg_name,
6700 /* Warn if the e prefix on a general reg is missing. */
6701 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6702 && i.types[op].bitfield.word
6703 && (i.tm.operand_types[op].bitfield.class == Reg
6704 || i.tm.operand_types[op].bitfield.instance == Accum)
6705 && i.tm.operand_types[op].bitfield.dword)
6707 /* Prohibit these changes in the 64bit mode, since the
6708 lowering is more complicated. */
6709 if (flag_code == CODE_64BIT)
6711 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6712 register_prefix, i.op[op].regs->reg_name,
6716 #if REGISTER_WARNINGS
6717 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6719 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6720 register_prefix, i.op[op].regs->reg_name, i.suffix);
6723 /* Warn if the r prefix on a general reg is present. */
6724 else if (i.types[op].bitfield.qword
6725 && (i.tm.operand_types[op].bitfield.class == Reg
6726 || i.tm.operand_types[op].bitfield.instance == Accum)
6727 && i.tm.operand_types[op].bitfield.dword)
6730 && i.tm.opcode_modifier.toqword
6731 && i.types[0].bitfield.class != RegSIMD)
6733 /* Convert to QWORD. We want REX byte. */
6734 i.suffix = QWORD_MNEM_SUFFIX;
6738 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6739 register_prefix, i.op[op].regs->reg_name,
6748 check_qword_reg (void)
6752 for (op = i.operands; --op >= 0; )
6753 /* Skip non-register operands. */
6754 if (i.types[op].bitfield.class != Reg)
6756 /* Reject eight bit registers, except where the template requires
6757 them. (eg. movzb) */
6758 else if (i.types[op].bitfield.byte
6759 && (i.tm.operand_types[op].bitfield.class == Reg
6760 || i.tm.operand_types[op].bitfield.instance == Accum)
6761 && (i.tm.operand_types[op].bitfield.word
6762 || i.tm.operand_types[op].bitfield.dword))
6764 as_bad (_("`%s%s' not allowed with `%s%c'"),
6766 i.op[op].regs->reg_name,
6771 /* Warn if the r prefix on a general reg is missing. */
6772 else if ((i.types[op].bitfield.word
6773 || i.types[op].bitfield.dword)
6774 && (i.tm.operand_types[op].bitfield.class == Reg
6775 || i.tm.operand_types[op].bitfield.instance == Accum)
6776 && i.tm.operand_types[op].bitfield.qword)
6778 /* Prohibit these changes in the 64bit mode, since the
6779 lowering is more complicated. */
6781 && i.tm.opcode_modifier.todword
6782 && i.types[0].bitfield.class != RegSIMD)
6784 /* Convert to DWORD. We don't want REX byte. */
6785 i.suffix = LONG_MNEM_SUFFIX;
6789 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6790 register_prefix, i.op[op].regs->reg_name,
6799 check_word_reg (void)
6802 for (op = i.operands; --op >= 0;)
6803 /* Skip non-register operands. */
6804 if (i.types[op].bitfield.class != Reg)
6806 /* Reject eight bit registers, except where the template requires
6807 them. (eg. movzb) */
6808 else if (i.types[op].bitfield.byte
6809 && (i.tm.operand_types[op].bitfield.class == Reg
6810 || i.tm.operand_types[op].bitfield.instance == Accum)
6811 && (i.tm.operand_types[op].bitfield.word
6812 || i.tm.operand_types[op].bitfield.dword))
6814 as_bad (_("`%s%s' not allowed with `%s%c'"),
6816 i.op[op].regs->reg_name,
6821 /* Warn if the e or r prefix on a general reg is present. */
6822 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6823 && (i.types[op].bitfield.dword
6824 || i.types[op].bitfield.qword)
6825 && (i.tm.operand_types[op].bitfield.class == Reg
6826 || i.tm.operand_types[op].bitfield.instance == Accum)
6827 && i.tm.operand_types[op].bitfield.word)
6829 /* Prohibit these changes in the 64bit mode, since the
6830 lowering is more complicated. */
6831 if (flag_code == CODE_64BIT)
6833 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6834 register_prefix, i.op[op].regs->reg_name,
6838 #if REGISTER_WARNINGS
6839 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6841 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6842 register_prefix, i.op[op].regs->reg_name, i.suffix);
6849 update_imm (unsigned int j)
6851 i386_operand_type overlap = i.types[j];
6852 if ((overlap.bitfield.imm8
6853 || overlap.bitfield.imm8s
6854 || overlap.bitfield.imm16
6855 || overlap.bitfield.imm32
6856 || overlap.bitfield.imm32s
6857 || overlap.bitfield.imm64)
6858 && !operand_type_equal (&overlap, &imm8)
6859 && !operand_type_equal (&overlap, &imm8s)
6860 && !operand_type_equal (&overlap, &imm16)
6861 && !operand_type_equal (&overlap, &imm32)
6862 && !operand_type_equal (&overlap, &imm32s)
6863 && !operand_type_equal (&overlap, &imm64))
6867 i386_operand_type temp;
6869 operand_type_set (&temp, 0);
6870 if (i.suffix == BYTE_MNEM_SUFFIX)
6872 temp.bitfield.imm8 = overlap.bitfield.imm8;
6873 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6875 else if (i.suffix == WORD_MNEM_SUFFIX)
6876 temp.bitfield.imm16 = overlap.bitfield.imm16;
6877 else if (i.suffix == QWORD_MNEM_SUFFIX)
6879 temp.bitfield.imm64 = overlap.bitfield.imm64;
6880 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6883 temp.bitfield.imm32 = overlap.bitfield.imm32;
6886 else if (operand_type_equal (&overlap, &imm16_32_32s)
6887 || operand_type_equal (&overlap, &imm16_32)
6888 || operand_type_equal (&overlap, &imm16_32s))
6890 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6895 if (!operand_type_equal (&overlap, &imm8)
6896 && !operand_type_equal (&overlap, &imm8s)
6897 && !operand_type_equal (&overlap, &imm16)
6898 && !operand_type_equal (&overlap, &imm32)
6899 && !operand_type_equal (&overlap, &imm32s)
6900 && !operand_type_equal (&overlap, &imm64))
6902 as_bad (_("no instruction mnemonic suffix given; "
6903 "can't determine immediate size"));
6907 i.types[j] = overlap;
6917 /* Update the first 2 immediate operands. */
6918 n = i.operands > 2 ? 2 : i.operands;
6921 for (j = 0; j < n; j++)
6922 if (update_imm (j) == 0)
6925 /* The 3rd operand can't be immediate operand. */
6926 gas_assert (operand_type_check (i.types[2], imm) == 0);
6933 process_operands (void)
6935 /* Default segment register this instruction will use for memory
6936 accesses. 0 means unknown. This is only for optimizing out
6937 unnecessary segment overrides. */
6938 const seg_entry *default_seg = 0;
6940 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6942 unsigned int dupl = i.operands;
6943 unsigned int dest = dupl - 1;
6946 /* The destination must be an xmm register. */
6947 gas_assert (i.reg_operands
6948 && MAX_OPERANDS > dupl
6949 && operand_type_equal (&i.types[dest], ®xmm));
6951 if (i.tm.operand_types[0].bitfield.instance == Accum
6952 && i.tm.operand_types[0].bitfield.xmmword)
6954 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6956 /* Keep xmm0 for instructions with VEX prefix and 3
6958 i.tm.operand_types[0].bitfield.instance = InstanceNone;
6959 i.tm.operand_types[0].bitfield.class = RegSIMD;
6964 /* We remove the first xmm0 and keep the number of
6965 operands unchanged, which in fact duplicates the
6967 for (j = 1; j < i.operands; j++)
6969 i.op[j - 1] = i.op[j];
6970 i.types[j - 1] = i.types[j];
6971 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6972 i.flags[j - 1] = i.flags[j];
6976 else if (i.tm.opcode_modifier.implicit1stxmm0)
6978 gas_assert ((MAX_OPERANDS - 1) > dupl
6979 && (i.tm.opcode_modifier.vexsources
6982 /* Add the implicit xmm0 for instructions with VEX prefix
6984 for (j = i.operands; j > 0; j--)
6986 i.op[j] = i.op[j - 1];
6987 i.types[j] = i.types[j - 1];
6988 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6989 i.flags[j] = i.flags[j - 1];
6992 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6993 i.types[0] = regxmm;
6994 i.tm.operand_types[0] = regxmm;
6997 i.reg_operands += 2;
7002 i.op[dupl] = i.op[dest];
7003 i.types[dupl] = i.types[dest];
7004 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7005 i.flags[dupl] = i.flags[dest];
7014 i.op[dupl] = i.op[dest];
7015 i.types[dupl] = i.types[dest];
7016 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7017 i.flags[dupl] = i.flags[dest];
7020 if (i.tm.opcode_modifier.immext)
7023 else if (i.tm.operand_types[0].bitfield.instance == Accum
7024 && i.tm.operand_types[0].bitfield.xmmword)
7028 for (j = 1; j < i.operands; j++)
7030 i.op[j - 1] = i.op[j];
7031 i.types[j - 1] = i.types[j];
7033 /* We need to adjust fields in i.tm since they are used by
7034 build_modrm_byte. */
7035 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7037 i.flags[j - 1] = i.flags[j];
7044 else if (i.tm.opcode_modifier.implicitquadgroup)
7046 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7048 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7049 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7050 regnum = register_number (i.op[1].regs);
7051 first_reg_in_group = regnum & ~3;
7052 last_reg_in_group = first_reg_in_group + 3;
7053 if (regnum != first_reg_in_group)
7054 as_warn (_("source register `%s%s' implicitly denotes"
7055 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7056 register_prefix, i.op[1].regs->reg_name,
7057 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7058 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7061 else if (i.tm.opcode_modifier.regkludge)
7063 /* The imul $imm, %reg instruction is converted into
7064 imul $imm, %reg, %reg, and the clr %reg instruction
7065 is converted into xor %reg, %reg. */
7067 unsigned int first_reg_op;
7069 if (operand_type_check (i.types[0], reg))
7073 /* Pretend we saw the extra register operand. */
7074 gas_assert (i.reg_operands == 1
7075 && i.op[first_reg_op + 1].regs == 0);
7076 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7077 i.types[first_reg_op + 1] = i.types[first_reg_op];
7082 if (i.tm.opcode_modifier.modrm)
7084 /* The opcode is completed (modulo i.tm.extension_opcode which
7085 must be put into the modrm byte). Now, we make the modrm and
7086 index base bytes based on all the info we've collected. */
7088 default_seg = build_modrm_byte ();
7090 else if (i.types[0].bitfield.class == SReg)
7092 if (flag_code != CODE_64BIT
7093 ? i.tm.base_opcode == POP_SEG_SHORT
7094 && i.op[0].regs->reg_num == 1
7095 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7096 && i.op[0].regs->reg_num < 4)
7098 as_bad (_("you can't `%s %s%s'"),
7099 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7102 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7104 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7105 i.tm.opcode_length = 2;
7107 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7109 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7113 else if (i.tm.opcode_modifier.isstring)
7115 /* For the string instructions that allow a segment override
7116 on one of their operands, the default segment is ds. */
7119 else if (i.tm.opcode_modifier.shortform)
7121 /* The register or float register operand is in operand
7123 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7125 /* Register goes in low 3 bits of opcode. */
7126 i.tm.base_opcode |= i.op[op].regs->reg_num;
7127 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7129 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7131 /* Warn about some common errors, but press on regardless.
7132 The first case can be generated by gcc (<= 2.8.1). */
7133 if (i.operands == 2)
7135 /* Reversed arguments on faddp, fsubp, etc. */
7136 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7137 register_prefix, i.op[!intel_syntax].regs->reg_name,
7138 register_prefix, i.op[intel_syntax].regs->reg_name);
7142 /* Extraneous `l' suffix on fp insn. */
7143 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7144 register_prefix, i.op[0].regs->reg_name);
7149 if (i.tm.base_opcode == 0x8d /* lea */
7152 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7154 /* If a segment was explicitly specified, and the specified segment
7155 is not the default, use an opcode prefix to select it. If we
7156 never figured out what the default segment is, then default_seg
7157 will be zero at this point, and the specified segment prefix will
7159 if ((i.seg[0]) && (i.seg[0] != default_seg))
7161 if (!add_prefix (i.seg[0]->seg_prefix))
7167 static const seg_entry *
7168 build_modrm_byte (void)
7170 const seg_entry *default_seg = 0;
7171 unsigned int source, dest;
7174 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7177 unsigned int nds, reg_slot;
7180 dest = i.operands - 1;
7183 /* There are 2 kinds of instructions:
7184 1. 5 operands: 4 register operands or 3 register operands
7185 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7186 VexW0 or VexW1. The destination must be either XMM, YMM or
7188 2. 4 operands: 4 register operands or 3 register operands
7189 plus 1 memory operand, with VexXDS. */
7190 gas_assert ((i.reg_operands == 4
7191 || (i.reg_operands == 3 && i.mem_operands == 1))
7192 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7193 && i.tm.opcode_modifier.vexw
7194 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7196 /* If VexW1 is set, the first non-immediate operand is the source and
7197 the second non-immediate one is encoded in the immediate operand. */
7198 if (i.tm.opcode_modifier.vexw == VEXW1)
7200 source = i.imm_operands;
7201 reg_slot = i.imm_operands + 1;
7205 source = i.imm_operands + 1;
7206 reg_slot = i.imm_operands;
7209 if (i.imm_operands == 0)
7211 /* When there is no immediate operand, generate an 8bit
7212 immediate operand to encode the first operand. */
7213 exp = &im_expressions[i.imm_operands++];
7214 i.op[i.operands].imms = exp;
7215 i.types[i.operands] = imm8;
7218 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7219 exp->X_op = O_constant;
7220 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7221 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7225 gas_assert (i.imm_operands == 1);
7226 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7227 gas_assert (!i.tm.opcode_modifier.immext);
7229 /* Turn on Imm8 again so that output_imm will generate it. */
7230 i.types[0].bitfield.imm8 = 1;
7232 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7233 i.op[0].imms->X_add_number
7234 |= register_number (i.op[reg_slot].regs) << 4;
7235 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7238 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7239 i.vex.register_specifier = i.op[nds].regs;
7244 /* i.reg_operands MUST be the number of real register operands;
7245 implicit registers do not count. If there are 3 register
7246 operands, it must be a instruction with VexNDS. For a
7247 instruction with VexNDD, the destination register is encoded
7248 in VEX prefix. If there are 4 register operands, it must be
7249 a instruction with VEX prefix and 3 sources. */
7250 if (i.mem_operands == 0
7251 && ((i.reg_operands == 2
7252 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7253 || (i.reg_operands == 3
7254 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7255 || (i.reg_operands == 4 && vex_3_sources)))
7263 /* When there are 3 operands, one of them may be immediate,
7264 which may be the first or the last operand. Otherwise,
7265 the first operand must be shift count register (cl) or it
7266 is an instruction with VexNDS. */
7267 gas_assert (i.imm_operands == 1
7268 || (i.imm_operands == 0
7269 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7270 || (i.types[0].bitfield.instance == RegC
7271 && i.types[0].bitfield.byte))));
7272 if (operand_type_check (i.types[0], imm)
7273 || (i.types[0].bitfield.instance == RegC
7274 && i.types[0].bitfield.byte))
7280 /* When there are 4 operands, the first two must be 8bit
7281 immediate operands. The source operand will be the 3rd
7284 For instructions with VexNDS, if the first operand
7285 an imm8, the source operand is the 2nd one. If the last
7286 operand is imm8, the source operand is the first one. */
7287 gas_assert ((i.imm_operands == 2
7288 && i.types[0].bitfield.imm8
7289 && i.types[1].bitfield.imm8)
7290 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7291 && i.imm_operands == 1
7292 && (i.types[0].bitfield.imm8
7293 || i.types[i.operands - 1].bitfield.imm8
7295 if (i.imm_operands == 2)
7299 if (i.types[0].bitfield.imm8)
7306 if (is_evex_encoding (&i.tm))
7308 /* For EVEX instructions, when there are 5 operands, the
7309 first one must be immediate operand. If the second one
7310 is immediate operand, the source operand is the 3th
7311 one. If the last one is immediate operand, the source
7312 operand is the 2nd one. */
7313 gas_assert (i.imm_operands == 2
7314 && i.tm.opcode_modifier.sae
7315 && operand_type_check (i.types[0], imm));
7316 if (operand_type_check (i.types[1], imm))
7318 else if (operand_type_check (i.types[4], imm))
7332 /* RC/SAE operand could be between DEST and SRC. That happens
7333 when one operand is GPR and the other one is XMM/YMM/ZMM
7335 if (i.rounding && i.rounding->operand == (int) dest)
7338 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7340 /* For instructions with VexNDS, the register-only source
7341 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7342 register. It is encoded in VEX prefix. */
7344 i386_operand_type op;
7347 /* Check register-only source operand when two source
7348 operands are swapped. */
7349 if (!i.tm.operand_types[source].bitfield.baseindex
7350 && i.tm.operand_types[dest].bitfield.baseindex)
7358 op = i.tm.operand_types[vvvv];
7359 if ((dest + 1) >= i.operands
7360 || ((op.bitfield.class != Reg
7361 || (!op.bitfield.dword && !op.bitfield.qword))
7362 && op.bitfield.class != RegSIMD
7363 && !operand_type_equal (&op, ®mask)))
7365 i.vex.register_specifier = i.op[vvvv].regs;
7371 /* One of the register operands will be encoded in the i.rm.reg
7372 field, the other in the combined i.rm.mode and i.rm.regmem
7373 fields. If no form of this instruction supports a memory
7374 destination operand, then we assume the source operand may
7375 sometimes be a memory operand and so we need to store the
7376 destination in the i.rm.reg field. */
7377 if (!i.tm.opcode_modifier.regmem
7378 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7380 i.rm.reg = i.op[dest].regs->reg_num;
7381 i.rm.regmem = i.op[source].regs->reg_num;
7382 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7383 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7384 i.has_regmmx = TRUE;
7385 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7386 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7388 if (i.types[dest].bitfield.zmmword
7389 || i.types[source].bitfield.zmmword)
7390 i.has_regzmm = TRUE;
7391 else if (i.types[dest].bitfield.ymmword
7392 || i.types[source].bitfield.ymmword)
7393 i.has_regymm = TRUE;
7395 i.has_regxmm = TRUE;
7397 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7399 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7401 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7403 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7408 i.rm.reg = i.op[source].regs->reg_num;
7409 i.rm.regmem = i.op[dest].regs->reg_num;
7410 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7412 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7414 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7416 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7419 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7421 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7424 add_prefix (LOCK_PREFIX_OPCODE);
7428 { /* If it's not 2 reg operands... */
7433 unsigned int fake_zero_displacement = 0;
7436 for (op = 0; op < i.operands; op++)
7437 if (i.flags[op] & Operand_Mem)
7439 gas_assert (op < i.operands);
7441 if (i.tm.opcode_modifier.vecsib)
7443 if (i.index_reg->reg_num == RegIZ)
7446 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7449 i.sib.base = NO_BASE_REGISTER;
7450 i.sib.scale = i.log2_scale_factor;
7451 i.types[op].bitfield.disp8 = 0;
7452 i.types[op].bitfield.disp16 = 0;
7453 i.types[op].bitfield.disp64 = 0;
7454 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7456 /* Must be 32 bit */
7457 i.types[op].bitfield.disp32 = 1;
7458 i.types[op].bitfield.disp32s = 0;
7462 i.types[op].bitfield.disp32 = 0;
7463 i.types[op].bitfield.disp32s = 1;
7466 i.sib.index = i.index_reg->reg_num;
7467 if ((i.index_reg->reg_flags & RegRex) != 0)
7469 if ((i.index_reg->reg_flags & RegVRex) != 0)
7475 if (i.base_reg == 0)
7478 if (!i.disp_operands)
7479 fake_zero_displacement = 1;
7480 if (i.index_reg == 0)
7482 i386_operand_type newdisp;
7484 gas_assert (!i.tm.opcode_modifier.vecsib);
7485 /* Operand is just <disp> */
7486 if (flag_code == CODE_64BIT)
7488 /* 64bit mode overwrites the 32bit absolute
7489 addressing by RIP relative addressing and
7490 absolute addressing is encoded by one of the
7491 redundant SIB forms. */
7492 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7493 i.sib.base = NO_BASE_REGISTER;
7494 i.sib.index = NO_INDEX_REGISTER;
7495 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7497 else if ((flag_code == CODE_16BIT)
7498 ^ (i.prefix[ADDR_PREFIX] != 0))
7500 i.rm.regmem = NO_BASE_REGISTER_16;
7505 i.rm.regmem = NO_BASE_REGISTER;
7508 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7509 i.types[op] = operand_type_or (i.types[op], newdisp);
7511 else if (!i.tm.opcode_modifier.vecsib)
7513 /* !i.base_reg && i.index_reg */
7514 if (i.index_reg->reg_num == RegIZ)
7515 i.sib.index = NO_INDEX_REGISTER;
7517 i.sib.index = i.index_reg->reg_num;
7518 i.sib.base = NO_BASE_REGISTER;
7519 i.sib.scale = i.log2_scale_factor;
7520 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7521 i.types[op].bitfield.disp8 = 0;
7522 i.types[op].bitfield.disp16 = 0;
7523 i.types[op].bitfield.disp64 = 0;
7524 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7526 /* Must be 32 bit */
7527 i.types[op].bitfield.disp32 = 1;
7528 i.types[op].bitfield.disp32s = 0;
7532 i.types[op].bitfield.disp32 = 0;
7533 i.types[op].bitfield.disp32s = 1;
7535 if ((i.index_reg->reg_flags & RegRex) != 0)
7539 /* RIP addressing for 64bit mode. */
7540 else if (i.base_reg->reg_num == RegIP)
7542 gas_assert (!i.tm.opcode_modifier.vecsib);
7543 i.rm.regmem = NO_BASE_REGISTER;
7544 i.types[op].bitfield.disp8 = 0;
7545 i.types[op].bitfield.disp16 = 0;
7546 i.types[op].bitfield.disp32 = 0;
7547 i.types[op].bitfield.disp32s = 1;
7548 i.types[op].bitfield.disp64 = 0;
7549 i.flags[op] |= Operand_PCrel;
7550 if (! i.disp_operands)
7551 fake_zero_displacement = 1;
7553 else if (i.base_reg->reg_type.bitfield.word)
7555 gas_assert (!i.tm.opcode_modifier.vecsib);
7556 switch (i.base_reg->reg_num)
7559 if (i.index_reg == 0)
7561 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7562 i.rm.regmem = i.index_reg->reg_num - 6;
7566 if (i.index_reg == 0)
7569 if (operand_type_check (i.types[op], disp) == 0)
7571 /* fake (%bp) into 0(%bp) */
7572 i.types[op].bitfield.disp8 = 1;
7573 fake_zero_displacement = 1;
7576 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7577 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7579 default: /* (%si) -> 4 or (%di) -> 5 */
7580 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7582 i.rm.mode = mode_from_disp_size (i.types[op]);
7584 else /* i.base_reg and 32/64 bit mode */
7586 if (flag_code == CODE_64BIT
7587 && operand_type_check (i.types[op], disp))
7589 i.types[op].bitfield.disp16 = 0;
7590 i.types[op].bitfield.disp64 = 0;
7591 if (i.prefix[ADDR_PREFIX] == 0)
7593 i.types[op].bitfield.disp32 = 0;
7594 i.types[op].bitfield.disp32s = 1;
7598 i.types[op].bitfield.disp32 = 1;
7599 i.types[op].bitfield.disp32s = 0;
7603 if (!i.tm.opcode_modifier.vecsib)
7604 i.rm.regmem = i.base_reg->reg_num;
7605 if ((i.base_reg->reg_flags & RegRex) != 0)
7607 i.sib.base = i.base_reg->reg_num;
7608 /* x86-64 ignores REX prefix bit here to avoid decoder
7610 if (!(i.base_reg->reg_flags & RegRex)
7611 && (i.base_reg->reg_num == EBP_REG_NUM
7612 || i.base_reg->reg_num == ESP_REG_NUM))
7614 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7616 fake_zero_displacement = 1;
7617 i.types[op].bitfield.disp8 = 1;
7619 i.sib.scale = i.log2_scale_factor;
7620 if (i.index_reg == 0)
7622 gas_assert (!i.tm.opcode_modifier.vecsib);
7623 /* <disp>(%esp) becomes two byte modrm with no index
7624 register. We've already stored the code for esp
7625 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7626 Any base register besides %esp will not use the
7627 extra modrm byte. */
7628 i.sib.index = NO_INDEX_REGISTER;
7630 else if (!i.tm.opcode_modifier.vecsib)
7632 if (i.index_reg->reg_num == RegIZ)
7633 i.sib.index = NO_INDEX_REGISTER;
7635 i.sib.index = i.index_reg->reg_num;
7636 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7637 if ((i.index_reg->reg_flags & RegRex) != 0)
7642 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7643 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7647 if (!fake_zero_displacement
7651 fake_zero_displacement = 1;
7652 if (i.disp_encoding == disp_encoding_8bit)
7653 i.types[op].bitfield.disp8 = 1;
7655 i.types[op].bitfield.disp32 = 1;
7657 i.rm.mode = mode_from_disp_size (i.types[op]);
7661 if (fake_zero_displacement)
7663 /* Fakes a zero displacement assuming that i.types[op]
7664 holds the correct displacement size. */
7667 gas_assert (i.op[op].disps == 0);
7668 exp = &disp_expressions[i.disp_operands++];
7669 i.op[op].disps = exp;
7670 exp->X_op = O_constant;
7671 exp->X_add_number = 0;
7672 exp->X_add_symbol = (symbolS *) 0;
7673 exp->X_op_symbol = (symbolS *) 0;
7681 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7683 if (operand_type_check (i.types[0], imm))
7684 i.vex.register_specifier = NULL;
7687 /* VEX.vvvv encodes one of the sources when the first
7688 operand is not an immediate. */
7689 if (i.tm.opcode_modifier.vexw == VEXW0)
7690 i.vex.register_specifier = i.op[0].regs;
7692 i.vex.register_specifier = i.op[1].regs;
7695 /* Destination is a XMM register encoded in the ModRM.reg
7697 i.rm.reg = i.op[2].regs->reg_num;
7698 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7701 /* ModRM.rm and VEX.B encodes the other source. */
7702 if (!i.mem_operands)
7706 if (i.tm.opcode_modifier.vexw == VEXW0)
7707 i.rm.regmem = i.op[1].regs->reg_num;
7709 i.rm.regmem = i.op[0].regs->reg_num;
7711 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7715 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7717 i.vex.register_specifier = i.op[2].regs;
7718 if (!i.mem_operands)
7721 i.rm.regmem = i.op[1].regs->reg_num;
7722 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7726 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7727 (if any) based on i.tm.extension_opcode. Again, we must be
7728 careful to make sure that segment/control/debug/test/MMX
7729 registers are coded into the i.rm.reg field. */
7730 else if (i.reg_operands)
7733 unsigned int vex_reg = ~0;
7735 for (op = 0; op < i.operands; op++)
7737 if (i.types[op].bitfield.class == Reg
7738 || i.types[op].bitfield.class == RegBND
7739 || i.types[op].bitfield.class == RegMask
7740 || i.types[op].bitfield.class == SReg
7741 || i.types[op].bitfield.class == RegCR
7742 || i.types[op].bitfield.class == RegDR
7743 || i.types[op].bitfield.class == RegTR)
7745 if (i.types[op].bitfield.class == RegSIMD)
7747 if (i.types[op].bitfield.zmmword)
7748 i.has_regzmm = TRUE;
7749 else if (i.types[op].bitfield.ymmword)
7750 i.has_regymm = TRUE;
7752 i.has_regxmm = TRUE;
7755 if (i.types[op].bitfield.class == RegMMX)
7757 i.has_regmmx = TRUE;
7764 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7766 /* For instructions with VexNDS, the register-only
7767 source operand is encoded in VEX prefix. */
7768 gas_assert (mem != (unsigned int) ~0);
7773 gas_assert (op < i.operands);
7777 /* Check register-only source operand when two source
7778 operands are swapped. */
7779 if (!i.tm.operand_types[op].bitfield.baseindex
7780 && i.tm.operand_types[op + 1].bitfield.baseindex)
7784 gas_assert (mem == (vex_reg + 1)
7785 && op < i.operands);
7790 gas_assert (vex_reg < i.operands);
7794 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7796 /* For instructions with VexNDD, the register destination
7797 is encoded in VEX prefix. */
7798 if (i.mem_operands == 0)
7800 /* There is no memory operand. */
7801 gas_assert ((op + 2) == i.operands);
7806 /* There are only 2 non-immediate operands. */
7807 gas_assert (op < i.imm_operands + 2
7808 && i.operands == i.imm_operands + 2);
7809 vex_reg = i.imm_operands + 1;
7813 gas_assert (op < i.operands);
7815 if (vex_reg != (unsigned int) ~0)
7817 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7819 if ((type->bitfield.class != Reg
7820 || (!type->bitfield.dword && !type->bitfield.qword))
7821 && type->bitfield.class != RegSIMD
7822 && !operand_type_equal (type, ®mask))
7825 i.vex.register_specifier = i.op[vex_reg].regs;
7828 /* Don't set OP operand twice. */
7831 /* If there is an extension opcode to put here, the
7832 register number must be put into the regmem field. */
7833 if (i.tm.extension_opcode != None)
7835 i.rm.regmem = i.op[op].regs->reg_num;
7836 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7838 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7843 i.rm.reg = i.op[op].regs->reg_num;
7844 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7846 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7851 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7852 must set it to 3 to indicate this is a register operand
7853 in the regmem field. */
7854 if (!i.mem_operands)
7858 /* Fill in i.rm.reg field with extension opcode (if any). */
7859 if (i.tm.extension_opcode != None)
7860 i.rm.reg = i.tm.extension_opcode;
7866 flip_code16 (unsigned int code16)
7868 gas_assert (i.tm.operands == 1);
7870 return !(i.prefix[REX_PREFIX] & REX_W)
7871 && (code16 ? i.tm.operand_types[0].bitfield.disp32
7872 || i.tm.operand_types[0].bitfield.disp32s
7873 : i.tm.operand_types[0].bitfield.disp16)
7878 output_branch (void)
7884 relax_substateT subtype;
7888 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7889 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7892 if (i.prefix[DATA_PREFIX] != 0)
7896 code16 ^= flip_code16(code16);
7898 /* Pentium4 branch hints. */
7899 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7900 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7905 if (i.prefix[REX_PREFIX] != 0)
7911 /* BND prefixed jump. */
7912 if (i.prefix[BND_PREFIX] != 0)
7918 if (i.prefixes != 0)
7919 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7921 /* It's always a symbol; End frag & setup for relax.
7922 Make sure there is enough room in this frag for the largest
7923 instruction we may generate in md_convert_frag. This is 2
7924 bytes for the opcode and room for the prefix and largest
7926 frag_grow (prefix + 2 + 4);
7927 /* Prefix and 1 opcode byte go in fr_fix. */
7928 p = frag_more (prefix + 1);
7929 if (i.prefix[DATA_PREFIX] != 0)
7930 *p++ = DATA_PREFIX_OPCODE;
7931 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7932 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7933 *p++ = i.prefix[SEG_PREFIX];
7934 if (i.prefix[BND_PREFIX] != 0)
7935 *p++ = BND_PREFIX_OPCODE;
7936 if (i.prefix[REX_PREFIX] != 0)
7937 *p++ = i.prefix[REX_PREFIX];
7938 *p = i.tm.base_opcode;
7940 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7941 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7942 else if (cpu_arch_flags.bitfield.cpui386)
7943 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7945 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7948 sym = i.op[0].disps->X_add_symbol;
7949 off = i.op[0].disps->X_add_number;
7951 if (i.op[0].disps->X_op != O_constant
7952 && i.op[0].disps->X_op != O_symbol)
7954 /* Handle complex expressions. */
7955 sym = make_expr_symbol (i.op[0].disps);
7959 /* 1 possible extra opcode + 4 byte displacement go in var part.
7960 Pass reloc in fr_var. */
7961 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7964 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7965 /* Return TRUE iff PLT32 relocation should be used for branching to
7969 need_plt32_p (symbolS *s)
7971 /* PLT32 relocation is ELF only. */
7976 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7977 krtld support it. */
7981 /* Since there is no need to prepare for PLT branch on x86-64, we
7982 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7983 be used as a marker for 32-bit PC-relative branches. */
7987 /* Weak or undefined symbol need PLT32 relocation. */
7988 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7991 /* Non-global symbol doesn't need PLT32 relocation. */
7992 if (! S_IS_EXTERNAL (s))
7995 /* Other global symbols need PLT32 relocation. NB: Symbol with
7996 non-default visibilities are treated as normal global symbol
7997 so that PLT32 relocation can be used as a marker for 32-bit
7998 PC-relative branches. It is useful for linker relaxation. */
8009 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8011 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8013 /* This is a loop or jecxz type instruction. */
8015 if (i.prefix[ADDR_PREFIX] != 0)
8017 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8020 /* Pentium4 branch hints. */
8021 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8022 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8024 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8033 if (flag_code == CODE_16BIT)
8036 if (i.prefix[DATA_PREFIX] != 0)
8038 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8040 code16 ^= flip_code16(code16);
8048 /* BND prefixed jump. */
8049 if (i.prefix[BND_PREFIX] != 0)
8051 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8055 if (i.prefix[REX_PREFIX] != 0)
8057 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8061 if (i.prefixes != 0)
8062 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8064 p = frag_more (i.tm.opcode_length + size);
8065 switch (i.tm.opcode_length)
8068 *p++ = i.tm.base_opcode >> 8;
8071 *p++ = i.tm.base_opcode;
8077 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8079 && jump_reloc == NO_RELOC
8080 && need_plt32_p (i.op[0].disps->X_add_symbol))
8081 jump_reloc = BFD_RELOC_X86_64_PLT32;
8084 jump_reloc = reloc (size, 1, 1, jump_reloc);
8086 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8087 i.op[0].disps, 1, jump_reloc);
8089 /* All jumps handled here are signed, but don't use a signed limit
8090 check for 32 and 16 bit jumps as we want to allow wrap around at
8091 4G and 64k respectively. */
8093 fixP->fx_signed = 1;
8097 output_interseg_jump (void)
8105 if (flag_code == CODE_16BIT)
8109 if (i.prefix[DATA_PREFIX] != 0)
8116 gas_assert (!i.prefix[REX_PREFIX]);
8122 if (i.prefixes != 0)
8123 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8125 /* 1 opcode; 2 segment; offset */
8126 p = frag_more (prefix + 1 + 2 + size);
8128 if (i.prefix[DATA_PREFIX] != 0)
8129 *p++ = DATA_PREFIX_OPCODE;
8131 if (i.prefix[REX_PREFIX] != 0)
8132 *p++ = i.prefix[REX_PREFIX];
8134 *p++ = i.tm.base_opcode;
8135 if (i.op[1].imms->X_op == O_constant)
8137 offsetT n = i.op[1].imms->X_add_number;
8140 && !fits_in_unsigned_word (n)
8141 && !fits_in_signed_word (n))
8143 as_bad (_("16-bit jump out of range"));
8146 md_number_to_chars (p, n, size);
8149 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8150 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8151 if (i.op[0].imms->X_op != O_constant)
8152 as_bad (_("can't handle non absolute segment in `%s'"),
8154 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8157 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8162 asection *seg = now_seg;
8163 subsegT subseg = now_subseg;
8165 unsigned int alignment, align_size_1;
8166 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8167 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8168 unsigned int padding;
8170 if (!IS_ELF || !x86_used_note)
8173 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8175 /* The .note.gnu.property section layout:
8177 Field Length Contents
8180 n_descsz 4 The note descriptor size
8181 n_type 4 NT_GNU_PROPERTY_TYPE_0
8183 n_desc n_descsz The program property array
8187 /* Create the .note.gnu.property section. */
8188 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8189 bfd_set_section_flags (sec,
8196 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8207 bfd_set_section_alignment (sec, alignment);
8208 elf_section_type (sec) = SHT_NOTE;
8210 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8212 isa_1_descsz_raw = 4 + 4 + 4;
8213 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8214 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8216 feature_2_descsz_raw = isa_1_descsz;
8217 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8219 feature_2_descsz_raw += 4 + 4 + 4;
8220 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8221 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8224 descsz = feature_2_descsz;
8225 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8226 p = frag_more (4 + 4 + 4 + 4 + descsz);
8228 /* Write n_namsz. */
8229 md_number_to_chars (p, (valueT) 4, 4);
8231 /* Write n_descsz. */
8232 md_number_to_chars (p + 4, (valueT) descsz, 4);
8235 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8238 memcpy (p + 4 * 3, "GNU", 4);
8240 /* Write 4-byte type. */
8241 md_number_to_chars (p + 4 * 4,
8242 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8244 /* Write 4-byte data size. */
8245 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8247 /* Write 4-byte data. */
8248 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8250 /* Zero out paddings. */
8251 padding = isa_1_descsz - isa_1_descsz_raw;
8253 memset (p + 4 * 7, 0, padding);
8255 /* Write 4-byte type. */
8256 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8257 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8259 /* Write 4-byte data size. */
8260 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8262 /* Write 4-byte data. */
8263 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8264 (valueT) x86_feature_2_used, 4);
8266 /* Zero out paddings. */
8267 padding = feature_2_descsz - feature_2_descsz_raw;
8269 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8271 /* We probably can't restore the current segment, for there likely
8274 subseg_set (seg, subseg);
8279 encoding_length (const fragS *start_frag, offsetT start_off,
8280 const char *frag_now_ptr)
8282 unsigned int len = 0;
8284 if (start_frag != frag_now)
8286 const fragS *fr = start_frag;
8291 } while (fr && fr != frag_now);
8294 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8297 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8298 be macro-fused with conditional jumps. */
8301 maybe_fused_with_jcc_p (void)
8303 /* No RIP address. */
8304 if (i.base_reg && i.base_reg->reg_num == RegIP)
8307 /* No VEX/EVEX encoding. */
8308 if (is_any_vex_encoding (&i.tm))
8311 /* and, add, sub with destination register. */
8312 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8313 || i.tm.base_opcode <= 5
8314 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8315 || ((i.tm.base_opcode | 3) == 0x83
8316 && ((i.tm.extension_opcode | 1) == 0x5
8317 || i.tm.extension_opcode == 0x0)))
8318 return (i.types[1].bitfield.class == Reg
8319 || i.types[1].bitfield.instance == Accum);
8321 /* test, cmp with any register. */
8322 if ((i.tm.base_opcode | 1) == 0x85
8323 || (i.tm.base_opcode | 1) == 0xa9
8324 || ((i.tm.base_opcode | 1) == 0xf7
8325 && i.tm.extension_opcode == 0)
8326 || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8327 || ((i.tm.base_opcode | 3) == 0x83
8328 && (i.tm.extension_opcode == 0x7)))
8329 return (i.types[0].bitfield.class == Reg
8330 || i.types[0].bitfield.instance == Accum
8331 || i.types[1].bitfield.class == Reg
8332 || i.types[1].bitfield.instance == Accum);
8334 /* inc, dec with any register. */
8335 if ((i.tm.cpu_flags.bitfield.cpuno64
8336 && (i.tm.base_opcode | 0xf) == 0x4f)
8337 || ((i.tm.base_opcode | 1) == 0xff
8338 && i.tm.extension_opcode <= 0x1))
8339 return (i.types[0].bitfield.class == Reg
8340 || i.types[0].bitfield.instance == Accum);
8345 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8348 add_fused_jcc_padding_frag_p (void)
8350 /* NB: Don't work with COND_JUMP86 without i386. */
8351 if (!align_branch_power
8352 || now_seg == absolute_section
8353 || !cpu_arch_flags.bitfield.cpui386
8354 || !(align_branch & align_branch_fused_bit))
8357 if (maybe_fused_with_jcc_p ())
8359 if (last_insn.kind == last_insn_other
8360 || last_insn.seg != now_seg)
8363 as_warn_where (last_insn.file, last_insn.line,
8364 _("`%s` skips -malign-branch-boundary on `%s`"),
8365 last_insn.name, i.tm.name);
8371 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8374 add_branch_prefix_frag_p (void)
8376 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8377 to PadLock instructions since they include prefixes in opcode. */
8378 if (!align_branch_power
8379 || !align_branch_prefix_size
8380 || now_seg == absolute_section
8381 || i.tm.cpu_flags.bitfield.cpupadlock
8382 || !cpu_arch_flags.bitfield.cpui386)
8385 /* Don't add prefix if it is a prefix or there is no operand in case
8386 that segment prefix is special. */
8387 if (!i.operands || i.tm.opcode_modifier.isprefix)
8390 if (last_insn.kind == last_insn_other
8391 || last_insn.seg != now_seg)
8395 as_warn_where (last_insn.file, last_insn.line,
8396 _("`%s` skips -malign-branch-boundary on `%s`"),
8397 last_insn.name, i.tm.name);
8402 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8405 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8409 /* NB: Don't work with COND_JUMP86 without i386. */
8410 if (!align_branch_power
8411 || now_seg == absolute_section
8412 || !cpu_arch_flags.bitfield.cpui386)
8417 /* Check for jcc and direct jmp. */
8418 if (i.tm.opcode_modifier.jump == JUMP)
8420 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8422 *branch_p = align_branch_jmp;
8423 add_padding = align_branch & align_branch_jmp_bit;
8427 *branch_p = align_branch_jcc;
8428 if ((align_branch & align_branch_jcc_bit))
8432 else if (is_any_vex_encoding (&i.tm))
8434 else if ((i.tm.base_opcode | 1) == 0xc3)
8437 *branch_p = align_branch_ret;
8438 if ((align_branch & align_branch_ret_bit))
8443 /* Check for indirect jmp, direct and indirect calls. */
8444 if (i.tm.base_opcode == 0xe8)
8447 *branch_p = align_branch_call;
8448 if ((align_branch & align_branch_call_bit))
8451 else if (i.tm.base_opcode == 0xff
8452 && (i.tm.extension_opcode == 2
8453 || i.tm.extension_opcode == 4))
8455 /* Indirect call and jmp. */
8456 *branch_p = align_branch_indirect;
8457 if ((align_branch & align_branch_indirect_bit))
8464 && (i.op[0].disps->X_op == O_symbol
8465 || (i.op[0].disps->X_op == O_subtract
8466 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8468 symbolS *s = i.op[0].disps->X_add_symbol;
8469 /* No padding to call to global or undefined tls_get_addr. */
8470 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8471 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8477 && last_insn.kind != last_insn_other
8478 && last_insn.seg == now_seg)
8481 as_warn_where (last_insn.file, last_insn.line,
8482 _("`%s` skips -malign-branch-boundary on `%s`"),
8483 last_insn.name, i.tm.name);
8493 fragS *insn_start_frag;
8494 offsetT insn_start_off;
8495 fragS *fragP = NULL;
8496 enum align_branch_kind branch = align_branch_none;
8498 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8499 if (IS_ELF && x86_used_note)
8501 if (i.tm.cpu_flags.bitfield.cpucmov)
8502 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8503 if (i.tm.cpu_flags.bitfield.cpusse)
8504 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8505 if (i.tm.cpu_flags.bitfield.cpusse2)
8506 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8507 if (i.tm.cpu_flags.bitfield.cpusse3)
8508 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8509 if (i.tm.cpu_flags.bitfield.cpussse3)
8510 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8511 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8512 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8513 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8514 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8515 if (i.tm.cpu_flags.bitfield.cpuavx)
8516 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8517 if (i.tm.cpu_flags.bitfield.cpuavx2)
8518 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8519 if (i.tm.cpu_flags.bitfield.cpufma)
8520 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8521 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8522 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8523 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8524 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8525 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8526 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8527 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8528 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8529 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8530 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8531 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8532 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8533 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8534 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8535 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8536 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8537 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8538 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8539 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8540 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8541 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8542 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8543 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8544 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8545 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8546 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8547 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8548 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8549 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8550 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8552 if (i.tm.cpu_flags.bitfield.cpu8087
8553 || i.tm.cpu_flags.bitfield.cpu287
8554 || i.tm.cpu_flags.bitfield.cpu387
8555 || i.tm.cpu_flags.bitfield.cpu687
8556 || i.tm.cpu_flags.bitfield.cpufisttp)
8557 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8559 || i.tm.base_opcode == 0xf77 /* emms */
8560 || i.tm.base_opcode == 0xf0e /* femms */)
8561 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8563 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8565 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8567 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8568 if (i.tm.cpu_flags.bitfield.cpufxsr)
8569 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8570 if (i.tm.cpu_flags.bitfield.cpuxsave)
8571 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8572 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8573 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8574 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8575 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8579 /* Tie dwarf2 debug info to the address at the start of the insn.
8580 We can't do this after the insn has been output as the current
8581 frag may have been closed off. eg. by frag_var. */
8582 dwarf2_emit_insn (0);
8584 insn_start_frag = frag_now;
8585 insn_start_off = frag_now_fix ();
8587 if (add_branch_padding_frag_p (&branch))
8590 /* Branch can be 8 bytes. Leave some room for prefixes. */
8591 unsigned int max_branch_padding_size = 14;
8593 /* Align section to boundary. */
8594 record_alignment (now_seg, align_branch_power);
8596 /* Make room for padding. */
8597 frag_grow (max_branch_padding_size);
8599 /* Start of the padding. */
8604 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8605 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8608 fragP->tc_frag_data.branch_type = branch;
8609 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8613 if (i.tm.opcode_modifier.jump == JUMP)
8615 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8616 || i.tm.opcode_modifier.jump == JUMP_DWORD)
8618 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8619 output_interseg_jump ();
8622 /* Output normal instructions here. */
8626 unsigned int prefix;
8629 && (i.tm.base_opcode == 0xfaee8
8630 || i.tm.base_opcode == 0xfaef0
8631 || i.tm.base_opcode == 0xfaef8))
8633 /* Encode lfence, mfence, and sfence as
8634 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8635 offsetT val = 0x240483f0ULL;
8637 md_number_to_chars (p, val, 5);
8641 /* Some processors fail on LOCK prefix. This options makes
8642 assembler ignore LOCK prefix and serves as a workaround. */
8643 if (omit_lock_prefix)
8645 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8647 i.prefix[LOCK_PREFIX] = 0;
8651 /* Skip if this is a branch. */
8653 else if (add_fused_jcc_padding_frag_p ())
8655 /* Make room for padding. */
8656 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8661 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8662 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8665 fragP->tc_frag_data.branch_type = align_branch_fused;
8666 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8668 else if (add_branch_prefix_frag_p ())
8670 unsigned int max_prefix_size = align_branch_prefix_size;
8672 /* Make room for padding. */
8673 frag_grow (max_prefix_size);
8678 frag_var (rs_machine_dependent, max_prefix_size, 0,
8679 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8682 fragP->tc_frag_data.max_bytes = max_prefix_size;
8685 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8686 don't need the explicit prefix. */
8687 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8689 switch (i.tm.opcode_length)
8692 if (i.tm.base_opcode & 0xff000000)
8694 prefix = (i.tm.base_opcode >> 24) & 0xff;
8695 if (!i.tm.cpu_flags.bitfield.cpupadlock
8696 || prefix != REPE_PREFIX_OPCODE
8697 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8698 add_prefix (prefix);
8702 if ((i.tm.base_opcode & 0xff0000) != 0)
8704 prefix = (i.tm.base_opcode >> 16) & 0xff;
8705 add_prefix (prefix);
8711 /* Check for pseudo prefixes. */
8712 as_bad_where (insn_start_frag->fr_file,
8713 insn_start_frag->fr_line,
8714 _("pseudo prefix without instruction"));
8720 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8721 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8722 R_X86_64_GOTTPOFF relocation so that linker can safely
8723 perform IE->LE optimization. */
8724 if (x86_elf_abi == X86_64_X32_ABI
8726 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8727 && i.prefix[REX_PREFIX] == 0)
8728 add_prefix (REX_OPCODE);
8731 /* The prefix bytes. */
8732 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8734 FRAG_APPEND_1_CHAR (*q);
8738 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8743 /* REX byte is encoded in VEX prefix. */
8747 FRAG_APPEND_1_CHAR (*q);
8750 /* There should be no other prefixes for instructions
8755 /* For EVEX instructions i.vrex should become 0 after
8756 build_evex_prefix. For VEX instructions upper 16 registers
8757 aren't available, so VREX should be 0. */
8760 /* Now the VEX prefix. */
8761 p = frag_more (i.vex.length);
8762 for (j = 0; j < i.vex.length; j++)
8763 p[j] = i.vex.bytes[j];
8766 /* Now the opcode; be careful about word order here! */
8767 if (i.tm.opcode_length == 1)
8769 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8773 switch (i.tm.opcode_length)
8777 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8778 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8782 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8792 /* Put out high byte first: can't use md_number_to_chars! */
8793 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8794 *p = i.tm.base_opcode & 0xff;
8797 /* Now the modrm byte and sib byte (if present). */
8798 if (i.tm.opcode_modifier.modrm)
8800 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8803 /* If i.rm.regmem == ESP (4)
8804 && i.rm.mode != (Register mode)
8806 ==> need second modrm byte. */
8807 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8809 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8810 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8812 | i.sib.scale << 6));
8815 if (i.disp_operands)
8816 output_disp (insn_start_frag, insn_start_off);
8819 output_imm (insn_start_frag, insn_start_off);
8822 * frag_now_fix () returning plain abs_section_offset when we're in the
8823 * absolute section, and abs_section_offset not getting updated as data
8824 * gets added to the frag breaks the logic below.
8826 if (now_seg != absolute_section)
8828 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8830 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8834 /* NB: Don't add prefix with GOTPC relocation since
8835 output_disp() above depends on the fixed encoding
8836 length. Can't add prefix with TLS relocation since
8837 it breaks TLS linker optimization. */
8838 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8839 /* Prefix count on the current instruction. */
8840 unsigned int count = i.vex.length;
8842 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8843 /* REX byte is encoded in VEX/EVEX prefix. */
8844 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8847 /* Count prefixes for extended opcode maps. */
8849 switch (i.tm.opcode_length)
8852 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8855 switch ((i.tm.base_opcode >> 8) & 0xff)
8867 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8876 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8879 /* Set the maximum prefix size in BRANCH_PREFIX
8881 if (fragP->tc_frag_data.max_bytes > max)
8882 fragP->tc_frag_data.max_bytes = max;
8883 if (fragP->tc_frag_data.max_bytes > count)
8884 fragP->tc_frag_data.max_bytes -= count;
8886 fragP->tc_frag_data.max_bytes = 0;
8890 /* Remember the maximum prefix size in FUSED_JCC_PADDING
8892 unsigned int max_prefix_size;
8893 if (align_branch_prefix_size > max)
8894 max_prefix_size = max;
8896 max_prefix_size = align_branch_prefix_size;
8897 if (max_prefix_size > count)
8898 fragP->tc_frag_data.max_prefix_length
8899 = max_prefix_size - count;
8902 /* Use existing segment prefix if possible. Use CS
8903 segment prefix in 64-bit mode. In 32-bit mode, use SS
8904 segment prefix with ESP/EBP base register and use DS
8905 segment prefix without ESP/EBP base register. */
8906 if (i.prefix[SEG_PREFIX])
8907 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8908 else if (flag_code == CODE_64BIT)
8909 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8911 && (i.base_reg->reg_num == 4
8912 || i.base_reg->reg_num == 5))
8913 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8915 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8920 /* NB: Don't work with COND_JUMP86 without i386. */
8921 if (align_branch_power
8922 && now_seg != absolute_section
8923 && cpu_arch_flags.bitfield.cpui386)
8925 /* Terminate each frag so that we can add prefix and check for
8927 frag_wane (frag_now);
8934 pi ("" /*line*/, &i);
8936 #endif /* DEBUG386 */
8939 /* Return the size of the displacement operand N. */
8942 disp_size (unsigned int n)
8946 if (i.types[n].bitfield.disp64)
8948 else if (i.types[n].bitfield.disp8)
8950 else if (i.types[n].bitfield.disp16)
8955 /* Return the size of the immediate operand N. */
8958 imm_size (unsigned int n)
8961 if (i.types[n].bitfield.imm64)
8963 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8965 else if (i.types[n].bitfield.imm16)
8971 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8976 for (n = 0; n < i.operands; n++)
8978 if (operand_type_check (i.types[n], disp))
8980 if (i.op[n].disps->X_op == O_constant)
8982 int size = disp_size (n);
8983 offsetT val = i.op[n].disps->X_add_number;
8985 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8987 p = frag_more (size);
8988 md_number_to_chars (p, val, size);
8992 enum bfd_reloc_code_real reloc_type;
8993 int size = disp_size (n);
8994 int sign = i.types[n].bitfield.disp32s;
8995 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8998 /* We can't have 8 bit displacement here. */
8999 gas_assert (!i.types[n].bitfield.disp8);
9001 /* The PC relative address is computed relative
9002 to the instruction boundary, so in case immediate
9003 fields follows, we need to adjust the value. */
9004 if (pcrel && i.imm_operands)
9009 for (n1 = 0; n1 < i.operands; n1++)
9010 if (operand_type_check (i.types[n1], imm))
9012 /* Only one immediate is allowed for PC
9013 relative address. */
9014 gas_assert (sz == 0);
9016 i.op[n].disps->X_add_number -= sz;
9018 /* We should find the immediate. */
9019 gas_assert (sz != 0);
9022 p = frag_more (size);
9023 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9025 && GOT_symbol == i.op[n].disps->X_add_symbol
9026 && (((reloc_type == BFD_RELOC_32
9027 || reloc_type == BFD_RELOC_X86_64_32S
9028 || (reloc_type == BFD_RELOC_64
9030 && (i.op[n].disps->X_op == O_symbol
9031 || (i.op[n].disps->X_op == O_add
9032 && ((symbol_get_value_expression
9033 (i.op[n].disps->X_op_symbol)->X_op)
9035 || reloc_type == BFD_RELOC_32_PCREL))
9039 reloc_type = BFD_RELOC_386_GOTPC;
9040 i.has_gotpc_tls_reloc = TRUE;
9041 i.op[n].imms->X_add_number +=
9042 encoding_length (insn_start_frag, insn_start_off, p);
9044 else if (reloc_type == BFD_RELOC_64)
9045 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9047 /* Don't do the adjustment for x86-64, as there
9048 the pcrel addressing is relative to the _next_
9049 insn, and that is taken care of in other code. */
9050 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9052 else if (align_branch_power)
9056 case BFD_RELOC_386_TLS_GD:
9057 case BFD_RELOC_386_TLS_LDM:
9058 case BFD_RELOC_386_TLS_IE:
9059 case BFD_RELOC_386_TLS_IE_32:
9060 case BFD_RELOC_386_TLS_GOTIE:
9061 case BFD_RELOC_386_TLS_GOTDESC:
9062 case BFD_RELOC_386_TLS_DESC_CALL:
9063 case BFD_RELOC_X86_64_TLSGD:
9064 case BFD_RELOC_X86_64_TLSLD:
9065 case BFD_RELOC_X86_64_GOTTPOFF:
9066 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9067 case BFD_RELOC_X86_64_TLSDESC_CALL:
9068 i.has_gotpc_tls_reloc = TRUE;
9073 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9074 size, i.op[n].disps, pcrel,
9076 /* Check for "call/jmp *mem", "mov mem, %reg",
9077 "test %reg, mem" and "binop mem, %reg" where binop
9078 is one of adc, add, and, cmp, or, sbb, sub, xor
9079 instructions without data prefix. Always generate
9080 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9081 if (i.prefix[DATA_PREFIX] == 0
9082 && (generate_relax_relocations
9085 && i.rm.regmem == 5))
9087 || (i.rm.mode == 0 && i.rm.regmem == 5))
9088 && ((i.operands == 1
9089 && i.tm.base_opcode == 0xff
9090 && (i.rm.reg == 2 || i.rm.reg == 4))
9092 && (i.tm.base_opcode == 0x8b
9093 || i.tm.base_opcode == 0x85
9094 || (i.tm.base_opcode & 0xc7) == 0x03))))
9098 fixP->fx_tcbit = i.rex != 0;
9100 && (i.base_reg->reg_num == RegIP))
9101 fixP->fx_tcbit2 = 1;
9104 fixP->fx_tcbit2 = 1;
9112 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9117 for (n = 0; n < i.operands; n++)
9119 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9120 if (i.rounding && (int) n == i.rounding->operand)
9123 if (operand_type_check (i.types[n], imm))
9125 if (i.op[n].imms->X_op == O_constant)
9127 int size = imm_size (n);
9130 val = offset_in_range (i.op[n].imms->X_add_number,
9132 p = frag_more (size);
9133 md_number_to_chars (p, val, size);
9137 /* Not absolute_section.
9138 Need a 32-bit fixup (don't support 8bit
9139 non-absolute imms). Try to support other
9141 enum bfd_reloc_code_real reloc_type;
9142 int size = imm_size (n);
9145 if (i.types[n].bitfield.imm32s
9146 && (i.suffix == QWORD_MNEM_SUFFIX
9147 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9152 p = frag_more (size);
9153 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9155 /* This is tough to explain. We end up with this one if we
9156 * have operands that look like
9157 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9158 * obtain the absolute address of the GOT, and it is strongly
9159 * preferable from a performance point of view to avoid using
9160 * a runtime relocation for this. The actual sequence of
9161 * instructions often look something like:
9166 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9168 * The call and pop essentially return the absolute address
9169 * of the label .L66 and store it in %ebx. The linker itself
9170 * will ultimately change the first operand of the addl so
9171 * that %ebx points to the GOT, but to keep things simple, the
9172 * .o file must have this operand set so that it generates not
9173 * the absolute address of .L66, but the absolute address of
9174 * itself. This allows the linker itself simply treat a GOTPC
9175 * relocation as asking for a pcrel offset to the GOT to be
9176 * added in, and the addend of the relocation is stored in the
9177 * operand field for the instruction itself.
9179 * Our job here is to fix the operand so that it would add
9180 * the correct offset so that %ebx would point to itself. The
9181 * thing that is tricky is that .-.L66 will point to the
9182 * beginning of the instruction, so we need to further modify
9183 * the operand so that it will point to itself. There are
9184 * other cases where you have something like:
9186 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9188 * and here no correction would be required. Internally in
9189 * the assembler we treat operands of this form as not being
9190 * pcrel since the '.' is explicitly mentioned, and I wonder
9191 * whether it would simplify matters to do it this way. Who
9192 * knows. In earlier versions of the PIC patches, the
9193 * pcrel_adjust field was used to store the correction, but
9194 * since the expression is not pcrel, I felt it would be
9195 * confusing to do it this way. */
9197 if ((reloc_type == BFD_RELOC_32
9198 || reloc_type == BFD_RELOC_X86_64_32S
9199 || reloc_type == BFD_RELOC_64)
9201 && GOT_symbol == i.op[n].imms->X_add_symbol
9202 && (i.op[n].imms->X_op == O_symbol
9203 || (i.op[n].imms->X_op == O_add
9204 && ((symbol_get_value_expression
9205 (i.op[n].imms->X_op_symbol)->X_op)
9209 reloc_type = BFD_RELOC_386_GOTPC;
9211 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9213 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9214 i.has_gotpc_tls_reloc = TRUE;
9215 i.op[n].imms->X_add_number +=
9216 encoding_length (insn_start_frag, insn_start_off, p);
9218 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9219 i.op[n].imms, 0, reloc_type);
9225 /* x86_cons_fix_new is called via the expression parsing code when a
9226 reloc is needed. We use this hook to get the correct .got reloc. */
9227 static int cons_sign = -1;
9230 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9231 expressionS *exp, bfd_reloc_code_real_type r)
9233 r = reloc (len, 0, cons_sign, r);
9236 if (exp->X_op == O_secrel)
9238 exp->X_op = O_symbol;
9239 r = BFD_RELOC_32_SECREL;
9243 fix_new_exp (frag, off, len, exp, 0, r);
9246 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9247 purpose of the `.dc.a' internal pseudo-op. */
9250 x86_address_bytes (void)
9252 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9254 return stdoutput->arch_info->bits_per_address / 8;
9257 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9259 # define lex_got(reloc, adjust, types) NULL
9261 /* Parse operands of the form
9262 <symbol>@GOTOFF+<nnn>
9263 and similar .plt or .got references.
9265 If we find one, set up the correct relocation in RELOC and copy the
9266 input string, minus the `@GOTOFF' into a malloc'd buffer for
9267 parsing by the calling routine. Return this buffer, and if ADJUST
9268 is non-null set it to the length of the string we removed from the
9269 input line. Otherwise return NULL. */
9271 lex_got (enum bfd_reloc_code_real *rel,
9273 i386_operand_type *types)
9275 /* Some of the relocations depend on the size of what field is to
9276 be relocated. But in our callers i386_immediate and i386_displacement
9277 we don't yet know the operand size (this will be set by insn
9278 matching). Hence we record the word32 relocation here,
9279 and adjust the reloc according to the real size in reloc(). */
9280 static const struct {
9283 const enum bfd_reloc_code_real rel[2];
9284 const i386_operand_type types64;
9286 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9287 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9289 OPERAND_TYPE_IMM32_64 },
9291 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9292 BFD_RELOC_X86_64_PLTOFF64 },
9293 OPERAND_TYPE_IMM64 },
9294 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9295 BFD_RELOC_X86_64_PLT32 },
9296 OPERAND_TYPE_IMM32_32S_DISP32 },
9297 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9298 BFD_RELOC_X86_64_GOTPLT64 },
9299 OPERAND_TYPE_IMM64_DISP64 },
9300 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9301 BFD_RELOC_X86_64_GOTOFF64 },
9302 OPERAND_TYPE_IMM64_DISP64 },
9303 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9304 BFD_RELOC_X86_64_GOTPCREL },
9305 OPERAND_TYPE_IMM32_32S_DISP32 },
9306 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9307 BFD_RELOC_X86_64_TLSGD },
9308 OPERAND_TYPE_IMM32_32S_DISP32 },
9309 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9310 _dummy_first_bfd_reloc_code_real },
9311 OPERAND_TYPE_NONE },
9312 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9313 BFD_RELOC_X86_64_TLSLD },
9314 OPERAND_TYPE_IMM32_32S_DISP32 },
9315 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9316 BFD_RELOC_X86_64_GOTTPOFF },
9317 OPERAND_TYPE_IMM32_32S_DISP32 },
9318 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9319 BFD_RELOC_X86_64_TPOFF32 },
9320 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9321 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9322 _dummy_first_bfd_reloc_code_real },
9323 OPERAND_TYPE_NONE },
9324 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9325 BFD_RELOC_X86_64_DTPOFF32 },
9326 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9327 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9328 _dummy_first_bfd_reloc_code_real },
9329 OPERAND_TYPE_NONE },
9330 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9331 _dummy_first_bfd_reloc_code_real },
9332 OPERAND_TYPE_NONE },
9333 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9334 BFD_RELOC_X86_64_GOT32 },
9335 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9336 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9337 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9338 OPERAND_TYPE_IMM32_32S_DISP32 },
9339 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9340 BFD_RELOC_X86_64_TLSDESC_CALL },
9341 OPERAND_TYPE_IMM32_32S_DISP32 },
9346 #if defined (OBJ_MAYBE_ELF)
9351 for (cp = input_line_pointer; *cp != '@'; cp++)
9352 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9355 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9357 int len = gotrel[j].len;
9358 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9360 if (gotrel[j].rel[object_64bit] != 0)
9363 char *tmpbuf, *past_reloc;
9365 *rel = gotrel[j].rel[object_64bit];
9369 if (flag_code != CODE_64BIT)
9371 types->bitfield.imm32 = 1;
9372 types->bitfield.disp32 = 1;
9375 *types = gotrel[j].types64;
9378 if (j != 0 && GOT_symbol == NULL)
9379 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9381 /* The length of the first part of our input line. */
9382 first = cp - input_line_pointer;
9384 /* The second part goes from after the reloc token until
9385 (and including) an end_of_line char or comma. */
9386 past_reloc = cp + 1 + len;
9388 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9390 second = cp + 1 - past_reloc;
9392 /* Allocate and copy string. The trailing NUL shouldn't
9393 be necessary, but be safe. */
9394 tmpbuf = XNEWVEC (char, first + second + 2);
9395 memcpy (tmpbuf, input_line_pointer, first);
9396 if (second != 0 && *past_reloc != ' ')
9397 /* Replace the relocation token with ' ', so that
9398 errors like foo@GOTOFF1 will be detected. */
9399 tmpbuf[first++] = ' ';
9401 /* Increment length by 1 if the relocation token is
9406 memcpy (tmpbuf + first, past_reloc, second);
9407 tmpbuf[first + second] = '\0';
9411 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9412 gotrel[j].str, 1 << (5 + object_64bit));
9417 /* Might be a symbol version string. Don't as_bad here. */
9426 /* Parse operands of the form
9427 <symbol>@SECREL32+<nnn>
9429 If we find one, set up the correct relocation in RELOC and copy the
9430 input string, minus the `@SECREL32' into a malloc'd buffer for
9431 parsing by the calling routine. Return this buffer, and if ADJUST
9432 is non-null set it to the length of the string we removed from the
9433 input line. Otherwise return NULL.
9435 This function is copied from the ELF version above adjusted for PE targets. */
9438 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9439 int *adjust ATTRIBUTE_UNUSED,
9440 i386_operand_type *types)
9446 const enum bfd_reloc_code_real rel[2];
9447 const i386_operand_type types64;
9451 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9452 BFD_RELOC_32_SECREL },
9453 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9459 for (cp = input_line_pointer; *cp != '@'; cp++)
9460 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9463 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9465 int len = gotrel[j].len;
9467 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9469 if (gotrel[j].rel[object_64bit] != 0)
9472 char *tmpbuf, *past_reloc;
9474 *rel = gotrel[j].rel[object_64bit];
9480 if (flag_code != CODE_64BIT)
9482 types->bitfield.imm32 = 1;
9483 types->bitfield.disp32 = 1;
9486 *types = gotrel[j].types64;
9489 /* The length of the first part of our input line. */
9490 first = cp - input_line_pointer;
9492 /* The second part goes from after the reloc token until
9493 (and including) an end_of_line char or comma. */
9494 past_reloc = cp + 1 + len;
9496 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9498 second = cp + 1 - past_reloc;
9500 /* Allocate and copy string. The trailing NUL shouldn't
9501 be necessary, but be safe. */
9502 tmpbuf = XNEWVEC (char, first + second + 2);
9503 memcpy (tmpbuf, input_line_pointer, first);
9504 if (second != 0 && *past_reloc != ' ')
9505 /* Replace the relocation token with ' ', so that
9506 errors like foo@SECLREL321 will be detected. */
9507 tmpbuf[first++] = ' ';
9508 memcpy (tmpbuf + first, past_reloc, second);
9509 tmpbuf[first + second] = '\0';
9513 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9514 gotrel[j].str, 1 << (5 + object_64bit));
9519 /* Might be a symbol version string. Don't as_bad here. */
9525 bfd_reloc_code_real_type
9526 x86_cons (expressionS *exp, int size)
9528 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9530 intel_syntax = -intel_syntax;
9533 if (size == 4 || (object_64bit && size == 8))
9535 /* Handle @GOTOFF and the like in an expression. */
9537 char *gotfree_input_line;
9540 save = input_line_pointer;
9541 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9542 if (gotfree_input_line)
9543 input_line_pointer = gotfree_input_line;
9547 if (gotfree_input_line)
9549 /* expression () has merrily parsed up to the end of line,
9550 or a comma - in the wrong buffer. Transfer how far
9551 input_line_pointer has moved to the right buffer. */
9552 input_line_pointer = (save
9553 + (input_line_pointer - gotfree_input_line)
9555 free (gotfree_input_line);
9556 if (exp->X_op == O_constant
9557 || exp->X_op == O_absent
9558 || exp->X_op == O_illegal
9559 || exp->X_op == O_register
9560 || exp->X_op == O_big)
9562 char c = *input_line_pointer;
9563 *input_line_pointer = 0;
9564 as_bad (_("missing or invalid expression `%s'"), save);
9565 *input_line_pointer = c;
9567 else if ((got_reloc == BFD_RELOC_386_PLT32
9568 || got_reloc == BFD_RELOC_X86_64_PLT32)
9569 && exp->X_op != O_symbol)
9571 char c = *input_line_pointer;
9572 *input_line_pointer = 0;
9573 as_bad (_("invalid PLT expression `%s'"), save);
9574 *input_line_pointer = c;
9581 intel_syntax = -intel_syntax;
9584 i386_intel_simplify (exp);
9590 signed_cons (int size)
9592 if (flag_code == CODE_64BIT)
9600 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9607 if (exp.X_op == O_symbol)
9608 exp.X_op = O_secrel;
9610 emit_expr (&exp, 4);
9612 while (*input_line_pointer++ == ',');
9614 input_line_pointer--;
9615 demand_empty_rest_of_line ();
9619 /* Handle Vector operations. */
9622 check_VecOperations (char *op_string, char *op_end)
9624 const reg_entry *mask;
9629 && (op_end == NULL || op_string < op_end))
9632 if (*op_string == '{')
9636 /* Check broadcasts. */
9637 if (strncmp (op_string, "1to", 3) == 0)
9642 goto duplicated_vec_op;
9645 if (*op_string == '8')
9647 else if (*op_string == '4')
9649 else if (*op_string == '2')
9651 else if (*op_string == '1'
9652 && *(op_string+1) == '6')
9659 as_bad (_("Unsupported broadcast: `%s'"), saved);
9664 broadcast_op.type = bcst_type;
9665 broadcast_op.operand = this_operand;
9666 broadcast_op.bytes = 0;
9667 i.broadcast = &broadcast_op;
9669 /* Check masking operation. */
9670 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9672 /* k0 can't be used for write mask. */
9673 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9675 as_bad (_("`%s%s' can't be used for write mask"),
9676 register_prefix, mask->reg_name);
9682 mask_op.mask = mask;
9683 mask_op.zeroing = 0;
9684 mask_op.operand = this_operand;
9690 goto duplicated_vec_op;
9692 i.mask->mask = mask;
9694 /* Only "{z}" is allowed here. No need to check
9695 zeroing mask explicitly. */
9696 if (i.mask->operand != this_operand)
9698 as_bad (_("invalid write mask `%s'"), saved);
9705 /* Check zeroing-flag for masking operation. */
9706 else if (*op_string == 'z')
9710 mask_op.mask = NULL;
9711 mask_op.zeroing = 1;
9712 mask_op.operand = this_operand;
9717 if (i.mask->zeroing)
9720 as_bad (_("duplicated `%s'"), saved);
9724 i.mask->zeroing = 1;
9726 /* Only "{%k}" is allowed here. No need to check mask
9727 register explicitly. */
9728 if (i.mask->operand != this_operand)
9730 as_bad (_("invalid zeroing-masking `%s'"),
9739 goto unknown_vec_op;
9741 if (*op_string != '}')
9743 as_bad (_("missing `}' in `%s'"), saved);
9748 /* Strip whitespace since the addition of pseudo prefixes
9749 changed how the scrubber treats '{'. */
9750 if (is_space_char (*op_string))
9756 /* We don't know this one. */
9757 as_bad (_("unknown vector operation: `%s'"), saved);
9761 if (i.mask && i.mask->zeroing && !i.mask->mask)
9763 as_bad (_("zeroing-masking only allowed with write mask"));
9771 i386_immediate (char *imm_start)
9773 char *save_input_line_pointer;
9774 char *gotfree_input_line;
9777 i386_operand_type types;
9779 operand_type_set (&types, ~0);
9781 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9783 as_bad (_("at most %d immediate operands are allowed"),
9784 MAX_IMMEDIATE_OPERANDS);
9788 exp = &im_expressions[i.imm_operands++];
9789 i.op[this_operand].imms = exp;
9791 if (is_space_char (*imm_start))
9794 save_input_line_pointer = input_line_pointer;
9795 input_line_pointer = imm_start;
9797 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9798 if (gotfree_input_line)
9799 input_line_pointer = gotfree_input_line;
9801 exp_seg = expression (exp);
9805 /* Handle vector operations. */
9806 if (*input_line_pointer == '{')
9808 input_line_pointer = check_VecOperations (input_line_pointer,
9810 if (input_line_pointer == NULL)
9814 if (*input_line_pointer)
9815 as_bad (_("junk `%s' after expression"), input_line_pointer);
9817 input_line_pointer = save_input_line_pointer;
9818 if (gotfree_input_line)
9820 free (gotfree_input_line);
9822 if (exp->X_op == O_constant || exp->X_op == O_register)
9823 exp->X_op = O_illegal;
9826 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9830 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9831 i386_operand_type types, const char *imm_start)
9833 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9836 as_bad (_("missing or invalid immediate expression `%s'"),
9840 else if (exp->X_op == O_constant)
9842 /* Size it properly later. */
9843 i.types[this_operand].bitfield.imm64 = 1;
9844 /* If not 64bit, sign extend val. */
9845 if (flag_code != CODE_64BIT
9846 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9848 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9850 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9851 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9852 && exp_seg != absolute_section
9853 && exp_seg != text_section
9854 && exp_seg != data_section
9855 && exp_seg != bss_section
9856 && exp_seg != undefined_section
9857 && !bfd_is_com_section (exp_seg))
9859 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9863 else if (!intel_syntax && exp_seg == reg_section)
9866 as_bad (_("illegal immediate register operand %s"), imm_start);
9871 /* This is an address. The size of the address will be
9872 determined later, depending on destination register,
9873 suffix, or the default for the section. */
9874 i.types[this_operand].bitfield.imm8 = 1;
9875 i.types[this_operand].bitfield.imm16 = 1;
9876 i.types[this_operand].bitfield.imm32 = 1;
9877 i.types[this_operand].bitfield.imm32s = 1;
9878 i.types[this_operand].bitfield.imm64 = 1;
9879 i.types[this_operand] = operand_type_and (i.types[this_operand],
9887 i386_scale (char *scale)
9890 char *save = input_line_pointer;
9892 input_line_pointer = scale;
9893 val = get_absolute_expression ();
9898 i.log2_scale_factor = 0;
9901 i.log2_scale_factor = 1;
9904 i.log2_scale_factor = 2;
9907 i.log2_scale_factor = 3;
9911 char sep = *input_line_pointer;
9913 *input_line_pointer = '\0';
9914 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9916 *input_line_pointer = sep;
9917 input_line_pointer = save;
9921 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9923 as_warn (_("scale factor of %d without an index register"),
9924 1 << i.log2_scale_factor);
9925 i.log2_scale_factor = 0;
9927 scale = input_line_pointer;
9928 input_line_pointer = save;
9933 i386_displacement (char *disp_start, char *disp_end)
9937 char *save_input_line_pointer;
9938 char *gotfree_input_line;
9940 i386_operand_type bigdisp, types = anydisp;
9943 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9945 as_bad (_("at most %d displacement operands are allowed"),
9946 MAX_MEMORY_OPERANDS);
9950 operand_type_set (&bigdisp, 0);
9952 || i.types[this_operand].bitfield.baseindex
9953 || (current_templates->start->opcode_modifier.jump != JUMP
9954 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9956 i386_addressing_mode ();
9957 override = (i.prefix[ADDR_PREFIX] != 0);
9958 if (flag_code == CODE_64BIT)
9962 bigdisp.bitfield.disp32s = 1;
9963 bigdisp.bitfield.disp64 = 1;
9966 bigdisp.bitfield.disp32 = 1;
9968 else if ((flag_code == CODE_16BIT) ^ override)
9969 bigdisp.bitfield.disp16 = 1;
9971 bigdisp.bitfield.disp32 = 1;
9975 /* For PC-relative branches, the width of the displacement may be
9976 dependent upon data size, but is never dependent upon address size.
9977 Also make sure to not unintentionally match against a non-PC-relative
9979 static templates aux_templates;
9980 const insn_template *t = current_templates->start;
9981 bfd_boolean has_intel64 = FALSE;
9983 aux_templates.start = t;
9984 while (++t < current_templates->end)
9986 if (t->opcode_modifier.jump
9987 != current_templates->start->opcode_modifier.jump)
9989 if (t->opcode_modifier.intel64)
9992 if (t < current_templates->end)
9994 aux_templates.end = t;
9995 current_templates = &aux_templates;
9998 override = (i.prefix[DATA_PREFIX] != 0);
9999 if (flag_code == CODE_64BIT)
10001 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10002 && (!intel64 || !has_intel64))
10003 bigdisp.bitfield.disp16 = 1;
10005 bigdisp.bitfield.disp32s = 1;
10010 override = (i.suffix == (flag_code != CODE_16BIT
10012 : LONG_MNEM_SUFFIX));
10013 bigdisp.bitfield.disp32 = 1;
10014 if ((flag_code == CODE_16BIT) ^ override)
10016 bigdisp.bitfield.disp32 = 0;
10017 bigdisp.bitfield.disp16 = 1;
10021 i.types[this_operand] = operand_type_or (i.types[this_operand],
10024 exp = &disp_expressions[i.disp_operands];
10025 i.op[this_operand].disps = exp;
10027 save_input_line_pointer = input_line_pointer;
10028 input_line_pointer = disp_start;
10029 END_STRING_AND_SAVE (disp_end);
10031 #ifndef GCC_ASM_O_HACK
10032 #define GCC_ASM_O_HACK 0
10035 END_STRING_AND_SAVE (disp_end + 1);
10036 if (i.types[this_operand].bitfield.baseIndex
10037 && displacement_string_end[-1] == '+')
10039 /* This hack is to avoid a warning when using the "o"
10040 constraint within gcc asm statements.
10043 #define _set_tssldt_desc(n,addr,limit,type) \
10044 __asm__ __volatile__ ( \
10045 "movw %w2,%0\n\t" \
10046 "movw %w1,2+%0\n\t" \
10047 "rorl $16,%1\n\t" \
10048 "movb %b1,4+%0\n\t" \
10049 "movb %4,5+%0\n\t" \
10050 "movb $0,6+%0\n\t" \
10051 "movb %h1,7+%0\n\t" \
10053 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10055 This works great except that the output assembler ends
10056 up looking a bit weird if it turns out that there is
10057 no offset. You end up producing code that looks like:
10070 So here we provide the missing zero. */
10072 *displacement_string_end = '0';
10075 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10076 if (gotfree_input_line)
10077 input_line_pointer = gotfree_input_line;
10079 exp_seg = expression (exp);
10081 SKIP_WHITESPACE ();
10082 if (*input_line_pointer)
10083 as_bad (_("junk `%s' after expression"), input_line_pointer);
10085 RESTORE_END_STRING (disp_end + 1);
10087 input_line_pointer = save_input_line_pointer;
10088 if (gotfree_input_line)
10090 free (gotfree_input_line);
10092 if (exp->X_op == O_constant || exp->X_op == O_register)
10093 exp->X_op = O_illegal;
10096 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10098 RESTORE_END_STRING (disp_end);
10104 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10105 i386_operand_type types, const char *disp_start)
10107 i386_operand_type bigdisp;
10110 /* We do this to make sure that the section symbol is in
10111 the symbol table. We will ultimately change the relocation
10112 to be relative to the beginning of the section. */
10113 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10114 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10115 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10117 if (exp->X_op != O_symbol)
10120 if (S_IS_LOCAL (exp->X_add_symbol)
10121 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10122 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10123 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10124 exp->X_op = O_subtract;
10125 exp->X_op_symbol = GOT_symbol;
10126 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10127 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10128 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10129 i.reloc[this_operand] = BFD_RELOC_64;
10131 i.reloc[this_operand] = BFD_RELOC_32;
10134 else if (exp->X_op == O_absent
10135 || exp->X_op == O_illegal
10136 || exp->X_op == O_big)
10139 as_bad (_("missing or invalid displacement expression `%s'"),
10144 else if (flag_code == CODE_64BIT
10145 && !i.prefix[ADDR_PREFIX]
10146 && exp->X_op == O_constant)
10148 /* Since displacement is signed extended to 64bit, don't allow
10149 disp32 and turn off disp32s if they are out of range. */
10150 i.types[this_operand].bitfield.disp32 = 0;
10151 if (!fits_in_signed_long (exp->X_add_number))
10153 i.types[this_operand].bitfield.disp32s = 0;
10154 if (i.types[this_operand].bitfield.baseindex)
10156 as_bad (_("0x%lx out range of signed 32bit displacement"),
10157 (long) exp->X_add_number);
10163 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10164 else if (exp->X_op != O_constant
10165 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10166 && exp_seg != absolute_section
10167 && exp_seg != text_section
10168 && exp_seg != data_section
10169 && exp_seg != bss_section
10170 && exp_seg != undefined_section
10171 && !bfd_is_com_section (exp_seg))
10173 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10178 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10179 /* Constants get taken care of by optimize_disp(). */
10180 && exp->X_op != O_constant)
10181 i.types[this_operand].bitfield.disp8 = 1;
10183 /* Check if this is a displacement only operand. */
10184 bigdisp = i.types[this_operand];
10185 bigdisp.bitfield.disp8 = 0;
10186 bigdisp.bitfield.disp16 = 0;
10187 bigdisp.bitfield.disp32 = 0;
10188 bigdisp.bitfield.disp32s = 0;
10189 bigdisp.bitfield.disp64 = 0;
10190 if (operand_type_all_zero (&bigdisp))
10191 i.types[this_operand] = operand_type_and (i.types[this_operand],
10197 /* Return the active addressing mode, taking address override and
10198 registers forming the address into consideration. Update the
10199 address override prefix if necessary. */
10201 static enum flag_code
10202 i386_addressing_mode (void)
10204 enum flag_code addr_mode;
10206 if (i.prefix[ADDR_PREFIX])
10207 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10210 addr_mode = flag_code;
10212 #if INFER_ADDR_PREFIX
10213 if (i.mem_operands == 0)
10215 /* Infer address prefix from the first memory operand. */
10216 const reg_entry *addr_reg = i.base_reg;
10218 if (addr_reg == NULL)
10219 addr_reg = i.index_reg;
10223 if (addr_reg->reg_type.bitfield.dword)
10224 addr_mode = CODE_32BIT;
10225 else if (flag_code != CODE_64BIT
10226 && addr_reg->reg_type.bitfield.word)
10227 addr_mode = CODE_16BIT;
10229 if (addr_mode != flag_code)
10231 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10233 /* Change the size of any displacement too. At most one
10234 of Disp16 or Disp32 is set.
10235 FIXME. There doesn't seem to be any real need for
10236 separate Disp16 and Disp32 flags. The same goes for
10237 Imm16 and Imm32. Removing them would probably clean
10238 up the code quite a lot. */
10239 if (flag_code != CODE_64BIT
10240 && (i.types[this_operand].bitfield.disp16
10241 || i.types[this_operand].bitfield.disp32))
10242 i.types[this_operand]
10243 = operand_type_xor (i.types[this_operand], disp16_32);
10253 /* Make sure the memory operand we've been dealt is valid.
10254 Return 1 on success, 0 on a failure. */
10257 i386_index_check (const char *operand_string)
10259 const char *kind = "base/index";
10260 enum flag_code addr_mode = i386_addressing_mode ();
10262 if (current_templates->start->opcode_modifier.isstring
10263 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10264 && (current_templates->end[-1].opcode_modifier.isstring
10265 || i.mem_operands))
10267 /* Memory operands of string insns are special in that they only allow
10268 a single register (rDI, rSI, or rBX) as their memory address. */
10269 const reg_entry *expected_reg;
10270 static const char *di_si[][2] =
10276 static const char *bx[] = { "ebx", "bx", "rbx" };
10278 kind = "string address";
10280 if (current_templates->start->opcode_modifier.repprefixok)
10282 int es_op = current_templates->end[-1].opcode_modifier.isstring
10283 - IS_STRING_ES_OP0;
10286 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10287 || ((!i.mem_operands != !intel_syntax)
10288 && current_templates->end[-1].operand_types[1]
10289 .bitfield.baseindex))
10291 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10294 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10296 if (i.base_reg != expected_reg
10298 || operand_type_check (i.types[this_operand], disp))
10300 /* The second memory operand must have the same size as
10304 && !((addr_mode == CODE_64BIT
10305 && i.base_reg->reg_type.bitfield.qword)
10306 || (addr_mode == CODE_32BIT
10307 ? i.base_reg->reg_type.bitfield.dword
10308 : i.base_reg->reg_type.bitfield.word)))
10311 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10313 intel_syntax ? '[' : '(',
10315 expected_reg->reg_name,
10316 intel_syntax ? ']' : ')');
10323 as_bad (_("`%s' is not a valid %s expression"),
10324 operand_string, kind);
10329 if (addr_mode != CODE_16BIT)
10331 /* 32-bit/64-bit checks. */
10333 && ((addr_mode == CODE_64BIT
10334 ? !i.base_reg->reg_type.bitfield.qword
10335 : !i.base_reg->reg_type.bitfield.dword)
10336 || (i.index_reg && i.base_reg->reg_num == RegIP)
10337 || i.base_reg->reg_num == RegIZ))
10339 && !i.index_reg->reg_type.bitfield.xmmword
10340 && !i.index_reg->reg_type.bitfield.ymmword
10341 && !i.index_reg->reg_type.bitfield.zmmword
10342 && ((addr_mode == CODE_64BIT
10343 ? !i.index_reg->reg_type.bitfield.qword
10344 : !i.index_reg->reg_type.bitfield.dword)
10345 || !i.index_reg->reg_type.bitfield.baseindex)))
10348 /* bndmk, bndldx, and bndstx have special restrictions. */
10349 if (current_templates->start->base_opcode == 0xf30f1b
10350 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10352 /* They cannot use RIP-relative addressing. */
10353 if (i.base_reg && i.base_reg->reg_num == RegIP)
10355 as_bad (_("`%s' cannot be used here"), operand_string);
10359 /* bndldx and bndstx ignore their scale factor. */
10360 if (current_templates->start->base_opcode != 0xf30f1b
10361 && i.log2_scale_factor)
10362 as_warn (_("register scaling is being ignored here"));
10367 /* 16-bit checks. */
10369 && (!i.base_reg->reg_type.bitfield.word
10370 || !i.base_reg->reg_type.bitfield.baseindex))
10372 && (!i.index_reg->reg_type.bitfield.word
10373 || !i.index_reg->reg_type.bitfield.baseindex
10375 && i.base_reg->reg_num < 6
10376 && i.index_reg->reg_num >= 6
10377 && i.log2_scale_factor == 0))))
10384 /* Handle vector immediates. */
10387 RC_SAE_immediate (const char *imm_start)
10389 unsigned int match_found, j;
10390 const char *pstr = imm_start;
10398 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10400 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10404 rc_op.type = RC_NamesTable[j].type;
10405 rc_op.operand = this_operand;
10406 i.rounding = &rc_op;
10410 as_bad (_("duplicated `%s'"), imm_start);
10413 pstr += RC_NamesTable[j].len;
10421 if (*pstr++ != '}')
10423 as_bad (_("Missing '}': '%s'"), imm_start);
10426 /* RC/SAE immediate string should contain nothing more. */;
10429 as_bad (_("Junk after '}': '%s'"), imm_start);
10433 exp = &im_expressions[i.imm_operands++];
10434 i.op[this_operand].imms = exp;
10436 exp->X_op = O_constant;
10437 exp->X_add_number = 0;
10438 exp->X_add_symbol = (symbolS *) 0;
10439 exp->X_op_symbol = (symbolS *) 0;
10441 i.types[this_operand].bitfield.imm8 = 1;
10445 /* Only string instructions can have a second memory operand, so
10446 reduce current_templates to just those if it contains any. */
10448 maybe_adjust_templates (void)
10450 const insn_template *t;
10452 gas_assert (i.mem_operands == 1);
10454 for (t = current_templates->start; t < current_templates->end; ++t)
10455 if (t->opcode_modifier.isstring)
10458 if (t < current_templates->end)
10460 static templates aux_templates;
10461 bfd_boolean recheck;
10463 aux_templates.start = t;
10464 for (; t < current_templates->end; ++t)
10465 if (!t->opcode_modifier.isstring)
10467 aux_templates.end = t;
10469 /* Determine whether to re-check the first memory operand. */
10470 recheck = (aux_templates.start != current_templates->start
10471 || t != current_templates->end);
10473 current_templates = &aux_templates;
10477 i.mem_operands = 0;
10478 if (i.memop1_string != NULL
10479 && i386_index_check (i.memop1_string) == 0)
10481 i.mem_operands = 1;
10488 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10492 i386_att_operand (char *operand_string)
10494 const reg_entry *r;
10496 char *op_string = operand_string;
10498 if (is_space_char (*op_string))
10501 /* We check for an absolute prefix (differentiating,
10502 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10503 if (*op_string == ABSOLUTE_PREFIX)
10506 if (is_space_char (*op_string))
10508 i.jumpabsolute = TRUE;
10511 /* Check if operand is a register. */
10512 if ((r = parse_register (op_string, &end_op)) != NULL)
10514 i386_operand_type temp;
10516 /* Check for a segment override by searching for ':' after a
10517 segment register. */
10518 op_string = end_op;
10519 if (is_space_char (*op_string))
10521 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10523 switch (r->reg_num)
10526 i.seg[i.mem_operands] = &es;
10529 i.seg[i.mem_operands] = &cs;
10532 i.seg[i.mem_operands] = &ss;
10535 i.seg[i.mem_operands] = &ds;
10538 i.seg[i.mem_operands] = &fs;
10541 i.seg[i.mem_operands] = &gs;
10545 /* Skip the ':' and whitespace. */
10547 if (is_space_char (*op_string))
10550 if (!is_digit_char (*op_string)
10551 && !is_identifier_char (*op_string)
10552 && *op_string != '('
10553 && *op_string != ABSOLUTE_PREFIX)
10555 as_bad (_("bad memory operand `%s'"), op_string);
10558 /* Handle case of %es:*foo. */
10559 if (*op_string == ABSOLUTE_PREFIX)
10562 if (is_space_char (*op_string))
10564 i.jumpabsolute = TRUE;
10566 goto do_memory_reference;
10569 /* Handle vector operations. */
10570 if (*op_string == '{')
10572 op_string = check_VecOperations (op_string, NULL);
10573 if (op_string == NULL)
10579 as_bad (_("junk `%s' after register"), op_string);
10582 temp = r->reg_type;
10583 temp.bitfield.baseindex = 0;
10584 i.types[this_operand] = operand_type_or (i.types[this_operand],
10586 i.types[this_operand].bitfield.unspecified = 0;
10587 i.op[this_operand].regs = r;
10590 else if (*op_string == REGISTER_PREFIX)
10592 as_bad (_("bad register name `%s'"), op_string);
10595 else if (*op_string == IMMEDIATE_PREFIX)
10598 if (i.jumpabsolute)
10600 as_bad (_("immediate operand illegal with absolute jump"));
10603 if (!i386_immediate (op_string))
10606 else if (RC_SAE_immediate (operand_string))
10608 /* If it is a RC or SAE immediate, do nothing. */
10611 else if (is_digit_char (*op_string)
10612 || is_identifier_char (*op_string)
10613 || *op_string == '"'
10614 || *op_string == '(')
10616 /* This is a memory reference of some sort. */
10619 /* Start and end of displacement string expression (if found). */
10620 char *displacement_string_start;
10621 char *displacement_string_end;
10624 do_memory_reference:
10625 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10627 if ((i.mem_operands == 1
10628 && !current_templates->start->opcode_modifier.isstring)
10629 || i.mem_operands == 2)
10631 as_bad (_("too many memory references for `%s'"),
10632 current_templates->start->name);
10636 /* Check for base index form. We detect the base index form by
10637 looking for an ')' at the end of the operand, searching
10638 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10640 base_string = op_string + strlen (op_string);
10642 /* Handle vector operations. */
10643 vop_start = strchr (op_string, '{');
10644 if (vop_start && vop_start < base_string)
10646 if (check_VecOperations (vop_start, base_string) == NULL)
10648 base_string = vop_start;
10652 if (is_space_char (*base_string))
10655 /* If we only have a displacement, set-up for it to be parsed later. */
10656 displacement_string_start = op_string;
10657 displacement_string_end = base_string + 1;
10659 if (*base_string == ')')
10662 unsigned int parens_balanced = 1;
10663 /* We've already checked that the number of left & right ()'s are
10664 equal, so this loop will not be infinite. */
10668 if (*base_string == ')')
10670 if (*base_string == '(')
10673 while (parens_balanced);
10675 temp_string = base_string;
10677 /* Skip past '(' and whitespace. */
10679 if (is_space_char (*base_string))
10682 if (*base_string == ','
10683 || ((i.base_reg = parse_register (base_string, &end_op))
10686 displacement_string_end = temp_string;
10688 i.types[this_operand].bitfield.baseindex = 1;
10692 base_string = end_op;
10693 if (is_space_char (*base_string))
10697 /* There may be an index reg or scale factor here. */
10698 if (*base_string == ',')
10701 if (is_space_char (*base_string))
10704 if ((i.index_reg = parse_register (base_string, &end_op))
10707 base_string = end_op;
10708 if (is_space_char (*base_string))
10710 if (*base_string == ',')
10713 if (is_space_char (*base_string))
10716 else if (*base_string != ')')
10718 as_bad (_("expecting `,' or `)' "
10719 "after index register in `%s'"),
10724 else if (*base_string == REGISTER_PREFIX)
10726 end_op = strchr (base_string, ',');
10729 as_bad (_("bad register name `%s'"), base_string);
10733 /* Check for scale factor. */
10734 if (*base_string != ')')
10736 char *end_scale = i386_scale (base_string);
10741 base_string = end_scale;
10742 if (is_space_char (*base_string))
10744 if (*base_string != ')')
10746 as_bad (_("expecting `)' "
10747 "after scale factor in `%s'"),
10752 else if (!i.index_reg)
10754 as_bad (_("expecting index register or scale factor "
10755 "after `,'; got '%c'"),
10760 else if (*base_string != ')')
10762 as_bad (_("expecting `,' or `)' "
10763 "after base register in `%s'"),
10768 else if (*base_string == REGISTER_PREFIX)
10770 end_op = strchr (base_string, ',');
10773 as_bad (_("bad register name `%s'"), base_string);
10778 /* If there's an expression beginning the operand, parse it,
10779 assuming displacement_string_start and
10780 displacement_string_end are meaningful. */
10781 if (displacement_string_start != displacement_string_end)
10783 if (!i386_displacement (displacement_string_start,
10784 displacement_string_end))
10788 /* Special case for (%dx) while doing input/output op. */
10790 && i.base_reg->reg_type.bitfield.instance == RegD
10791 && i.base_reg->reg_type.bitfield.word
10792 && i.index_reg == 0
10793 && i.log2_scale_factor == 0
10794 && i.seg[i.mem_operands] == 0
10795 && !operand_type_check (i.types[this_operand], disp))
10797 i.types[this_operand] = i.base_reg->reg_type;
10801 if (i386_index_check (operand_string) == 0)
10803 i.flags[this_operand] |= Operand_Mem;
10804 if (i.mem_operands == 0)
10805 i.memop1_string = xstrdup (operand_string);
10810 /* It's not a memory operand; argh! */
10811 as_bad (_("invalid char %s beginning operand %d `%s'"),
10812 output_invalid (*op_string),
10817 return 1; /* Normal return. */
10820 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10821 that an rs_machine_dependent frag may reach. */
10824 i386_frag_max_var (fragS *frag)
10826 /* The only relaxable frags are for jumps.
10827 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10828 gas_assert (frag->fr_type == rs_machine_dependent);
10829 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10832 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10834 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10836 /* STT_GNU_IFUNC symbol must go through PLT. */
10837 if ((symbol_get_bfdsym (fr_symbol)->flags
10838 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10841 if (!S_IS_EXTERNAL (fr_symbol))
10842 /* Symbol may be weak or local. */
10843 return !S_IS_WEAK (fr_symbol);
10845 /* Global symbols with non-default visibility can't be preempted. */
10846 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10849 if (fr_var != NO_RELOC)
10850 switch ((enum bfd_reloc_code_real) fr_var)
10852 case BFD_RELOC_386_PLT32:
10853 case BFD_RELOC_X86_64_PLT32:
10854 /* Symbol with PLT relocation may be preempted. */
10860 /* Global symbols with default visibility in a shared library may be
10861 preempted by another definition. */
10866 /* Return the next non-empty frag. */
10869 i386_next_non_empty_frag (fragS *fragP)
10871 /* There may be a frag with a ".fill 0" when there is no room in
10872 the current frag for frag_grow in output_insn. */
10873 for (fragP = fragP->fr_next;
10875 && fragP->fr_type == rs_fill
10876 && fragP->fr_fix == 0);
10877 fragP = fragP->fr_next)
10882 /* Return the next jcc frag after BRANCH_PADDING. */
10885 i386_next_jcc_frag (fragS *fragP)
10890 if (fragP->fr_type == rs_machine_dependent
10891 && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10892 == BRANCH_PADDING))
10894 fragP = i386_next_non_empty_frag (fragP);
10895 if (fragP->fr_type != rs_machine_dependent)
10897 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10904 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
10907 i386_classify_machine_dependent_frag (fragS *fragP)
10911 fragS *branch_fragP;
10913 unsigned int max_prefix_length;
10915 if (fragP->tc_frag_data.classified)
10918 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
10919 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
10920 for (next_fragP = fragP;
10921 next_fragP != NULL;
10922 next_fragP = next_fragP->fr_next)
10924 next_fragP->tc_frag_data.classified = 1;
10925 if (next_fragP->fr_type == rs_machine_dependent)
10926 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10928 case BRANCH_PADDING:
10929 /* The BRANCH_PADDING frag must be followed by a branch
10931 branch_fragP = i386_next_non_empty_frag (next_fragP);
10932 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10934 case FUSED_JCC_PADDING:
10935 /* Check if this is a fused jcc:
10937 CMP like instruction
10941 cmp_fragP = i386_next_non_empty_frag (next_fragP);
10942 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10943 branch_fragP = i386_next_jcc_frag (pad_fragP);
10946 /* The BRANCH_PADDING frag is merged with the
10947 FUSED_JCC_PADDING frag. */
10948 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10949 /* CMP like instruction size. */
10950 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10951 frag_wane (pad_fragP);
10952 /* Skip to branch_fragP. */
10953 next_fragP = branch_fragP;
10955 else if (next_fragP->tc_frag_data.max_prefix_length)
10957 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10959 next_fragP->fr_subtype
10960 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10961 next_fragP->tc_frag_data.max_bytes
10962 = next_fragP->tc_frag_data.max_prefix_length;
10963 /* This will be updated in the BRANCH_PREFIX scan. */
10964 next_fragP->tc_frag_data.max_prefix_length = 0;
10967 frag_wane (next_fragP);
10972 /* Stop if there is no BRANCH_PREFIX. */
10973 if (!align_branch_prefix_size)
10976 /* Scan for BRANCH_PREFIX. */
10977 for (; fragP != NULL; fragP = fragP->fr_next)
10979 if (fragP->fr_type != rs_machine_dependent
10980 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10984 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
10985 COND_JUMP_PREFIX. */
10986 max_prefix_length = 0;
10987 for (next_fragP = fragP;
10988 next_fragP != NULL;
10989 next_fragP = next_fragP->fr_next)
10991 if (next_fragP->fr_type == rs_fill)
10992 /* Skip rs_fill frags. */
10994 else if (next_fragP->fr_type != rs_machine_dependent)
10995 /* Stop for all other frags. */
10998 /* rs_machine_dependent frags. */
10999 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11002 /* Count BRANCH_PREFIX frags. */
11003 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11005 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11006 frag_wane (next_fragP);
11010 += next_fragP->tc_frag_data.max_bytes;
11012 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11014 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11015 == FUSED_JCC_PADDING))
11017 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11018 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11022 /* Stop for other rs_machine_dependent frags. */
11026 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11028 /* Skip to the next frag. */
11029 fragP = next_fragP;
11033 /* Compute padding size for
11036 CMP like instruction
11038 COND_JUMP/UNCOND_JUMP
11043 COND_JUMP/UNCOND_JUMP
11047 i386_branch_padding_size (fragS *fragP, offsetT address)
11049 unsigned int offset, size, padding_size;
11050 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11052 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11054 address = fragP->fr_address;
11055 address += fragP->fr_fix;
11057 /* CMP like instrunction size. */
11058 size = fragP->tc_frag_data.cmp_size;
11060 /* The base size of the branch frag. */
11061 size += branch_fragP->fr_fix;
11063 /* Add opcode and displacement bytes for the rs_machine_dependent
11065 if (branch_fragP->fr_type == rs_machine_dependent)
11066 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11068 /* Check if branch is within boundary and doesn't end at the last
11070 offset = address & ((1U << align_branch_power) - 1);
11071 if ((offset + size) >= (1U << align_branch_power))
11072 /* Padding needed to avoid crossing boundary. */
11073 padding_size = (1U << align_branch_power) - offset;
11075 /* No padding needed. */
11078 /* The return value may be saved in tc_frag_data.length which is
11080 if (!fits_in_unsigned_byte (padding_size))
11083 return padding_size;
11086 /* i386_generic_table_relax_frag()
11088 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11089 grow/shrink padding to align branch frags. Hand others to
11093 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11095 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11096 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11098 long padding_size = i386_branch_padding_size (fragP, 0);
11099 long grow = padding_size - fragP->tc_frag_data.length;
11101 /* When the BRANCH_PREFIX frag is used, the computed address
11102 must match the actual address and there should be no padding. */
11103 if (fragP->tc_frag_data.padding_address
11104 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11108 /* Update the padding size. */
11110 fragP->tc_frag_data.length = padding_size;
11114 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11116 fragS *padding_fragP, *next_fragP;
11117 long padding_size, left_size, last_size;
11119 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11120 if (!padding_fragP)
11121 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11122 return (fragP->tc_frag_data.length
11123 - fragP->tc_frag_data.last_length);
11125 /* Compute the relative address of the padding frag in the very
11126 first time where the BRANCH_PREFIX frag sizes are zero. */
11127 if (!fragP->tc_frag_data.padding_address)
11128 fragP->tc_frag_data.padding_address
11129 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11131 /* First update the last length from the previous interation. */
11132 left_size = fragP->tc_frag_data.prefix_length;
11133 for (next_fragP = fragP;
11134 next_fragP != padding_fragP;
11135 next_fragP = next_fragP->fr_next)
11136 if (next_fragP->fr_type == rs_machine_dependent
11137 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11142 int max = next_fragP->tc_frag_data.max_bytes;
11146 if (max > left_size)
11151 next_fragP->tc_frag_data.last_length = size;
11155 next_fragP->tc_frag_data.last_length = 0;
11158 /* Check the padding size for the padding frag. */
11159 padding_size = i386_branch_padding_size
11160 (padding_fragP, (fragP->fr_address
11161 + fragP->tc_frag_data.padding_address));
11163 last_size = fragP->tc_frag_data.prefix_length;
11164 /* Check if there is change from the last interation. */
11165 if (padding_size == last_size)
11167 /* Update the expected address of the padding frag. */
11168 padding_fragP->tc_frag_data.padding_address
11169 = (fragP->fr_address + padding_size
11170 + fragP->tc_frag_data.padding_address);
11174 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11176 /* No padding if there is no sufficient room. Clear the
11177 expected address of the padding frag. */
11178 padding_fragP->tc_frag_data.padding_address = 0;
11182 /* Store the expected address of the padding frag. */
11183 padding_fragP->tc_frag_data.padding_address
11184 = (fragP->fr_address + padding_size
11185 + fragP->tc_frag_data.padding_address);
11187 fragP->tc_frag_data.prefix_length = padding_size;
11189 /* Update the length for the current interation. */
11190 left_size = padding_size;
11191 for (next_fragP = fragP;
11192 next_fragP != padding_fragP;
11193 next_fragP = next_fragP->fr_next)
11194 if (next_fragP->fr_type == rs_machine_dependent
11195 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11200 int max = next_fragP->tc_frag_data.max_bytes;
11204 if (max > left_size)
11209 next_fragP->tc_frag_data.length = size;
11213 next_fragP->tc_frag_data.length = 0;
11216 return (fragP->tc_frag_data.length
11217 - fragP->tc_frag_data.last_length);
11219 return relax_frag (segment, fragP, stretch);
11222 /* md_estimate_size_before_relax()
11224 Called just before relax() for rs_machine_dependent frags. The x86
11225 assembler uses these frags to handle variable size jump
11228 Any symbol that is now undefined will not become defined.
11229 Return the correct fr_subtype in the frag.
11230 Return the initial "guess for variable size of frag" to caller.
11231 The guess is actually the growth beyond the fixed part. Whatever
11232 we do to grow the fixed or variable part contributes to our
11236 md_estimate_size_before_relax (fragS *fragP, segT segment)
11238 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11239 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11240 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11242 i386_classify_machine_dependent_frag (fragP);
11243 return fragP->tc_frag_data.length;
11246 /* We've already got fragP->fr_subtype right; all we have to do is
11247 check for un-relaxable symbols. On an ELF system, we can't relax
11248 an externally visible symbol, because it may be overridden by a
11250 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11251 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11253 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11256 #if defined (OBJ_COFF) && defined (TE_PE)
11257 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11258 && S_IS_WEAK (fragP->fr_symbol))
11262 /* Symbol is undefined in this segment, or we need to keep a
11263 reloc so that weak symbols can be overridden. */
11264 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11265 enum bfd_reloc_code_real reloc_type;
11266 unsigned char *opcode;
11269 if (fragP->fr_var != NO_RELOC)
11270 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11271 else if (size == 2)
11272 reloc_type = BFD_RELOC_16_PCREL;
11273 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11274 else if (need_plt32_p (fragP->fr_symbol))
11275 reloc_type = BFD_RELOC_X86_64_PLT32;
11278 reloc_type = BFD_RELOC_32_PCREL;
11280 old_fr_fix = fragP->fr_fix;
11281 opcode = (unsigned char *) fragP->fr_opcode;
11283 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11286 /* Make jmp (0xeb) a (d)word displacement jump. */
11288 fragP->fr_fix += size;
11289 fix_new (fragP, old_fr_fix, size,
11291 fragP->fr_offset, 1,
11297 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11299 /* Negate the condition, and branch past an
11300 unconditional jump. */
11303 /* Insert an unconditional jump. */
11305 /* We added two extra opcode bytes, and have a two byte
11307 fragP->fr_fix += 2 + 2;
11308 fix_new (fragP, old_fr_fix + 2, 2,
11310 fragP->fr_offset, 1,
11314 /* Fall through. */
11317 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11321 fragP->fr_fix += 1;
11322 fixP = fix_new (fragP, old_fr_fix, 1,
11324 fragP->fr_offset, 1,
11325 BFD_RELOC_8_PCREL);
11326 fixP->fx_signed = 1;
11330 /* This changes the byte-displacement jump 0x7N
11331 to the (d)word-displacement jump 0x0f,0x8N. */
11332 opcode[1] = opcode[0] + 0x10;
11333 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11334 /* We've added an opcode byte. */
11335 fragP->fr_fix += 1 + size;
11336 fix_new (fragP, old_fr_fix + 1, size,
11338 fragP->fr_offset, 1,
11343 BAD_CASE (fragP->fr_subtype);
11347 return fragP->fr_fix - old_fr_fix;
11350 /* Guess size depending on current relax state. Initially the relax
11351 state will correspond to a short jump and we return 1, because
11352 the variable part of the frag (the branch offset) is one byte
11353 long. However, we can relax a section more than once and in that
11354 case we must either set fr_subtype back to the unrelaxed state,
11355 or return the value for the appropriate branch. */
11356 return md_relax_table[fragP->fr_subtype].rlx_length;
11359 /* Called after relax() is finished.
11361 In: Address of frag.
11362 fr_type == rs_machine_dependent.
11363 fr_subtype is what the address relaxed to.
11365 Out: Any fixSs and constants are set up.
11366 Caller will turn frag into a ".space 0". */
11369 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11372 unsigned char *opcode;
11373 unsigned char *where_to_put_displacement = NULL;
11374 offsetT target_address;
11375 offsetT opcode_address;
11376 unsigned int extension = 0;
11377 offsetT displacement_from_opcode_start;
11379 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11380 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11381 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11383 /* Generate nop padding. */
11384 unsigned int size = fragP->tc_frag_data.length;
11387 if (size > fragP->tc_frag_data.max_bytes)
11393 const char *branch = "branch";
11394 const char *prefix = "";
11395 fragS *padding_fragP;
11396 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11399 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11400 switch (fragP->tc_frag_data.default_prefix)
11405 case CS_PREFIX_OPCODE:
11408 case DS_PREFIX_OPCODE:
11411 case ES_PREFIX_OPCODE:
11414 case FS_PREFIX_OPCODE:
11417 case GS_PREFIX_OPCODE:
11420 case SS_PREFIX_OPCODE:
11425 msg = _("%s:%u: add %d%s at 0x%llx to align "
11426 "%s within %d-byte boundary\n");
11428 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11429 "align %s within %d-byte boundary\n");
11433 padding_fragP = fragP;
11434 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11435 "%s within %d-byte boundary\n");
11439 switch (padding_fragP->tc_frag_data.branch_type)
11441 case align_branch_jcc:
11444 case align_branch_fused:
11445 branch = "fused jcc";
11447 case align_branch_jmp:
11450 case align_branch_call:
11453 case align_branch_indirect:
11454 branch = "indiret branch";
11456 case align_branch_ret:
11463 fprintf (stdout, msg,
11464 fragP->fr_file, fragP->fr_line, size, prefix,
11465 (long long) fragP->fr_address, branch,
11466 1 << align_branch_power);
11468 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11469 memset (fragP->fr_opcode,
11470 fragP->tc_frag_data.default_prefix, size);
11472 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11474 fragP->fr_fix += size;
11479 opcode = (unsigned char *) fragP->fr_opcode;
11481 /* Address we want to reach in file space. */
11482 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11484 /* Address opcode resides at in file space. */
11485 opcode_address = fragP->fr_address + fragP->fr_fix;
11487 /* Displacement from opcode start to fill into instruction. */
11488 displacement_from_opcode_start = target_address - opcode_address;
11490 if ((fragP->fr_subtype & BIG) == 0)
11492 /* Don't have to change opcode. */
11493 extension = 1; /* 1 opcode + 1 displacement */
11494 where_to_put_displacement = &opcode[1];
11498 if (no_cond_jump_promotion
11499 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11500 as_warn_where (fragP->fr_file, fragP->fr_line,
11501 _("long jump required"));
11503 switch (fragP->fr_subtype)
11505 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11506 extension = 4; /* 1 opcode + 4 displacement */
11508 where_to_put_displacement = &opcode[1];
11511 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11512 extension = 2; /* 1 opcode + 2 displacement */
11514 where_to_put_displacement = &opcode[1];
11517 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11518 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11519 extension = 5; /* 2 opcode + 4 displacement */
11520 opcode[1] = opcode[0] + 0x10;
11521 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11522 where_to_put_displacement = &opcode[2];
11525 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11526 extension = 3; /* 2 opcode + 2 displacement */
11527 opcode[1] = opcode[0] + 0x10;
11528 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11529 where_to_put_displacement = &opcode[2];
11532 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11537 where_to_put_displacement = &opcode[3];
11541 BAD_CASE (fragP->fr_subtype);
11546 /* If size if less then four we are sure that the operand fits,
11547 but if it's 4, then it could be that the displacement is larger
11549 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11551 && ((addressT) (displacement_from_opcode_start - extension
11552 + ((addressT) 1 << 31))
11553 > (((addressT) 2 << 31) - 1)))
11555 as_bad_where (fragP->fr_file, fragP->fr_line,
11556 _("jump target out of range"));
11557 /* Make us emit 0. */
11558 displacement_from_opcode_start = extension;
11560 /* Now put displacement after opcode. */
11561 md_number_to_chars ((char *) where_to_put_displacement,
11562 (valueT) (displacement_from_opcode_start - extension),
11563 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11564 fragP->fr_fix += extension;
11567 /* Apply a fixup (fixP) to segment data, once it has been determined
11568 by our caller that we have all the info we need to fix it up.
11570 Parameter valP is the pointer to the value of the bits.
11572 On the 386, immediates, displacements, and data pointers are all in
11573 the same (little-endian) format, so we don't need to care about which
11574 we are handling. */
11577 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11579 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11580 valueT value = *valP;
11582 #if !defined (TE_Mach)
11583 if (fixP->fx_pcrel)
11585 switch (fixP->fx_r_type)
11591 fixP->fx_r_type = BFD_RELOC_64_PCREL;
11594 case BFD_RELOC_X86_64_32S:
11595 fixP->fx_r_type = BFD_RELOC_32_PCREL;
11598 fixP->fx_r_type = BFD_RELOC_16_PCREL;
11601 fixP->fx_r_type = BFD_RELOC_8_PCREL;
11606 if (fixP->fx_addsy != NULL
11607 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11608 || fixP->fx_r_type == BFD_RELOC_64_PCREL
11609 || fixP->fx_r_type == BFD_RELOC_16_PCREL
11610 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11611 && !use_rela_relocations)
11613 /* This is a hack. There should be a better way to handle this.
11614 This covers for the fact that bfd_install_relocation will
11615 subtract the current location (for partial_inplace, PC relative
11616 relocations); see more below. */
11620 || OUTPUT_FLAVOR == bfd_target_coff_flavour
11623 value += fixP->fx_where + fixP->fx_frag->fr_address;
11625 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11628 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11630 if ((sym_seg == seg
11631 || (symbol_section_p (fixP->fx_addsy)
11632 && sym_seg != absolute_section))
11633 && !generic_force_reloc (fixP))
11635 /* Yes, we add the values in twice. This is because
11636 bfd_install_relocation subtracts them out again. I think
11637 bfd_install_relocation is broken, but I don't dare change
11639 value += fixP->fx_where + fixP->fx_frag->fr_address;
11643 #if defined (OBJ_COFF) && defined (TE_PE)
11644 /* For some reason, the PE format does not store a
11645 section address offset for a PC relative symbol. */
11646 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11647 || S_IS_WEAK (fixP->fx_addsy))
11648 value += md_pcrel_from (fixP);
11651 #if defined (OBJ_COFF) && defined (TE_PE)
11652 if (fixP->fx_addsy != NULL
11653 && S_IS_WEAK (fixP->fx_addsy)
11654 /* PR 16858: Do not modify weak function references. */
11655 && ! fixP->fx_pcrel)
11657 #if !defined (TE_PEP)
11658 /* For x86 PE weak function symbols are neither PC-relative
11659 nor do they set S_IS_FUNCTION. So the only reliable way
11660 to detect them is to check the flags of their containing
11662 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11663 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11667 value -= S_GET_VALUE (fixP->fx_addsy);
11671 /* Fix a few things - the dynamic linker expects certain values here,
11672 and we must not disappoint it. */
11673 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11674 if (IS_ELF && fixP->fx_addsy)
11675 switch (fixP->fx_r_type)
11677 case BFD_RELOC_386_PLT32:
11678 case BFD_RELOC_X86_64_PLT32:
11679 /* Make the jump instruction point to the address of the operand.
11680 At runtime we merely add the offset to the actual PLT entry.
11681 NB: Subtract the offset size only for jump instructions. */
11682 if (fixP->fx_pcrel)
11686 case BFD_RELOC_386_TLS_GD:
11687 case BFD_RELOC_386_TLS_LDM:
11688 case BFD_RELOC_386_TLS_IE_32:
11689 case BFD_RELOC_386_TLS_IE:
11690 case BFD_RELOC_386_TLS_GOTIE:
11691 case BFD_RELOC_386_TLS_GOTDESC:
11692 case BFD_RELOC_X86_64_TLSGD:
11693 case BFD_RELOC_X86_64_TLSLD:
11694 case BFD_RELOC_X86_64_GOTTPOFF:
11695 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11696 value = 0; /* Fully resolved at runtime. No addend. */
11698 case BFD_RELOC_386_TLS_LE:
11699 case BFD_RELOC_386_TLS_LDO_32:
11700 case BFD_RELOC_386_TLS_LE_32:
11701 case BFD_RELOC_X86_64_DTPOFF32:
11702 case BFD_RELOC_X86_64_DTPOFF64:
11703 case BFD_RELOC_X86_64_TPOFF32:
11704 case BFD_RELOC_X86_64_TPOFF64:
11705 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11708 case BFD_RELOC_386_TLS_DESC_CALL:
11709 case BFD_RELOC_X86_64_TLSDESC_CALL:
11710 value = 0; /* Fully resolved at runtime. No addend. */
11711 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11715 case BFD_RELOC_VTABLE_INHERIT:
11716 case BFD_RELOC_VTABLE_ENTRY:
11723 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
11725 #endif /* !defined (TE_Mach) */
11727 /* Are we finished with this relocation now? */
11728 if (fixP->fx_addsy == NULL)
11730 #if defined (OBJ_COFF) && defined (TE_PE)
11731 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11734 /* Remember value for tc_gen_reloc. */
11735 fixP->fx_addnumber = value;
11736 /* Clear out the frag for now. */
11740 else if (use_rela_relocations)
11742 fixP->fx_no_overflow = 1;
11743 /* Remember value for tc_gen_reloc. */
11744 fixP->fx_addnumber = value;
11748 md_number_to_chars (p, value, fixP->fx_size);
11752 md_atof (int type, char *litP, int *sizeP)
11754 /* This outputs the LITTLENUMs in REVERSE order;
11755 in accord with the bigendian 386. */
11756 return ieee_md_atof (type, litP, sizeP, FALSE);
11759 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11762 output_invalid (int c)
11765 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11768 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11769 "(0x%x)", (unsigned char) c);
11770 return output_invalid_buf;
11773 /* REG_STRING starts *before* REGISTER_PREFIX. */
11775 static const reg_entry *
11776 parse_real_register (char *reg_string, char **end_op)
11778 char *s = reg_string;
11780 char reg_name_given[MAX_REG_NAME_SIZE + 1];
11781 const reg_entry *r;
11783 /* Skip possible REGISTER_PREFIX and possible whitespace. */
11784 if (*s == REGISTER_PREFIX)
11787 if (is_space_char (*s))
11790 p = reg_name_given;
11791 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11793 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11794 return (const reg_entry *) NULL;
11798 /* For naked regs, make sure that we are not dealing with an identifier.
11799 This prevents confusing an identifier like `eax_var' with register
11801 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11802 return (const reg_entry *) NULL;
11806 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11808 /* Handle floating point regs, allowing spaces in the (i) part. */
11809 if (r == i386_regtab /* %st is first entry of table */)
11811 if (!cpu_arch_flags.bitfield.cpu8087
11812 && !cpu_arch_flags.bitfield.cpu287
11813 && !cpu_arch_flags.bitfield.cpu387)
11814 return (const reg_entry *) NULL;
11816 if (is_space_char (*s))
11821 if (is_space_char (*s))
11823 if (*s >= '0' && *s <= '7')
11825 int fpr = *s - '0';
11827 if (is_space_char (*s))
11832 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11837 /* We have "%st(" then garbage. */
11838 return (const reg_entry *) NULL;
11842 if (r == NULL || allow_pseudo_reg)
11845 if (operand_type_all_zero (&r->reg_type))
11846 return (const reg_entry *) NULL;
11848 if ((r->reg_type.bitfield.dword
11849 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11850 || r->reg_type.bitfield.class == RegCR
11851 || r->reg_type.bitfield.class == RegDR
11852 || r->reg_type.bitfield.class == RegTR)
11853 && !cpu_arch_flags.bitfield.cpui386)
11854 return (const reg_entry *) NULL;
11856 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11857 return (const reg_entry *) NULL;
11859 if (!cpu_arch_flags.bitfield.cpuavx512f)
11861 if (r->reg_type.bitfield.zmmword
11862 || r->reg_type.bitfield.class == RegMask)
11863 return (const reg_entry *) NULL;
11865 if (!cpu_arch_flags.bitfield.cpuavx)
11867 if (r->reg_type.bitfield.ymmword)
11868 return (const reg_entry *) NULL;
11870 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11871 return (const reg_entry *) NULL;
11875 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11876 return (const reg_entry *) NULL;
11878 /* Don't allow fake index register unless allow_index_reg isn't 0. */
11879 if (!allow_index_reg && r->reg_num == RegIZ)
11880 return (const reg_entry *) NULL;
11882 /* Upper 16 vector registers are only available with VREX in 64bit
11883 mode, and require EVEX encoding. */
11884 if (r->reg_flags & RegVRex)
11886 if (!cpu_arch_flags.bitfield.cpuavx512f
11887 || flag_code != CODE_64BIT)
11888 return (const reg_entry *) NULL;
11890 i.vec_encoding = vex_encoding_evex;
11893 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11894 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11895 && flag_code != CODE_64BIT)
11896 return (const reg_entry *) NULL;
11898 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11900 return (const reg_entry *) NULL;
11905 /* REG_STRING starts *before* REGISTER_PREFIX. */
11907 static const reg_entry *
11908 parse_register (char *reg_string, char **end_op)
11910 const reg_entry *r;
11912 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11913 r = parse_real_register (reg_string, end_op);
11918 char *save = input_line_pointer;
11922 input_line_pointer = reg_string;
11923 c = get_symbol_name (®_string);
11924 symbolP = symbol_find (reg_string);
11925 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11927 const expressionS *e = symbol_get_value_expression (symbolP);
11929 know (e->X_op == O_register);
11930 know (e->X_add_number >= 0
11931 && (valueT) e->X_add_number < i386_regtab_size);
11932 r = i386_regtab + e->X_add_number;
11933 if ((r->reg_flags & RegVRex))
11934 i.vec_encoding = vex_encoding_evex;
11935 *end_op = input_line_pointer;
11937 *input_line_pointer = c;
11938 input_line_pointer = save;
11944 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11946 const reg_entry *r;
11947 char *end = input_line_pointer;
11950 r = parse_register (name, &input_line_pointer);
11951 if (r && end <= input_line_pointer)
11953 *nextcharP = *input_line_pointer;
11954 *input_line_pointer = 0;
11955 e->X_op = O_register;
11956 e->X_add_number = r - i386_regtab;
11959 input_line_pointer = end;
11961 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11965 md_operand (expressionS *e)
11968 const reg_entry *r;
11970 switch (*input_line_pointer)
11972 case REGISTER_PREFIX:
11973 r = parse_real_register (input_line_pointer, &end);
11976 e->X_op = O_register;
11977 e->X_add_number = r - i386_regtab;
11978 input_line_pointer = end;
11983 gas_assert (intel_syntax);
11984 end = input_line_pointer++;
11986 if (*input_line_pointer == ']')
11988 ++input_line_pointer;
11989 e->X_op_symbol = make_expr_symbol (e);
11990 e->X_add_symbol = NULL;
11991 e->X_add_number = 0;
11996 e->X_op = O_absent;
11997 input_line_pointer = end;
12004 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12005 const char *md_shortopts = "kVQ:sqnO::";
12007 const char *md_shortopts = "qnO::";
12010 #define OPTION_32 (OPTION_MD_BASE + 0)
12011 #define OPTION_64 (OPTION_MD_BASE + 1)
12012 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12013 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12014 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12015 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12016 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12017 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12018 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12019 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12020 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12021 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12022 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12023 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12024 #define OPTION_X32 (OPTION_MD_BASE + 14)
12025 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12026 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12027 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12028 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12029 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12030 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12031 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12032 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12033 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12034 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12035 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12036 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12037 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12038 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12039 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12040 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12042 struct option md_longopts[] =
12044 {"32", no_argument, NULL, OPTION_32},
12045 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12046 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12047 {"64", no_argument, NULL, OPTION_64},
12049 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12050 {"x32", no_argument, NULL, OPTION_X32},
12051 {"mshared", no_argument, NULL, OPTION_MSHARED},
12052 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12054 {"divide", no_argument, NULL, OPTION_DIVIDE},
12055 {"march", required_argument, NULL, OPTION_MARCH},
12056 {"mtune", required_argument, NULL, OPTION_MTUNE},
12057 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12058 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12059 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12060 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12061 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12062 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12063 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12064 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12065 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12066 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12067 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12068 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12069 # if defined (TE_PE) || defined (TE_PEP)
12070 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12072 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12073 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12074 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12075 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12076 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12077 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12078 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12079 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12080 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12081 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12082 {NULL, no_argument, NULL, 0}
12084 size_t md_longopts_size = sizeof (md_longopts);
12087 md_parse_option (int c, const char *arg)
12090 char *arch, *next, *saved, *type;
12095 optimize_align_code = 0;
12099 quiet_warnings = 1;
12102 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12103 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12104 should be emitted or not. FIXME: Not implemented. */
12106 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12110 /* -V: SVR4 argument to print version ID. */
12112 print_version_id ();
12115 /* -k: Ignore for FreeBSD compatibility. */
12120 /* -s: On i386 Solaris, this tells the native assembler to use
12121 .stab instead of .stab.excl. We always use .stab anyhow. */
12124 case OPTION_MSHARED:
12128 case OPTION_X86_USED_NOTE:
12129 if (strcasecmp (arg, "yes") == 0)
12131 else if (strcasecmp (arg, "no") == 0)
12134 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12139 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12140 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12143 const char **list, **l;
12145 list = bfd_target_list ();
12146 for (l = list; *l != NULL; l++)
12147 if (CONST_STRNEQ (*l, "elf64-x86-64")
12148 || strcmp (*l, "coff-x86-64") == 0
12149 || strcmp (*l, "pe-x86-64") == 0
12150 || strcmp (*l, "pei-x86-64") == 0
12151 || strcmp (*l, "mach-o-x86-64") == 0)
12153 default_arch = "x86_64";
12157 as_fatal (_("no compiled in support for x86_64"));
12163 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12167 const char **list, **l;
12169 list = bfd_target_list ();
12170 for (l = list; *l != NULL; l++)
12171 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12173 default_arch = "x86_64:32";
12177 as_fatal (_("no compiled in support for 32bit x86_64"));
12181 as_fatal (_("32bit x86_64 is only supported for ELF"));
12186 default_arch = "i386";
12189 case OPTION_DIVIDE:
12190 #ifdef SVR4_COMMENT_CHARS
12195 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12197 for (s = i386_comment_chars; *s != '\0'; s++)
12201 i386_comment_chars = n;
12207 saved = xstrdup (arg);
12209 /* Allow -march=+nosse. */
12215 as_fatal (_("invalid -march= option: `%s'"), arg);
12216 next = strchr (arch, '+');
12219 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12221 if (strcmp (arch, cpu_arch [j].name) == 0)
12224 if (! cpu_arch[j].flags.bitfield.cpui386)
12227 cpu_arch_name = cpu_arch[j].name;
12228 cpu_sub_arch_name = NULL;
12229 cpu_arch_flags = cpu_arch[j].flags;
12230 cpu_arch_isa = cpu_arch[j].type;
12231 cpu_arch_isa_flags = cpu_arch[j].flags;
12232 if (!cpu_arch_tune_set)
12234 cpu_arch_tune = cpu_arch_isa;
12235 cpu_arch_tune_flags = cpu_arch_isa_flags;
12239 else if (*cpu_arch [j].name == '.'
12240 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12242 /* ISA extension. */
12243 i386_cpu_flags flags;
12245 flags = cpu_flags_or (cpu_arch_flags,
12246 cpu_arch[j].flags);
12248 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12250 if (cpu_sub_arch_name)
12252 char *name = cpu_sub_arch_name;
12253 cpu_sub_arch_name = concat (name,
12255 (const char *) NULL);
12259 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12260 cpu_arch_flags = flags;
12261 cpu_arch_isa_flags = flags;
12265 = cpu_flags_or (cpu_arch_isa_flags,
12266 cpu_arch[j].flags);
12271 if (j >= ARRAY_SIZE (cpu_arch))
12273 /* Disable an ISA extension. */
12274 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12275 if (strcmp (arch, cpu_noarch [j].name) == 0)
12277 i386_cpu_flags flags;
12279 flags = cpu_flags_and_not (cpu_arch_flags,
12280 cpu_noarch[j].flags);
12281 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12283 if (cpu_sub_arch_name)
12285 char *name = cpu_sub_arch_name;
12286 cpu_sub_arch_name = concat (arch,
12287 (const char *) NULL);
12291 cpu_sub_arch_name = xstrdup (arch);
12292 cpu_arch_flags = flags;
12293 cpu_arch_isa_flags = flags;
12298 if (j >= ARRAY_SIZE (cpu_noarch))
12299 j = ARRAY_SIZE (cpu_arch);
12302 if (j >= ARRAY_SIZE (cpu_arch))
12303 as_fatal (_("invalid -march= option: `%s'"), arg);
12307 while (next != NULL);
12313 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12314 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12316 if (strcmp (arg, cpu_arch [j].name) == 0)
12318 cpu_arch_tune_set = 1;
12319 cpu_arch_tune = cpu_arch [j].type;
12320 cpu_arch_tune_flags = cpu_arch[j].flags;
12324 if (j >= ARRAY_SIZE (cpu_arch))
12325 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12328 case OPTION_MMNEMONIC:
12329 if (strcasecmp (arg, "att") == 0)
12330 intel_mnemonic = 0;
12331 else if (strcasecmp (arg, "intel") == 0)
12332 intel_mnemonic = 1;
12334 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12337 case OPTION_MSYNTAX:
12338 if (strcasecmp (arg, "att") == 0)
12340 else if (strcasecmp (arg, "intel") == 0)
12343 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12346 case OPTION_MINDEX_REG:
12347 allow_index_reg = 1;
12350 case OPTION_MNAKED_REG:
12351 allow_naked_reg = 1;
12354 case OPTION_MSSE2AVX:
12358 case OPTION_MSSE_CHECK:
12359 if (strcasecmp (arg, "error") == 0)
12360 sse_check = check_error;
12361 else if (strcasecmp (arg, "warning") == 0)
12362 sse_check = check_warning;
12363 else if (strcasecmp (arg, "none") == 0)
12364 sse_check = check_none;
12366 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12369 case OPTION_MOPERAND_CHECK:
12370 if (strcasecmp (arg, "error") == 0)
12371 operand_check = check_error;
12372 else if (strcasecmp (arg, "warning") == 0)
12373 operand_check = check_warning;
12374 else if (strcasecmp (arg, "none") == 0)
12375 operand_check = check_none;
12377 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12380 case OPTION_MAVXSCALAR:
12381 if (strcasecmp (arg, "128") == 0)
12382 avxscalar = vex128;
12383 else if (strcasecmp (arg, "256") == 0)
12384 avxscalar = vex256;
12386 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12389 case OPTION_MVEXWIG:
12390 if (strcmp (arg, "0") == 0)
12392 else if (strcmp (arg, "1") == 0)
12395 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12398 case OPTION_MADD_BND_PREFIX:
12399 add_bnd_prefix = 1;
12402 case OPTION_MEVEXLIG:
12403 if (strcmp (arg, "128") == 0)
12404 evexlig = evexl128;
12405 else if (strcmp (arg, "256") == 0)
12406 evexlig = evexl256;
12407 else if (strcmp (arg, "512") == 0)
12408 evexlig = evexl512;
12410 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12413 case OPTION_MEVEXRCIG:
12414 if (strcmp (arg, "rne") == 0)
12416 else if (strcmp (arg, "rd") == 0)
12418 else if (strcmp (arg, "ru") == 0)
12420 else if (strcmp (arg, "rz") == 0)
12423 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12426 case OPTION_MEVEXWIG:
12427 if (strcmp (arg, "0") == 0)
12429 else if (strcmp (arg, "1") == 0)
12432 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12435 # if defined (TE_PE) || defined (TE_PEP)
12436 case OPTION_MBIG_OBJ:
12441 case OPTION_MOMIT_LOCK_PREFIX:
12442 if (strcasecmp (arg, "yes") == 0)
12443 omit_lock_prefix = 1;
12444 else if (strcasecmp (arg, "no") == 0)
12445 omit_lock_prefix = 0;
12447 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12450 case OPTION_MFENCE_AS_LOCK_ADD:
12451 if (strcasecmp (arg, "yes") == 0)
12453 else if (strcasecmp (arg, "no") == 0)
12456 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12459 case OPTION_MRELAX_RELOCATIONS:
12460 if (strcasecmp (arg, "yes") == 0)
12461 generate_relax_relocations = 1;
12462 else if (strcasecmp (arg, "no") == 0)
12463 generate_relax_relocations = 0;
12465 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12468 case OPTION_MALIGN_BRANCH_BOUNDARY:
12471 long int align = strtoul (arg, &end, 0);
12476 align_branch_power = 0;
12479 else if (align >= 16)
12482 for (align_power = 0;
12484 align >>= 1, align_power++)
12486 /* Limit alignment power to 31. */
12487 if (align == 1 && align_power < 32)
12489 align_branch_power = align_power;
12494 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12498 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12501 int align = strtoul (arg, &end, 0);
12502 /* Some processors only support 5 prefixes. */
12503 if (*end == '\0' && align >= 0 && align < 6)
12505 align_branch_prefix_size = align;
12508 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12513 case OPTION_MALIGN_BRANCH:
12515 saved = xstrdup (arg);
12519 next = strchr (type, '+');
12522 if (strcasecmp (type, "jcc") == 0)
12523 align_branch |= align_branch_jcc_bit;
12524 else if (strcasecmp (type, "fused") == 0)
12525 align_branch |= align_branch_fused_bit;
12526 else if (strcasecmp (type, "jmp") == 0)
12527 align_branch |= align_branch_jmp_bit;
12528 else if (strcasecmp (type, "call") == 0)
12529 align_branch |= align_branch_call_bit;
12530 else if (strcasecmp (type, "ret") == 0)
12531 align_branch |= align_branch_ret_bit;
12532 else if (strcasecmp (type, "indirect") == 0)
12533 align_branch |= align_branch_indirect_bit;
12535 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12538 while (next != NULL);
12542 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12543 align_branch_power = 5;
12544 align_branch_prefix_size = 5;
12545 align_branch = (align_branch_jcc_bit
12546 | align_branch_fused_bit
12547 | align_branch_jmp_bit);
12550 case OPTION_MAMD64:
12554 case OPTION_MINTEL64:
12562 /* Turn off -Os. */
12563 optimize_for_space = 0;
12565 else if (*arg == 's')
12567 optimize_for_space = 1;
12568 /* Turn on all encoding optimizations. */
12569 optimize = INT_MAX;
12573 optimize = atoi (arg);
12574 /* Turn off -Os. */
12575 optimize_for_space = 0;
12585 #define MESSAGE_TEMPLATE \
12589 output_message (FILE *stream, char *p, char *message, char *start,
12590 int *left_p, const char *name, int len)
12592 int size = sizeof (MESSAGE_TEMPLATE);
12593 int left = *left_p;
12595 /* Reserve 2 spaces for ", " or ",\0" */
12598 /* Check if there is any room. */
12606 p = mempcpy (p, name, len);
12610 /* Output the current message now and start a new one. */
12613 fprintf (stream, "%s\n", message);
12615 left = size - (start - message) - len - 2;
12617 gas_assert (left >= 0);
12619 p = mempcpy (p, name, len);
12627 show_arch (FILE *stream, int ext, int check)
12629 static char message[] = MESSAGE_TEMPLATE;
12630 char *start = message + 27;
12632 int size = sizeof (MESSAGE_TEMPLATE);
12639 left = size - (start - message);
12640 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12642 /* Should it be skipped? */
12643 if (cpu_arch [j].skip)
12646 name = cpu_arch [j].name;
12647 len = cpu_arch [j].len;
12650 /* It is an extension. Skip if we aren't asked to show it. */
12661 /* It is an processor. Skip if we show only extension. */
12664 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12666 /* It is an impossible processor - skip. */
12670 p = output_message (stream, p, message, start, &left, name, len);
12673 /* Display disabled extensions. */
12675 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12677 name = cpu_noarch [j].name;
12678 len = cpu_noarch [j].len;
12679 p = output_message (stream, p, message, start, &left, name,
12684 fprintf (stream, "%s\n", message);
12688 md_show_usage (FILE *stream)
12690 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12691 fprintf (stream, _("\
12692 -Qy, -Qn ignored\n\
12693 -V print assembler version number\n\
12696 fprintf (stream, _("\
12697 -n Do not optimize code alignment\n\
12698 -q quieten some warnings\n"));
12699 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12700 fprintf (stream, _("\
12703 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12704 || defined (TE_PE) || defined (TE_PEP))
12705 fprintf (stream, _("\
12706 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
12708 #ifdef SVR4_COMMENT_CHARS
12709 fprintf (stream, _("\
12710 --divide do not treat `/' as a comment character\n"));
12712 fprintf (stream, _("\
12713 --divide ignored\n"));
12715 fprintf (stream, _("\
12716 -march=CPU[,+EXTENSION...]\n\
12717 generate code for CPU and EXTENSION, CPU is one of:\n"));
12718 show_arch (stream, 0, 1);
12719 fprintf (stream, _("\
12720 EXTENSION is combination of:\n"));
12721 show_arch (stream, 1, 0);
12722 fprintf (stream, _("\
12723 -mtune=CPU optimize for CPU, CPU is one of:\n"));
12724 show_arch (stream, 0, 0);
12725 fprintf (stream, _("\
12726 -msse2avx encode SSE instructions with VEX prefix\n"));
12727 fprintf (stream, _("\
12728 -msse-check=[none|error|warning] (default: warning)\n\
12729 check SSE instructions\n"));
12730 fprintf (stream, _("\
12731 -moperand-check=[none|error|warning] (default: warning)\n\
12732 check operand combinations for validity\n"));
12733 fprintf (stream, _("\
12734 -mavxscalar=[128|256] (default: 128)\n\
12735 encode scalar AVX instructions with specific vector\n\
12737 fprintf (stream, _("\
12738 -mvexwig=[0|1] (default: 0)\n\
12739 encode VEX instructions with specific VEX.W value\n\
12740 for VEX.W bit ignored instructions\n"));
12741 fprintf (stream, _("\
12742 -mevexlig=[128|256|512] (default: 128)\n\
12743 encode scalar EVEX instructions with specific vector\n\
12745 fprintf (stream, _("\
12746 -mevexwig=[0|1] (default: 0)\n\
12747 encode EVEX instructions with specific EVEX.W value\n\
12748 for EVEX.W bit ignored instructions\n"));
12749 fprintf (stream, _("\
12750 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12751 encode EVEX instructions with specific EVEX.RC value\n\
12752 for SAE-only ignored instructions\n"));
12753 fprintf (stream, _("\
12754 -mmnemonic=[att|intel] "));
12755 if (SYSV386_COMPAT)
12756 fprintf (stream, _("(default: att)\n"));
12758 fprintf (stream, _("(default: intel)\n"));
12759 fprintf (stream, _("\
12760 use AT&T/Intel mnemonic\n"));
12761 fprintf (stream, _("\
12762 -msyntax=[att|intel] (default: att)\n\
12763 use AT&T/Intel syntax\n"));
12764 fprintf (stream, _("\
12765 -mindex-reg support pseudo index registers\n"));
12766 fprintf (stream, _("\
12767 -mnaked-reg don't require `%%' prefix for registers\n"));
12768 fprintf (stream, _("\
12769 -madd-bnd-prefix add BND prefix for all valid branches\n"));
12770 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12771 fprintf (stream, _("\
12772 -mshared disable branch optimization for shared code\n"));
12773 fprintf (stream, _("\
12774 -mx86-used-note=[no|yes] "));
12775 if (DEFAULT_X86_USED_NOTE)
12776 fprintf (stream, _("(default: yes)\n"));
12778 fprintf (stream, _("(default: no)\n"));
12779 fprintf (stream, _("\
12780 generate x86 used ISA and feature properties\n"));
12782 #if defined (TE_PE) || defined (TE_PEP)
12783 fprintf (stream, _("\
12784 -mbig-obj generate big object files\n"));
12786 fprintf (stream, _("\
12787 -momit-lock-prefix=[no|yes] (default: no)\n\
12788 strip all lock prefixes\n"));
12789 fprintf (stream, _("\
12790 -mfence-as-lock-add=[no|yes] (default: no)\n\
12791 encode lfence, mfence and sfence as\n\
12792 lock addl $0x0, (%%{re}sp)\n"));
12793 fprintf (stream, _("\
12794 -mrelax-relocations=[no|yes] "));
12795 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12796 fprintf (stream, _("(default: yes)\n"));
12798 fprintf (stream, _("(default: no)\n"));
12799 fprintf (stream, _("\
12800 generate relax relocations\n"));
12801 fprintf (stream, _("\
12802 -malign-branch-boundary=NUM (default: 0)\n\
12803 align branches within NUM byte boundary\n"));
12804 fprintf (stream, _("\
12805 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12806 TYPE is combination of jcc, fused, jmp, call, ret,\n\
12808 specify types of branches to align\n"));
12809 fprintf (stream, _("\
12810 -malign-branch-prefix-size=NUM (default: 5)\n\
12811 align branches with NUM prefixes per instruction\n"));
12812 fprintf (stream, _("\
12813 -mbranches-within-32B-boundaries\n\
12814 align branches within 32 byte boundary\n"));
12815 fprintf (stream, _("\
12816 -mamd64 accept only AMD64 ISA [default]\n"));
12817 fprintf (stream, _("\
12818 -mintel64 accept only Intel64 ISA\n"));
12821 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12822 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12823 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12825 /* Pick the target format to use. */
12828 i386_target_format (void)
12830 if (!strncmp (default_arch, "x86_64", 6))
12832 update_code_flag (CODE_64BIT, 1);
12833 if (default_arch[6] == '\0')
12834 x86_elf_abi = X86_64_ABI;
12836 x86_elf_abi = X86_64_X32_ABI;
12838 else if (!strcmp (default_arch, "i386"))
12839 update_code_flag (CODE_32BIT, 1);
12840 else if (!strcmp (default_arch, "iamcu"))
12842 update_code_flag (CODE_32BIT, 1);
12843 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12845 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12846 cpu_arch_name = "iamcu";
12847 cpu_sub_arch_name = NULL;
12848 cpu_arch_flags = iamcu_flags;
12849 cpu_arch_isa = PROCESSOR_IAMCU;
12850 cpu_arch_isa_flags = iamcu_flags;
12851 if (!cpu_arch_tune_set)
12853 cpu_arch_tune = cpu_arch_isa;
12854 cpu_arch_tune_flags = cpu_arch_isa_flags;
12857 else if (cpu_arch_isa != PROCESSOR_IAMCU)
12858 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12862 as_fatal (_("unknown architecture"));
12864 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12865 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12866 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12867 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12869 switch (OUTPUT_FLAVOR)
12871 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12872 case bfd_target_aout_flavour:
12873 return AOUT_TARGET_FORMAT;
12875 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12876 # if defined (TE_PE) || defined (TE_PEP)
12877 case bfd_target_coff_flavour:
12878 if (flag_code == CODE_64BIT)
12879 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12882 # elif defined (TE_GO32)
12883 case bfd_target_coff_flavour:
12884 return "coff-go32";
12886 case bfd_target_coff_flavour:
12887 return "coff-i386";
12890 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12891 case bfd_target_elf_flavour:
12893 const char *format;
12895 switch (x86_elf_abi)
12898 format = ELF_TARGET_FORMAT;
12900 tls_get_addr = "___tls_get_addr";
12904 use_rela_relocations = 1;
12907 tls_get_addr = "__tls_get_addr";
12909 format = ELF_TARGET_FORMAT64;
12911 case X86_64_X32_ABI:
12912 use_rela_relocations = 1;
12915 tls_get_addr = "__tls_get_addr";
12917 disallow_64bit_reloc = 1;
12918 format = ELF_TARGET_FORMAT32;
12921 if (cpu_arch_isa == PROCESSOR_L1OM)
12923 if (x86_elf_abi != X86_64_ABI)
12924 as_fatal (_("Intel L1OM is 64bit only"));
12925 return ELF_TARGET_L1OM_FORMAT;
12927 else if (cpu_arch_isa == PROCESSOR_K1OM)
12929 if (x86_elf_abi != X86_64_ABI)
12930 as_fatal (_("Intel K1OM is 64bit only"));
12931 return ELF_TARGET_K1OM_FORMAT;
12933 else if (cpu_arch_isa == PROCESSOR_IAMCU)
12935 if (x86_elf_abi != I386_ABI)
12936 as_fatal (_("Intel MCU is 32bit only"));
12937 return ELF_TARGET_IAMCU_FORMAT;
12943 #if defined (OBJ_MACH_O)
12944 case bfd_target_mach_o_flavour:
12945 if (flag_code == CODE_64BIT)
12947 use_rela_relocations = 1;
12949 return "mach-o-x86-64";
12952 return "mach-o-i386";
12960 #endif /* OBJ_MAYBE_ more than one */
12963 md_undefined_symbol (char *name)
12965 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12966 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12967 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12968 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12972 if (symbol_find (name))
12973 as_bad (_("GOT already in symbol table"));
12974 GOT_symbol = symbol_new (name, undefined_section,
12975 (valueT) 0, &zero_address_frag);
12982 /* Round up a section size to the appropriate boundary. */
12985 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
12987 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12988 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
12990 /* For a.out, force the section size to be aligned. If we don't do
12991 this, BFD will align it for us, but it will not write out the
12992 final bytes of the section. This may be a bug in BFD, but it is
12993 easier to fix it here since that is how the other a.out targets
12997 align = bfd_section_alignment (segment);
12998 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13005 /* On the i386, PC-relative offsets are relative to the start of the
13006 next instruction. That is, the address of the offset, plus its
13007 size, since the offset is always the last part of the insn. */
13010 md_pcrel_from (fixS *fixP)
13012 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13018 s_bss (int ignore ATTRIBUTE_UNUSED)
13022 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13024 obj_elf_section_change_hook ();
13026 temp = get_absolute_expression ();
13027 subseg_set (bss_section, (subsegT) temp);
13028 demand_empty_rest_of_line ();
13033 /* Remember constant directive. */
13036 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13038 if (last_insn.kind != last_insn_directive
13039 && (bfd_section_flags (now_seg) & SEC_CODE))
13041 last_insn.seg = now_seg;
13042 last_insn.kind = last_insn_directive;
13043 last_insn.name = "constant directive";
13044 last_insn.file = as_where (&last_insn.line);
13049 i386_validate_fix (fixS *fixp)
13051 if (fixp->fx_subsy)
13053 if (fixp->fx_subsy == GOT_symbol)
13055 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13059 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13060 if (fixp->fx_tcbit2)
13061 fixp->fx_r_type = (fixp->fx_tcbit
13062 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13063 : BFD_RELOC_X86_64_GOTPCRELX);
13066 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13071 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13073 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13075 fixp->fx_subsy = 0;
13078 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13079 else if (!object_64bit)
13081 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13082 && fixp->fx_tcbit2)
13083 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13089 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13092 bfd_reloc_code_real_type code;
13094 switch (fixp->fx_r_type)
13096 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13097 case BFD_RELOC_SIZE32:
13098 case BFD_RELOC_SIZE64:
13099 if (S_IS_DEFINED (fixp->fx_addsy)
13100 && !S_IS_EXTERNAL (fixp->fx_addsy))
13102 /* Resolve size relocation against local symbol to size of
13103 the symbol plus addend. */
13104 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13105 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13106 && !fits_in_unsigned_long (value))
13107 as_bad_where (fixp->fx_file, fixp->fx_line,
13108 _("symbol size computation overflow"));
13109 fixp->fx_addsy = NULL;
13110 fixp->fx_subsy = NULL;
13111 md_apply_fix (fixp, (valueT *) &value, NULL);
13115 /* Fall through. */
13117 case BFD_RELOC_X86_64_PLT32:
13118 case BFD_RELOC_X86_64_GOT32:
13119 case BFD_RELOC_X86_64_GOTPCREL:
13120 case BFD_RELOC_X86_64_GOTPCRELX:
13121 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13122 case BFD_RELOC_386_PLT32:
13123 case BFD_RELOC_386_GOT32:
13124 case BFD_RELOC_386_GOT32X:
13125 case BFD_RELOC_386_GOTOFF:
13126 case BFD_RELOC_386_GOTPC:
13127 case BFD_RELOC_386_TLS_GD:
13128 case BFD_RELOC_386_TLS_LDM:
13129 case BFD_RELOC_386_TLS_LDO_32:
13130 case BFD_RELOC_386_TLS_IE_32:
13131 case BFD_RELOC_386_TLS_IE:
13132 case BFD_RELOC_386_TLS_GOTIE:
13133 case BFD_RELOC_386_TLS_LE_32:
13134 case BFD_RELOC_386_TLS_LE:
13135 case BFD_RELOC_386_TLS_GOTDESC:
13136 case BFD_RELOC_386_TLS_DESC_CALL:
13137 case BFD_RELOC_X86_64_TLSGD:
13138 case BFD_RELOC_X86_64_TLSLD:
13139 case BFD_RELOC_X86_64_DTPOFF32:
13140 case BFD_RELOC_X86_64_DTPOFF64:
13141 case BFD_RELOC_X86_64_GOTTPOFF:
13142 case BFD_RELOC_X86_64_TPOFF32:
13143 case BFD_RELOC_X86_64_TPOFF64:
13144 case BFD_RELOC_X86_64_GOTOFF64:
13145 case BFD_RELOC_X86_64_GOTPC32:
13146 case BFD_RELOC_X86_64_GOT64:
13147 case BFD_RELOC_X86_64_GOTPCREL64:
13148 case BFD_RELOC_X86_64_GOTPC64:
13149 case BFD_RELOC_X86_64_GOTPLT64:
13150 case BFD_RELOC_X86_64_PLTOFF64:
13151 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13152 case BFD_RELOC_X86_64_TLSDESC_CALL:
13153 case BFD_RELOC_RVA:
13154 case BFD_RELOC_VTABLE_ENTRY:
13155 case BFD_RELOC_VTABLE_INHERIT:
13157 case BFD_RELOC_32_SECREL:
13159 code = fixp->fx_r_type;
13161 case BFD_RELOC_X86_64_32S:
13162 if (!fixp->fx_pcrel)
13164 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13165 code = fixp->fx_r_type;
13168 /* Fall through. */
13170 if (fixp->fx_pcrel)
13172 switch (fixp->fx_size)
13175 as_bad_where (fixp->fx_file, fixp->fx_line,
13176 _("can not do %d byte pc-relative relocation"),
13178 code = BFD_RELOC_32_PCREL;
13180 case 1: code = BFD_RELOC_8_PCREL; break;
13181 case 2: code = BFD_RELOC_16_PCREL; break;
13182 case 4: code = BFD_RELOC_32_PCREL; break;
13184 case 8: code = BFD_RELOC_64_PCREL; break;
13190 switch (fixp->fx_size)
13193 as_bad_where (fixp->fx_file, fixp->fx_line,
13194 _("can not do %d byte relocation"),
13196 code = BFD_RELOC_32;
13198 case 1: code = BFD_RELOC_8; break;
13199 case 2: code = BFD_RELOC_16; break;
13200 case 4: code = BFD_RELOC_32; break;
13202 case 8: code = BFD_RELOC_64; break;
13209 if ((code == BFD_RELOC_32
13210 || code == BFD_RELOC_32_PCREL
13211 || code == BFD_RELOC_X86_64_32S)
13213 && fixp->fx_addsy == GOT_symbol)
13216 code = BFD_RELOC_386_GOTPC;
13218 code = BFD_RELOC_X86_64_GOTPC32;
13220 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13222 && fixp->fx_addsy == GOT_symbol)
13224 code = BFD_RELOC_X86_64_GOTPC64;
13227 rel = XNEW (arelent);
13228 rel->sym_ptr_ptr = XNEW (asymbol *);
13229 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13231 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13233 if (!use_rela_relocations)
13235 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13236 vtable entry to be used in the relocation's section offset. */
13237 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13238 rel->address = fixp->fx_offset;
13239 #if defined (OBJ_COFF) && defined (TE_PE)
13240 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13241 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13246 /* Use the rela in 64bit mode. */
13249 if (disallow_64bit_reloc)
13252 case BFD_RELOC_X86_64_DTPOFF64:
13253 case BFD_RELOC_X86_64_TPOFF64:
13254 case BFD_RELOC_64_PCREL:
13255 case BFD_RELOC_X86_64_GOTOFF64:
13256 case BFD_RELOC_X86_64_GOT64:
13257 case BFD_RELOC_X86_64_GOTPCREL64:
13258 case BFD_RELOC_X86_64_GOTPC64:
13259 case BFD_RELOC_X86_64_GOTPLT64:
13260 case BFD_RELOC_X86_64_PLTOFF64:
13261 as_bad_where (fixp->fx_file, fixp->fx_line,
13262 _("cannot represent relocation type %s in x32 mode"),
13263 bfd_get_reloc_code_name (code));
13269 if (!fixp->fx_pcrel)
13270 rel->addend = fixp->fx_offset;
13274 case BFD_RELOC_X86_64_PLT32:
13275 case BFD_RELOC_X86_64_GOT32:
13276 case BFD_RELOC_X86_64_GOTPCREL:
13277 case BFD_RELOC_X86_64_GOTPCRELX:
13278 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13279 case BFD_RELOC_X86_64_TLSGD:
13280 case BFD_RELOC_X86_64_TLSLD:
13281 case BFD_RELOC_X86_64_GOTTPOFF:
13282 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13283 case BFD_RELOC_X86_64_TLSDESC_CALL:
13284 rel->addend = fixp->fx_offset - fixp->fx_size;
13287 rel->addend = (section->vma
13289 + fixp->fx_addnumber
13290 + md_pcrel_from (fixp));
13295 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13296 if (rel->howto == NULL)
13298 as_bad_where (fixp->fx_file, fixp->fx_line,
13299 _("cannot represent relocation type %s"),
13300 bfd_get_reloc_code_name (code));
13301 /* Set howto to a garbage value so that we can keep going. */
13302 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13303 gas_assert (rel->howto != NULL);
13309 #include "tc-i386-intel.c"
13312 tc_x86_parse_to_dw2regnum (expressionS *exp)
13314 int saved_naked_reg;
13315 char saved_register_dot;
13317 saved_naked_reg = allow_naked_reg;
13318 allow_naked_reg = 1;
13319 saved_register_dot = register_chars['.'];
13320 register_chars['.'] = '.';
13321 allow_pseudo_reg = 1;
13322 expression_and_evaluate (exp);
13323 allow_pseudo_reg = 0;
13324 register_chars['.'] = saved_register_dot;
13325 allow_naked_reg = saved_naked_reg;
13327 if (exp->X_op == O_register && exp->X_add_number >= 0)
13329 if ((addressT) exp->X_add_number < i386_regtab_size)
13331 exp->X_op = O_constant;
13332 exp->X_add_number = i386_regtab[exp->X_add_number]
13333 .dw2_regnum[flag_code >> 1];
13336 exp->X_op = O_illegal;
13341 tc_x86_frame_initial_instructions (void)
13343 static unsigned int sp_regno[2];
13345 if (!sp_regno[flag_code >> 1])
13347 char *saved_input = input_line_pointer;
13348 char sp[][4] = {"esp", "rsp"};
13351 input_line_pointer = sp[flag_code >> 1];
13352 tc_x86_parse_to_dw2regnum (&exp);
13353 gas_assert (exp.X_op == O_constant);
13354 sp_regno[flag_code >> 1] = exp.X_add_number;
13355 input_line_pointer = saved_input;
13358 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13359 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13363 x86_dwarf2_addr_size (void)
13365 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13366 if (x86_elf_abi == X86_64_X32_ABI)
13369 return bfd_arch_bits_per_address (stdoutput) / 8;
13373 i386_elf_section_type (const char *str, size_t len)
13375 if (flag_code == CODE_64BIT
13376 && len == sizeof ("unwind") - 1
13377 && strncmp (str, "unwind", 6) == 0)
13378 return SHT_X86_64_UNWIND;
13385 i386_solaris_fix_up_eh_frame (segT sec)
13387 if (flag_code == CODE_64BIT)
13388 elf_section_type (sec) = SHT_X86_64_UNWIND;
13394 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13398 exp.X_op = O_secrel;
13399 exp.X_add_symbol = symbol;
13400 exp.X_add_number = 0;
13401 emit_expr (&exp, size);
13405 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13406 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
13409 x86_64_section_letter (int letter, const char **ptr_msg)
13411 if (flag_code == CODE_64BIT)
13414 return SHF_X86_64_LARGE;
13416 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13419 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13424 x86_64_section_word (char *str, size_t len)
13426 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13427 return SHF_X86_64_LARGE;
13433 handle_large_common (int small ATTRIBUTE_UNUSED)
13435 if (flag_code != CODE_64BIT)
13437 s_comm_internal (0, elf_common_parse);
13438 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13442 static segT lbss_section;
13443 asection *saved_com_section_ptr = elf_com_section_ptr;
13444 asection *saved_bss_section = bss_section;
13446 if (lbss_section == NULL)
13448 flagword applicable;
13449 segT seg = now_seg;
13450 subsegT subseg = now_subseg;
13452 /* The .lbss section is for local .largecomm symbols. */
13453 lbss_section = subseg_new (".lbss", 0);
13454 applicable = bfd_applicable_section_flags (stdoutput);
13455 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13456 seg_info (lbss_section)->bss = 1;
13458 subseg_set (seg, subseg);
13461 elf_com_section_ptr = &_bfd_elf_large_com_section;
13462 bss_section = lbss_section;
13464 s_comm_internal (0, elf_common_parse);
13466 elf_com_section_ptr = saved_com_section_ptr;
13467 bss_section = saved_bss_section;
13470 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */