[PATCH 22/57][Arm][GAS] Add support for MVE instructions: vmlaldav, vmlalv, vmlsldav...
[binutils-gdb.git] / gas / config / tc-i386.c
blob08dd9963e1c089dea70d358bdad9b17137d81a0a
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2019 Free Software Foundation, Inc.
4 This file is part of GAS, the GNU Assembler.
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
47 #ifndef REGISTER_WARNINGS
48 #define REGISTER_WARNINGS 1
49 #endif
51 #ifndef INFER_ADDR_PREFIX
52 #define INFER_ADDR_PREFIX 1
53 #endif
55 #ifndef DEFAULT_ARCH
56 #define DEFAULT_ARCH "i386"
57 #endif
59 #ifndef INLINE
60 #if __GNUC__ >= 2
61 #define INLINE __inline__
62 #else
63 #define INLINE
64 #endif
65 #endif
67 /* Prefixes will be emitted in the order defined below.
68 WAIT_PREFIX must be the first prefix since FWAIT is really is an
69 instruction, and so must come before any prefixes.
70 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
71 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
72 #define WAIT_PREFIX 0
73 #define SEG_PREFIX 1
74 #define ADDR_PREFIX 2
75 #define DATA_PREFIX 3
76 #define REP_PREFIX 4
77 #define HLE_PREFIX REP_PREFIX
78 #define BND_PREFIX REP_PREFIX
79 #define LOCK_PREFIX 5
80 #define REX_PREFIX 6 /* must come last. */
81 #define MAX_PREFIXES 7 /* max prefixes per opcode */
83 /* we define the syntax here (modulo base,index,scale syntax) */
84 #define REGISTER_PREFIX '%'
85 #define IMMEDIATE_PREFIX '$'
86 #define ABSOLUTE_PREFIX '*'
88 /* these are the instruction mnemonic suffixes in AT&T syntax or
89 memory operand size in Intel syntax. */
90 #define WORD_MNEM_SUFFIX 'w'
91 #define BYTE_MNEM_SUFFIX 'b'
92 #define SHORT_MNEM_SUFFIX 's'
93 #define LONG_MNEM_SUFFIX 'l'
94 #define QWORD_MNEM_SUFFIX 'q'
95 /* Intel Syntax. Use a non-ascii letter since since it never appears
96 in instructions. */
97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
99 #define END_OF_INSN '\0'
102 'templates' is for grouping together 'template' structures for opcodes
103 of the same name. This is only used for storing the insns in the grand
104 ole hash table of insns.
105 The templates themselves start at START and range up to (but not including)
106 END.
108 typedef struct
110 const insn_template *start;
111 const insn_template *end;
113 templates;
115 /* 386 operand encoding bytes: see 386 book for details of this. */
116 typedef struct
118 unsigned int regmem; /* codes register or memory operand */
119 unsigned int reg; /* codes register operand (or extended opcode) */
120 unsigned int mode; /* how to interpret regmem & reg */
122 modrm_byte;
124 /* x86-64 extension prefix. */
125 typedef int rex_byte;
127 /* 386 opcode byte to code indirect addressing. */
128 typedef struct
130 unsigned base;
131 unsigned index;
132 unsigned scale;
134 sib_byte;
136 /* x86 arch names, types and features */
137 typedef struct
139 const char *name; /* arch name */
140 unsigned int len; /* arch string length */
141 enum processor_type type; /* arch type */
142 i386_cpu_flags flags; /* cpu feature flags */
143 unsigned int skip; /* show_arch should skip this. */
145 arch_entry;
147 /* Used to turn off indicated flags. */
148 typedef struct
150 const char *name; /* arch name */
151 unsigned int len; /* arch string length */
152 i386_cpu_flags flags; /* cpu feature flags */
154 noarch_entry;
156 static void update_code_flag (int, int);
157 static void set_code_flag (int);
158 static void set_16bit_gcc_code_flag (int);
159 static void set_intel_syntax (int);
160 static void set_intel_mnemonic (int);
161 static void set_allow_index_reg (int);
162 static void set_check (int);
163 static void set_cpu_arch (int);
164 #ifdef TE_PE
165 static void pe_directive_secrel (int);
166 #endif
167 static void signed_cons (int);
168 static char *output_invalid (int c);
169 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
170 const char *);
171 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
172 const char *);
173 static int i386_att_operand (char *);
174 static int i386_intel_operand (char *, int);
175 static int i386_intel_simplify (expressionS *);
176 static int i386_intel_parse_name (const char *, expressionS *);
177 static const reg_entry *parse_register (char *, char **);
178 static char *parse_insn (char *, char *);
179 static char *parse_operands (char *, const char *);
180 static void swap_operands (void);
181 static void swap_2_operands (int, int);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
211 static const char *default_arch = DEFAULT_ARCH;
213 /* This struct describes rounding control and SAE in the instruction. */
214 struct RC_Operation
216 enum rc_type
218 rne = 0,
222 saeonly
223 } type;
224 int operand;
227 static struct RC_Operation rc_op;
229 /* The struct describes masking, applied to OPERAND in the instruction.
230 MASK is a pointer to the corresponding mask register. ZEROING tells
231 whether merging or zeroing mask is used. */
232 struct Mask_Operation
234 const reg_entry *mask;
235 unsigned int zeroing;
236 /* The operand where this operation is associated. */
237 int operand;
240 static struct Mask_Operation mask_op;
242 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
243 broadcast factor. */
244 struct Broadcast_Operation
246 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
247 int type;
249 /* Index of broadcasted operand. */
250 int operand;
252 /* Number of bytes to broadcast. */
253 int bytes;
256 static struct Broadcast_Operation broadcast_op;
258 /* VEX prefix. */
259 typedef struct
261 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
262 unsigned char bytes[4];
263 unsigned int length;
264 /* Destination or source register specifier. */
265 const reg_entry *register_specifier;
266 } vex_prefix;
268 /* 'md_assemble ()' gathers together information and puts it into a
269 i386_insn. */
271 union i386_op
273 expressionS *disps;
274 expressionS *imms;
275 const reg_entry *regs;
278 enum i386_error
280 operand_size_mismatch,
281 operand_type_mismatch,
282 register_type_mismatch,
283 number_of_operands_mismatch,
284 invalid_instruction_suffix,
285 bad_imm4,
286 unsupported_with_intel_mnemonic,
287 unsupported_syntax,
288 unsupported,
289 invalid_vsib_address,
290 invalid_vector_register_set,
291 unsupported_vector_index_register,
292 unsupported_broadcast,
293 broadcast_needed,
294 unsupported_masking,
295 mask_not_on_destination,
296 no_default_mask,
297 unsupported_rc_sae,
298 rc_sae_operand_not_last_imm,
299 invalid_register_operand,
302 struct _i386_insn
304 /* TM holds the template for the insn were currently assembling. */
305 insn_template tm;
307 /* SUFFIX holds the instruction size suffix for byte, word, dword
308 or qword, if given. */
309 char suffix;
311 /* OPERANDS gives the number of given operands. */
312 unsigned int operands;
314 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
315 of given register, displacement, memory operands and immediate
316 operands. */
317 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
319 /* TYPES [i] is the type (see above #defines) which tells us how to
320 use OP[i] for the corresponding operand. */
321 i386_operand_type types[MAX_OPERANDS];
323 /* Displacement expression, immediate expression, or register for each
324 operand. */
325 union i386_op op[MAX_OPERANDS];
327 /* Flags for operands. */
328 unsigned int flags[MAX_OPERANDS];
329 #define Operand_PCrel 1
330 #define Operand_Mem 2
332 /* Relocation type for operand */
333 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
335 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
336 the base index byte below. */
337 const reg_entry *base_reg;
338 const reg_entry *index_reg;
339 unsigned int log2_scale_factor;
341 /* SEG gives the seg_entries of this insn. They are zero unless
342 explicit segment overrides are given. */
343 const seg_entry *seg[2];
345 /* Copied first memory operand string, for re-checking. */
346 char *memop1_string;
348 /* PREFIX holds all the given prefix opcodes (usually null).
349 PREFIXES is the number of prefix opcodes. */
350 unsigned int prefixes;
351 unsigned char prefix[MAX_PREFIXES];
353 /* Has MMX register operands. */
354 bfd_boolean has_regmmx;
356 /* Has XMM register operands. */
357 bfd_boolean has_regxmm;
359 /* Has YMM register operands. */
360 bfd_boolean has_regymm;
362 /* Has ZMM register operands. */
363 bfd_boolean has_regzmm;
365 /* RM and SIB are the modrm byte and the sib byte where the
366 addressing modes of this insn are encoded. */
367 modrm_byte rm;
368 rex_byte rex;
369 rex_byte vrex;
370 sib_byte sib;
371 vex_prefix vex;
373 /* Masking attributes. */
374 struct Mask_Operation *mask;
376 /* Rounding control and SAE attributes. */
377 struct RC_Operation *rounding;
379 /* Broadcasting attributes. */
380 struct Broadcast_Operation *broadcast;
382 /* Compressed disp8*N attribute. */
383 unsigned int memshift;
385 /* Prefer load or store in encoding. */
386 enum
388 dir_encoding_default = 0,
389 dir_encoding_load,
390 dir_encoding_store,
391 dir_encoding_swap
392 } dir_encoding;
394 /* Prefer 8bit or 32bit displacement in encoding. */
395 enum
397 disp_encoding_default = 0,
398 disp_encoding_8bit,
399 disp_encoding_32bit
400 } disp_encoding;
402 /* Prefer the REX byte in encoding. */
403 bfd_boolean rex_encoding;
405 /* Disable instruction size optimization. */
406 bfd_boolean no_optimize;
408 /* How to encode vector instructions. */
409 enum
411 vex_encoding_default = 0,
412 vex_encoding_vex2,
413 vex_encoding_vex3,
414 vex_encoding_evex
415 } vec_encoding;
417 /* REP prefix. */
418 const char *rep_prefix;
420 /* HLE prefix. */
421 const char *hle_prefix;
423 /* Have BND prefix. */
424 const char *bnd_prefix;
426 /* Have NOTRACK prefix. */
427 const char *notrack_prefix;
429 /* Error message. */
430 enum i386_error error;
433 typedef struct _i386_insn i386_insn;
435 /* Link RC type with corresponding string, that'll be looked for in
436 asm. */
437 struct RC_name
439 enum rc_type type;
440 const char *name;
441 unsigned int len;
444 static const struct RC_name RC_NamesTable[] =
446 { rne, STRING_COMMA_LEN ("rn-sae") },
447 { rd, STRING_COMMA_LEN ("rd-sae") },
448 { ru, STRING_COMMA_LEN ("ru-sae") },
449 { rz, STRING_COMMA_LEN ("rz-sae") },
450 { saeonly, STRING_COMMA_LEN ("sae") },
453 /* List of chars besides those in app.c:symbol_chars that can start an
454 operand. Used to prevent the scrubber eating vital white-space. */
455 const char extra_symbol_chars[] = "*%-([{}"
456 #ifdef LEX_AT
458 #endif
459 #ifdef LEX_QM
461 #endif
464 #if (defined (TE_I386AIX) \
465 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
466 && !defined (TE_GNU) \
467 && !defined (TE_LINUX) \
468 && !defined (TE_NACL) \
469 && !defined (TE_FreeBSD) \
470 && !defined (TE_DragonFly) \
471 && !defined (TE_NetBSD)))
472 /* This array holds the chars that always start a comment. If the
473 pre-processor is disabled, these aren't very useful. The option
474 --divide will remove '/' from this list. */
475 const char *i386_comment_chars = "#/";
476 #define SVR4_COMMENT_CHARS 1
477 #define PREFIX_SEPARATOR '\\'
479 #else
480 const char *i386_comment_chars = "#";
481 #define PREFIX_SEPARATOR '/'
482 #endif
484 /* This array holds the chars that only start a comment at the beginning of
485 a line. If the line seems to have the form '# 123 filename'
486 .line and .file directives will appear in the pre-processed output.
487 Note that input_file.c hand checks for '#' at the beginning of the
488 first line of the input file. This is because the compiler outputs
489 #NO_APP at the beginning of its output.
490 Also note that comments started like this one will always work if
491 '/' isn't otherwise defined. */
492 const char line_comment_chars[] = "#/";
494 const char line_separator_chars[] = ";";
496 /* Chars that can be used to separate mant from exp in floating point
497 nums. */
498 const char EXP_CHARS[] = "eE";
500 /* Chars that mean this number is a floating point constant
501 As in 0f12.456
502 or 0d1.2345e12. */
503 const char FLT_CHARS[] = "fFdDxX";
505 /* Tables for lexical analysis. */
506 static char mnemonic_chars[256];
507 static char register_chars[256];
508 static char operand_chars[256];
509 static char identifier_chars[256];
510 static char digit_chars[256];
512 /* Lexical macros. */
513 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
514 #define is_operand_char(x) (operand_chars[(unsigned char) x])
515 #define is_register_char(x) (register_chars[(unsigned char) x])
516 #define is_space_char(x) ((x) == ' ')
517 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
518 #define is_digit_char(x) (digit_chars[(unsigned char) x])
520 /* All non-digit non-letter characters that may occur in an operand. */
521 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
523 /* md_assemble() always leaves the strings it's passed unaltered. To
524 effect this we maintain a stack of saved characters that we've smashed
525 with '\0's (indicating end of strings for various sub-fields of the
526 assembler instruction). */
527 static char save_stack[32];
528 static char *save_stack_p;
529 #define END_STRING_AND_SAVE(s) \
530 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
531 #define RESTORE_END_STRING(s) \
532 do { *(s) = *--save_stack_p; } while (0)
534 /* The instruction we're assembling. */
535 static i386_insn i;
537 /* Possible templates for current insn. */
538 static const templates *current_templates;
540 /* Per instruction expressionS buffers: max displacements & immediates. */
541 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
542 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
544 /* Current operand we are working on. */
545 static int this_operand = -1;
547 /* We support four different modes. FLAG_CODE variable is used to distinguish
548 these. */
550 enum flag_code {
551 CODE_32BIT,
552 CODE_16BIT,
553 CODE_64BIT };
555 static enum flag_code flag_code;
556 static unsigned int object_64bit;
557 static unsigned int disallow_64bit_reloc;
558 static int use_rela_relocations = 0;
560 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
561 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
562 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
564 /* The ELF ABI to use. */
565 enum x86_elf_abi
567 I386_ABI,
568 X86_64_ABI,
569 X86_64_X32_ABI
572 static enum x86_elf_abi x86_elf_abi = I386_ABI;
573 #endif
575 #if defined (TE_PE) || defined (TE_PEP)
576 /* Use big object file format. */
577 static int use_big_obj = 0;
578 #endif
580 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
581 /* 1 if generating code for a shared library. */
582 static int shared = 0;
583 #endif
585 /* 1 for intel syntax,
586 0 if att syntax. */
587 static int intel_syntax = 0;
589 /* 1 for Intel64 ISA,
590 0 if AMD64 ISA. */
591 static int intel64;
593 /* 1 for intel mnemonic,
594 0 if att mnemonic. */
595 static int intel_mnemonic = !SYSV386_COMPAT;
597 /* 1 if pseudo registers are permitted. */
598 static int allow_pseudo_reg = 0;
600 /* 1 if register prefix % not required. */
601 static int allow_naked_reg = 0;
603 /* 1 if the assembler should add BND prefix for all control-transferring
604 instructions supporting it, even if this prefix wasn't specified
605 explicitly. */
606 static int add_bnd_prefix = 0;
608 /* 1 if pseudo index register, eiz/riz, is allowed . */
609 static int allow_index_reg = 0;
611 /* 1 if the assembler should ignore LOCK prefix, even if it was
612 specified explicitly. */
613 static int omit_lock_prefix = 0;
615 /* 1 if the assembler should encode lfence, mfence, and sfence as
616 "lock addl $0, (%{re}sp)". */
617 static int avoid_fence = 0;
619 /* 1 if the assembler should generate relax relocations. */
621 static int generate_relax_relocations
622 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
624 static enum check_kind
626 check_none = 0,
627 check_warning,
628 check_error
630 sse_check, operand_check = check_warning;
632 /* Optimization:
633 1. Clear the REX_W bit with register operand if possible.
634 2. Above plus use 128bit vector instruction to clear the full vector
635 register.
637 static int optimize = 0;
639 /* Optimization:
640 1. Clear the REX_W bit with register operand if possible.
641 2. Above plus use 128bit vector instruction to clear the full vector
642 register.
643 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
644 "testb $imm7,%r8".
646 static int optimize_for_space = 0;
648 /* Register prefix used for error message. */
649 static const char *register_prefix = "%";
651 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
652 leave, push, and pop instructions so that gcc has the same stack
653 frame as in 32 bit mode. */
654 static char stackop_size = '\0';
656 /* Non-zero to optimize code alignment. */
657 int optimize_align_code = 1;
659 /* Non-zero to quieten some warnings. */
660 static int quiet_warnings = 0;
662 /* CPU name. */
663 static const char *cpu_arch_name = NULL;
664 static char *cpu_sub_arch_name = NULL;
666 /* CPU feature flags. */
667 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
669 /* If we have selected a cpu we are generating instructions for. */
670 static int cpu_arch_tune_set = 0;
672 /* Cpu we are generating instructions for. */
673 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
675 /* CPU feature flags of cpu we are generating instructions for. */
676 static i386_cpu_flags cpu_arch_tune_flags;
678 /* CPU instruction set architecture used. */
679 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
681 /* CPU feature flags of instruction set architecture used. */
682 i386_cpu_flags cpu_arch_isa_flags;
684 /* If set, conditional jumps are not automatically promoted to handle
685 larger than a byte offset. */
686 static unsigned int no_cond_jump_promotion = 0;
688 /* Encode SSE instructions with VEX prefix. */
689 static unsigned int sse2avx;
691 /* Encode scalar AVX instructions with specific vector length. */
692 static enum
694 vex128 = 0,
695 vex256
696 } avxscalar;
698 /* Encode VEX WIG instructions with specific vex.w. */
699 static enum
701 vexw0 = 0,
702 vexw1
703 } vexwig;
705 /* Encode scalar EVEX LIG instructions with specific vector length. */
706 static enum
708 evexl128 = 0,
709 evexl256,
710 evexl512
711 } evexlig;
713 /* Encode EVEX WIG instructions with specific evex.w. */
714 static enum
716 evexw0 = 0,
717 evexw1
718 } evexwig;
720 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
721 static enum rc_type evexrcig = rne;
723 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
724 static symbolS *GOT_symbol;
726 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
727 unsigned int x86_dwarf2_return_column;
729 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
730 int x86_cie_data_alignment;
732 /* Interface to relax_segment.
733 There are 3 major relax states for 386 jump insns because the
734 different types of jumps add different sizes to frags when we're
735 figuring out what sort of jump to choose to reach a given label. */
737 /* Types. */
738 #define UNCOND_JUMP 0
739 #define COND_JUMP 1
740 #define COND_JUMP86 2
742 /* Sizes. */
743 #define CODE16 1
744 #define SMALL 0
745 #define SMALL16 (SMALL | CODE16)
746 #define BIG 2
747 #define BIG16 (BIG | CODE16)
749 #ifndef INLINE
750 #ifdef __GNUC__
751 #define INLINE __inline__
752 #else
753 #define INLINE
754 #endif
755 #endif
757 #define ENCODE_RELAX_STATE(type, size) \
758 ((relax_substateT) (((type) << 2) | (size)))
759 #define TYPE_FROM_RELAX_STATE(s) \
760 ((s) >> 2)
761 #define DISP_SIZE_FROM_RELAX_STATE(s) \
762 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
764 /* This table is used by relax_frag to promote short jumps to long
765 ones where necessary. SMALL (short) jumps may be promoted to BIG
766 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
767 don't allow a short jump in a 32 bit code segment to be promoted to
768 a 16 bit offset jump because it's slower (requires data size
769 prefix), and doesn't work, unless the destination is in the bottom
770 64k of the code segment (The top 16 bits of eip are zeroed). */
772 const relax_typeS md_relax_table[] =
774 /* The fields are:
775 1) most positive reach of this state,
776 2) most negative reach of this state,
777 3) how many bytes this mode will have in the variable part of the frag
778 4) which index into the table to try if we can't fit into this one. */
780 /* UNCOND_JUMP states. */
781 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
782 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
783 /* dword jmp adds 4 bytes to frag:
784 0 extra opcode bytes, 4 displacement bytes. */
785 {0, 0, 4, 0},
786 /* word jmp adds 2 byte2 to frag:
787 0 extra opcode bytes, 2 displacement bytes. */
788 {0, 0, 2, 0},
790 /* COND_JUMP states. */
791 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
792 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
793 /* dword conditionals adds 5 bytes to frag:
794 1 extra opcode byte, 4 displacement bytes. */
795 {0, 0, 5, 0},
796 /* word conditionals add 3 bytes to frag:
797 1 extra opcode byte, 2 displacement bytes. */
798 {0, 0, 3, 0},
800 /* COND_JUMP86 states. */
801 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
802 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
803 /* dword conditionals adds 5 bytes to frag:
804 1 extra opcode byte, 4 displacement bytes. */
805 {0, 0, 5, 0},
806 /* word conditionals add 4 bytes to frag:
807 1 displacement byte and a 3 byte long branch insn. */
808 {0, 0, 4, 0}
811 static const arch_entry cpu_arch[] =
813 /* Do not replace the first two entries - i386_target_format()
814 relies on them being there in this order. */
815 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
816 CPU_GENERIC32_FLAGS, 0 },
817 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
818 CPU_GENERIC64_FLAGS, 0 },
819 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
820 CPU_NONE_FLAGS, 0 },
821 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
822 CPU_I186_FLAGS, 0 },
823 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
824 CPU_I286_FLAGS, 0 },
825 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
826 CPU_I386_FLAGS, 0 },
827 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
828 CPU_I486_FLAGS, 0 },
829 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
830 CPU_I586_FLAGS, 0 },
831 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
832 CPU_I686_FLAGS, 0 },
833 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
834 CPU_I586_FLAGS, 0 },
835 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
836 CPU_PENTIUMPRO_FLAGS, 0 },
837 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
838 CPU_P2_FLAGS, 0 },
839 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
840 CPU_P3_FLAGS, 0 },
841 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
842 CPU_P4_FLAGS, 0 },
843 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
844 CPU_CORE_FLAGS, 0 },
845 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
846 CPU_NOCONA_FLAGS, 0 },
847 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
848 CPU_CORE_FLAGS, 1 },
849 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
850 CPU_CORE_FLAGS, 0 },
851 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
852 CPU_CORE2_FLAGS, 1 },
853 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
854 CPU_CORE2_FLAGS, 0 },
855 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
856 CPU_COREI7_FLAGS, 0 },
857 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
858 CPU_L1OM_FLAGS, 0 },
859 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
860 CPU_K1OM_FLAGS, 0 },
861 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
862 CPU_IAMCU_FLAGS, 0 },
863 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
864 CPU_K6_FLAGS, 0 },
865 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
866 CPU_K6_2_FLAGS, 0 },
867 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
868 CPU_ATHLON_FLAGS, 0 },
869 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
870 CPU_K8_FLAGS, 1 },
871 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
872 CPU_K8_FLAGS, 0 },
873 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
874 CPU_K8_FLAGS, 0 },
875 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
876 CPU_AMDFAM10_FLAGS, 0 },
877 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
878 CPU_BDVER1_FLAGS, 0 },
879 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
880 CPU_BDVER2_FLAGS, 0 },
881 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
882 CPU_BDVER3_FLAGS, 0 },
883 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
884 CPU_BDVER4_FLAGS, 0 },
885 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
886 CPU_ZNVER1_FLAGS, 0 },
887 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
888 CPU_ZNVER2_FLAGS, 0 },
889 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
890 CPU_BTVER1_FLAGS, 0 },
891 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
892 CPU_BTVER2_FLAGS, 0 },
893 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
894 CPU_8087_FLAGS, 0 },
895 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
896 CPU_287_FLAGS, 0 },
897 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
898 CPU_387_FLAGS, 0 },
899 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
900 CPU_687_FLAGS, 0 },
901 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
902 CPU_CMOV_FLAGS, 0 },
903 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
904 CPU_FXSR_FLAGS, 0 },
905 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
906 CPU_MMX_FLAGS, 0 },
907 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
908 CPU_SSE_FLAGS, 0 },
909 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
910 CPU_SSE2_FLAGS, 0 },
911 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
912 CPU_SSE3_FLAGS, 0 },
913 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
914 CPU_SSSE3_FLAGS, 0 },
915 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
916 CPU_SSE4_1_FLAGS, 0 },
917 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
918 CPU_SSE4_2_FLAGS, 0 },
919 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
920 CPU_SSE4_2_FLAGS, 0 },
921 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
922 CPU_AVX_FLAGS, 0 },
923 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
924 CPU_AVX2_FLAGS, 0 },
925 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
926 CPU_AVX512F_FLAGS, 0 },
927 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
928 CPU_AVX512CD_FLAGS, 0 },
929 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
930 CPU_AVX512ER_FLAGS, 0 },
931 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
932 CPU_AVX512PF_FLAGS, 0 },
933 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
934 CPU_AVX512DQ_FLAGS, 0 },
935 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
936 CPU_AVX512BW_FLAGS, 0 },
937 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
938 CPU_AVX512VL_FLAGS, 0 },
939 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
940 CPU_VMX_FLAGS, 0 },
941 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
942 CPU_VMFUNC_FLAGS, 0 },
943 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
944 CPU_SMX_FLAGS, 0 },
945 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
946 CPU_XSAVE_FLAGS, 0 },
947 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
948 CPU_XSAVEOPT_FLAGS, 0 },
949 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
950 CPU_XSAVEC_FLAGS, 0 },
951 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
952 CPU_XSAVES_FLAGS, 0 },
953 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
954 CPU_AES_FLAGS, 0 },
955 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
956 CPU_PCLMUL_FLAGS, 0 },
957 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
958 CPU_PCLMUL_FLAGS, 1 },
959 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
960 CPU_FSGSBASE_FLAGS, 0 },
961 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
962 CPU_RDRND_FLAGS, 0 },
963 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
964 CPU_F16C_FLAGS, 0 },
965 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
966 CPU_BMI2_FLAGS, 0 },
967 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
968 CPU_FMA_FLAGS, 0 },
969 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
970 CPU_FMA4_FLAGS, 0 },
971 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
972 CPU_XOP_FLAGS, 0 },
973 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
974 CPU_LWP_FLAGS, 0 },
975 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
976 CPU_MOVBE_FLAGS, 0 },
977 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
978 CPU_CX16_FLAGS, 0 },
979 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
980 CPU_EPT_FLAGS, 0 },
981 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
982 CPU_LZCNT_FLAGS, 0 },
983 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
984 CPU_HLE_FLAGS, 0 },
985 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
986 CPU_RTM_FLAGS, 0 },
987 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
988 CPU_INVPCID_FLAGS, 0 },
989 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
990 CPU_CLFLUSH_FLAGS, 0 },
991 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
992 CPU_NOP_FLAGS, 0 },
993 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
994 CPU_SYSCALL_FLAGS, 0 },
995 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
996 CPU_RDTSCP_FLAGS, 0 },
997 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
998 CPU_3DNOW_FLAGS, 0 },
999 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1000 CPU_3DNOWA_FLAGS, 0 },
1001 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1002 CPU_PADLOCK_FLAGS, 0 },
1003 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1004 CPU_SVME_FLAGS, 1 },
1005 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1006 CPU_SVME_FLAGS, 0 },
1007 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1008 CPU_SSE4A_FLAGS, 0 },
1009 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1010 CPU_ABM_FLAGS, 0 },
1011 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1012 CPU_BMI_FLAGS, 0 },
1013 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1014 CPU_TBM_FLAGS, 0 },
1015 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1016 CPU_ADX_FLAGS, 0 },
1017 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1018 CPU_RDSEED_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1020 CPU_PRFCHW_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1022 CPU_SMAP_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1024 CPU_MPX_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1026 CPU_SHA_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1028 CPU_CLFLUSHOPT_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1030 CPU_PREFETCHWT1_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1032 CPU_SE1_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1034 CPU_CLWB_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1036 CPU_AVX512IFMA_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1038 CPU_AVX512VBMI_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1040 CPU_AVX512_4FMAPS_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1042 CPU_AVX512_4VNNIW_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1044 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1045 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1046 CPU_AVX512_VBMI2_FLAGS, 0 },
1047 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1048 CPU_AVX512_VNNI_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1050 CPU_AVX512_BITALG_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1052 CPU_CLZERO_FLAGS, 0 },
1053 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1054 CPU_MWAITX_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1056 CPU_OSPKE_FLAGS, 0 },
1057 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1058 CPU_RDPID_FLAGS, 0 },
1059 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1060 CPU_PTWRITE_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1062 CPU_IBT_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1064 CPU_SHSTK_FLAGS, 0 },
1065 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1066 CPU_GFNI_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1068 CPU_VAES_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1070 CPU_VPCLMULQDQ_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1072 CPU_WBNOINVD_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1074 CPU_PCONFIG_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1076 CPU_WAITPKG_FLAGS, 0 },
1077 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1078 CPU_CLDEMOTE_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1080 CPU_MOVDIRI_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1082 CPU_MOVDIR64B_FLAGS, 0 },
1083 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1084 CPU_AVX512_BF16_FLAGS, 0 },
1087 static const noarch_entry cpu_noarch[] =
1089 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1090 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1091 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1092 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1093 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1094 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1095 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1096 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1097 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1098 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1099 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1100 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1101 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1102 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1103 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1104 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1105 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1106 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1107 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1108 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1109 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1110 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1111 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1112 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1113 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1114 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1115 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1116 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1117 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1118 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1119 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1120 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1121 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1122 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1123 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1124 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1127 #ifdef I386COFF
1128 /* Like s_lcomm_internal in gas/read.c but the alignment string
1129 is allowed to be optional. */
1131 static symbolS *
1132 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1134 addressT align = 0;
1136 SKIP_WHITESPACE ();
1138 if (needs_align
1139 && *input_line_pointer == ',')
1141 align = parse_align (needs_align - 1);
1143 if (align == (addressT) -1)
1144 return NULL;
1146 else
1148 if (size >= 8)
1149 align = 3;
1150 else if (size >= 4)
1151 align = 2;
1152 else if (size >= 2)
1153 align = 1;
1154 else
1155 align = 0;
1158 bss_alloc (symbolP, size, align);
1159 return symbolP;
1162 static void
1163 pe_lcomm (int needs_align)
1165 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1167 #endif
1169 const pseudo_typeS md_pseudo_table[] =
1171 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1172 {"align", s_align_bytes, 0},
1173 #else
1174 {"align", s_align_ptwo, 0},
1175 #endif
1176 {"arch", set_cpu_arch, 0},
1177 #ifndef I386COFF
1178 {"bss", s_bss, 0},
1179 #else
1180 {"lcomm", pe_lcomm, 1},
1181 #endif
1182 {"ffloat", float_cons, 'f'},
1183 {"dfloat", float_cons, 'd'},
1184 {"tfloat", float_cons, 'x'},
1185 {"value", cons, 2},
1186 {"slong", signed_cons, 4},
1187 {"noopt", s_ignore, 0},
1188 {"optim", s_ignore, 0},
1189 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1190 {"code16", set_code_flag, CODE_16BIT},
1191 {"code32", set_code_flag, CODE_32BIT},
1192 #ifdef BFD64
1193 {"code64", set_code_flag, CODE_64BIT},
1194 #endif
1195 {"intel_syntax", set_intel_syntax, 1},
1196 {"att_syntax", set_intel_syntax, 0},
1197 {"intel_mnemonic", set_intel_mnemonic, 1},
1198 {"att_mnemonic", set_intel_mnemonic, 0},
1199 {"allow_index_reg", set_allow_index_reg, 1},
1200 {"disallow_index_reg", set_allow_index_reg, 0},
1201 {"sse_check", set_check, 0},
1202 {"operand_check", set_check, 1},
1203 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1204 {"largecomm", handle_large_common, 0},
1205 #else
1206 {"file", dwarf2_directive_file, 0},
1207 {"loc", dwarf2_directive_loc, 0},
1208 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1209 #endif
1210 #ifdef TE_PE
1211 {"secrel32", pe_directive_secrel, 0},
1212 #endif
1213 {0, 0, 0}
1216 /* For interface with expression (). */
1217 extern char *input_line_pointer;
1219 /* Hash table for instruction mnemonic lookup. */
1220 static struct hash_control *op_hash;
1222 /* Hash table for register lookup. */
1223 static struct hash_control *reg_hash;
1225 /* Various efficient no-op patterns for aligning code labels.
1226 Note: Don't try to assemble the instructions in the comments.
1227 0L and 0w are not legal. */
1228 static const unsigned char f32_1[] =
1229 {0x90}; /* nop */
1230 static const unsigned char f32_2[] =
1231 {0x66,0x90}; /* xchg %ax,%ax */
1232 static const unsigned char f32_3[] =
1233 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1234 static const unsigned char f32_4[] =
1235 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1236 static const unsigned char f32_6[] =
1237 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1238 static const unsigned char f32_7[] =
1239 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1240 static const unsigned char f16_3[] =
1241 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1242 static const unsigned char f16_4[] =
1243 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1244 static const unsigned char jump_disp8[] =
1245 {0xeb}; /* jmp disp8 */
1246 static const unsigned char jump32_disp32[] =
1247 {0xe9}; /* jmp disp32 */
1248 static const unsigned char jump16_disp32[] =
1249 {0x66,0xe9}; /* jmp disp32 */
1250 /* 32-bit NOPs patterns. */
1251 static const unsigned char *const f32_patt[] = {
1252 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1254 /* 16-bit NOPs patterns. */
1255 static const unsigned char *const f16_patt[] = {
1256 f32_1, f32_2, f16_3, f16_4
1258 /* nopl (%[re]ax) */
1259 static const unsigned char alt_3[] =
1260 {0x0f,0x1f,0x00};
1261 /* nopl 0(%[re]ax) */
1262 static const unsigned char alt_4[] =
1263 {0x0f,0x1f,0x40,0x00};
1264 /* nopl 0(%[re]ax,%[re]ax,1) */
1265 static const unsigned char alt_5[] =
1266 {0x0f,0x1f,0x44,0x00,0x00};
1267 /* nopw 0(%[re]ax,%[re]ax,1) */
1268 static const unsigned char alt_6[] =
1269 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1270 /* nopl 0L(%[re]ax) */
1271 static const unsigned char alt_7[] =
1272 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1273 /* nopl 0L(%[re]ax,%[re]ax,1) */
1274 static const unsigned char alt_8[] =
1275 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1276 /* nopw 0L(%[re]ax,%[re]ax,1) */
1277 static const unsigned char alt_9[] =
1278 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1279 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1280 static const unsigned char alt_10[] =
1281 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1282 /* data16 nopw %cs:0L(%eax,%eax,1) */
1283 static const unsigned char alt_11[] =
1284 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1285 /* 32-bit and 64-bit NOPs patterns. */
1286 static const unsigned char *const alt_patt[] = {
1287 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1288 alt_9, alt_10, alt_11
1291 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1292 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1294 static void
1295 i386_output_nops (char *where, const unsigned char *const *patt,
1296 int count, int max_single_nop_size)
1299 /* Place the longer NOP first. */
1300 int last;
1301 int offset;
1302 const unsigned char *nops;
1304 if (max_single_nop_size < 1)
1306 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1307 max_single_nop_size);
1308 return;
1311 nops = patt[max_single_nop_size - 1];
1313 /* Use the smaller one if the requsted one isn't available. */
1314 if (nops == NULL)
1316 max_single_nop_size--;
1317 nops = patt[max_single_nop_size - 1];
1320 last = count % max_single_nop_size;
1322 count -= last;
1323 for (offset = 0; offset < count; offset += max_single_nop_size)
1324 memcpy (where + offset, nops, max_single_nop_size);
1326 if (last)
1328 nops = patt[last - 1];
1329 if (nops == NULL)
1331 /* Use the smaller one plus one-byte NOP if the needed one
1332 isn't available. */
1333 last--;
1334 nops = patt[last - 1];
1335 memcpy (where + offset, nops, last);
1336 where[offset + last] = *patt[0];
1338 else
1339 memcpy (where + offset, nops, last);
1343 static INLINE int
1344 fits_in_imm7 (offsetT num)
1346 return (num & 0x7f) == num;
1349 static INLINE int
1350 fits_in_imm31 (offsetT num)
1352 return (num & 0x7fffffff) == num;
1355 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1356 single NOP instruction LIMIT. */
1358 void
1359 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1361 const unsigned char *const *patt = NULL;
1362 int max_single_nop_size;
1363 /* Maximum number of NOPs before switching to jump over NOPs. */
1364 int max_number_of_nops;
1366 switch (fragP->fr_type)
1368 case rs_fill_nop:
1369 case rs_align_code:
1370 break;
1371 default:
1372 return;
1375 /* We need to decide which NOP sequence to use for 32bit and
1376 64bit. When -mtune= is used:
1378 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1379 PROCESSOR_GENERIC32, f32_patt will be used.
1380 2. For the rest, alt_patt will be used.
1382 When -mtune= isn't used, alt_patt will be used if
1383 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1384 be used.
1386 When -march= or .arch is used, we can't use anything beyond
1387 cpu_arch_isa_flags. */
1389 if (flag_code == CODE_16BIT)
1391 patt = f16_patt;
1392 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1393 /* Limit number of NOPs to 2 in 16-bit mode. */
1394 max_number_of_nops = 2;
1396 else
1398 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1400 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1401 switch (cpu_arch_tune)
1403 case PROCESSOR_UNKNOWN:
1404 /* We use cpu_arch_isa_flags to check if we SHOULD
1405 optimize with nops. */
1406 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1407 patt = alt_patt;
1408 else
1409 patt = f32_patt;
1410 break;
1411 case PROCESSOR_PENTIUM4:
1412 case PROCESSOR_NOCONA:
1413 case PROCESSOR_CORE:
1414 case PROCESSOR_CORE2:
1415 case PROCESSOR_COREI7:
1416 case PROCESSOR_L1OM:
1417 case PROCESSOR_K1OM:
1418 case PROCESSOR_GENERIC64:
1419 case PROCESSOR_K6:
1420 case PROCESSOR_ATHLON:
1421 case PROCESSOR_K8:
1422 case PROCESSOR_AMDFAM10:
1423 case PROCESSOR_BD:
1424 case PROCESSOR_ZNVER:
1425 case PROCESSOR_BT:
1426 patt = alt_patt;
1427 break;
1428 case PROCESSOR_I386:
1429 case PROCESSOR_I486:
1430 case PROCESSOR_PENTIUM:
1431 case PROCESSOR_PENTIUMPRO:
1432 case PROCESSOR_IAMCU:
1433 case PROCESSOR_GENERIC32:
1434 patt = f32_patt;
1435 break;
1438 else
1440 switch (fragP->tc_frag_data.tune)
1442 case PROCESSOR_UNKNOWN:
1443 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1444 PROCESSOR_UNKNOWN. */
1445 abort ();
1446 break;
1448 case PROCESSOR_I386:
1449 case PROCESSOR_I486:
1450 case PROCESSOR_PENTIUM:
1451 case PROCESSOR_IAMCU:
1452 case PROCESSOR_K6:
1453 case PROCESSOR_ATHLON:
1454 case PROCESSOR_K8:
1455 case PROCESSOR_AMDFAM10:
1456 case PROCESSOR_BD:
1457 case PROCESSOR_ZNVER:
1458 case PROCESSOR_BT:
1459 case PROCESSOR_GENERIC32:
1460 /* We use cpu_arch_isa_flags to check if we CAN optimize
1461 with nops. */
1462 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1463 patt = alt_patt;
1464 else
1465 patt = f32_patt;
1466 break;
1467 case PROCESSOR_PENTIUMPRO:
1468 case PROCESSOR_PENTIUM4:
1469 case PROCESSOR_NOCONA:
1470 case PROCESSOR_CORE:
1471 case PROCESSOR_CORE2:
1472 case PROCESSOR_COREI7:
1473 case PROCESSOR_L1OM:
1474 case PROCESSOR_K1OM:
1475 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1476 patt = alt_patt;
1477 else
1478 patt = f32_patt;
1479 break;
1480 case PROCESSOR_GENERIC64:
1481 patt = alt_patt;
1482 break;
1486 if (patt == f32_patt)
1488 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1489 /* Limit number of NOPs to 2 for older processors. */
1490 max_number_of_nops = 2;
1492 else
1494 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1495 /* Limit number of NOPs to 7 for newer processors. */
1496 max_number_of_nops = 7;
1500 if (limit == 0)
1501 limit = max_single_nop_size;
1503 if (fragP->fr_type == rs_fill_nop)
1505 /* Output NOPs for .nop directive. */
1506 if (limit > max_single_nop_size)
1508 as_bad_where (fragP->fr_file, fragP->fr_line,
1509 _("invalid single nop size: %d "
1510 "(expect within [0, %d])"),
1511 limit, max_single_nop_size);
1512 return;
1515 else
1516 fragP->fr_var = count;
1518 if ((count / max_single_nop_size) > max_number_of_nops)
1520 /* Generate jump over NOPs. */
1521 offsetT disp = count - 2;
1522 if (fits_in_imm7 (disp))
1524 /* Use "jmp disp8" if possible. */
1525 count = disp;
1526 where[0] = jump_disp8[0];
1527 where[1] = count;
1528 where += 2;
1530 else
1532 unsigned int size_of_jump;
1534 if (flag_code == CODE_16BIT)
1536 where[0] = jump16_disp32[0];
1537 where[1] = jump16_disp32[1];
1538 size_of_jump = 2;
1540 else
1542 where[0] = jump32_disp32[0];
1543 size_of_jump = 1;
1546 count -= size_of_jump + 4;
1547 if (!fits_in_imm31 (count))
1549 as_bad_where (fragP->fr_file, fragP->fr_line,
1550 _("jump over nop padding out of range"));
1551 return;
1554 md_number_to_chars (where + size_of_jump, count, 4);
1555 where += size_of_jump + 4;
1559 /* Generate multiple NOPs. */
1560 i386_output_nops (where, patt, count, limit);
1563 static INLINE int
1564 operand_type_all_zero (const union i386_operand_type *x)
1566 switch (ARRAY_SIZE(x->array))
1568 case 3:
1569 if (x->array[2])
1570 return 0;
1571 /* Fall through. */
1572 case 2:
1573 if (x->array[1])
1574 return 0;
1575 /* Fall through. */
1576 case 1:
1577 return !x->array[0];
1578 default:
1579 abort ();
1583 static INLINE void
1584 operand_type_set (union i386_operand_type *x, unsigned int v)
1586 switch (ARRAY_SIZE(x->array))
1588 case 3:
1589 x->array[2] = v;
1590 /* Fall through. */
1591 case 2:
1592 x->array[1] = v;
1593 /* Fall through. */
1594 case 1:
1595 x->array[0] = v;
1596 /* Fall through. */
1597 break;
1598 default:
1599 abort ();
1603 static INLINE int
1604 operand_type_equal (const union i386_operand_type *x,
1605 const union i386_operand_type *y)
1607 switch (ARRAY_SIZE(x->array))
1609 case 3:
1610 if (x->array[2] != y->array[2])
1611 return 0;
1612 /* Fall through. */
1613 case 2:
1614 if (x->array[1] != y->array[1])
1615 return 0;
1616 /* Fall through. */
1617 case 1:
1618 return x->array[0] == y->array[0];
1619 break;
1620 default:
1621 abort ();
1625 static INLINE int
1626 cpu_flags_all_zero (const union i386_cpu_flags *x)
1628 switch (ARRAY_SIZE(x->array))
1630 case 4:
1631 if (x->array[3])
1632 return 0;
1633 /* Fall through. */
1634 case 3:
1635 if (x->array[2])
1636 return 0;
1637 /* Fall through. */
1638 case 2:
1639 if (x->array[1])
1640 return 0;
1641 /* Fall through. */
1642 case 1:
1643 return !x->array[0];
1644 default:
1645 abort ();
1649 static INLINE int
1650 cpu_flags_equal (const union i386_cpu_flags *x,
1651 const union i386_cpu_flags *y)
1653 switch (ARRAY_SIZE(x->array))
1655 case 4:
1656 if (x->array[3] != y->array[3])
1657 return 0;
1658 /* Fall through. */
1659 case 3:
1660 if (x->array[2] != y->array[2])
1661 return 0;
1662 /* Fall through. */
1663 case 2:
1664 if (x->array[1] != y->array[1])
1665 return 0;
1666 /* Fall through. */
1667 case 1:
1668 return x->array[0] == y->array[0];
1669 break;
1670 default:
1671 abort ();
1675 static INLINE int
1676 cpu_flags_check_cpu64 (i386_cpu_flags f)
1678 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1679 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1682 static INLINE i386_cpu_flags
1683 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1685 switch (ARRAY_SIZE (x.array))
1687 case 4:
1688 x.array [3] &= y.array [3];
1689 /* Fall through. */
1690 case 3:
1691 x.array [2] &= y.array [2];
1692 /* Fall through. */
1693 case 2:
1694 x.array [1] &= y.array [1];
1695 /* Fall through. */
1696 case 1:
1697 x.array [0] &= y.array [0];
1698 break;
1699 default:
1700 abort ();
1702 return x;
1705 static INLINE i386_cpu_flags
1706 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1708 switch (ARRAY_SIZE (x.array))
1710 case 4:
1711 x.array [3] |= y.array [3];
1712 /* Fall through. */
1713 case 3:
1714 x.array [2] |= y.array [2];
1715 /* Fall through. */
1716 case 2:
1717 x.array [1] |= y.array [1];
1718 /* Fall through. */
1719 case 1:
1720 x.array [0] |= y.array [0];
1721 break;
1722 default:
1723 abort ();
1725 return x;
1728 static INLINE i386_cpu_flags
1729 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1731 switch (ARRAY_SIZE (x.array))
1733 case 4:
1734 x.array [3] &= ~y.array [3];
1735 /* Fall through. */
1736 case 3:
1737 x.array [2] &= ~y.array [2];
1738 /* Fall through. */
1739 case 2:
1740 x.array [1] &= ~y.array [1];
1741 /* Fall through. */
1742 case 1:
1743 x.array [0] &= ~y.array [0];
1744 break;
1745 default:
1746 abort ();
1748 return x;
1751 #define CPU_FLAGS_ARCH_MATCH 0x1
1752 #define CPU_FLAGS_64BIT_MATCH 0x2
1754 #define CPU_FLAGS_PERFECT_MATCH \
1755 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1757 /* Return CPU flags match bits. */
1759 static int
1760 cpu_flags_match (const insn_template *t)
1762 i386_cpu_flags x = t->cpu_flags;
1763 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1765 x.bitfield.cpu64 = 0;
1766 x.bitfield.cpuno64 = 0;
1768 if (cpu_flags_all_zero (&x))
1770 /* This instruction is available on all archs. */
1771 match |= CPU_FLAGS_ARCH_MATCH;
1773 else
1775 /* This instruction is available only on some archs. */
1776 i386_cpu_flags cpu = cpu_arch_flags;
1778 /* AVX512VL is no standalone feature - match it and then strip it. */
1779 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1780 return match;
1781 x.bitfield.cpuavx512vl = 0;
1783 cpu = cpu_flags_and (x, cpu);
1784 if (!cpu_flags_all_zero (&cpu))
1786 if (x.bitfield.cpuavx)
1788 /* We need to check a few extra flags with AVX. */
1789 if (cpu.bitfield.cpuavx
1790 && (!t->opcode_modifier.sse2avx || sse2avx)
1791 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1792 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1793 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1794 match |= CPU_FLAGS_ARCH_MATCH;
1796 else if (x.bitfield.cpuavx512f)
1798 /* We need to check a few extra flags with AVX512F. */
1799 if (cpu.bitfield.cpuavx512f
1800 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1801 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1802 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1803 match |= CPU_FLAGS_ARCH_MATCH;
1805 else
1806 match |= CPU_FLAGS_ARCH_MATCH;
1809 return match;
1812 static INLINE i386_operand_type
1813 operand_type_and (i386_operand_type x, i386_operand_type y)
1815 switch (ARRAY_SIZE (x.array))
1817 case 3:
1818 x.array [2] &= y.array [2];
1819 /* Fall through. */
1820 case 2:
1821 x.array [1] &= y.array [1];
1822 /* Fall through. */
1823 case 1:
1824 x.array [0] &= y.array [0];
1825 break;
1826 default:
1827 abort ();
1829 return x;
1832 static INLINE i386_operand_type
1833 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1835 switch (ARRAY_SIZE (x.array))
1837 case 3:
1838 x.array [2] &= ~y.array [2];
1839 /* Fall through. */
1840 case 2:
1841 x.array [1] &= ~y.array [1];
1842 /* Fall through. */
1843 case 1:
1844 x.array [0] &= ~y.array [0];
1845 break;
1846 default:
1847 abort ();
1849 return x;
1852 static INLINE i386_operand_type
1853 operand_type_or (i386_operand_type x, i386_operand_type y)
1855 switch (ARRAY_SIZE (x.array))
1857 case 3:
1858 x.array [2] |= y.array [2];
1859 /* Fall through. */
1860 case 2:
1861 x.array [1] |= y.array [1];
1862 /* Fall through. */
1863 case 1:
1864 x.array [0] |= y.array [0];
1865 break;
1866 default:
1867 abort ();
1869 return x;
1872 static INLINE i386_operand_type
1873 operand_type_xor (i386_operand_type x, i386_operand_type y)
1875 switch (ARRAY_SIZE (x.array))
1877 case 3:
1878 x.array [2] ^= y.array [2];
1879 /* Fall through. */
1880 case 2:
1881 x.array [1] ^= y.array [1];
1882 /* Fall through. */
1883 case 1:
1884 x.array [0] ^= y.array [0];
1885 break;
1886 default:
1887 abort ();
1889 return x;
1892 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1893 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1894 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1895 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1896 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1897 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1898 static const i386_operand_type anydisp
1899 = OPERAND_TYPE_ANYDISP;
1900 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1901 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1902 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1903 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1904 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1905 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1906 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1907 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1908 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1909 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1910 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1911 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1913 enum operand_type
1915 reg,
1916 imm,
1917 disp,
1918 anymem
1921 static INLINE int
1922 operand_type_check (i386_operand_type t, enum operand_type c)
1924 switch (c)
1926 case reg:
1927 return t.bitfield.reg;
1929 case imm:
1930 return (t.bitfield.imm8
1931 || t.bitfield.imm8s
1932 || t.bitfield.imm16
1933 || t.bitfield.imm32
1934 || t.bitfield.imm32s
1935 || t.bitfield.imm64);
1937 case disp:
1938 return (t.bitfield.disp8
1939 || t.bitfield.disp16
1940 || t.bitfield.disp32
1941 || t.bitfield.disp32s
1942 || t.bitfield.disp64);
1944 case anymem:
1945 return (t.bitfield.disp8
1946 || t.bitfield.disp16
1947 || t.bitfield.disp32
1948 || t.bitfield.disp32s
1949 || t.bitfield.disp64
1950 || t.bitfield.baseindex);
1952 default:
1953 abort ();
1956 return 0;
1959 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
1960 between operand GIVEN and opeand WANTED for instruction template T. */
1962 static INLINE int
1963 match_operand_size (const insn_template *t, unsigned int wanted,
1964 unsigned int given)
1966 return !((i.types[given].bitfield.byte
1967 && !t->operand_types[wanted].bitfield.byte)
1968 || (i.types[given].bitfield.word
1969 && !t->operand_types[wanted].bitfield.word)
1970 || (i.types[given].bitfield.dword
1971 && !t->operand_types[wanted].bitfield.dword)
1972 || (i.types[given].bitfield.qword
1973 && !t->operand_types[wanted].bitfield.qword)
1974 || (i.types[given].bitfield.tbyte
1975 && !t->operand_types[wanted].bitfield.tbyte));
1978 /* Return 1 if there is no conflict in SIMD register between operand
1979 GIVEN and opeand WANTED for instruction template T. */
1981 static INLINE int
1982 match_simd_size (const insn_template *t, unsigned int wanted,
1983 unsigned int given)
1985 return !((i.types[given].bitfield.xmmword
1986 && !t->operand_types[wanted].bitfield.xmmword)
1987 || (i.types[given].bitfield.ymmword
1988 && !t->operand_types[wanted].bitfield.ymmword)
1989 || (i.types[given].bitfield.zmmword
1990 && !t->operand_types[wanted].bitfield.zmmword));
1993 /* Return 1 if there is no conflict in any size between operand GIVEN
1994 and opeand WANTED for instruction template T. */
1996 static INLINE int
1997 match_mem_size (const insn_template *t, unsigned int wanted,
1998 unsigned int given)
2000 return (match_operand_size (t, wanted, given)
2001 && !((i.types[given].bitfield.unspecified
2002 && !i.broadcast
2003 && !t->operand_types[wanted].bitfield.unspecified)
2004 || (i.types[given].bitfield.fword
2005 && !t->operand_types[wanted].bitfield.fword)
2006 /* For scalar opcode templates to allow register and memory
2007 operands at the same time, some special casing is needed
2008 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2009 down-conversion vpmov*. */
2010 || ((t->operand_types[wanted].bitfield.regsimd
2011 && !t->opcode_modifier.broadcast
2012 && (t->operand_types[wanted].bitfield.byte
2013 || t->operand_types[wanted].bitfield.word
2014 || t->operand_types[wanted].bitfield.dword
2015 || t->operand_types[wanted].bitfield.qword))
2016 ? (i.types[given].bitfield.xmmword
2017 || i.types[given].bitfield.ymmword
2018 || i.types[given].bitfield.zmmword)
2019 : !match_simd_size(t, wanted, given))));
2022 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2023 operands for instruction template T, and it has MATCH_REVERSE set if there
2024 is no size conflict on any operands for the template with operands reversed
2025 (and the template allows for reversing in the first place). */
2027 #define MATCH_STRAIGHT 1
2028 #define MATCH_REVERSE 2
2030 static INLINE unsigned int
2031 operand_size_match (const insn_template *t)
2033 unsigned int j, match = MATCH_STRAIGHT;
2035 /* Don't check jump instructions. */
2036 if (t->opcode_modifier.jump
2037 || t->opcode_modifier.jumpbyte
2038 || t->opcode_modifier.jumpdword
2039 || t->opcode_modifier.jumpintersegment)
2040 return match;
2042 /* Check memory and accumulator operand size. */
2043 for (j = 0; j < i.operands; j++)
2045 if (!i.types[j].bitfield.reg && !i.types[j].bitfield.regsimd
2046 && t->operand_types[j].bitfield.anysize)
2047 continue;
2049 if (t->operand_types[j].bitfield.reg
2050 && !match_operand_size (t, j, j))
2052 match = 0;
2053 break;
2056 if (t->operand_types[j].bitfield.regsimd
2057 && !match_simd_size (t, j, j))
2059 match = 0;
2060 break;
2063 if (t->operand_types[j].bitfield.acc
2064 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2066 match = 0;
2067 break;
2070 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2072 match = 0;
2073 break;
2077 if (!t->opcode_modifier.d)
2079 mismatch:
2080 if (!match)
2081 i.error = operand_size_mismatch;
2082 return match;
2085 /* Check reverse. */
2086 gas_assert (i.operands >= 2 && i.operands <= 3);
2088 for (j = 0; j < i.operands; j++)
2090 unsigned int given = i.operands - j - 1;
2092 if (t->operand_types[j].bitfield.reg
2093 && !match_operand_size (t, j, given))
2094 goto mismatch;
2096 if (t->operand_types[j].bitfield.regsimd
2097 && !match_simd_size (t, j, given))
2098 goto mismatch;
2100 if (t->operand_types[j].bitfield.acc
2101 && (!match_operand_size (t, j, given)
2102 || !match_simd_size (t, j, given)))
2103 goto mismatch;
2105 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2106 goto mismatch;
2109 return match | MATCH_REVERSE;
2112 static INLINE int
2113 operand_type_match (i386_operand_type overlap,
2114 i386_operand_type given)
2116 i386_operand_type temp = overlap;
2118 temp.bitfield.jumpabsolute = 0;
2119 temp.bitfield.unspecified = 0;
2120 temp.bitfield.byte = 0;
2121 temp.bitfield.word = 0;
2122 temp.bitfield.dword = 0;
2123 temp.bitfield.fword = 0;
2124 temp.bitfield.qword = 0;
2125 temp.bitfield.tbyte = 0;
2126 temp.bitfield.xmmword = 0;
2127 temp.bitfield.ymmword = 0;
2128 temp.bitfield.zmmword = 0;
2129 if (operand_type_all_zero (&temp))
2130 goto mismatch;
2132 if (given.bitfield.baseindex == overlap.bitfield.baseindex
2133 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2134 return 1;
2136 mismatch:
2137 i.error = operand_type_mismatch;
2138 return 0;
2141 /* If given types g0 and g1 are registers they must be of the same type
2142 unless the expected operand type register overlap is null.
2143 Memory operand size of certain SIMD instructions is also being checked
2144 here. */
2146 static INLINE int
2147 operand_type_register_match (i386_operand_type g0,
2148 i386_operand_type t0,
2149 i386_operand_type g1,
2150 i386_operand_type t1)
2152 if (!g0.bitfield.reg
2153 && !g0.bitfield.regsimd
2154 && (!operand_type_check (g0, anymem)
2155 || g0.bitfield.unspecified
2156 || !t0.bitfield.regsimd))
2157 return 1;
2159 if (!g1.bitfield.reg
2160 && !g1.bitfield.regsimd
2161 && (!operand_type_check (g1, anymem)
2162 || g1.bitfield.unspecified
2163 || !t1.bitfield.regsimd))
2164 return 1;
2166 if (g0.bitfield.byte == g1.bitfield.byte
2167 && g0.bitfield.word == g1.bitfield.word
2168 && g0.bitfield.dword == g1.bitfield.dword
2169 && g0.bitfield.qword == g1.bitfield.qword
2170 && g0.bitfield.xmmword == g1.bitfield.xmmword
2171 && g0.bitfield.ymmword == g1.bitfield.ymmword
2172 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2173 return 1;
2175 if (!(t0.bitfield.byte & t1.bitfield.byte)
2176 && !(t0.bitfield.word & t1.bitfield.word)
2177 && !(t0.bitfield.dword & t1.bitfield.dword)
2178 && !(t0.bitfield.qword & t1.bitfield.qword)
2179 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2180 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2181 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2182 return 1;
2184 i.error = register_type_mismatch;
2186 return 0;
2189 static INLINE unsigned int
2190 register_number (const reg_entry *r)
2192 unsigned int nr = r->reg_num;
2194 if (r->reg_flags & RegRex)
2195 nr += 8;
2197 if (r->reg_flags & RegVRex)
2198 nr += 16;
2200 return nr;
2203 static INLINE unsigned int
2204 mode_from_disp_size (i386_operand_type t)
2206 if (t.bitfield.disp8)
2207 return 1;
2208 else if (t.bitfield.disp16
2209 || t.bitfield.disp32
2210 || t.bitfield.disp32s)
2211 return 2;
2212 else
2213 return 0;
2216 static INLINE int
2217 fits_in_signed_byte (addressT num)
2219 return num + 0x80 <= 0xff;
2222 static INLINE int
2223 fits_in_unsigned_byte (addressT num)
2225 return num <= 0xff;
2228 static INLINE int
2229 fits_in_unsigned_word (addressT num)
2231 return num <= 0xffff;
2234 static INLINE int
2235 fits_in_signed_word (addressT num)
2237 return num + 0x8000 <= 0xffff;
2240 static INLINE int
2241 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2243 #ifndef BFD64
2244 return 1;
2245 #else
2246 return num + 0x80000000 <= 0xffffffff;
2247 #endif
2248 } /* fits_in_signed_long() */
2250 static INLINE int
2251 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2253 #ifndef BFD64
2254 return 1;
2255 #else
2256 return num <= 0xffffffff;
2257 #endif
2258 } /* fits_in_unsigned_long() */
2260 static INLINE int
2261 fits_in_disp8 (offsetT num)
2263 int shift = i.memshift;
2264 unsigned int mask;
2266 if (shift == -1)
2267 abort ();
2269 mask = (1 << shift) - 1;
2271 /* Return 0 if NUM isn't properly aligned. */
2272 if ((num & mask))
2273 return 0;
2275 /* Check if NUM will fit in 8bit after shift. */
2276 return fits_in_signed_byte (num >> shift);
2279 static INLINE int
2280 fits_in_imm4 (offsetT num)
2282 return (num & 0xf) == num;
2285 static i386_operand_type
2286 smallest_imm_type (offsetT num)
2288 i386_operand_type t;
2290 operand_type_set (&t, 0);
2291 t.bitfield.imm64 = 1;
2293 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2295 /* This code is disabled on the 486 because all the Imm1 forms
2296 in the opcode table are slower on the i486. They're the
2297 versions with the implicitly specified single-position
2298 displacement, which has another syntax if you really want to
2299 use that form. */
2300 t.bitfield.imm1 = 1;
2301 t.bitfield.imm8 = 1;
2302 t.bitfield.imm8s = 1;
2303 t.bitfield.imm16 = 1;
2304 t.bitfield.imm32 = 1;
2305 t.bitfield.imm32s = 1;
2307 else if (fits_in_signed_byte (num))
2309 t.bitfield.imm8 = 1;
2310 t.bitfield.imm8s = 1;
2311 t.bitfield.imm16 = 1;
2312 t.bitfield.imm32 = 1;
2313 t.bitfield.imm32s = 1;
2315 else if (fits_in_unsigned_byte (num))
2317 t.bitfield.imm8 = 1;
2318 t.bitfield.imm16 = 1;
2319 t.bitfield.imm32 = 1;
2320 t.bitfield.imm32s = 1;
2322 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2324 t.bitfield.imm16 = 1;
2325 t.bitfield.imm32 = 1;
2326 t.bitfield.imm32s = 1;
2328 else if (fits_in_signed_long (num))
2330 t.bitfield.imm32 = 1;
2331 t.bitfield.imm32s = 1;
2333 else if (fits_in_unsigned_long (num))
2334 t.bitfield.imm32 = 1;
2336 return t;
2339 static offsetT
2340 offset_in_range (offsetT val, int size)
2342 addressT mask;
2344 switch (size)
2346 case 1: mask = ((addressT) 1 << 8) - 1; break;
2347 case 2: mask = ((addressT) 1 << 16) - 1; break;
2348 case 4: mask = ((addressT) 2 << 31) - 1; break;
2349 #ifdef BFD64
2350 case 8: mask = ((addressT) 2 << 63) - 1; break;
2351 #endif
2352 default: abort ();
2355 #ifdef BFD64
2356 /* If BFD64, sign extend val for 32bit address mode. */
2357 if (flag_code != CODE_64BIT
2358 || i.prefix[ADDR_PREFIX])
2359 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2360 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2361 #endif
2363 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2365 char buf1[40], buf2[40];
2367 sprint_value (buf1, val);
2368 sprint_value (buf2, val & mask);
2369 as_warn (_("%s shortened to %s"), buf1, buf2);
2371 return val & mask;
2374 enum PREFIX_GROUP
2376 PREFIX_EXIST = 0,
2377 PREFIX_LOCK,
2378 PREFIX_REP,
2379 PREFIX_DS,
2380 PREFIX_OTHER
2383 /* Returns
2384 a. PREFIX_EXIST if attempting to add a prefix where one from the
2385 same class already exists.
2386 b. PREFIX_LOCK if lock prefix is added.
2387 c. PREFIX_REP if rep/repne prefix is added.
2388 d. PREFIX_DS if ds prefix is added.
2389 e. PREFIX_OTHER if other prefix is added.
2392 static enum PREFIX_GROUP
2393 add_prefix (unsigned int prefix)
2395 enum PREFIX_GROUP ret = PREFIX_OTHER;
2396 unsigned int q;
2398 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2399 && flag_code == CODE_64BIT)
2401 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2402 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2403 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2404 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2405 ret = PREFIX_EXIST;
2406 q = REX_PREFIX;
2408 else
2410 switch (prefix)
2412 default:
2413 abort ();
2415 case DS_PREFIX_OPCODE:
2416 ret = PREFIX_DS;
2417 /* Fall through. */
2418 case CS_PREFIX_OPCODE:
2419 case ES_PREFIX_OPCODE:
2420 case FS_PREFIX_OPCODE:
2421 case GS_PREFIX_OPCODE:
2422 case SS_PREFIX_OPCODE:
2423 q = SEG_PREFIX;
2424 break;
2426 case REPNE_PREFIX_OPCODE:
2427 case REPE_PREFIX_OPCODE:
2428 q = REP_PREFIX;
2429 ret = PREFIX_REP;
2430 break;
2432 case LOCK_PREFIX_OPCODE:
2433 q = LOCK_PREFIX;
2434 ret = PREFIX_LOCK;
2435 break;
2437 case FWAIT_OPCODE:
2438 q = WAIT_PREFIX;
2439 break;
2441 case ADDR_PREFIX_OPCODE:
2442 q = ADDR_PREFIX;
2443 break;
2445 case DATA_PREFIX_OPCODE:
2446 q = DATA_PREFIX;
2447 break;
2449 if (i.prefix[q] != 0)
2450 ret = PREFIX_EXIST;
2453 if (ret)
2455 if (!i.prefix[q])
2456 ++i.prefixes;
2457 i.prefix[q] |= prefix;
2459 else
2460 as_bad (_("same type of prefix used twice"));
2462 return ret;
2465 static void
2466 update_code_flag (int value, int check)
2468 PRINTF_LIKE ((*as_error));
2470 flag_code = (enum flag_code) value;
2471 if (flag_code == CODE_64BIT)
2473 cpu_arch_flags.bitfield.cpu64 = 1;
2474 cpu_arch_flags.bitfield.cpuno64 = 0;
2476 else
2478 cpu_arch_flags.bitfield.cpu64 = 0;
2479 cpu_arch_flags.bitfield.cpuno64 = 1;
2481 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2483 if (check)
2484 as_error = as_fatal;
2485 else
2486 as_error = as_bad;
2487 (*as_error) (_("64bit mode not supported on `%s'."),
2488 cpu_arch_name ? cpu_arch_name : default_arch);
2490 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2492 if (check)
2493 as_error = as_fatal;
2494 else
2495 as_error = as_bad;
2496 (*as_error) (_("32bit mode not supported on `%s'."),
2497 cpu_arch_name ? cpu_arch_name : default_arch);
2499 stackop_size = '\0';
2502 static void
2503 set_code_flag (int value)
2505 update_code_flag (value, 0);
2508 static void
2509 set_16bit_gcc_code_flag (int new_code_flag)
2511 flag_code = (enum flag_code) new_code_flag;
2512 if (flag_code != CODE_16BIT)
2513 abort ();
2514 cpu_arch_flags.bitfield.cpu64 = 0;
2515 cpu_arch_flags.bitfield.cpuno64 = 1;
2516 stackop_size = LONG_MNEM_SUFFIX;
2519 static void
2520 set_intel_syntax (int syntax_flag)
2522 /* Find out if register prefixing is specified. */
2523 int ask_naked_reg = 0;
2525 SKIP_WHITESPACE ();
2526 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2528 char *string;
2529 int e = get_symbol_name (&string);
2531 if (strcmp (string, "prefix") == 0)
2532 ask_naked_reg = 1;
2533 else if (strcmp (string, "noprefix") == 0)
2534 ask_naked_reg = -1;
2535 else
2536 as_bad (_("bad argument to syntax directive."));
2537 (void) restore_line_pointer (e);
2539 demand_empty_rest_of_line ();
2541 intel_syntax = syntax_flag;
2543 if (ask_naked_reg == 0)
2544 allow_naked_reg = (intel_syntax
2545 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2546 else
2547 allow_naked_reg = (ask_naked_reg < 0);
2549 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2551 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2552 identifier_chars['$'] = intel_syntax ? '$' : 0;
2553 register_prefix = allow_naked_reg ? "" : "%";
2556 static void
2557 set_intel_mnemonic (int mnemonic_flag)
2559 intel_mnemonic = mnemonic_flag;
2562 static void
2563 set_allow_index_reg (int flag)
2565 allow_index_reg = flag;
2568 static void
2569 set_check (int what)
2571 enum check_kind *kind;
2572 const char *str;
2574 if (what)
2576 kind = &operand_check;
2577 str = "operand";
2579 else
2581 kind = &sse_check;
2582 str = "sse";
2585 SKIP_WHITESPACE ();
2587 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2589 char *string;
2590 int e = get_symbol_name (&string);
2592 if (strcmp (string, "none") == 0)
2593 *kind = check_none;
2594 else if (strcmp (string, "warning") == 0)
2595 *kind = check_warning;
2596 else if (strcmp (string, "error") == 0)
2597 *kind = check_error;
2598 else
2599 as_bad (_("bad argument to %s_check directive."), str);
2600 (void) restore_line_pointer (e);
2602 else
2603 as_bad (_("missing argument for %s_check directive"), str);
2605 demand_empty_rest_of_line ();
2608 static void
2609 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2610 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2612 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2613 static const char *arch;
2615 /* Intel LIOM is only supported on ELF. */
2616 if (!IS_ELF)
2617 return;
2619 if (!arch)
2621 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2622 use default_arch. */
2623 arch = cpu_arch_name;
2624 if (!arch)
2625 arch = default_arch;
2628 /* If we are targeting Intel MCU, we must enable it. */
2629 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2630 || new_flag.bitfield.cpuiamcu)
2631 return;
2633 /* If we are targeting Intel L1OM, we must enable it. */
2634 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2635 || new_flag.bitfield.cpul1om)
2636 return;
2638 /* If we are targeting Intel K1OM, we must enable it. */
2639 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2640 || new_flag.bitfield.cpuk1om)
2641 return;
2643 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2644 #endif
2647 static void
2648 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2650 SKIP_WHITESPACE ();
2652 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2654 char *string;
2655 int e = get_symbol_name (&string);
2656 unsigned int j;
2657 i386_cpu_flags flags;
2659 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2661 if (strcmp (string, cpu_arch[j].name) == 0)
2663 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2665 if (*string != '.')
2667 cpu_arch_name = cpu_arch[j].name;
2668 cpu_sub_arch_name = NULL;
2669 cpu_arch_flags = cpu_arch[j].flags;
2670 if (flag_code == CODE_64BIT)
2672 cpu_arch_flags.bitfield.cpu64 = 1;
2673 cpu_arch_flags.bitfield.cpuno64 = 0;
2675 else
2677 cpu_arch_flags.bitfield.cpu64 = 0;
2678 cpu_arch_flags.bitfield.cpuno64 = 1;
2680 cpu_arch_isa = cpu_arch[j].type;
2681 cpu_arch_isa_flags = cpu_arch[j].flags;
2682 if (!cpu_arch_tune_set)
2684 cpu_arch_tune = cpu_arch_isa;
2685 cpu_arch_tune_flags = cpu_arch_isa_flags;
2687 break;
2690 flags = cpu_flags_or (cpu_arch_flags,
2691 cpu_arch[j].flags);
2693 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2695 if (cpu_sub_arch_name)
2697 char *name = cpu_sub_arch_name;
2698 cpu_sub_arch_name = concat (name,
2699 cpu_arch[j].name,
2700 (const char *) NULL);
2701 free (name);
2703 else
2704 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2705 cpu_arch_flags = flags;
2706 cpu_arch_isa_flags = flags;
2708 else
2709 cpu_arch_isa_flags
2710 = cpu_flags_or (cpu_arch_isa_flags,
2711 cpu_arch[j].flags);
2712 (void) restore_line_pointer (e);
2713 demand_empty_rest_of_line ();
2714 return;
2718 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2720 /* Disable an ISA extension. */
2721 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2722 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2724 flags = cpu_flags_and_not (cpu_arch_flags,
2725 cpu_noarch[j].flags);
2726 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2728 if (cpu_sub_arch_name)
2730 char *name = cpu_sub_arch_name;
2731 cpu_sub_arch_name = concat (name, string,
2732 (const char *) NULL);
2733 free (name);
2735 else
2736 cpu_sub_arch_name = xstrdup (string);
2737 cpu_arch_flags = flags;
2738 cpu_arch_isa_flags = flags;
2740 (void) restore_line_pointer (e);
2741 demand_empty_rest_of_line ();
2742 return;
2745 j = ARRAY_SIZE (cpu_arch);
2748 if (j >= ARRAY_SIZE (cpu_arch))
2749 as_bad (_("no such architecture: `%s'"), string);
2751 *input_line_pointer = e;
2753 else
2754 as_bad (_("missing cpu architecture"));
2756 no_cond_jump_promotion = 0;
2757 if (*input_line_pointer == ','
2758 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2760 char *string;
2761 char e;
2763 ++input_line_pointer;
2764 e = get_symbol_name (&string);
2766 if (strcmp (string, "nojumps") == 0)
2767 no_cond_jump_promotion = 1;
2768 else if (strcmp (string, "jumps") == 0)
2770 else
2771 as_bad (_("no such architecture modifier: `%s'"), string);
2773 (void) restore_line_pointer (e);
2776 demand_empty_rest_of_line ();
2779 enum bfd_architecture
2780 i386_arch (void)
2782 if (cpu_arch_isa == PROCESSOR_L1OM)
2784 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2785 || flag_code != CODE_64BIT)
2786 as_fatal (_("Intel L1OM is 64bit ELF only"));
2787 return bfd_arch_l1om;
2789 else if (cpu_arch_isa == PROCESSOR_K1OM)
2791 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2792 || flag_code != CODE_64BIT)
2793 as_fatal (_("Intel K1OM is 64bit ELF only"));
2794 return bfd_arch_k1om;
2796 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2798 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2799 || flag_code == CODE_64BIT)
2800 as_fatal (_("Intel MCU is 32bit ELF only"));
2801 return bfd_arch_iamcu;
2803 else
2804 return bfd_arch_i386;
2807 unsigned long
2808 i386_mach (void)
2810 if (!strncmp (default_arch, "x86_64", 6))
2812 if (cpu_arch_isa == PROCESSOR_L1OM)
2814 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2815 || default_arch[6] != '\0')
2816 as_fatal (_("Intel L1OM is 64bit ELF only"));
2817 return bfd_mach_l1om;
2819 else if (cpu_arch_isa == PROCESSOR_K1OM)
2821 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2822 || default_arch[6] != '\0')
2823 as_fatal (_("Intel K1OM is 64bit ELF only"));
2824 return bfd_mach_k1om;
2826 else if (default_arch[6] == '\0')
2827 return bfd_mach_x86_64;
2828 else
2829 return bfd_mach_x64_32;
2831 else if (!strcmp (default_arch, "i386")
2832 || !strcmp (default_arch, "iamcu"))
2834 if (cpu_arch_isa == PROCESSOR_IAMCU)
2836 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2837 as_fatal (_("Intel MCU is 32bit ELF only"));
2838 return bfd_mach_i386_iamcu;
2840 else
2841 return bfd_mach_i386_i386;
2843 else
2844 as_fatal (_("unknown architecture"));
2847 void
2848 md_begin (void)
2850 const char *hash_err;
2852 /* Support pseudo prefixes like {disp32}. */
2853 lex_type ['{'] = LEX_BEGIN_NAME;
2855 /* Initialize op_hash hash table. */
2856 op_hash = hash_new ();
2859 const insn_template *optab;
2860 templates *core_optab;
2862 /* Setup for loop. */
2863 optab = i386_optab;
2864 core_optab = XNEW (templates);
2865 core_optab->start = optab;
2867 while (1)
2869 ++optab;
2870 if (optab->name == NULL
2871 || strcmp (optab->name, (optab - 1)->name) != 0)
2873 /* different name --> ship out current template list;
2874 add to hash table; & begin anew. */
2875 core_optab->end = optab;
2876 hash_err = hash_insert (op_hash,
2877 (optab - 1)->name,
2878 (void *) core_optab);
2879 if (hash_err)
2881 as_fatal (_("can't hash %s: %s"),
2882 (optab - 1)->name,
2883 hash_err);
2885 if (optab->name == NULL)
2886 break;
2887 core_optab = XNEW (templates);
2888 core_optab->start = optab;
2893 /* Initialize reg_hash hash table. */
2894 reg_hash = hash_new ();
2896 const reg_entry *regtab;
2897 unsigned int regtab_size = i386_regtab_size;
2899 for (regtab = i386_regtab; regtab_size--; regtab++)
2901 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2902 if (hash_err)
2903 as_fatal (_("can't hash %s: %s"),
2904 regtab->reg_name,
2905 hash_err);
2909 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2911 int c;
2912 char *p;
2914 for (c = 0; c < 256; c++)
2916 if (ISDIGIT (c))
2918 digit_chars[c] = c;
2919 mnemonic_chars[c] = c;
2920 register_chars[c] = c;
2921 operand_chars[c] = c;
2923 else if (ISLOWER (c))
2925 mnemonic_chars[c] = c;
2926 register_chars[c] = c;
2927 operand_chars[c] = c;
2929 else if (ISUPPER (c))
2931 mnemonic_chars[c] = TOLOWER (c);
2932 register_chars[c] = mnemonic_chars[c];
2933 operand_chars[c] = c;
2935 else if (c == '{' || c == '}')
2937 mnemonic_chars[c] = c;
2938 operand_chars[c] = c;
2941 if (ISALPHA (c) || ISDIGIT (c))
2942 identifier_chars[c] = c;
2943 else if (c >= 128)
2945 identifier_chars[c] = c;
2946 operand_chars[c] = c;
2950 #ifdef LEX_AT
2951 identifier_chars['@'] = '@';
2952 #endif
2953 #ifdef LEX_QM
2954 identifier_chars['?'] = '?';
2955 operand_chars['?'] = '?';
2956 #endif
2957 digit_chars['-'] = '-';
2958 mnemonic_chars['_'] = '_';
2959 mnemonic_chars['-'] = '-';
2960 mnemonic_chars['.'] = '.';
2961 identifier_chars['_'] = '_';
2962 identifier_chars['.'] = '.';
2964 for (p = operand_special_chars; *p != '\0'; p++)
2965 operand_chars[(unsigned char) *p] = *p;
2968 if (flag_code == CODE_64BIT)
2970 #if defined (OBJ_COFF) && defined (TE_PE)
2971 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2972 ? 32 : 16);
2973 #else
2974 x86_dwarf2_return_column = 16;
2975 #endif
2976 x86_cie_data_alignment = -8;
2978 else
2980 x86_dwarf2_return_column = 8;
2981 x86_cie_data_alignment = -4;
2985 void
2986 i386_print_statistics (FILE *file)
2988 hash_print_statistics (file, "i386 opcode", op_hash);
2989 hash_print_statistics (file, "i386 register", reg_hash);
2992 #ifdef DEBUG386
2994 /* Debugging routines for md_assemble. */
2995 static void pte (insn_template *);
2996 static void pt (i386_operand_type);
2997 static void pe (expressionS *);
2998 static void ps (symbolS *);
3000 static void
3001 pi (char *line, i386_insn *x)
3003 unsigned int j;
3005 fprintf (stdout, "%s: template ", line);
3006 pte (&x->tm);
3007 fprintf (stdout, " address: base %s index %s scale %x\n",
3008 x->base_reg ? x->base_reg->reg_name : "none",
3009 x->index_reg ? x->index_reg->reg_name : "none",
3010 x->log2_scale_factor);
3011 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3012 x->rm.mode, x->rm.reg, x->rm.regmem);
3013 fprintf (stdout, " sib: base %x index %x scale %x\n",
3014 x->sib.base, x->sib.index, x->sib.scale);
3015 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3016 (x->rex & REX_W) != 0,
3017 (x->rex & REX_R) != 0,
3018 (x->rex & REX_X) != 0,
3019 (x->rex & REX_B) != 0);
3020 for (j = 0; j < x->operands; j++)
3022 fprintf (stdout, " #%d: ", j + 1);
3023 pt (x->types[j]);
3024 fprintf (stdout, "\n");
3025 if (x->types[j].bitfield.reg
3026 || x->types[j].bitfield.regmmx
3027 || x->types[j].bitfield.regsimd
3028 || x->types[j].bitfield.sreg2
3029 || x->types[j].bitfield.sreg3
3030 || x->types[j].bitfield.control
3031 || x->types[j].bitfield.debug
3032 || x->types[j].bitfield.test)
3033 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3034 if (operand_type_check (x->types[j], imm))
3035 pe (x->op[j].imms);
3036 if (operand_type_check (x->types[j], disp))
3037 pe (x->op[j].disps);
3041 static void
3042 pte (insn_template *t)
3044 unsigned int j;
3045 fprintf (stdout, " %d operands ", t->operands);
3046 fprintf (stdout, "opcode %x ", t->base_opcode);
3047 if (t->extension_opcode != None)
3048 fprintf (stdout, "ext %x ", t->extension_opcode);
3049 if (t->opcode_modifier.d)
3050 fprintf (stdout, "D");
3051 if (t->opcode_modifier.w)
3052 fprintf (stdout, "W");
3053 fprintf (stdout, "\n");
3054 for (j = 0; j < t->operands; j++)
3056 fprintf (stdout, " #%d type ", j + 1);
3057 pt (t->operand_types[j]);
3058 fprintf (stdout, "\n");
3062 static void
3063 pe (expressionS *e)
3065 fprintf (stdout, " operation %d\n", e->X_op);
3066 fprintf (stdout, " add_number %ld (%lx)\n",
3067 (long) e->X_add_number, (long) e->X_add_number);
3068 if (e->X_add_symbol)
3070 fprintf (stdout, " add_symbol ");
3071 ps (e->X_add_symbol);
3072 fprintf (stdout, "\n");
3074 if (e->X_op_symbol)
3076 fprintf (stdout, " op_symbol ");
3077 ps (e->X_op_symbol);
3078 fprintf (stdout, "\n");
3082 static void
3083 ps (symbolS *s)
3085 fprintf (stdout, "%s type %s%s",
3086 S_GET_NAME (s),
3087 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3088 segment_name (S_GET_SEGMENT (s)));
3091 static struct type_name
3093 i386_operand_type mask;
3094 const char *name;
3096 const type_names[] =
3098 { OPERAND_TYPE_REG8, "r8" },
3099 { OPERAND_TYPE_REG16, "r16" },
3100 { OPERAND_TYPE_REG32, "r32" },
3101 { OPERAND_TYPE_REG64, "r64" },
3102 { OPERAND_TYPE_IMM8, "i8" },
3103 { OPERAND_TYPE_IMM8, "i8s" },
3104 { OPERAND_TYPE_IMM16, "i16" },
3105 { OPERAND_TYPE_IMM32, "i32" },
3106 { OPERAND_TYPE_IMM32S, "i32s" },
3107 { OPERAND_TYPE_IMM64, "i64" },
3108 { OPERAND_TYPE_IMM1, "i1" },
3109 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3110 { OPERAND_TYPE_DISP8, "d8" },
3111 { OPERAND_TYPE_DISP16, "d16" },
3112 { OPERAND_TYPE_DISP32, "d32" },
3113 { OPERAND_TYPE_DISP32S, "d32s" },
3114 { OPERAND_TYPE_DISP64, "d64" },
3115 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3116 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3117 { OPERAND_TYPE_CONTROL, "control reg" },
3118 { OPERAND_TYPE_TEST, "test reg" },
3119 { OPERAND_TYPE_DEBUG, "debug reg" },
3120 { OPERAND_TYPE_FLOATREG, "FReg" },
3121 { OPERAND_TYPE_FLOATACC, "FAcc" },
3122 { OPERAND_TYPE_SREG2, "SReg2" },
3123 { OPERAND_TYPE_SREG3, "SReg3" },
3124 { OPERAND_TYPE_ACC, "Acc" },
3125 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3126 { OPERAND_TYPE_REGMMX, "rMMX" },
3127 { OPERAND_TYPE_REGXMM, "rXMM" },
3128 { OPERAND_TYPE_REGYMM, "rYMM" },
3129 { OPERAND_TYPE_REGZMM, "rZMM" },
3130 { OPERAND_TYPE_REGMASK, "Mask reg" },
3131 { OPERAND_TYPE_ESSEG, "es" },
3134 static void
3135 pt (i386_operand_type t)
3137 unsigned int j;
3138 i386_operand_type a;
3140 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3142 a = operand_type_and (t, type_names[j].mask);
3143 if (!operand_type_all_zero (&a))
3144 fprintf (stdout, "%s, ", type_names[j].name);
3146 fflush (stdout);
3149 #endif /* DEBUG386 */
3151 static bfd_reloc_code_real_type
3152 reloc (unsigned int size,
3153 int pcrel,
3154 int sign,
3155 bfd_reloc_code_real_type other)
3157 if (other != NO_RELOC)
3159 reloc_howto_type *rel;
3161 if (size == 8)
3162 switch (other)
3164 case BFD_RELOC_X86_64_GOT32:
3165 return BFD_RELOC_X86_64_GOT64;
3166 break;
3167 case BFD_RELOC_X86_64_GOTPLT64:
3168 return BFD_RELOC_X86_64_GOTPLT64;
3169 break;
3170 case BFD_RELOC_X86_64_PLTOFF64:
3171 return BFD_RELOC_X86_64_PLTOFF64;
3172 break;
3173 case BFD_RELOC_X86_64_GOTPC32:
3174 other = BFD_RELOC_X86_64_GOTPC64;
3175 break;
3176 case BFD_RELOC_X86_64_GOTPCREL:
3177 other = BFD_RELOC_X86_64_GOTPCREL64;
3178 break;
3179 case BFD_RELOC_X86_64_TPOFF32:
3180 other = BFD_RELOC_X86_64_TPOFF64;
3181 break;
3182 case BFD_RELOC_X86_64_DTPOFF32:
3183 other = BFD_RELOC_X86_64_DTPOFF64;
3184 break;
3185 default:
3186 break;
3189 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3190 if (other == BFD_RELOC_SIZE32)
3192 if (size == 8)
3193 other = BFD_RELOC_SIZE64;
3194 if (pcrel)
3196 as_bad (_("there are no pc-relative size relocations"));
3197 return NO_RELOC;
3200 #endif
3202 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3203 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3204 sign = -1;
3206 rel = bfd_reloc_type_lookup (stdoutput, other);
3207 if (!rel)
3208 as_bad (_("unknown relocation (%u)"), other);
3209 else if (size != bfd_get_reloc_size (rel))
3210 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3211 bfd_get_reloc_size (rel),
3212 size);
3213 else if (pcrel && !rel->pc_relative)
3214 as_bad (_("non-pc-relative relocation for pc-relative field"));
3215 else if ((rel->complain_on_overflow == complain_overflow_signed
3216 && !sign)
3217 || (rel->complain_on_overflow == complain_overflow_unsigned
3218 && sign > 0))
3219 as_bad (_("relocated field and relocation type differ in signedness"));
3220 else
3221 return other;
3222 return NO_RELOC;
3225 if (pcrel)
3227 if (!sign)
3228 as_bad (_("there are no unsigned pc-relative relocations"));
3229 switch (size)
3231 case 1: return BFD_RELOC_8_PCREL;
3232 case 2: return BFD_RELOC_16_PCREL;
3233 case 4: return BFD_RELOC_32_PCREL;
3234 case 8: return BFD_RELOC_64_PCREL;
3236 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3238 else
3240 if (sign > 0)
3241 switch (size)
3243 case 4: return BFD_RELOC_X86_64_32S;
3245 else
3246 switch (size)
3248 case 1: return BFD_RELOC_8;
3249 case 2: return BFD_RELOC_16;
3250 case 4: return BFD_RELOC_32;
3251 case 8: return BFD_RELOC_64;
3253 as_bad (_("cannot do %s %u byte relocation"),
3254 sign > 0 ? "signed" : "unsigned", size);
3257 return NO_RELOC;
3260 /* Here we decide which fixups can be adjusted to make them relative to
3261 the beginning of the section instead of the symbol. Basically we need
3262 to make sure that the dynamic relocations are done correctly, so in
3263 some cases we force the original symbol to be used. */
3266 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3268 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3269 if (!IS_ELF)
3270 return 1;
3272 /* Don't adjust pc-relative references to merge sections in 64-bit
3273 mode. */
3274 if (use_rela_relocations
3275 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3276 && fixP->fx_pcrel)
3277 return 0;
3279 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3280 and changed later by validate_fix. */
3281 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3282 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3283 return 0;
3285 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3286 for size relocations. */
3287 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3288 || fixP->fx_r_type == BFD_RELOC_SIZE64
3289 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3290 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3291 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3292 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3293 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3294 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3295 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3296 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3297 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3298 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3299 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3300 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3301 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3302 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3303 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3304 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3305 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3306 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3307 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3308 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3309 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3310 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3311 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3312 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3313 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3314 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3315 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3316 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3317 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3318 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3319 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3320 return 0;
3321 #endif
3322 return 1;
3325 static int
3326 intel_float_operand (const char *mnemonic)
3328 /* Note that the value returned is meaningful only for opcodes with (memory)
3329 operands, hence the code here is free to improperly handle opcodes that
3330 have no operands (for better performance and smaller code). */
3332 if (mnemonic[0] != 'f')
3333 return 0; /* non-math */
3335 switch (mnemonic[1])
3337 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3338 the fs segment override prefix not currently handled because no
3339 call path can make opcodes without operands get here */
3340 case 'i':
3341 return 2 /* integer op */;
3342 case 'l':
3343 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3344 return 3; /* fldcw/fldenv */
3345 break;
3346 case 'n':
3347 if (mnemonic[2] != 'o' /* fnop */)
3348 return 3; /* non-waiting control op */
3349 break;
3350 case 'r':
3351 if (mnemonic[2] == 's')
3352 return 3; /* frstor/frstpm */
3353 break;
3354 case 's':
3355 if (mnemonic[2] == 'a')
3356 return 3; /* fsave */
3357 if (mnemonic[2] == 't')
3359 switch (mnemonic[3])
3361 case 'c': /* fstcw */
3362 case 'd': /* fstdw */
3363 case 'e': /* fstenv */
3364 case 's': /* fsts[gw] */
3365 return 3;
3368 break;
3369 case 'x':
3370 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3371 return 0; /* fxsave/fxrstor are not really math ops */
3372 break;
3375 return 1;
3378 /* Build the VEX prefix. */
3380 static void
3381 build_vex_prefix (const insn_template *t)
3383 unsigned int register_specifier;
3384 unsigned int implied_prefix;
3385 unsigned int vector_length;
3386 unsigned int w;
3388 /* Check register specifier. */
3389 if (i.vex.register_specifier)
3391 register_specifier =
3392 ~register_number (i.vex.register_specifier) & 0xf;
3393 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3395 else
3396 register_specifier = 0xf;
3398 /* Use 2-byte VEX prefix by swapping destination and source operand
3399 if there are more than 1 register operand. */
3400 if (i.reg_operands > 1
3401 && i.vec_encoding != vex_encoding_vex3
3402 && i.dir_encoding == dir_encoding_default
3403 && i.operands == i.reg_operands
3404 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3405 && i.tm.opcode_modifier.vexopcode == VEX0F
3406 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3407 && i.rex == REX_B)
3409 unsigned int xchg = i.operands - 1;
3410 union i386_op temp_op;
3411 i386_operand_type temp_type;
3413 temp_type = i.types[xchg];
3414 i.types[xchg] = i.types[0];
3415 i.types[0] = temp_type;
3416 temp_op = i.op[xchg];
3417 i.op[xchg] = i.op[0];
3418 i.op[0] = temp_op;
3420 gas_assert (i.rm.mode == 3);
3422 i.rex = REX_R;
3423 xchg = i.rm.regmem;
3424 i.rm.regmem = i.rm.reg;
3425 i.rm.reg = xchg;
3427 if (i.tm.opcode_modifier.d)
3428 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3429 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3430 else /* Use the next insn. */
3431 i.tm = t[1];
3434 if (i.tm.opcode_modifier.vex == VEXScalar)
3435 vector_length = avxscalar;
3436 else if (i.tm.opcode_modifier.vex == VEX256)
3437 vector_length = 1;
3438 else
3440 unsigned int op;
3442 /* Determine vector length from the last multi-length vector
3443 operand. */
3444 vector_length = 0;
3445 for (op = t->operands; op--;)
3446 if (t->operand_types[op].bitfield.xmmword
3447 && t->operand_types[op].bitfield.ymmword
3448 && i.types[op].bitfield.ymmword)
3450 vector_length = 1;
3451 break;
3455 switch ((i.tm.base_opcode >> 8) & 0xff)
3457 case 0:
3458 implied_prefix = 0;
3459 break;
3460 case DATA_PREFIX_OPCODE:
3461 implied_prefix = 1;
3462 break;
3463 case REPE_PREFIX_OPCODE:
3464 implied_prefix = 2;
3465 break;
3466 case REPNE_PREFIX_OPCODE:
3467 implied_prefix = 3;
3468 break;
3469 default:
3470 abort ();
3473 /* Check the REX.W bit and VEXW. */
3474 if (i.tm.opcode_modifier.vexw == VEXWIG)
3475 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3476 else if (i.tm.opcode_modifier.vexw)
3477 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3478 else
3479 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3481 /* Use 2-byte VEX prefix if possible. */
3482 if (w == 0
3483 && i.vec_encoding != vex_encoding_vex3
3484 && i.tm.opcode_modifier.vexopcode == VEX0F
3485 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3487 /* 2-byte VEX prefix. */
3488 unsigned int r;
3490 i.vex.length = 2;
3491 i.vex.bytes[0] = 0xc5;
3493 /* Check the REX.R bit. */
3494 r = (i.rex & REX_R) ? 0 : 1;
3495 i.vex.bytes[1] = (r << 7
3496 | register_specifier << 3
3497 | vector_length << 2
3498 | implied_prefix);
3500 else
3502 /* 3-byte VEX prefix. */
3503 unsigned int m;
3505 i.vex.length = 3;
3507 switch (i.tm.opcode_modifier.vexopcode)
3509 case VEX0F:
3510 m = 0x1;
3511 i.vex.bytes[0] = 0xc4;
3512 break;
3513 case VEX0F38:
3514 m = 0x2;
3515 i.vex.bytes[0] = 0xc4;
3516 break;
3517 case VEX0F3A:
3518 m = 0x3;
3519 i.vex.bytes[0] = 0xc4;
3520 break;
3521 case XOP08:
3522 m = 0x8;
3523 i.vex.bytes[0] = 0x8f;
3524 break;
3525 case XOP09:
3526 m = 0x9;
3527 i.vex.bytes[0] = 0x8f;
3528 break;
3529 case XOP0A:
3530 m = 0xa;
3531 i.vex.bytes[0] = 0x8f;
3532 break;
3533 default:
3534 abort ();
3537 /* The high 3 bits of the second VEX byte are 1's compliment
3538 of RXB bits from REX. */
3539 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3541 i.vex.bytes[2] = (w << 7
3542 | register_specifier << 3
3543 | vector_length << 2
3544 | implied_prefix);
3548 static INLINE bfd_boolean
3549 is_evex_encoding (const insn_template *t)
3551 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3552 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3553 || t->opcode_modifier.staticrounding || t->opcode_modifier.sae;
3556 static INLINE bfd_boolean
3557 is_any_vex_encoding (const insn_template *t)
3559 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3560 || is_evex_encoding (t);
3563 /* Build the EVEX prefix. */
3565 static void
3566 build_evex_prefix (void)
3568 unsigned int register_specifier;
3569 unsigned int implied_prefix;
3570 unsigned int m, w;
3571 rex_byte vrex_used = 0;
3573 /* Check register specifier. */
3574 if (i.vex.register_specifier)
3576 gas_assert ((i.vrex & REX_X) == 0);
3578 register_specifier = i.vex.register_specifier->reg_num;
3579 if ((i.vex.register_specifier->reg_flags & RegRex))
3580 register_specifier += 8;
3581 /* The upper 16 registers are encoded in the fourth byte of the
3582 EVEX prefix. */
3583 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3584 i.vex.bytes[3] = 0x8;
3585 register_specifier = ~register_specifier & 0xf;
3587 else
3589 register_specifier = 0xf;
3591 /* Encode upper 16 vector index register in the fourth byte of
3592 the EVEX prefix. */
3593 if (!(i.vrex & REX_X))
3594 i.vex.bytes[3] = 0x8;
3595 else
3596 vrex_used |= REX_X;
3599 switch ((i.tm.base_opcode >> 8) & 0xff)
3601 case 0:
3602 implied_prefix = 0;
3603 break;
3604 case DATA_PREFIX_OPCODE:
3605 implied_prefix = 1;
3606 break;
3607 case REPE_PREFIX_OPCODE:
3608 implied_prefix = 2;
3609 break;
3610 case REPNE_PREFIX_OPCODE:
3611 implied_prefix = 3;
3612 break;
3613 default:
3614 abort ();
3617 /* 4 byte EVEX prefix. */
3618 i.vex.length = 4;
3619 i.vex.bytes[0] = 0x62;
3621 /* mmmm bits. */
3622 switch (i.tm.opcode_modifier.vexopcode)
3624 case VEX0F:
3625 m = 1;
3626 break;
3627 case VEX0F38:
3628 m = 2;
3629 break;
3630 case VEX0F3A:
3631 m = 3;
3632 break;
3633 default:
3634 abort ();
3635 break;
3638 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3639 bits from REX. */
3640 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3642 /* The fifth bit of the second EVEX byte is 1's compliment of the
3643 REX_R bit in VREX. */
3644 if (!(i.vrex & REX_R))
3645 i.vex.bytes[1] |= 0x10;
3646 else
3647 vrex_used |= REX_R;
3649 if ((i.reg_operands + i.imm_operands) == i.operands)
3651 /* When all operands are registers, the REX_X bit in REX is not
3652 used. We reuse it to encode the upper 16 registers, which is
3653 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3654 as 1's compliment. */
3655 if ((i.vrex & REX_B))
3657 vrex_used |= REX_B;
3658 i.vex.bytes[1] &= ~0x40;
3662 /* EVEX instructions shouldn't need the REX prefix. */
3663 i.vrex &= ~vrex_used;
3664 gas_assert (i.vrex == 0);
3666 /* Check the REX.W bit and VEXW. */
3667 if (i.tm.opcode_modifier.vexw == VEXWIG)
3668 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3669 else if (i.tm.opcode_modifier.vexw)
3670 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3671 else
3672 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3674 /* Encode the U bit. */
3675 implied_prefix |= 0x4;
3677 /* The third byte of the EVEX prefix. */
3678 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3680 /* The fourth byte of the EVEX prefix. */
3681 /* The zeroing-masking bit. */
3682 if (i.mask && i.mask->zeroing)
3683 i.vex.bytes[3] |= 0x80;
3685 /* Don't always set the broadcast bit if there is no RC. */
3686 if (!i.rounding)
3688 /* Encode the vector length. */
3689 unsigned int vec_length;
3691 if (!i.tm.opcode_modifier.evex
3692 || i.tm.opcode_modifier.evex == EVEXDYN)
3694 unsigned int op;
3696 /* Determine vector length from the last multi-length vector
3697 operand. */
3698 vec_length = 0;
3699 for (op = i.operands; op--;)
3700 if (i.tm.operand_types[op].bitfield.xmmword
3701 + i.tm.operand_types[op].bitfield.ymmword
3702 + i.tm.operand_types[op].bitfield.zmmword > 1)
3704 if (i.types[op].bitfield.zmmword)
3706 i.tm.opcode_modifier.evex = EVEX512;
3707 break;
3709 else if (i.types[op].bitfield.ymmword)
3711 i.tm.opcode_modifier.evex = EVEX256;
3712 break;
3714 else if (i.types[op].bitfield.xmmword)
3716 i.tm.opcode_modifier.evex = EVEX128;
3717 break;
3719 else if (i.broadcast && (int) op == i.broadcast->operand)
3721 switch (i.broadcast->bytes)
3723 case 64:
3724 i.tm.opcode_modifier.evex = EVEX512;
3725 break;
3726 case 32:
3727 i.tm.opcode_modifier.evex = EVEX256;
3728 break;
3729 case 16:
3730 i.tm.opcode_modifier.evex = EVEX128;
3731 break;
3732 default:
3733 abort ();
3735 break;
3739 if (op >= MAX_OPERANDS)
3740 abort ();
3743 switch (i.tm.opcode_modifier.evex)
3745 case EVEXLIG: /* LL' is ignored */
3746 vec_length = evexlig << 5;
3747 break;
3748 case EVEX128:
3749 vec_length = 0 << 5;
3750 break;
3751 case EVEX256:
3752 vec_length = 1 << 5;
3753 break;
3754 case EVEX512:
3755 vec_length = 2 << 5;
3756 break;
3757 default:
3758 abort ();
3759 break;
3761 i.vex.bytes[3] |= vec_length;
3762 /* Encode the broadcast bit. */
3763 if (i.broadcast)
3764 i.vex.bytes[3] |= 0x10;
3766 else
3768 if (i.rounding->type != saeonly)
3769 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3770 else
3771 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3774 if (i.mask && i.mask->mask)
3775 i.vex.bytes[3] |= i.mask->mask->reg_num;
3778 static void
3779 process_immext (void)
3781 expressionS *exp;
3783 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3784 && i.operands > 0)
3786 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3787 with an opcode suffix which is coded in the same place as an
3788 8-bit immediate field would be.
3789 Here we check those operands and remove them afterwards. */
3790 unsigned int x;
3792 for (x = 0; x < i.operands; x++)
3793 if (register_number (i.op[x].regs) != x)
3794 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3795 register_prefix, i.op[x].regs->reg_name, x + 1,
3796 i.tm.name);
3798 i.operands = 0;
3801 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3803 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3804 suffix which is coded in the same place as an 8-bit immediate
3805 field would be.
3806 Here we check those operands and remove them afterwards. */
3807 unsigned int x;
3809 if (i.operands != 3)
3810 abort();
3812 for (x = 0; x < 2; x++)
3813 if (register_number (i.op[x].regs) != x)
3814 goto bad_register_operand;
3816 /* Check for third operand for mwaitx/monitorx insn. */
3817 if (register_number (i.op[x].regs)
3818 != (x + (i.tm.extension_opcode == 0xfb)))
3820 bad_register_operand:
3821 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3822 register_prefix, i.op[x].regs->reg_name, x+1,
3823 i.tm.name);
3826 i.operands = 0;
3829 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3830 which is coded in the same place as an 8-bit immediate field
3831 would be. Here we fake an 8-bit immediate operand from the
3832 opcode suffix stored in tm.extension_opcode.
3834 AVX instructions also use this encoding, for some of
3835 3 argument instructions. */
3837 gas_assert (i.imm_operands <= 1
3838 && (i.operands <= 2
3839 || (is_any_vex_encoding (&i.tm)
3840 && i.operands <= 4)));
3842 exp = &im_expressions[i.imm_operands++];
3843 i.op[i.operands].imms = exp;
3844 i.types[i.operands] = imm8;
3845 i.operands++;
3846 exp->X_op = O_constant;
3847 exp->X_add_number = i.tm.extension_opcode;
3848 i.tm.extension_opcode = None;
3852 static int
3853 check_hle (void)
3855 switch (i.tm.opcode_modifier.hleprefixok)
3857 default:
3858 abort ();
3859 case HLEPrefixNone:
3860 as_bad (_("invalid instruction `%s' after `%s'"),
3861 i.tm.name, i.hle_prefix);
3862 return 0;
3863 case HLEPrefixLock:
3864 if (i.prefix[LOCK_PREFIX])
3865 return 1;
3866 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3867 return 0;
3868 case HLEPrefixAny:
3869 return 1;
3870 case HLEPrefixRelease:
3871 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3873 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3874 i.tm.name);
3875 return 0;
3877 if (i.mem_operands == 0
3878 || !operand_type_check (i.types[i.operands - 1], anymem))
3880 as_bad (_("memory destination needed for instruction `%s'"
3881 " after `xrelease'"), i.tm.name);
3882 return 0;
3884 return 1;
3888 /* Try the shortest encoding by shortening operand size. */
3890 static void
3891 optimize_encoding (void)
3893 int j;
3895 if (optimize_for_space
3896 && i.reg_operands == 1
3897 && i.imm_operands == 1
3898 && !i.types[1].bitfield.byte
3899 && i.op[0].imms->X_op == O_constant
3900 && fits_in_imm7 (i.op[0].imms->X_add_number)
3901 && ((i.tm.base_opcode == 0xa8
3902 && i.tm.extension_opcode == None)
3903 || (i.tm.base_opcode == 0xf6
3904 && i.tm.extension_opcode == 0x0)))
3906 /* Optimize: -Os:
3907 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
3909 unsigned int base_regnum = i.op[1].regs->reg_num;
3910 if (flag_code == CODE_64BIT || base_regnum < 4)
3912 i.types[1].bitfield.byte = 1;
3913 /* Ignore the suffix. */
3914 i.suffix = 0;
3915 if (base_regnum >= 4
3916 && !(i.op[1].regs->reg_flags & RegRex))
3918 /* Handle SP, BP, SI and DI registers. */
3919 if (i.types[1].bitfield.word)
3920 j = 16;
3921 else if (i.types[1].bitfield.dword)
3922 j = 32;
3923 else
3924 j = 48;
3925 i.op[1].regs -= j;
3929 else if (flag_code == CODE_64BIT
3930 && ((i.types[1].bitfield.qword
3931 && i.reg_operands == 1
3932 && i.imm_operands == 1
3933 && i.op[0].imms->X_op == O_constant
3934 && ((i.tm.base_opcode == 0xb0
3935 && i.tm.extension_opcode == None
3936 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3937 || (fits_in_imm31 (i.op[0].imms->X_add_number)
3938 && (((i.tm.base_opcode == 0x24
3939 || i.tm.base_opcode == 0xa8)
3940 && i.tm.extension_opcode == None)
3941 || (i.tm.base_opcode == 0x80
3942 && i.tm.extension_opcode == 0x4)
3943 || ((i.tm.base_opcode == 0xf6
3944 || i.tm.base_opcode == 0xc6)
3945 && i.tm.extension_opcode == 0x0)))))
3946 || (i.types[0].bitfield.qword
3947 && ((i.reg_operands == 2
3948 && i.op[0].regs == i.op[1].regs
3949 && ((i.tm.base_opcode == 0x30
3950 || i.tm.base_opcode == 0x28)
3951 && i.tm.extension_opcode == None))
3952 || (i.reg_operands == 1
3953 && i.operands == 1
3954 && i.tm.base_opcode == 0x30
3955 && i.tm.extension_opcode == None)))))
3957 /* Optimize: -O:
3958 andq $imm31, %r64 -> andl $imm31, %r32
3959 testq $imm31, %r64 -> testl $imm31, %r32
3960 xorq %r64, %r64 -> xorl %r32, %r32
3961 subq %r64, %r64 -> subl %r32, %r32
3962 movq $imm31, %r64 -> movl $imm31, %r32
3963 movq $imm32, %r64 -> movl $imm32, %r32
3965 i.tm.opcode_modifier.norex64 = 1;
3966 if (i.tm.base_opcode == 0xb0 || i.tm.base_opcode == 0xc6)
3968 /* Handle
3969 movq $imm31, %r64 -> movl $imm31, %r32
3970 movq $imm32, %r64 -> movl $imm32, %r32
3972 i.tm.operand_types[0].bitfield.imm32 = 1;
3973 i.tm.operand_types[0].bitfield.imm32s = 0;
3974 i.tm.operand_types[0].bitfield.imm64 = 0;
3975 i.types[0].bitfield.imm32 = 1;
3976 i.types[0].bitfield.imm32s = 0;
3977 i.types[0].bitfield.imm64 = 0;
3978 i.types[1].bitfield.dword = 1;
3979 i.types[1].bitfield.qword = 0;
3980 if (i.tm.base_opcode == 0xc6)
3982 /* Handle
3983 movq $imm31, %r64 -> movl $imm31, %r32
3985 i.tm.base_opcode = 0xb0;
3986 i.tm.extension_opcode = None;
3987 i.tm.opcode_modifier.shortform = 1;
3988 i.tm.opcode_modifier.modrm = 0;
3992 else if (i.reg_operands == 3
3993 && i.op[0].regs == i.op[1].regs
3994 && !i.types[2].bitfield.xmmword
3995 && (i.tm.opcode_modifier.vex
3996 || ((!i.mask || i.mask->zeroing)
3997 && !i.rounding
3998 && is_evex_encoding (&i.tm)
3999 && (i.vec_encoding != vex_encoding_evex
4000 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4001 || i.tm.cpu_flags.bitfield.cpuavx512vl
4002 || (i.tm.operand_types[2].bitfield.zmmword
4003 && i.types[2].bitfield.ymmword))))
4004 && ((i.tm.base_opcode == 0x55
4005 || i.tm.base_opcode == 0x6655
4006 || i.tm.base_opcode == 0x66df
4007 || i.tm.base_opcode == 0x57
4008 || i.tm.base_opcode == 0x6657
4009 || i.tm.base_opcode == 0x66ef
4010 || i.tm.base_opcode == 0x66f8
4011 || i.tm.base_opcode == 0x66f9
4012 || i.tm.base_opcode == 0x66fa
4013 || i.tm.base_opcode == 0x66fb
4014 || i.tm.base_opcode == 0x42
4015 || i.tm.base_opcode == 0x6642
4016 || i.tm.base_opcode == 0x47
4017 || i.tm.base_opcode == 0x6647)
4018 && i.tm.extension_opcode == None))
4020 /* Optimize: -O1:
4021 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4022 vpsubq and vpsubw:
4023 EVEX VOP %zmmM, %zmmM, %zmmN
4024 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4025 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4026 EVEX VOP %ymmM, %ymmM, %ymmN
4027 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4028 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4029 VEX VOP %ymmM, %ymmM, %ymmN
4030 -> VEX VOP %xmmM, %xmmM, %xmmN
4031 VOP, one of vpandn and vpxor:
4032 VEX VOP %ymmM, %ymmM, %ymmN
4033 -> VEX VOP %xmmM, %xmmM, %xmmN
4034 VOP, one of vpandnd and vpandnq:
4035 EVEX VOP %zmmM, %zmmM, %zmmN
4036 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4037 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4038 EVEX VOP %ymmM, %ymmM, %ymmN
4039 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4040 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4041 VOP, one of vpxord and vpxorq:
4042 EVEX VOP %zmmM, %zmmM, %zmmN
4043 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4044 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4045 EVEX VOP %ymmM, %ymmM, %ymmN
4046 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4047 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4048 VOP, one of kxord and kxorq:
4049 VEX VOP %kM, %kM, %kN
4050 -> VEX kxorw %kM, %kM, %kN
4051 VOP, one of kandnd and kandnq:
4052 VEX VOP %kM, %kM, %kN
4053 -> VEX kandnw %kM, %kM, %kN
4055 if (is_evex_encoding (&i.tm))
4057 if (i.vec_encoding != vex_encoding_evex)
4059 i.tm.opcode_modifier.vex = VEX128;
4060 i.tm.opcode_modifier.vexw = VEXW0;
4061 i.tm.opcode_modifier.evex = 0;
4063 else if (optimize > 1)
4064 i.tm.opcode_modifier.evex = EVEX128;
4065 else
4066 return;
4068 else if (i.tm.operand_types[0].bitfield.regmask)
4070 i.tm.base_opcode &= 0xff;
4071 i.tm.opcode_modifier.vexw = VEXW0;
4073 else
4074 i.tm.opcode_modifier.vex = VEX128;
4076 if (i.tm.opcode_modifier.vex)
4077 for (j = 0; j < 3; j++)
4079 i.types[j].bitfield.xmmword = 1;
4080 i.types[j].bitfield.ymmword = 0;
4083 else if (i.vec_encoding != vex_encoding_evex
4084 && !i.types[0].bitfield.zmmword
4085 && !i.types[1].bitfield.zmmword
4086 && !i.mask
4087 && is_evex_encoding (&i.tm)
4088 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4089 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4090 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4091 && i.tm.extension_opcode == None)
4093 /* Optimize: -O1:
4094 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4095 vmovdqu32 and vmovdqu64:
4096 EVEX VOP %xmmM, %xmmN
4097 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4098 EVEX VOP %ymmM, %ymmN
4099 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4100 EVEX VOP %xmmM, mem
4101 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4102 EVEX VOP %ymmM, mem
4103 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4104 EVEX VOP mem, %xmmN
4105 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4106 EVEX VOP mem, %ymmN
4107 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4109 for (j = 0; j < 2; j++)
4110 if (operand_type_check (i.types[j], disp)
4111 && i.op[j].disps->X_op == O_constant)
4113 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4114 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4115 bytes, we choose EVEX Disp8 over VEX Disp32. */
4116 int evex_disp8, vex_disp8;
4117 unsigned int memshift = i.memshift;
4118 offsetT n = i.op[j].disps->X_add_number;
4120 evex_disp8 = fits_in_disp8 (n);
4121 i.memshift = 0;
4122 vex_disp8 = fits_in_disp8 (n);
4123 if (evex_disp8 != vex_disp8)
4125 i.memshift = memshift;
4126 return;
4129 i.types[j].bitfield.disp8 = vex_disp8;
4130 break;
4132 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4133 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4134 i.tm.opcode_modifier.vex
4135 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4136 i.tm.opcode_modifier.vexw = VEXW0;
4137 i.tm.opcode_modifier.evex = 0;
4138 i.tm.opcode_modifier.masking = 0;
4139 i.tm.opcode_modifier.disp8memshift = 0;
4140 i.memshift = 0;
4141 for (j = 0; j < 2; j++)
4142 if (operand_type_check (i.types[j], disp)
4143 && i.op[j].disps->X_op == O_constant)
4145 i.types[j].bitfield.disp8
4146 = fits_in_disp8 (i.op[j].disps->X_add_number);
4147 break;
4152 /* This is the guts of the machine-dependent assembler. LINE points to a
4153 machine dependent instruction. This function is supposed to emit
4154 the frags/bytes it assembles to. */
4156 void
4157 md_assemble (char *line)
4159 unsigned int j;
4160 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4161 const insn_template *t;
4163 /* Initialize globals. */
4164 memset (&i, '\0', sizeof (i));
4165 for (j = 0; j < MAX_OPERANDS; j++)
4166 i.reloc[j] = NO_RELOC;
4167 memset (disp_expressions, '\0', sizeof (disp_expressions));
4168 memset (im_expressions, '\0', sizeof (im_expressions));
4169 save_stack_p = save_stack;
4171 /* First parse an instruction mnemonic & call i386_operand for the operands.
4172 We assume that the scrubber has arranged it so that line[0] is the valid
4173 start of a (possibly prefixed) mnemonic. */
4175 line = parse_insn (line, mnemonic);
4176 if (line == NULL)
4177 return;
4178 mnem_suffix = i.suffix;
4180 line = parse_operands (line, mnemonic);
4181 this_operand = -1;
4182 xfree (i.memop1_string);
4183 i.memop1_string = NULL;
4184 if (line == NULL)
4185 return;
4187 /* Now we've parsed the mnemonic into a set of templates, and have the
4188 operands at hand. */
4190 /* All intel opcodes have reversed operands except for "bound" and
4191 "enter". We also don't reverse intersegment "jmp" and "call"
4192 instructions with 2 immediate operands so that the immediate segment
4193 precedes the offset, as it does when in AT&T mode. */
4194 if (intel_syntax
4195 && i.operands > 1
4196 && (strcmp (mnemonic, "bound") != 0)
4197 && (strcmp (mnemonic, "invlpga") != 0)
4198 && !(operand_type_check (i.types[0], imm)
4199 && operand_type_check (i.types[1], imm)))
4200 swap_operands ();
4202 /* The order of the immediates should be reversed
4203 for 2 immediates extrq and insertq instructions */
4204 if (i.imm_operands == 2
4205 && (strcmp (mnemonic, "extrq") == 0
4206 || strcmp (mnemonic, "insertq") == 0))
4207 swap_2_operands (0, 1);
4209 if (i.imm_operands)
4210 optimize_imm ();
4212 /* Don't optimize displacement for movabs since it only takes 64bit
4213 displacement. */
4214 if (i.disp_operands
4215 && i.disp_encoding != disp_encoding_32bit
4216 && (flag_code != CODE_64BIT
4217 || strcmp (mnemonic, "movabs") != 0))
4218 optimize_disp ();
4220 /* Next, we find a template that matches the given insn,
4221 making sure the overlap of the given operands types is consistent
4222 with the template operand types. */
4224 if (!(t = match_template (mnem_suffix)))
4225 return;
4227 if (sse_check != check_none
4228 && !i.tm.opcode_modifier.noavx
4229 && !i.tm.cpu_flags.bitfield.cpuavx
4230 && (i.tm.cpu_flags.bitfield.cpusse
4231 || i.tm.cpu_flags.bitfield.cpusse2
4232 || i.tm.cpu_flags.bitfield.cpusse3
4233 || i.tm.cpu_flags.bitfield.cpussse3
4234 || i.tm.cpu_flags.bitfield.cpusse4_1
4235 || i.tm.cpu_flags.bitfield.cpusse4_2
4236 || i.tm.cpu_flags.bitfield.cpupclmul
4237 || i.tm.cpu_flags.bitfield.cpuaes
4238 || i.tm.cpu_flags.bitfield.cpugfni))
4240 (sse_check == check_warning
4241 ? as_warn
4242 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4245 /* Zap movzx and movsx suffix. The suffix has been set from
4246 "word ptr" or "byte ptr" on the source operand in Intel syntax
4247 or extracted from mnemonic in AT&T syntax. But we'll use
4248 the destination register to choose the suffix for encoding. */
4249 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4251 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4252 there is no suffix, the default will be byte extension. */
4253 if (i.reg_operands != 2
4254 && !i.suffix
4255 && intel_syntax)
4256 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4258 i.suffix = 0;
4261 if (i.tm.opcode_modifier.fwait)
4262 if (!add_prefix (FWAIT_OPCODE))
4263 return;
4265 /* Check if REP prefix is OK. */
4266 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4268 as_bad (_("invalid instruction `%s' after `%s'"),
4269 i.tm.name, i.rep_prefix);
4270 return;
4273 /* Check for lock without a lockable instruction. Destination operand
4274 must be memory unless it is xchg (0x86). */
4275 if (i.prefix[LOCK_PREFIX]
4276 && (!i.tm.opcode_modifier.islockable
4277 || i.mem_operands == 0
4278 || (i.tm.base_opcode != 0x86
4279 && !operand_type_check (i.types[i.operands - 1], anymem))))
4281 as_bad (_("expecting lockable instruction after `lock'"));
4282 return;
4285 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4286 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4288 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4289 return;
4292 /* Check if HLE prefix is OK. */
4293 if (i.hle_prefix && !check_hle ())
4294 return;
4296 /* Check BND prefix. */
4297 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4298 as_bad (_("expecting valid branch instruction after `bnd'"));
4300 /* Check NOTRACK prefix. */
4301 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4302 as_bad (_("expecting indirect branch instruction after `notrack'"));
4304 if (i.tm.cpu_flags.bitfield.cpumpx)
4306 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4307 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4308 else if (flag_code != CODE_16BIT
4309 ? i.prefix[ADDR_PREFIX]
4310 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4311 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4314 /* Insert BND prefix. */
4315 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4317 if (!i.prefix[BND_PREFIX])
4318 add_prefix (BND_PREFIX_OPCODE);
4319 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4321 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4322 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4326 /* Check string instruction segment overrides. */
4327 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4329 if (!check_string ())
4330 return;
4331 i.disp_operands = 0;
4334 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4335 optimize_encoding ();
4337 if (!process_suffix ())
4338 return;
4340 /* Update operand types. */
4341 for (j = 0; j < i.operands; j++)
4342 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4344 /* Make still unresolved immediate matches conform to size of immediate
4345 given in i.suffix. */
4346 if (!finalize_imm ())
4347 return;
4349 if (i.types[0].bitfield.imm1)
4350 i.imm_operands = 0; /* kludge for shift insns. */
4352 /* We only need to check those implicit registers for instructions
4353 with 3 operands or less. */
4354 if (i.operands <= 3)
4355 for (j = 0; j < i.operands; j++)
4356 if (i.types[j].bitfield.inoutportreg
4357 || i.types[j].bitfield.shiftcount
4358 || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4359 i.reg_operands--;
4361 /* ImmExt should be processed after SSE2AVX. */
4362 if (!i.tm.opcode_modifier.sse2avx
4363 && i.tm.opcode_modifier.immext)
4364 process_immext ();
4366 /* For insns with operands there are more diddles to do to the opcode. */
4367 if (i.operands)
4369 if (!process_operands ())
4370 return;
4372 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4374 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4375 as_warn (_("translating to `%sp'"), i.tm.name);
4378 if (is_any_vex_encoding (&i.tm))
4380 if (flag_code == CODE_16BIT)
4382 as_bad (_("instruction `%s' isn't supported in 16-bit mode."),
4383 i.tm.name);
4384 return;
4387 if (i.tm.opcode_modifier.vex)
4388 build_vex_prefix (t);
4389 else
4390 build_evex_prefix ();
4393 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4394 instructions may define INT_OPCODE as well, so avoid this corner
4395 case for those instructions that use MODRM. */
4396 if (i.tm.base_opcode == INT_OPCODE
4397 && !i.tm.opcode_modifier.modrm
4398 && i.op[0].imms->X_add_number == 3)
4400 i.tm.base_opcode = INT3_OPCODE;
4401 i.imm_operands = 0;
4404 if ((i.tm.opcode_modifier.jump
4405 || i.tm.opcode_modifier.jumpbyte
4406 || i.tm.opcode_modifier.jumpdword)
4407 && i.op[0].disps->X_op == O_constant)
4409 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4410 the absolute address given by the constant. Since ix86 jumps and
4411 calls are pc relative, we need to generate a reloc. */
4412 i.op[0].disps->X_add_symbol = &abs_symbol;
4413 i.op[0].disps->X_op = O_symbol;
4416 if (i.tm.opcode_modifier.rex64)
4417 i.rex |= REX_W;
4419 /* For 8 bit registers we need an empty rex prefix. Also if the
4420 instruction already has a prefix, we need to convert old
4421 registers to new ones. */
4423 if ((i.types[0].bitfield.reg && i.types[0].bitfield.byte
4424 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4425 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte
4426 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4427 || (((i.types[0].bitfield.reg && i.types[0].bitfield.byte)
4428 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte))
4429 && i.rex != 0))
4431 int x;
4433 i.rex |= REX_OPCODE;
4434 for (x = 0; x < 2; x++)
4436 /* Look for 8 bit operand that uses old registers. */
4437 if (i.types[x].bitfield.reg && i.types[x].bitfield.byte
4438 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4440 /* In case it is "hi" register, give up. */
4441 if (i.op[x].regs->reg_num > 3)
4442 as_bad (_("can't encode register '%s%s' in an "
4443 "instruction requiring REX prefix."),
4444 register_prefix, i.op[x].regs->reg_name);
4446 /* Otherwise it is equivalent to the extended register.
4447 Since the encoding doesn't change this is merely
4448 cosmetic cleanup for debug output. */
4450 i.op[x].regs = i.op[x].regs + 8;
4455 if (i.rex == 0 && i.rex_encoding)
4457 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4458 that uses legacy register. If it is "hi" register, don't add
4459 the REX_OPCODE byte. */
4460 int x;
4461 for (x = 0; x < 2; x++)
4462 if (i.types[x].bitfield.reg
4463 && i.types[x].bitfield.byte
4464 && (i.op[x].regs->reg_flags & RegRex64) == 0
4465 && i.op[x].regs->reg_num > 3)
4467 i.rex_encoding = FALSE;
4468 break;
4471 if (i.rex_encoding)
4472 i.rex = REX_OPCODE;
4475 if (i.rex != 0)
4476 add_prefix (REX_OPCODE | i.rex);
4478 /* We are ready to output the insn. */
4479 output_insn ();
4482 static char *
4483 parse_insn (char *line, char *mnemonic)
4485 char *l = line;
4486 char *token_start = l;
4487 char *mnem_p;
4488 int supported;
4489 const insn_template *t;
4490 char *dot_p = NULL;
4492 while (1)
4494 mnem_p = mnemonic;
4495 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4497 if (*mnem_p == '.')
4498 dot_p = mnem_p;
4499 mnem_p++;
4500 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4502 as_bad (_("no such instruction: `%s'"), token_start);
4503 return NULL;
4505 l++;
4507 if (!is_space_char (*l)
4508 && *l != END_OF_INSN
4509 && (intel_syntax
4510 || (*l != PREFIX_SEPARATOR
4511 && *l != ',')))
4513 as_bad (_("invalid character %s in mnemonic"),
4514 output_invalid (*l));
4515 return NULL;
4517 if (token_start == l)
4519 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4520 as_bad (_("expecting prefix; got nothing"));
4521 else
4522 as_bad (_("expecting mnemonic; got nothing"));
4523 return NULL;
4526 /* Look up instruction (or prefix) via hash table. */
4527 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4529 if (*l != END_OF_INSN
4530 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4531 && current_templates
4532 && current_templates->start->opcode_modifier.isprefix)
4534 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4536 as_bad ((flag_code != CODE_64BIT
4537 ? _("`%s' is only supported in 64-bit mode")
4538 : _("`%s' is not supported in 64-bit mode")),
4539 current_templates->start->name);
4540 return NULL;
4542 /* If we are in 16-bit mode, do not allow addr16 or data16.
4543 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4544 if ((current_templates->start->opcode_modifier.size == SIZE16
4545 || current_templates->start->opcode_modifier.size == SIZE32)
4546 && flag_code != CODE_64BIT
4547 && ((current_templates->start->opcode_modifier.size == SIZE32)
4548 ^ (flag_code == CODE_16BIT)))
4550 as_bad (_("redundant %s prefix"),
4551 current_templates->start->name);
4552 return NULL;
4554 if (current_templates->start->opcode_length == 0)
4556 /* Handle pseudo prefixes. */
4557 switch (current_templates->start->base_opcode)
4559 case 0x0:
4560 /* {disp8} */
4561 i.disp_encoding = disp_encoding_8bit;
4562 break;
4563 case 0x1:
4564 /* {disp32} */
4565 i.disp_encoding = disp_encoding_32bit;
4566 break;
4567 case 0x2:
4568 /* {load} */
4569 i.dir_encoding = dir_encoding_load;
4570 break;
4571 case 0x3:
4572 /* {store} */
4573 i.dir_encoding = dir_encoding_store;
4574 break;
4575 case 0x4:
4576 /* {vex2} */
4577 i.vec_encoding = vex_encoding_vex2;
4578 break;
4579 case 0x5:
4580 /* {vex3} */
4581 i.vec_encoding = vex_encoding_vex3;
4582 break;
4583 case 0x6:
4584 /* {evex} */
4585 i.vec_encoding = vex_encoding_evex;
4586 break;
4587 case 0x7:
4588 /* {rex} */
4589 i.rex_encoding = TRUE;
4590 break;
4591 case 0x8:
4592 /* {nooptimize} */
4593 i.no_optimize = TRUE;
4594 break;
4595 default:
4596 abort ();
4599 else
4601 /* Add prefix, checking for repeated prefixes. */
4602 switch (add_prefix (current_templates->start->base_opcode))
4604 case PREFIX_EXIST:
4605 return NULL;
4606 case PREFIX_DS:
4607 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4608 i.notrack_prefix = current_templates->start->name;
4609 break;
4610 case PREFIX_REP:
4611 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4612 i.hle_prefix = current_templates->start->name;
4613 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4614 i.bnd_prefix = current_templates->start->name;
4615 else
4616 i.rep_prefix = current_templates->start->name;
4617 break;
4618 default:
4619 break;
4622 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4623 token_start = ++l;
4625 else
4626 break;
4629 if (!current_templates)
4631 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4632 Check if we should swap operand or force 32bit displacement in
4633 encoding. */
4634 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4635 i.dir_encoding = dir_encoding_swap;
4636 else if (mnem_p - 3 == dot_p
4637 && dot_p[1] == 'd'
4638 && dot_p[2] == '8')
4639 i.disp_encoding = disp_encoding_8bit;
4640 else if (mnem_p - 4 == dot_p
4641 && dot_p[1] == 'd'
4642 && dot_p[2] == '3'
4643 && dot_p[3] == '2')
4644 i.disp_encoding = disp_encoding_32bit;
4645 else
4646 goto check_suffix;
4647 mnem_p = dot_p;
4648 *dot_p = '\0';
4649 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4652 if (!current_templates)
4654 check_suffix:
4655 if (mnem_p > mnemonic)
4657 /* See if we can get a match by trimming off a suffix. */
4658 switch (mnem_p[-1])
4660 case WORD_MNEM_SUFFIX:
4661 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4662 i.suffix = SHORT_MNEM_SUFFIX;
4663 else
4664 /* Fall through. */
4665 case BYTE_MNEM_SUFFIX:
4666 case QWORD_MNEM_SUFFIX:
4667 i.suffix = mnem_p[-1];
4668 mnem_p[-1] = '\0';
4669 current_templates = (const templates *) hash_find (op_hash,
4670 mnemonic);
4671 break;
4672 case SHORT_MNEM_SUFFIX:
4673 case LONG_MNEM_SUFFIX:
4674 if (!intel_syntax)
4676 i.suffix = mnem_p[-1];
4677 mnem_p[-1] = '\0';
4678 current_templates = (const templates *) hash_find (op_hash,
4679 mnemonic);
4681 break;
4683 /* Intel Syntax. */
4684 case 'd':
4685 if (intel_syntax)
4687 if (intel_float_operand (mnemonic) == 1)
4688 i.suffix = SHORT_MNEM_SUFFIX;
4689 else
4690 i.suffix = LONG_MNEM_SUFFIX;
4691 mnem_p[-1] = '\0';
4692 current_templates = (const templates *) hash_find (op_hash,
4693 mnemonic);
4695 break;
4699 if (!current_templates)
4701 as_bad (_("no such instruction: `%s'"), token_start);
4702 return NULL;
4706 if (current_templates->start->opcode_modifier.jump
4707 || current_templates->start->opcode_modifier.jumpbyte)
4709 /* Check for a branch hint. We allow ",pt" and ",pn" for
4710 predict taken and predict not taken respectively.
4711 I'm not sure that branch hints actually do anything on loop
4712 and jcxz insns (JumpByte) for current Pentium4 chips. They
4713 may work in the future and it doesn't hurt to accept them
4714 now. */
4715 if (l[0] == ',' && l[1] == 'p')
4717 if (l[2] == 't')
4719 if (!add_prefix (DS_PREFIX_OPCODE))
4720 return NULL;
4721 l += 3;
4723 else if (l[2] == 'n')
4725 if (!add_prefix (CS_PREFIX_OPCODE))
4726 return NULL;
4727 l += 3;
4731 /* Any other comma loses. */
4732 if (*l == ',')
4734 as_bad (_("invalid character %s in mnemonic"),
4735 output_invalid (*l));
4736 return NULL;
4739 /* Check if instruction is supported on specified architecture. */
4740 supported = 0;
4741 for (t = current_templates->start; t < current_templates->end; ++t)
4743 supported |= cpu_flags_match (t);
4744 if (supported == CPU_FLAGS_PERFECT_MATCH)
4746 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4747 as_warn (_("use .code16 to ensure correct addressing mode"));
4749 return l;
4753 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4754 as_bad (flag_code == CODE_64BIT
4755 ? _("`%s' is not supported in 64-bit mode")
4756 : _("`%s' is only supported in 64-bit mode"),
4757 current_templates->start->name);
4758 else
4759 as_bad (_("`%s' is not supported on `%s%s'"),
4760 current_templates->start->name,
4761 cpu_arch_name ? cpu_arch_name : default_arch,
4762 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4764 return NULL;
4767 static char *
4768 parse_operands (char *l, const char *mnemonic)
4770 char *token_start;
4772 /* 1 if operand is pending after ','. */
4773 unsigned int expecting_operand = 0;
4775 /* Non-zero if operand parens not balanced. */
4776 unsigned int paren_not_balanced;
4778 while (*l != END_OF_INSN)
4780 /* Skip optional white space before operand. */
4781 if (is_space_char (*l))
4782 ++l;
4783 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4785 as_bad (_("invalid character %s before operand %d"),
4786 output_invalid (*l),
4787 i.operands + 1);
4788 return NULL;
4790 token_start = l; /* After white space. */
4791 paren_not_balanced = 0;
4792 while (paren_not_balanced || *l != ',')
4794 if (*l == END_OF_INSN)
4796 if (paren_not_balanced)
4798 if (!intel_syntax)
4799 as_bad (_("unbalanced parenthesis in operand %d."),
4800 i.operands + 1);
4801 else
4802 as_bad (_("unbalanced brackets in operand %d."),
4803 i.operands + 1);
4804 return NULL;
4806 else
4807 break; /* we are done */
4809 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4811 as_bad (_("invalid character %s in operand %d"),
4812 output_invalid (*l),
4813 i.operands + 1);
4814 return NULL;
4816 if (!intel_syntax)
4818 if (*l == '(')
4819 ++paren_not_balanced;
4820 if (*l == ')')
4821 --paren_not_balanced;
4823 else
4825 if (*l == '[')
4826 ++paren_not_balanced;
4827 if (*l == ']')
4828 --paren_not_balanced;
4830 l++;
4832 if (l != token_start)
4833 { /* Yes, we've read in another operand. */
4834 unsigned int operand_ok;
4835 this_operand = i.operands++;
4836 if (i.operands > MAX_OPERANDS)
4838 as_bad (_("spurious operands; (%d operands/instruction max)"),
4839 MAX_OPERANDS);
4840 return NULL;
4842 i.types[this_operand].bitfield.unspecified = 1;
4843 /* Now parse operand adding info to 'i' as we go along. */
4844 END_STRING_AND_SAVE (l);
4846 if (i.mem_operands > 1)
4848 as_bad (_("too many memory references for `%s'"),
4849 mnemonic);
4850 return 0;
4853 if (intel_syntax)
4854 operand_ok =
4855 i386_intel_operand (token_start,
4856 intel_float_operand (mnemonic));
4857 else
4858 operand_ok = i386_att_operand (token_start);
4860 RESTORE_END_STRING (l);
4861 if (!operand_ok)
4862 return NULL;
4864 else
4866 if (expecting_operand)
4868 expecting_operand_after_comma:
4869 as_bad (_("expecting operand after ','; got nothing"));
4870 return NULL;
4872 if (*l == ',')
4874 as_bad (_("expecting operand before ','; got nothing"));
4875 return NULL;
4879 /* Now *l must be either ',' or END_OF_INSN. */
4880 if (*l == ',')
4882 if (*++l == END_OF_INSN)
4884 /* Just skip it, if it's \n complain. */
4885 goto expecting_operand_after_comma;
4887 expecting_operand = 1;
4890 return l;
4893 static void
4894 swap_2_operands (int xchg1, int xchg2)
4896 union i386_op temp_op;
4897 i386_operand_type temp_type;
4898 unsigned int temp_flags;
4899 enum bfd_reloc_code_real temp_reloc;
4901 temp_type = i.types[xchg2];
4902 i.types[xchg2] = i.types[xchg1];
4903 i.types[xchg1] = temp_type;
4905 temp_flags = i.flags[xchg2];
4906 i.flags[xchg2] = i.flags[xchg1];
4907 i.flags[xchg1] = temp_flags;
4909 temp_op = i.op[xchg2];
4910 i.op[xchg2] = i.op[xchg1];
4911 i.op[xchg1] = temp_op;
4913 temp_reloc = i.reloc[xchg2];
4914 i.reloc[xchg2] = i.reloc[xchg1];
4915 i.reloc[xchg1] = temp_reloc;
4917 if (i.mask)
4919 if (i.mask->operand == xchg1)
4920 i.mask->operand = xchg2;
4921 else if (i.mask->operand == xchg2)
4922 i.mask->operand = xchg1;
4924 if (i.broadcast)
4926 if (i.broadcast->operand == xchg1)
4927 i.broadcast->operand = xchg2;
4928 else if (i.broadcast->operand == xchg2)
4929 i.broadcast->operand = xchg1;
4931 if (i.rounding)
4933 if (i.rounding->operand == xchg1)
4934 i.rounding->operand = xchg2;
4935 else if (i.rounding->operand == xchg2)
4936 i.rounding->operand = xchg1;
4940 static void
4941 swap_operands (void)
4943 switch (i.operands)
4945 case 5:
4946 case 4:
4947 swap_2_operands (1, i.operands - 2);
4948 /* Fall through. */
4949 case 3:
4950 case 2:
4951 swap_2_operands (0, i.operands - 1);
4952 break;
4953 default:
4954 abort ();
4957 if (i.mem_operands == 2)
4959 const seg_entry *temp_seg;
4960 temp_seg = i.seg[0];
4961 i.seg[0] = i.seg[1];
4962 i.seg[1] = temp_seg;
4966 /* Try to ensure constant immediates are represented in the smallest
4967 opcode possible. */
4968 static void
4969 optimize_imm (void)
4971 char guess_suffix = 0;
4972 int op;
4974 if (i.suffix)
4975 guess_suffix = i.suffix;
4976 else if (i.reg_operands)
4978 /* Figure out a suffix from the last register operand specified.
4979 We can't do this properly yet, ie. excluding InOutPortReg,
4980 but the following works for instructions with immediates.
4981 In any case, we can't set i.suffix yet. */
4982 for (op = i.operands; --op >= 0;)
4983 if (i.types[op].bitfield.reg && i.types[op].bitfield.byte)
4985 guess_suffix = BYTE_MNEM_SUFFIX;
4986 break;
4988 else if (i.types[op].bitfield.reg && i.types[op].bitfield.word)
4990 guess_suffix = WORD_MNEM_SUFFIX;
4991 break;
4993 else if (i.types[op].bitfield.reg && i.types[op].bitfield.dword)
4995 guess_suffix = LONG_MNEM_SUFFIX;
4996 break;
4998 else if (i.types[op].bitfield.reg && i.types[op].bitfield.qword)
5000 guess_suffix = QWORD_MNEM_SUFFIX;
5001 break;
5004 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5005 guess_suffix = WORD_MNEM_SUFFIX;
5007 for (op = i.operands; --op >= 0;)
5008 if (operand_type_check (i.types[op], imm))
5010 switch (i.op[op].imms->X_op)
5012 case O_constant:
5013 /* If a suffix is given, this operand may be shortened. */
5014 switch (guess_suffix)
5016 case LONG_MNEM_SUFFIX:
5017 i.types[op].bitfield.imm32 = 1;
5018 i.types[op].bitfield.imm64 = 1;
5019 break;
5020 case WORD_MNEM_SUFFIX:
5021 i.types[op].bitfield.imm16 = 1;
5022 i.types[op].bitfield.imm32 = 1;
5023 i.types[op].bitfield.imm32s = 1;
5024 i.types[op].bitfield.imm64 = 1;
5025 break;
5026 case BYTE_MNEM_SUFFIX:
5027 i.types[op].bitfield.imm8 = 1;
5028 i.types[op].bitfield.imm8s = 1;
5029 i.types[op].bitfield.imm16 = 1;
5030 i.types[op].bitfield.imm32 = 1;
5031 i.types[op].bitfield.imm32s = 1;
5032 i.types[op].bitfield.imm64 = 1;
5033 break;
5036 /* If this operand is at most 16 bits, convert it
5037 to a signed 16 bit number before trying to see
5038 whether it will fit in an even smaller size.
5039 This allows a 16-bit operand such as $0xffe0 to
5040 be recognised as within Imm8S range. */
5041 if ((i.types[op].bitfield.imm16)
5042 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5044 i.op[op].imms->X_add_number =
5045 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5047 #ifdef BFD64
5048 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5049 if ((i.types[op].bitfield.imm32)
5050 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5051 == 0))
5053 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5054 ^ ((offsetT) 1 << 31))
5055 - ((offsetT) 1 << 31));
5057 #endif
5058 i.types[op]
5059 = operand_type_or (i.types[op],
5060 smallest_imm_type (i.op[op].imms->X_add_number));
5062 /* We must avoid matching of Imm32 templates when 64bit
5063 only immediate is available. */
5064 if (guess_suffix == QWORD_MNEM_SUFFIX)
5065 i.types[op].bitfield.imm32 = 0;
5066 break;
5068 case O_absent:
5069 case O_register:
5070 abort ();
5072 /* Symbols and expressions. */
5073 default:
5074 /* Convert symbolic operand to proper sizes for matching, but don't
5075 prevent matching a set of insns that only supports sizes other
5076 than those matching the insn suffix. */
5078 i386_operand_type mask, allowed;
5079 const insn_template *t;
5081 operand_type_set (&mask, 0);
5082 operand_type_set (&allowed, 0);
5084 for (t = current_templates->start;
5085 t < current_templates->end;
5086 ++t)
5087 allowed = operand_type_or (allowed,
5088 t->operand_types[op]);
5089 switch (guess_suffix)
5091 case QWORD_MNEM_SUFFIX:
5092 mask.bitfield.imm64 = 1;
5093 mask.bitfield.imm32s = 1;
5094 break;
5095 case LONG_MNEM_SUFFIX:
5096 mask.bitfield.imm32 = 1;
5097 break;
5098 case WORD_MNEM_SUFFIX:
5099 mask.bitfield.imm16 = 1;
5100 break;
5101 case BYTE_MNEM_SUFFIX:
5102 mask.bitfield.imm8 = 1;
5103 break;
5104 default:
5105 break;
5107 allowed = operand_type_and (mask, allowed);
5108 if (!operand_type_all_zero (&allowed))
5109 i.types[op] = operand_type_and (i.types[op], mask);
5111 break;
5116 /* Try to use the smallest displacement type too. */
5117 static void
5118 optimize_disp (void)
5120 int op;
5122 for (op = i.operands; --op >= 0;)
5123 if (operand_type_check (i.types[op], disp))
5125 if (i.op[op].disps->X_op == O_constant)
5127 offsetT op_disp = i.op[op].disps->X_add_number;
5129 if (i.types[op].bitfield.disp16
5130 && (op_disp & ~(offsetT) 0xffff) == 0)
5132 /* If this operand is at most 16 bits, convert
5133 to a signed 16 bit number and don't use 64bit
5134 displacement. */
5135 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5136 i.types[op].bitfield.disp64 = 0;
5138 #ifdef BFD64
5139 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5140 if (i.types[op].bitfield.disp32
5141 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5143 /* If this operand is at most 32 bits, convert
5144 to a signed 32 bit number and don't use 64bit
5145 displacement. */
5146 op_disp &= (((offsetT) 2 << 31) - 1);
5147 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5148 i.types[op].bitfield.disp64 = 0;
5150 #endif
5151 if (!op_disp && i.types[op].bitfield.baseindex)
5153 i.types[op].bitfield.disp8 = 0;
5154 i.types[op].bitfield.disp16 = 0;
5155 i.types[op].bitfield.disp32 = 0;
5156 i.types[op].bitfield.disp32s = 0;
5157 i.types[op].bitfield.disp64 = 0;
5158 i.op[op].disps = 0;
5159 i.disp_operands--;
5161 else if (flag_code == CODE_64BIT)
5163 if (fits_in_signed_long (op_disp))
5165 i.types[op].bitfield.disp64 = 0;
5166 i.types[op].bitfield.disp32s = 1;
5168 if (i.prefix[ADDR_PREFIX]
5169 && fits_in_unsigned_long (op_disp))
5170 i.types[op].bitfield.disp32 = 1;
5172 if ((i.types[op].bitfield.disp32
5173 || i.types[op].bitfield.disp32s
5174 || i.types[op].bitfield.disp16)
5175 && fits_in_disp8 (op_disp))
5176 i.types[op].bitfield.disp8 = 1;
5178 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5179 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5181 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5182 i.op[op].disps, 0, i.reloc[op]);
5183 i.types[op].bitfield.disp8 = 0;
5184 i.types[op].bitfield.disp16 = 0;
5185 i.types[op].bitfield.disp32 = 0;
5186 i.types[op].bitfield.disp32s = 0;
5187 i.types[op].bitfield.disp64 = 0;
5189 else
5190 /* We only support 64bit displacement on constants. */
5191 i.types[op].bitfield.disp64 = 0;
5195 /* Return 1 if there is a match in broadcast bytes between operand
5196 GIVEN and instruction template T. */
5198 static INLINE int
5199 match_broadcast_size (const insn_template *t, unsigned int given)
5201 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5202 && i.types[given].bitfield.byte)
5203 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5204 && i.types[given].bitfield.word)
5205 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5206 && i.types[given].bitfield.dword)
5207 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5208 && i.types[given].bitfield.qword));
5211 /* Check if operands are valid for the instruction. */
5213 static int
5214 check_VecOperands (const insn_template *t)
5216 unsigned int op;
5217 i386_cpu_flags cpu;
5218 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5220 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5221 any one operand are implicity requiring AVX512VL support if the actual
5222 operand size is YMMword or XMMword. Since this function runs after
5223 template matching, there's no need to check for YMMword/XMMword in
5224 the template. */
5225 cpu = cpu_flags_and (t->cpu_flags, avx512);
5226 if (!cpu_flags_all_zero (&cpu)
5227 && !t->cpu_flags.bitfield.cpuavx512vl
5228 && !cpu_arch_flags.bitfield.cpuavx512vl)
5230 for (op = 0; op < t->operands; ++op)
5232 if (t->operand_types[op].bitfield.zmmword
5233 && (i.types[op].bitfield.ymmword
5234 || i.types[op].bitfield.xmmword))
5236 i.error = unsupported;
5237 return 1;
5242 /* Without VSIB byte, we can't have a vector register for index. */
5243 if (!t->opcode_modifier.vecsib
5244 && i.index_reg
5245 && (i.index_reg->reg_type.bitfield.xmmword
5246 || i.index_reg->reg_type.bitfield.ymmword
5247 || i.index_reg->reg_type.bitfield.zmmword))
5249 i.error = unsupported_vector_index_register;
5250 return 1;
5253 /* Check if default mask is allowed. */
5254 if (t->opcode_modifier.nodefmask
5255 && (!i.mask || i.mask->mask->reg_num == 0))
5257 i.error = no_default_mask;
5258 return 1;
5261 /* For VSIB byte, we need a vector register for index, and all vector
5262 registers must be distinct. */
5263 if (t->opcode_modifier.vecsib)
5265 if (!i.index_reg
5266 || !((t->opcode_modifier.vecsib == VecSIB128
5267 && i.index_reg->reg_type.bitfield.xmmword)
5268 || (t->opcode_modifier.vecsib == VecSIB256
5269 && i.index_reg->reg_type.bitfield.ymmword)
5270 || (t->opcode_modifier.vecsib == VecSIB512
5271 && i.index_reg->reg_type.bitfield.zmmword)))
5273 i.error = invalid_vsib_address;
5274 return 1;
5277 gas_assert (i.reg_operands == 2 || i.mask);
5278 if (i.reg_operands == 2 && !i.mask)
5280 gas_assert (i.types[0].bitfield.regsimd);
5281 gas_assert (i.types[0].bitfield.xmmword
5282 || i.types[0].bitfield.ymmword);
5283 gas_assert (i.types[2].bitfield.regsimd);
5284 gas_assert (i.types[2].bitfield.xmmword
5285 || i.types[2].bitfield.ymmword);
5286 if (operand_check == check_none)
5287 return 0;
5288 if (register_number (i.op[0].regs)
5289 != register_number (i.index_reg)
5290 && register_number (i.op[2].regs)
5291 != register_number (i.index_reg)
5292 && register_number (i.op[0].regs)
5293 != register_number (i.op[2].regs))
5294 return 0;
5295 if (operand_check == check_error)
5297 i.error = invalid_vector_register_set;
5298 return 1;
5300 as_warn (_("mask, index, and destination registers should be distinct"));
5302 else if (i.reg_operands == 1 && i.mask)
5304 if (i.types[1].bitfield.regsimd
5305 && (i.types[1].bitfield.xmmword
5306 || i.types[1].bitfield.ymmword
5307 || i.types[1].bitfield.zmmword)
5308 && (register_number (i.op[1].regs)
5309 == register_number (i.index_reg)))
5311 if (operand_check == check_error)
5313 i.error = invalid_vector_register_set;
5314 return 1;
5316 if (operand_check != check_none)
5317 as_warn (_("index and destination registers should be distinct"));
5322 /* Check if broadcast is supported by the instruction and is applied
5323 to the memory operand. */
5324 if (i.broadcast)
5326 i386_operand_type type, overlap;
5328 /* Check if specified broadcast is supported in this instruction,
5329 and its broadcast bytes match the memory operand. */
5330 op = i.broadcast->operand;
5331 if (!t->opcode_modifier.broadcast
5332 || !(i.flags[op] & Operand_Mem)
5333 || (!i.types[op].bitfield.unspecified
5334 && !match_broadcast_size (t, op)))
5336 bad_broadcast:
5337 i.error = unsupported_broadcast;
5338 return 1;
5341 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5342 * i.broadcast->type);
5343 operand_type_set (&type, 0);
5344 switch (i.broadcast->bytes)
5346 case 2:
5347 type.bitfield.word = 1;
5348 break;
5349 case 4:
5350 type.bitfield.dword = 1;
5351 break;
5352 case 8:
5353 type.bitfield.qword = 1;
5354 break;
5355 case 16:
5356 type.bitfield.xmmword = 1;
5357 break;
5358 case 32:
5359 type.bitfield.ymmword = 1;
5360 break;
5361 case 64:
5362 type.bitfield.zmmword = 1;
5363 break;
5364 default:
5365 goto bad_broadcast;
5368 overlap = operand_type_and (type, t->operand_types[op]);
5369 if (operand_type_all_zero (&overlap))
5370 goto bad_broadcast;
5372 if (t->opcode_modifier.checkregsize)
5374 unsigned int j;
5376 type.bitfield.baseindex = 1;
5377 for (j = 0; j < i.operands; ++j)
5379 if (j != op
5380 && !operand_type_register_match(i.types[j],
5381 t->operand_types[j],
5382 type,
5383 t->operand_types[op]))
5384 goto bad_broadcast;
5388 /* If broadcast is supported in this instruction, we need to check if
5389 operand of one-element size isn't specified without broadcast. */
5390 else if (t->opcode_modifier.broadcast && i.mem_operands)
5392 /* Find memory operand. */
5393 for (op = 0; op < i.operands; op++)
5394 if (operand_type_check (i.types[op], anymem))
5395 break;
5396 gas_assert (op < i.operands);
5397 /* Check size of the memory operand. */
5398 if (match_broadcast_size (t, op))
5400 i.error = broadcast_needed;
5401 return 1;
5404 else
5405 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5407 /* Check if requested masking is supported. */
5408 if (i.mask)
5410 switch (t->opcode_modifier.masking)
5412 case BOTH_MASKING:
5413 break;
5414 case MERGING_MASKING:
5415 if (i.mask->zeroing)
5417 case 0:
5418 i.error = unsupported_masking;
5419 return 1;
5421 break;
5422 case DYNAMIC_MASKING:
5423 /* Memory destinations allow only merging masking. */
5424 if (i.mask->zeroing && i.mem_operands)
5426 /* Find memory operand. */
5427 for (op = 0; op < i.operands; op++)
5428 if (i.flags[op] & Operand_Mem)
5429 break;
5430 gas_assert (op < i.operands);
5431 if (op == i.operands - 1)
5433 i.error = unsupported_masking;
5434 return 1;
5437 break;
5438 default:
5439 abort ();
5443 /* Check if masking is applied to dest operand. */
5444 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5446 i.error = mask_not_on_destination;
5447 return 1;
5450 /* Check RC/SAE. */
5451 if (i.rounding)
5453 if ((i.rounding->type != saeonly
5454 && !t->opcode_modifier.staticrounding)
5455 || (i.rounding->type == saeonly
5456 && (t->opcode_modifier.staticrounding
5457 || !t->opcode_modifier.sae)))
5459 i.error = unsupported_rc_sae;
5460 return 1;
5462 /* If the instruction has several immediate operands and one of
5463 them is rounding, the rounding operand should be the last
5464 immediate operand. */
5465 if (i.imm_operands > 1
5466 && i.rounding->operand != (int) (i.imm_operands - 1))
5468 i.error = rc_sae_operand_not_last_imm;
5469 return 1;
5473 /* Check vector Disp8 operand. */
5474 if (t->opcode_modifier.disp8memshift
5475 && i.disp_encoding != disp_encoding_32bit)
5477 if (i.broadcast)
5478 i.memshift = t->opcode_modifier.broadcast - 1;
5479 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5480 i.memshift = t->opcode_modifier.disp8memshift;
5481 else
5483 const i386_operand_type *type = NULL;
5485 i.memshift = 0;
5486 for (op = 0; op < i.operands; op++)
5487 if (operand_type_check (i.types[op], anymem))
5489 if (t->opcode_modifier.evex == EVEXLIG)
5490 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5491 else if (t->operand_types[op].bitfield.xmmword
5492 + t->operand_types[op].bitfield.ymmword
5493 + t->operand_types[op].bitfield.zmmword <= 1)
5494 type = &t->operand_types[op];
5495 else if (!i.types[op].bitfield.unspecified)
5496 type = &i.types[op];
5498 else if (i.types[op].bitfield.regsimd
5499 && t->opcode_modifier.evex != EVEXLIG)
5501 if (i.types[op].bitfield.zmmword)
5502 i.memshift = 6;
5503 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5504 i.memshift = 5;
5505 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5506 i.memshift = 4;
5509 if (type)
5511 if (type->bitfield.zmmword)
5512 i.memshift = 6;
5513 else if (type->bitfield.ymmword)
5514 i.memshift = 5;
5515 else if (type->bitfield.xmmword)
5516 i.memshift = 4;
5519 /* For the check in fits_in_disp8(). */
5520 if (i.memshift == 0)
5521 i.memshift = -1;
5524 for (op = 0; op < i.operands; op++)
5525 if (operand_type_check (i.types[op], disp)
5526 && i.op[op].disps->X_op == O_constant)
5528 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5530 i.types[op].bitfield.disp8 = 1;
5531 return 0;
5533 i.types[op].bitfield.disp8 = 0;
5537 i.memshift = 0;
5539 return 0;
5542 /* Check if operands are valid for the instruction. Update VEX
5543 operand types. */
5545 static int
5546 VEX_check_operands (const insn_template *t)
5548 if (i.vec_encoding == vex_encoding_evex)
5550 /* This instruction must be encoded with EVEX prefix. */
5551 if (!is_evex_encoding (t))
5553 i.error = unsupported;
5554 return 1;
5556 return 0;
5559 if (!t->opcode_modifier.vex)
5561 /* This instruction template doesn't have VEX prefix. */
5562 if (i.vec_encoding != vex_encoding_default)
5564 i.error = unsupported;
5565 return 1;
5567 return 0;
5570 /* Only check VEX_Imm4, which must be the first operand. */
5571 if (t->operand_types[0].bitfield.vec_imm4)
5573 if (i.op[0].imms->X_op != O_constant
5574 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5576 i.error = bad_imm4;
5577 return 1;
5580 /* Turn off Imm8 so that update_imm won't complain. */
5581 i.types[0] = vec_imm4;
5584 return 0;
5587 static const insn_template *
5588 match_template (char mnem_suffix)
5590 /* Points to template once we've found it. */
5591 const insn_template *t;
5592 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5593 i386_operand_type overlap4;
5594 unsigned int found_reverse_match;
5595 i386_opcode_modifier suffix_check, mnemsuf_check;
5596 i386_operand_type operand_types [MAX_OPERANDS];
5597 int addr_prefix_disp;
5598 unsigned int j;
5599 unsigned int found_cpu_match, size_match;
5600 unsigned int check_register;
5601 enum i386_error specific_error = 0;
5603 #if MAX_OPERANDS != 5
5604 # error "MAX_OPERANDS must be 5."
5605 #endif
5607 found_reverse_match = 0;
5608 addr_prefix_disp = -1;
5610 memset (&suffix_check, 0, sizeof (suffix_check));
5611 if (intel_syntax && i.broadcast)
5612 /* nothing */;
5613 else if (i.suffix == BYTE_MNEM_SUFFIX)
5614 suffix_check.no_bsuf = 1;
5615 else if (i.suffix == WORD_MNEM_SUFFIX)
5616 suffix_check.no_wsuf = 1;
5617 else if (i.suffix == SHORT_MNEM_SUFFIX)
5618 suffix_check.no_ssuf = 1;
5619 else if (i.suffix == LONG_MNEM_SUFFIX)
5620 suffix_check.no_lsuf = 1;
5621 else if (i.suffix == QWORD_MNEM_SUFFIX)
5622 suffix_check.no_qsuf = 1;
5623 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5624 suffix_check.no_ldsuf = 1;
5626 memset (&mnemsuf_check, 0, sizeof (mnemsuf_check));
5627 if (intel_syntax)
5629 switch (mnem_suffix)
5631 case BYTE_MNEM_SUFFIX: mnemsuf_check.no_bsuf = 1; break;
5632 case WORD_MNEM_SUFFIX: mnemsuf_check.no_wsuf = 1; break;
5633 case SHORT_MNEM_SUFFIX: mnemsuf_check.no_ssuf = 1; break;
5634 case LONG_MNEM_SUFFIX: mnemsuf_check.no_lsuf = 1; break;
5635 case QWORD_MNEM_SUFFIX: mnemsuf_check.no_qsuf = 1; break;
5639 /* Must have right number of operands. */
5640 i.error = number_of_operands_mismatch;
5642 for (t = current_templates->start; t < current_templates->end; t++)
5644 addr_prefix_disp = -1;
5645 found_reverse_match = 0;
5647 if (i.operands != t->operands)
5648 continue;
5650 /* Check processor support. */
5651 i.error = unsupported;
5652 found_cpu_match = (cpu_flags_match (t)
5653 == CPU_FLAGS_PERFECT_MATCH);
5654 if (!found_cpu_match)
5655 continue;
5657 /* Check AT&T mnemonic. */
5658 i.error = unsupported_with_intel_mnemonic;
5659 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5660 continue;
5662 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5663 i.error = unsupported_syntax;
5664 if ((intel_syntax && t->opcode_modifier.attsyntax)
5665 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5666 || (intel64 && t->opcode_modifier.amd64)
5667 || (!intel64 && t->opcode_modifier.intel64))
5668 continue;
5670 /* Check the suffix, except for some instructions in intel mode. */
5671 i.error = invalid_instruction_suffix;
5672 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
5673 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5674 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5675 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5676 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5677 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5678 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
5679 continue;
5680 /* In Intel mode all mnemonic suffixes must be explicitly allowed. */
5681 if ((t->opcode_modifier.no_bsuf && mnemsuf_check.no_bsuf)
5682 || (t->opcode_modifier.no_wsuf && mnemsuf_check.no_wsuf)
5683 || (t->opcode_modifier.no_lsuf && mnemsuf_check.no_lsuf)
5684 || (t->opcode_modifier.no_ssuf && mnemsuf_check.no_ssuf)
5685 || (t->opcode_modifier.no_qsuf && mnemsuf_check.no_qsuf)
5686 || (t->opcode_modifier.no_ldsuf && mnemsuf_check.no_ldsuf))
5687 continue;
5689 size_match = operand_size_match (t);
5690 if (!size_match)
5691 continue;
5693 for (j = 0; j < MAX_OPERANDS; j++)
5694 operand_types[j] = t->operand_types[j];
5696 /* In general, don't allow 64-bit operands in 32-bit mode. */
5697 if (i.suffix == QWORD_MNEM_SUFFIX
5698 && flag_code != CODE_64BIT
5699 && (intel_syntax
5700 ? (!t->opcode_modifier.ignoresize
5701 && !t->opcode_modifier.broadcast
5702 && !intel_float_operand (t->name))
5703 : intel_float_operand (t->name) != 2)
5704 && ((!operand_types[0].bitfield.regmmx
5705 && !operand_types[0].bitfield.regsimd)
5706 || (!operand_types[t->operands > 1].bitfield.regmmx
5707 && !operand_types[t->operands > 1].bitfield.regsimd))
5708 && (t->base_opcode != 0x0fc7
5709 || t->extension_opcode != 1 /* cmpxchg8b */))
5710 continue;
5712 /* In general, don't allow 32-bit operands on pre-386. */
5713 else if (i.suffix == LONG_MNEM_SUFFIX
5714 && !cpu_arch_flags.bitfield.cpui386
5715 && (intel_syntax
5716 ? (!t->opcode_modifier.ignoresize
5717 && !intel_float_operand (t->name))
5718 : intel_float_operand (t->name) != 2)
5719 && ((!operand_types[0].bitfield.regmmx
5720 && !operand_types[0].bitfield.regsimd)
5721 || (!operand_types[t->operands > 1].bitfield.regmmx
5722 && !operand_types[t->operands > 1].bitfield.regsimd)))
5723 continue;
5725 /* Do not verify operands when there are none. */
5726 else
5728 if (!t->operands)
5729 /* We've found a match; break out of loop. */
5730 break;
5733 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5734 into Disp32/Disp16/Disp32 operand. */
5735 if (i.prefix[ADDR_PREFIX] != 0)
5737 /* There should be only one Disp operand. */
5738 switch (flag_code)
5740 case CODE_16BIT:
5741 for (j = 0; j < MAX_OPERANDS; j++)
5743 if (operand_types[j].bitfield.disp16)
5745 addr_prefix_disp = j;
5746 operand_types[j].bitfield.disp32 = 1;
5747 operand_types[j].bitfield.disp16 = 0;
5748 break;
5751 break;
5752 case CODE_32BIT:
5753 for (j = 0; j < MAX_OPERANDS; j++)
5755 if (operand_types[j].bitfield.disp32)
5757 addr_prefix_disp = j;
5758 operand_types[j].bitfield.disp32 = 0;
5759 operand_types[j].bitfield.disp16 = 1;
5760 break;
5763 break;
5764 case CODE_64BIT:
5765 for (j = 0; j < MAX_OPERANDS; j++)
5767 if (operand_types[j].bitfield.disp64)
5769 addr_prefix_disp = j;
5770 operand_types[j].bitfield.disp64 = 0;
5771 operand_types[j].bitfield.disp32 = 1;
5772 break;
5775 break;
5779 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5780 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5781 continue;
5783 /* We check register size if needed. */
5784 if (t->opcode_modifier.checkregsize)
5786 check_register = (1 << t->operands) - 1;
5787 if (i.broadcast)
5788 check_register &= ~(1 << i.broadcast->operand);
5790 else
5791 check_register = 0;
5793 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5794 switch (t->operands)
5796 case 1:
5797 if (!operand_type_match (overlap0, i.types[0]))
5798 continue;
5799 break;
5800 case 2:
5801 /* xchg %eax, %eax is a special case. It is an alias for nop
5802 only in 32bit mode and we can use opcode 0x90. In 64bit
5803 mode, we can't use 0x90 for xchg %eax, %eax since it should
5804 zero-extend %eax to %rax. */
5805 if (flag_code == CODE_64BIT
5806 && t->base_opcode == 0x90
5807 && operand_type_equal (&i.types [0], &acc32)
5808 && operand_type_equal (&i.types [1], &acc32))
5809 continue;
5810 /* xrelease mov %eax, <disp> is another special case. It must not
5811 match the accumulator-only encoding of mov. */
5812 if (flag_code != CODE_64BIT
5813 && i.hle_prefix
5814 && t->base_opcode == 0xa0
5815 && i.types[0].bitfield.acc
5816 && operand_type_check (i.types[1], anymem))
5817 continue;
5818 /* Fall through. */
5820 case 3:
5821 if (!(size_match & MATCH_STRAIGHT))
5822 goto check_reverse;
5823 /* Reverse direction of operands if swapping is possible in the first
5824 place (operands need to be symmetric) and
5825 - the load form is requested, and the template is a store form,
5826 - the store form is requested, and the template is a load form,
5827 - the non-default (swapped) form is requested. */
5828 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5829 if (t->opcode_modifier.d && i.reg_operands == i.operands
5830 && !operand_type_all_zero (&overlap1))
5831 switch (i.dir_encoding)
5833 case dir_encoding_load:
5834 if (operand_type_check (operand_types[i.operands - 1], anymem)
5835 || operand_types[i.operands - 1].bitfield.regmem)
5836 goto check_reverse;
5837 break;
5839 case dir_encoding_store:
5840 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5841 && !operand_types[i.operands - 1].bitfield.regmem)
5842 goto check_reverse;
5843 break;
5845 case dir_encoding_swap:
5846 goto check_reverse;
5848 case dir_encoding_default:
5849 break;
5851 /* If we want store form, we skip the current load. */
5852 if ((i.dir_encoding == dir_encoding_store
5853 || i.dir_encoding == dir_encoding_swap)
5854 && i.mem_operands == 0
5855 && t->opcode_modifier.load)
5856 continue;
5857 /* Fall through. */
5858 case 4:
5859 case 5:
5860 overlap1 = operand_type_and (i.types[1], operand_types[1]);
5861 if (!operand_type_match (overlap0, i.types[0])
5862 || !operand_type_match (overlap1, i.types[1])
5863 || ((check_register & 3) == 3
5864 && !operand_type_register_match (i.types[0],
5865 operand_types[0],
5866 i.types[1],
5867 operand_types[1])))
5869 /* Check if other direction is valid ... */
5870 if (!t->opcode_modifier.d)
5871 continue;
5873 check_reverse:
5874 if (!(size_match & MATCH_REVERSE))
5875 continue;
5876 /* Try reversing direction of operands. */
5877 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
5878 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
5879 if (!operand_type_match (overlap0, i.types[0])
5880 || !operand_type_match (overlap1, i.types[i.operands - 1])
5881 || (check_register
5882 && !operand_type_register_match (i.types[0],
5883 operand_types[i.operands - 1],
5884 i.types[i.operands - 1],
5885 operand_types[0])))
5887 /* Does not match either direction. */
5888 continue;
5890 /* found_reverse_match holds which of D or FloatR
5891 we've found. */
5892 if (!t->opcode_modifier.d)
5893 found_reverse_match = 0;
5894 else if (operand_types[0].bitfield.tbyte)
5895 found_reverse_match = Opcode_FloatD;
5896 else if (operand_types[0].bitfield.xmmword
5897 || operand_types[i.operands - 1].bitfield.xmmword
5898 || operand_types[0].bitfield.regmmx
5899 || operand_types[i.operands - 1].bitfield.regmmx
5900 || is_any_vex_encoding(t))
5901 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
5902 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
5903 else
5904 found_reverse_match = Opcode_D;
5905 if (t->opcode_modifier.floatr)
5906 found_reverse_match |= Opcode_FloatR;
5908 else
5910 /* Found a forward 2 operand match here. */
5911 switch (t->operands)
5913 case 5:
5914 overlap4 = operand_type_and (i.types[4],
5915 operand_types[4]);
5916 /* Fall through. */
5917 case 4:
5918 overlap3 = operand_type_and (i.types[3],
5919 operand_types[3]);
5920 /* Fall through. */
5921 case 3:
5922 overlap2 = operand_type_and (i.types[2],
5923 operand_types[2]);
5924 break;
5927 switch (t->operands)
5929 case 5:
5930 if (!operand_type_match (overlap4, i.types[4])
5931 || !operand_type_register_match (i.types[3],
5932 operand_types[3],
5933 i.types[4],
5934 operand_types[4]))
5935 continue;
5936 /* Fall through. */
5937 case 4:
5938 if (!operand_type_match (overlap3, i.types[3])
5939 || ((check_register & 0xa) == 0xa
5940 && !operand_type_register_match (i.types[1],
5941 operand_types[1],
5942 i.types[3],
5943 operand_types[3]))
5944 || ((check_register & 0xc) == 0xc
5945 && !operand_type_register_match (i.types[2],
5946 operand_types[2],
5947 i.types[3],
5948 operand_types[3])))
5949 continue;
5950 /* Fall through. */
5951 case 3:
5952 /* Here we make use of the fact that there are no
5953 reverse match 3 operand instructions. */
5954 if (!operand_type_match (overlap2, i.types[2])
5955 || ((check_register & 5) == 5
5956 && !operand_type_register_match (i.types[0],
5957 operand_types[0],
5958 i.types[2],
5959 operand_types[2]))
5960 || ((check_register & 6) == 6
5961 && !operand_type_register_match (i.types[1],
5962 operand_types[1],
5963 i.types[2],
5964 operand_types[2])))
5965 continue;
5966 break;
5969 /* Found either forward/reverse 2, 3 or 4 operand match here:
5970 slip through to break. */
5972 if (!found_cpu_match)
5973 continue;
5975 /* Check if vector and VEX operands are valid. */
5976 if (check_VecOperands (t) || VEX_check_operands (t))
5978 specific_error = i.error;
5979 continue;
5982 /* We've found a match; break out of loop. */
5983 break;
5986 if (t == current_templates->end)
5988 /* We found no match. */
5989 const char *err_msg;
5990 switch (specific_error ? specific_error : i.error)
5992 default:
5993 abort ();
5994 case operand_size_mismatch:
5995 err_msg = _("operand size mismatch");
5996 break;
5997 case operand_type_mismatch:
5998 err_msg = _("operand type mismatch");
5999 break;
6000 case register_type_mismatch:
6001 err_msg = _("register type mismatch");
6002 break;
6003 case number_of_operands_mismatch:
6004 err_msg = _("number of operands mismatch");
6005 break;
6006 case invalid_instruction_suffix:
6007 err_msg = _("invalid instruction suffix");
6008 break;
6009 case bad_imm4:
6010 err_msg = _("constant doesn't fit in 4 bits");
6011 break;
6012 case unsupported_with_intel_mnemonic:
6013 err_msg = _("unsupported with Intel mnemonic");
6014 break;
6015 case unsupported_syntax:
6016 err_msg = _("unsupported syntax");
6017 break;
6018 case unsupported:
6019 as_bad (_("unsupported instruction `%s'"),
6020 current_templates->start->name);
6021 return NULL;
6022 case invalid_vsib_address:
6023 err_msg = _("invalid VSIB address");
6024 break;
6025 case invalid_vector_register_set:
6026 err_msg = _("mask, index, and destination registers must be distinct");
6027 break;
6028 case unsupported_vector_index_register:
6029 err_msg = _("unsupported vector index register");
6030 break;
6031 case unsupported_broadcast:
6032 err_msg = _("unsupported broadcast");
6033 break;
6034 case broadcast_needed:
6035 err_msg = _("broadcast is needed for operand of such type");
6036 break;
6037 case unsupported_masking:
6038 err_msg = _("unsupported masking");
6039 break;
6040 case mask_not_on_destination:
6041 err_msg = _("mask not on destination operand");
6042 break;
6043 case no_default_mask:
6044 err_msg = _("default mask isn't allowed");
6045 break;
6046 case unsupported_rc_sae:
6047 err_msg = _("unsupported static rounding/sae");
6048 break;
6049 case rc_sae_operand_not_last_imm:
6050 if (intel_syntax)
6051 err_msg = _("RC/SAE operand must precede immediate operands");
6052 else
6053 err_msg = _("RC/SAE operand must follow immediate operands");
6054 break;
6055 case invalid_register_operand:
6056 err_msg = _("invalid register operand");
6057 break;
6059 as_bad (_("%s for `%s'"), err_msg,
6060 current_templates->start->name);
6061 return NULL;
6064 if (!quiet_warnings)
6066 if (!intel_syntax
6067 && (i.types[0].bitfield.jumpabsolute
6068 != operand_types[0].bitfield.jumpabsolute))
6070 as_warn (_("indirect %s without `*'"), t->name);
6073 if (t->opcode_modifier.isprefix
6074 && t->opcode_modifier.ignoresize)
6076 /* Warn them that a data or address size prefix doesn't
6077 affect assembly of the next line of code. */
6078 as_warn (_("stand-alone `%s' prefix"), t->name);
6082 /* Copy the template we found. */
6083 i.tm = *t;
6085 if (addr_prefix_disp != -1)
6086 i.tm.operand_types[addr_prefix_disp]
6087 = operand_types[addr_prefix_disp];
6089 if (found_reverse_match)
6091 /* If we found a reverse match we must alter the opcode
6092 direction bit. found_reverse_match holds bits to change
6093 (different for int & float insns). */
6095 i.tm.base_opcode ^= found_reverse_match;
6097 i.tm.operand_types[0] = operand_types[i.operands - 1];
6098 i.tm.operand_types[i.operands - 1] = operand_types[0];
6101 return t;
6104 static int
6105 check_string (void)
6107 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
6108 if (i.tm.operand_types[mem_op].bitfield.esseg)
6110 if (i.seg[0] != NULL && i.seg[0] != &es)
6112 as_bad (_("`%s' operand %d must use `%ses' segment"),
6113 i.tm.name,
6114 mem_op + 1,
6115 register_prefix);
6116 return 0;
6118 /* There's only ever one segment override allowed per instruction.
6119 This instruction possibly has a legal segment override on the
6120 second operand, so copy the segment to where non-string
6121 instructions store it, allowing common code. */
6122 i.seg[0] = i.seg[1];
6124 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
6126 if (i.seg[1] != NULL && i.seg[1] != &es)
6128 as_bad (_("`%s' operand %d must use `%ses' segment"),
6129 i.tm.name,
6130 mem_op + 2,
6131 register_prefix);
6132 return 0;
6135 return 1;
6138 static int
6139 process_suffix (void)
6141 /* If matched instruction specifies an explicit instruction mnemonic
6142 suffix, use it. */
6143 if (i.tm.opcode_modifier.size == SIZE16)
6144 i.suffix = WORD_MNEM_SUFFIX;
6145 else if (i.tm.opcode_modifier.size == SIZE32)
6146 i.suffix = LONG_MNEM_SUFFIX;
6147 else if (i.tm.opcode_modifier.size == SIZE64)
6148 i.suffix = QWORD_MNEM_SUFFIX;
6149 else if (i.reg_operands)
6151 /* If there's no instruction mnemonic suffix we try to invent one
6152 based on register operands. */
6153 if (!i.suffix)
6155 /* We take i.suffix from the last register operand specified,
6156 Destination register type is more significant than source
6157 register type. crc32 in SSE4.2 prefers source register
6158 type. */
6159 if (i.tm.base_opcode == 0xf20f38f0 && i.types[0].bitfield.reg)
6161 if (i.types[0].bitfield.byte)
6162 i.suffix = BYTE_MNEM_SUFFIX;
6163 else if (i.types[0].bitfield.word)
6164 i.suffix = WORD_MNEM_SUFFIX;
6165 else if (i.types[0].bitfield.dword)
6166 i.suffix = LONG_MNEM_SUFFIX;
6167 else if (i.types[0].bitfield.qword)
6168 i.suffix = QWORD_MNEM_SUFFIX;
6171 if (!i.suffix)
6173 int op;
6175 if (i.tm.base_opcode == 0xf20f38f0)
6177 /* We have to know the operand size for crc32. */
6178 as_bad (_("ambiguous memory operand size for `%s`"),
6179 i.tm.name);
6180 return 0;
6183 for (op = i.operands; --op >= 0;)
6184 if (!i.tm.operand_types[op].bitfield.inoutportreg
6185 && !i.tm.operand_types[op].bitfield.shiftcount)
6187 if (!i.types[op].bitfield.reg)
6188 continue;
6189 if (i.types[op].bitfield.byte)
6190 i.suffix = BYTE_MNEM_SUFFIX;
6191 else if (i.types[op].bitfield.word)
6192 i.suffix = WORD_MNEM_SUFFIX;
6193 else if (i.types[op].bitfield.dword)
6194 i.suffix = LONG_MNEM_SUFFIX;
6195 else if (i.types[op].bitfield.qword)
6196 i.suffix = QWORD_MNEM_SUFFIX;
6197 else
6198 continue;
6199 break;
6203 else if (i.suffix == BYTE_MNEM_SUFFIX)
6205 if (intel_syntax
6206 && i.tm.opcode_modifier.ignoresize
6207 && i.tm.opcode_modifier.no_bsuf)
6208 i.suffix = 0;
6209 else if (!check_byte_reg ())
6210 return 0;
6212 else if (i.suffix == LONG_MNEM_SUFFIX)
6214 if (intel_syntax
6215 && i.tm.opcode_modifier.ignoresize
6216 && i.tm.opcode_modifier.no_lsuf
6217 && !i.tm.opcode_modifier.todword
6218 && !i.tm.opcode_modifier.toqword)
6219 i.suffix = 0;
6220 else if (!check_long_reg ())
6221 return 0;
6223 else if (i.suffix == QWORD_MNEM_SUFFIX)
6225 if (intel_syntax
6226 && i.tm.opcode_modifier.ignoresize
6227 && i.tm.opcode_modifier.no_qsuf
6228 && !i.tm.opcode_modifier.todword
6229 && !i.tm.opcode_modifier.toqword)
6230 i.suffix = 0;
6231 else if (!check_qword_reg ())
6232 return 0;
6234 else if (i.suffix == WORD_MNEM_SUFFIX)
6236 if (intel_syntax
6237 && i.tm.opcode_modifier.ignoresize
6238 && i.tm.opcode_modifier.no_wsuf)
6239 i.suffix = 0;
6240 else if (!check_word_reg ())
6241 return 0;
6243 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6244 /* Do nothing if the instruction is going to ignore the prefix. */
6246 else
6247 abort ();
6249 else if (i.tm.opcode_modifier.defaultsize
6250 && !i.suffix
6251 /* exclude fldenv/frstor/fsave/fstenv */
6252 && i.tm.opcode_modifier.no_ssuf)
6254 if (stackop_size == LONG_MNEM_SUFFIX
6255 && i.tm.base_opcode == 0xcf)
6257 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6258 .code16gcc directive to support 16-bit mode with
6259 32-bit address. For IRET without a suffix, generate
6260 16-bit IRET (opcode 0xcf) to return from an interrupt
6261 handler. */
6262 i.suffix = WORD_MNEM_SUFFIX;
6263 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6265 else
6266 i.suffix = stackop_size;
6268 else if (intel_syntax
6269 && !i.suffix
6270 && (i.tm.operand_types[0].bitfield.jumpabsolute
6271 || i.tm.opcode_modifier.jumpbyte
6272 || i.tm.opcode_modifier.jumpintersegment
6273 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6274 && i.tm.extension_opcode <= 3)))
6276 switch (flag_code)
6278 case CODE_64BIT:
6279 if (!i.tm.opcode_modifier.no_qsuf)
6281 i.suffix = QWORD_MNEM_SUFFIX;
6282 break;
6284 /* Fall through. */
6285 case CODE_32BIT:
6286 if (!i.tm.opcode_modifier.no_lsuf)
6287 i.suffix = LONG_MNEM_SUFFIX;
6288 break;
6289 case CODE_16BIT:
6290 if (!i.tm.opcode_modifier.no_wsuf)
6291 i.suffix = WORD_MNEM_SUFFIX;
6292 break;
6296 if (!i.suffix)
6298 if (!intel_syntax)
6300 if (i.tm.opcode_modifier.w)
6302 as_bad (_("no instruction mnemonic suffix given and "
6303 "no register operands; can't size instruction"));
6304 return 0;
6307 else
6309 unsigned int suffixes;
6311 suffixes = !i.tm.opcode_modifier.no_bsuf;
6312 if (!i.tm.opcode_modifier.no_wsuf)
6313 suffixes |= 1 << 1;
6314 if (!i.tm.opcode_modifier.no_lsuf)
6315 suffixes |= 1 << 2;
6316 if (!i.tm.opcode_modifier.no_ldsuf)
6317 suffixes |= 1 << 3;
6318 if (!i.tm.opcode_modifier.no_ssuf)
6319 suffixes |= 1 << 4;
6320 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6321 suffixes |= 1 << 5;
6323 /* There are more than suffix matches. */
6324 if (i.tm.opcode_modifier.w
6325 || ((suffixes & (suffixes - 1))
6326 && !i.tm.opcode_modifier.defaultsize
6327 && !i.tm.opcode_modifier.ignoresize))
6329 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6330 return 0;
6335 /* Change the opcode based on the operand size given by i.suffix. */
6336 switch (i.suffix)
6338 /* Size floating point instruction. */
6339 case LONG_MNEM_SUFFIX:
6340 if (i.tm.opcode_modifier.floatmf)
6342 i.tm.base_opcode ^= 4;
6343 break;
6345 /* fall through */
6346 case WORD_MNEM_SUFFIX:
6347 case QWORD_MNEM_SUFFIX:
6348 /* It's not a byte, select word/dword operation. */
6349 if (i.tm.opcode_modifier.w)
6351 if (i.tm.opcode_modifier.shortform)
6352 i.tm.base_opcode |= 8;
6353 else
6354 i.tm.base_opcode |= 1;
6356 /* fall through */
6357 case SHORT_MNEM_SUFFIX:
6358 /* Now select between word & dword operations via the operand
6359 size prefix, except for instructions that will ignore this
6360 prefix anyway. */
6361 if (i.reg_operands > 0
6362 && i.types[0].bitfield.reg
6363 && i.tm.opcode_modifier.addrprefixopreg
6364 && (i.tm.opcode_modifier.immext
6365 || i.operands == 1))
6367 /* The address size override prefix changes the size of the
6368 first operand. */
6369 if ((flag_code == CODE_32BIT
6370 && i.op[0].regs->reg_type.bitfield.word)
6371 || (flag_code != CODE_32BIT
6372 && i.op[0].regs->reg_type.bitfield.dword))
6373 if (!add_prefix (ADDR_PREFIX_OPCODE))
6374 return 0;
6376 else if (i.suffix != QWORD_MNEM_SUFFIX
6377 && !i.tm.opcode_modifier.ignoresize
6378 && !i.tm.opcode_modifier.floatmf
6379 && !i.tm.opcode_modifier.vex
6380 && !i.tm.opcode_modifier.vexopcode
6381 && !is_evex_encoding (&i.tm)
6382 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6383 || (flag_code == CODE_64BIT
6384 && i.tm.opcode_modifier.jumpbyte)))
6386 unsigned int prefix = DATA_PREFIX_OPCODE;
6388 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6389 prefix = ADDR_PREFIX_OPCODE;
6391 if (!add_prefix (prefix))
6392 return 0;
6395 /* Set mode64 for an operand. */
6396 if (i.suffix == QWORD_MNEM_SUFFIX
6397 && flag_code == CODE_64BIT
6398 && !i.tm.opcode_modifier.norex64
6399 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6400 need rex64. */
6401 && ! (i.operands == 2
6402 && i.tm.base_opcode == 0x90
6403 && i.tm.extension_opcode == None
6404 && operand_type_equal (&i.types [0], &acc64)
6405 && operand_type_equal (&i.types [1], &acc64)))
6406 i.rex |= REX_W;
6408 break;
6411 if (i.reg_operands != 0
6412 && i.operands > 1
6413 && i.tm.opcode_modifier.addrprefixopreg
6414 && !i.tm.opcode_modifier.immext)
6416 /* Check invalid register operand when the address size override
6417 prefix changes the size of register operands. */
6418 unsigned int op;
6419 enum { need_word, need_dword, need_qword } need;
6421 if (flag_code == CODE_32BIT)
6422 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6423 else
6425 if (i.prefix[ADDR_PREFIX])
6426 need = need_dword;
6427 else
6428 need = flag_code == CODE_64BIT ? need_qword : need_word;
6431 for (op = 0; op < i.operands; op++)
6432 if (i.types[op].bitfield.reg
6433 && ((need == need_word
6434 && !i.op[op].regs->reg_type.bitfield.word)
6435 || (need == need_dword
6436 && !i.op[op].regs->reg_type.bitfield.dword)
6437 || (need == need_qword
6438 && !i.op[op].regs->reg_type.bitfield.qword)))
6440 as_bad (_("invalid register operand size for `%s'"),
6441 i.tm.name);
6442 return 0;
6446 return 1;
6449 static int
6450 check_byte_reg (void)
6452 int op;
6454 for (op = i.operands; --op >= 0;)
6456 /* Skip non-register operands. */
6457 if (!i.types[op].bitfield.reg)
6458 continue;
6460 /* If this is an eight bit register, it's OK. If it's the 16 or
6461 32 bit version of an eight bit register, we will just use the
6462 low portion, and that's OK too. */
6463 if (i.types[op].bitfield.byte)
6464 continue;
6466 /* I/O port address operands are OK too. */
6467 if (i.tm.operand_types[op].bitfield.inoutportreg)
6468 continue;
6470 /* crc32 doesn't generate this warning. */
6471 if (i.tm.base_opcode == 0xf20f38f0)
6472 continue;
6474 if ((i.types[op].bitfield.word
6475 || i.types[op].bitfield.dword
6476 || i.types[op].bitfield.qword)
6477 && i.op[op].regs->reg_num < 4
6478 /* Prohibit these changes in 64bit mode, since the lowering
6479 would be more complicated. */
6480 && flag_code != CODE_64BIT)
6482 #if REGISTER_WARNINGS
6483 if (!quiet_warnings)
6484 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6485 register_prefix,
6486 (i.op[op].regs + (i.types[op].bitfield.word
6487 ? REGNAM_AL - REGNAM_AX
6488 : REGNAM_AL - REGNAM_EAX))->reg_name,
6489 register_prefix,
6490 i.op[op].regs->reg_name,
6491 i.suffix);
6492 #endif
6493 continue;
6495 /* Any other register is bad. */
6496 if (i.types[op].bitfield.reg
6497 || i.types[op].bitfield.regmmx
6498 || i.types[op].bitfield.regsimd
6499 || i.types[op].bitfield.sreg2
6500 || i.types[op].bitfield.sreg3
6501 || i.types[op].bitfield.control
6502 || i.types[op].bitfield.debug
6503 || i.types[op].bitfield.test)
6505 as_bad (_("`%s%s' not allowed with `%s%c'"),
6506 register_prefix,
6507 i.op[op].regs->reg_name,
6508 i.tm.name,
6509 i.suffix);
6510 return 0;
6513 return 1;
6516 static int
6517 check_long_reg (void)
6519 int op;
6521 for (op = i.operands; --op >= 0;)
6522 /* Skip non-register operands. */
6523 if (!i.types[op].bitfield.reg)
6524 continue;
6525 /* Reject eight bit registers, except where the template requires
6526 them. (eg. movzb) */
6527 else if (i.types[op].bitfield.byte
6528 && (i.tm.operand_types[op].bitfield.reg
6529 || i.tm.operand_types[op].bitfield.acc)
6530 && (i.tm.operand_types[op].bitfield.word
6531 || i.tm.operand_types[op].bitfield.dword))
6533 as_bad (_("`%s%s' not allowed with `%s%c'"),
6534 register_prefix,
6535 i.op[op].regs->reg_name,
6536 i.tm.name,
6537 i.suffix);
6538 return 0;
6540 /* Warn if the e prefix on a general reg is missing. */
6541 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6542 && i.types[op].bitfield.word
6543 && (i.tm.operand_types[op].bitfield.reg
6544 || i.tm.operand_types[op].bitfield.acc)
6545 && i.tm.operand_types[op].bitfield.dword)
6547 /* Prohibit these changes in the 64bit mode, since the
6548 lowering is more complicated. */
6549 if (flag_code == CODE_64BIT)
6551 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6552 register_prefix, i.op[op].regs->reg_name,
6553 i.suffix);
6554 return 0;
6556 #if REGISTER_WARNINGS
6557 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6558 register_prefix,
6559 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6560 register_prefix, i.op[op].regs->reg_name, i.suffix);
6561 #endif
6563 /* Warn if the r prefix on a general reg is present. */
6564 else if (i.types[op].bitfield.qword
6565 && (i.tm.operand_types[op].bitfield.reg
6566 || i.tm.operand_types[op].bitfield.acc)
6567 && i.tm.operand_types[op].bitfield.dword)
6569 if (intel_syntax
6570 && i.tm.opcode_modifier.toqword
6571 && !i.types[0].bitfield.regsimd)
6573 /* Convert to QWORD. We want REX byte. */
6574 i.suffix = QWORD_MNEM_SUFFIX;
6576 else
6578 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6579 register_prefix, i.op[op].regs->reg_name,
6580 i.suffix);
6581 return 0;
6584 return 1;
6587 static int
6588 check_qword_reg (void)
6590 int op;
6592 for (op = i.operands; --op >= 0; )
6593 /* Skip non-register operands. */
6594 if (!i.types[op].bitfield.reg)
6595 continue;
6596 /* Reject eight bit registers, except where the template requires
6597 them. (eg. movzb) */
6598 else if (i.types[op].bitfield.byte
6599 && (i.tm.operand_types[op].bitfield.reg
6600 || i.tm.operand_types[op].bitfield.acc)
6601 && (i.tm.operand_types[op].bitfield.word
6602 || i.tm.operand_types[op].bitfield.dword))
6604 as_bad (_("`%s%s' not allowed with `%s%c'"),
6605 register_prefix,
6606 i.op[op].regs->reg_name,
6607 i.tm.name,
6608 i.suffix);
6609 return 0;
6611 /* Warn if the r prefix on a general reg is missing. */
6612 else if ((i.types[op].bitfield.word
6613 || i.types[op].bitfield.dword)
6614 && (i.tm.operand_types[op].bitfield.reg
6615 || i.tm.operand_types[op].bitfield.acc)
6616 && i.tm.operand_types[op].bitfield.qword)
6618 /* Prohibit these changes in the 64bit mode, since the
6619 lowering is more complicated. */
6620 if (intel_syntax
6621 && i.tm.opcode_modifier.todword
6622 && !i.types[0].bitfield.regsimd)
6624 /* Convert to DWORD. We don't want REX byte. */
6625 i.suffix = LONG_MNEM_SUFFIX;
6627 else
6629 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6630 register_prefix, i.op[op].regs->reg_name,
6631 i.suffix);
6632 return 0;
6635 return 1;
6638 static int
6639 check_word_reg (void)
6641 int op;
6642 for (op = i.operands; --op >= 0;)
6643 /* Skip non-register operands. */
6644 if (!i.types[op].bitfield.reg)
6645 continue;
6646 /* Reject eight bit registers, except where the template requires
6647 them. (eg. movzb) */
6648 else if (i.types[op].bitfield.byte
6649 && (i.tm.operand_types[op].bitfield.reg
6650 || i.tm.operand_types[op].bitfield.acc)
6651 && (i.tm.operand_types[op].bitfield.word
6652 || i.tm.operand_types[op].bitfield.dword))
6654 as_bad (_("`%s%s' not allowed with `%s%c'"),
6655 register_prefix,
6656 i.op[op].regs->reg_name,
6657 i.tm.name,
6658 i.suffix);
6659 return 0;
6661 /* Warn if the e or r prefix on a general reg is present. */
6662 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6663 && (i.types[op].bitfield.dword
6664 || i.types[op].bitfield.qword)
6665 && (i.tm.operand_types[op].bitfield.reg
6666 || i.tm.operand_types[op].bitfield.acc)
6667 && i.tm.operand_types[op].bitfield.word)
6669 /* Prohibit these changes in the 64bit mode, since the
6670 lowering is more complicated. */
6671 if (flag_code == CODE_64BIT)
6673 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6674 register_prefix, i.op[op].regs->reg_name,
6675 i.suffix);
6676 return 0;
6678 #if REGISTER_WARNINGS
6679 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6680 register_prefix,
6681 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6682 register_prefix, i.op[op].regs->reg_name, i.suffix);
6683 #endif
6685 return 1;
6688 static int
6689 update_imm (unsigned int j)
6691 i386_operand_type overlap = i.types[j];
6692 if ((overlap.bitfield.imm8
6693 || overlap.bitfield.imm8s
6694 || overlap.bitfield.imm16
6695 || overlap.bitfield.imm32
6696 || overlap.bitfield.imm32s
6697 || overlap.bitfield.imm64)
6698 && !operand_type_equal (&overlap, &imm8)
6699 && !operand_type_equal (&overlap, &imm8s)
6700 && !operand_type_equal (&overlap, &imm16)
6701 && !operand_type_equal (&overlap, &imm32)
6702 && !operand_type_equal (&overlap, &imm32s)
6703 && !operand_type_equal (&overlap, &imm64))
6705 if (i.suffix)
6707 i386_operand_type temp;
6709 operand_type_set (&temp, 0);
6710 if (i.suffix == BYTE_MNEM_SUFFIX)
6712 temp.bitfield.imm8 = overlap.bitfield.imm8;
6713 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6715 else if (i.suffix == WORD_MNEM_SUFFIX)
6716 temp.bitfield.imm16 = overlap.bitfield.imm16;
6717 else if (i.suffix == QWORD_MNEM_SUFFIX)
6719 temp.bitfield.imm64 = overlap.bitfield.imm64;
6720 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6722 else
6723 temp.bitfield.imm32 = overlap.bitfield.imm32;
6724 overlap = temp;
6726 else if (operand_type_equal (&overlap, &imm16_32_32s)
6727 || operand_type_equal (&overlap, &imm16_32)
6728 || operand_type_equal (&overlap, &imm16_32s))
6730 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6731 overlap = imm16;
6732 else
6733 overlap = imm32s;
6735 if (!operand_type_equal (&overlap, &imm8)
6736 && !operand_type_equal (&overlap, &imm8s)
6737 && !operand_type_equal (&overlap, &imm16)
6738 && !operand_type_equal (&overlap, &imm32)
6739 && !operand_type_equal (&overlap, &imm32s)
6740 && !operand_type_equal (&overlap, &imm64))
6742 as_bad (_("no instruction mnemonic suffix given; "
6743 "can't determine immediate size"));
6744 return 0;
6747 i.types[j] = overlap;
6749 return 1;
6752 static int
6753 finalize_imm (void)
6755 unsigned int j, n;
6757 /* Update the first 2 immediate operands. */
6758 n = i.operands > 2 ? 2 : i.operands;
6759 if (n)
6761 for (j = 0; j < n; j++)
6762 if (update_imm (j) == 0)
6763 return 0;
6765 /* The 3rd operand can't be immediate operand. */
6766 gas_assert (operand_type_check (i.types[2], imm) == 0);
6769 return 1;
6772 static int
6773 process_operands (void)
6775 /* Default segment register this instruction will use for memory
6776 accesses. 0 means unknown. This is only for optimizing out
6777 unnecessary segment overrides. */
6778 const seg_entry *default_seg = 0;
6780 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6782 unsigned int dupl = i.operands;
6783 unsigned int dest = dupl - 1;
6784 unsigned int j;
6786 /* The destination must be an xmm register. */
6787 gas_assert (i.reg_operands
6788 && MAX_OPERANDS > dupl
6789 && operand_type_equal (&i.types[dest], &regxmm));
6791 if (i.tm.operand_types[0].bitfield.acc
6792 && i.tm.operand_types[0].bitfield.xmmword)
6794 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6796 /* Keep xmm0 for instructions with VEX prefix and 3
6797 sources. */
6798 i.tm.operand_types[0].bitfield.acc = 0;
6799 i.tm.operand_types[0].bitfield.regsimd = 1;
6800 goto duplicate;
6802 else
6804 /* We remove the first xmm0 and keep the number of
6805 operands unchanged, which in fact duplicates the
6806 destination. */
6807 for (j = 1; j < i.operands; j++)
6809 i.op[j - 1] = i.op[j];
6810 i.types[j - 1] = i.types[j];
6811 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6815 else if (i.tm.opcode_modifier.implicit1stxmm0)
6817 gas_assert ((MAX_OPERANDS - 1) > dupl
6818 && (i.tm.opcode_modifier.vexsources
6819 == VEX3SOURCES));
6821 /* Add the implicit xmm0 for instructions with VEX prefix
6822 and 3 sources. */
6823 for (j = i.operands; j > 0; j--)
6825 i.op[j] = i.op[j - 1];
6826 i.types[j] = i.types[j - 1];
6827 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6829 i.op[0].regs
6830 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6831 i.types[0] = regxmm;
6832 i.tm.operand_types[0] = regxmm;
6834 i.operands += 2;
6835 i.reg_operands += 2;
6836 i.tm.operands += 2;
6838 dupl++;
6839 dest++;
6840 i.op[dupl] = i.op[dest];
6841 i.types[dupl] = i.types[dest];
6842 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6844 else
6846 duplicate:
6847 i.operands++;
6848 i.reg_operands++;
6849 i.tm.operands++;
6851 i.op[dupl] = i.op[dest];
6852 i.types[dupl] = i.types[dest];
6853 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6856 if (i.tm.opcode_modifier.immext)
6857 process_immext ();
6859 else if (i.tm.operand_types[0].bitfield.acc
6860 && i.tm.operand_types[0].bitfield.xmmword)
6862 unsigned int j;
6864 for (j = 1; j < i.operands; j++)
6866 i.op[j - 1] = i.op[j];
6867 i.types[j - 1] = i.types[j];
6869 /* We need to adjust fields in i.tm since they are used by
6870 build_modrm_byte. */
6871 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6874 i.operands--;
6875 i.reg_operands--;
6876 i.tm.operands--;
6878 else if (i.tm.opcode_modifier.implicitquadgroup)
6880 unsigned int regnum, first_reg_in_group, last_reg_in_group;
6882 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6883 gas_assert (i.operands >= 2 && i.types[1].bitfield.regsimd);
6884 regnum = register_number (i.op[1].regs);
6885 first_reg_in_group = regnum & ~3;
6886 last_reg_in_group = first_reg_in_group + 3;
6887 if (regnum != first_reg_in_group)
6888 as_warn (_("source register `%s%s' implicitly denotes"
6889 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6890 register_prefix, i.op[1].regs->reg_name,
6891 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6892 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6893 i.tm.name);
6895 else if (i.tm.opcode_modifier.regkludge)
6897 /* The imul $imm, %reg instruction is converted into
6898 imul $imm, %reg, %reg, and the clr %reg instruction
6899 is converted into xor %reg, %reg. */
6901 unsigned int first_reg_op;
6903 if (operand_type_check (i.types[0], reg))
6904 first_reg_op = 0;
6905 else
6906 first_reg_op = 1;
6907 /* Pretend we saw the extra register operand. */
6908 gas_assert (i.reg_operands == 1
6909 && i.op[first_reg_op + 1].regs == 0);
6910 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
6911 i.types[first_reg_op + 1] = i.types[first_reg_op];
6912 i.operands++;
6913 i.reg_operands++;
6916 if (i.tm.opcode_modifier.shortform)
6918 if (i.types[0].bitfield.sreg2
6919 || i.types[0].bitfield.sreg3)
6921 if (i.tm.base_opcode == POP_SEG_SHORT
6922 && i.op[0].regs->reg_num == 1)
6924 as_bad (_("you can't `pop %scs'"), register_prefix);
6925 return 0;
6927 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
6928 if ((i.op[0].regs->reg_flags & RegRex) != 0)
6929 i.rex |= REX_B;
6931 else
6933 /* The register or float register operand is in operand
6934 0 or 1. */
6935 unsigned int op;
6937 if ((i.types[0].bitfield.reg && i.types[0].bitfield.tbyte)
6938 || operand_type_check (i.types[0], reg))
6939 op = 0;
6940 else
6941 op = 1;
6942 /* Register goes in low 3 bits of opcode. */
6943 i.tm.base_opcode |= i.op[op].regs->reg_num;
6944 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6945 i.rex |= REX_B;
6946 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
6948 /* Warn about some common errors, but press on regardless.
6949 The first case can be generated by gcc (<= 2.8.1). */
6950 if (i.operands == 2)
6952 /* Reversed arguments on faddp, fsubp, etc. */
6953 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
6954 register_prefix, i.op[!intel_syntax].regs->reg_name,
6955 register_prefix, i.op[intel_syntax].regs->reg_name);
6957 else
6959 /* Extraneous `l' suffix on fp insn. */
6960 as_warn (_("translating to `%s %s%s'"), i.tm.name,
6961 register_prefix, i.op[0].regs->reg_name);
6966 else if (i.tm.opcode_modifier.modrm)
6968 /* The opcode is completed (modulo i.tm.extension_opcode which
6969 must be put into the modrm byte). Now, we make the modrm and
6970 index base bytes based on all the info we've collected. */
6972 default_seg = build_modrm_byte ();
6974 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
6976 default_seg = &ds;
6978 else if (i.tm.opcode_modifier.isstring)
6980 /* For the string instructions that allow a segment override
6981 on one of their operands, the default segment is ds. */
6982 default_seg = &ds;
6985 if (i.tm.base_opcode == 0x8d /* lea */
6986 && i.seg[0]
6987 && !quiet_warnings)
6988 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
6990 /* If a segment was explicitly specified, and the specified segment
6991 is not the default, use an opcode prefix to select it. If we
6992 never figured out what the default segment is, then default_seg
6993 will be zero at this point, and the specified segment prefix will
6994 always be used. */
6995 if ((i.seg[0]) && (i.seg[0] != default_seg))
6997 if (!add_prefix (i.seg[0]->seg_prefix))
6998 return 0;
7000 return 1;
7003 static const seg_entry *
7004 build_modrm_byte (void)
7006 const seg_entry *default_seg = 0;
7007 unsigned int source, dest;
7008 int vex_3_sources;
7010 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7011 if (vex_3_sources)
7013 unsigned int nds, reg_slot;
7014 expressionS *exp;
7016 dest = i.operands - 1;
7017 nds = dest - 1;
7019 /* There are 2 kinds of instructions:
7020 1. 5 operands: 4 register operands or 3 register operands
7021 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
7022 VexW0 or VexW1. The destination must be either XMM, YMM or
7023 ZMM register.
7024 2. 4 operands: 4 register operands or 3 register operands
7025 plus 1 memory operand, with VexXDS. */
7026 gas_assert ((i.reg_operands == 4
7027 || (i.reg_operands == 3 && i.mem_operands == 1))
7028 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7029 && i.tm.opcode_modifier.vexw
7030 && i.tm.operand_types[dest].bitfield.regsimd);
7032 /* If VexW1 is set, the first non-immediate operand is the source and
7033 the second non-immediate one is encoded in the immediate operand. */
7034 if (i.tm.opcode_modifier.vexw == VEXW1)
7036 source = i.imm_operands;
7037 reg_slot = i.imm_operands + 1;
7039 else
7041 source = i.imm_operands + 1;
7042 reg_slot = i.imm_operands;
7045 if (i.imm_operands == 0)
7047 /* When there is no immediate operand, generate an 8bit
7048 immediate operand to encode the first operand. */
7049 exp = &im_expressions[i.imm_operands++];
7050 i.op[i.operands].imms = exp;
7051 i.types[i.operands] = imm8;
7052 i.operands++;
7054 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7055 exp->X_op = O_constant;
7056 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7057 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7059 else
7061 unsigned int imm_slot;
7063 gas_assert (i.imm_operands == 1 && i.types[0].bitfield.vec_imm4);
7065 if (i.tm.opcode_modifier.immext)
7067 /* When ImmExt is set, the immediate byte is the last
7068 operand. */
7069 imm_slot = i.operands - 1;
7070 source--;
7071 reg_slot--;
7073 else
7075 imm_slot = 0;
7077 /* Turn on Imm8 so that output_imm will generate it. */
7078 i.types[imm_slot].bitfield.imm8 = 1;
7081 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
7082 i.op[imm_slot].imms->X_add_number
7083 |= register_number (i.op[reg_slot].regs) << 4;
7084 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7087 gas_assert (i.tm.operand_types[nds].bitfield.regsimd);
7088 i.vex.register_specifier = i.op[nds].regs;
7090 else
7091 source = dest = 0;
7093 /* i.reg_operands MUST be the number of real register operands;
7094 implicit registers do not count. If there are 3 register
7095 operands, it must be a instruction with VexNDS. For a
7096 instruction with VexNDD, the destination register is encoded
7097 in VEX prefix. If there are 4 register operands, it must be
7098 a instruction with VEX prefix and 3 sources. */
7099 if (i.mem_operands == 0
7100 && ((i.reg_operands == 2
7101 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7102 || (i.reg_operands == 3
7103 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7104 || (i.reg_operands == 4 && vex_3_sources)))
7106 switch (i.operands)
7108 case 2:
7109 source = 0;
7110 break;
7111 case 3:
7112 /* When there are 3 operands, one of them may be immediate,
7113 which may be the first or the last operand. Otherwise,
7114 the first operand must be shift count register (cl) or it
7115 is an instruction with VexNDS. */
7116 gas_assert (i.imm_operands == 1
7117 || (i.imm_operands == 0
7118 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7119 || i.types[0].bitfield.shiftcount)));
7120 if (operand_type_check (i.types[0], imm)
7121 || i.types[0].bitfield.shiftcount)
7122 source = 1;
7123 else
7124 source = 0;
7125 break;
7126 case 4:
7127 /* When there are 4 operands, the first two must be 8bit
7128 immediate operands. The source operand will be the 3rd
7129 one.
7131 For instructions with VexNDS, if the first operand
7132 an imm8, the source operand is the 2nd one. If the last
7133 operand is imm8, the source operand is the first one. */
7134 gas_assert ((i.imm_operands == 2
7135 && i.types[0].bitfield.imm8
7136 && i.types[1].bitfield.imm8)
7137 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7138 && i.imm_operands == 1
7139 && (i.types[0].bitfield.imm8
7140 || i.types[i.operands - 1].bitfield.imm8
7141 || i.rounding)));
7142 if (i.imm_operands == 2)
7143 source = 2;
7144 else
7146 if (i.types[0].bitfield.imm8)
7147 source = 1;
7148 else
7149 source = 0;
7151 break;
7152 case 5:
7153 if (is_evex_encoding (&i.tm))
7155 /* For EVEX instructions, when there are 5 operands, the
7156 first one must be immediate operand. If the second one
7157 is immediate operand, the source operand is the 3th
7158 one. If the last one is immediate operand, the source
7159 operand is the 2nd one. */
7160 gas_assert (i.imm_operands == 2
7161 && i.tm.opcode_modifier.sae
7162 && operand_type_check (i.types[0], imm));
7163 if (operand_type_check (i.types[1], imm))
7164 source = 2;
7165 else if (operand_type_check (i.types[4], imm))
7166 source = 1;
7167 else
7168 abort ();
7170 break;
7171 default:
7172 abort ();
7175 if (!vex_3_sources)
7177 dest = source + 1;
7179 /* RC/SAE operand could be between DEST and SRC. That happens
7180 when one operand is GPR and the other one is XMM/YMM/ZMM
7181 register. */
7182 if (i.rounding && i.rounding->operand == (int) dest)
7183 dest++;
7185 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7187 /* For instructions with VexNDS, the register-only source
7188 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7189 register. It is encoded in VEX prefix. We need to
7190 clear RegMem bit before calling operand_type_equal. */
7192 i386_operand_type op;
7193 unsigned int vvvv;
7195 /* Check register-only source operand when two source
7196 operands are swapped. */
7197 if (!i.tm.operand_types[source].bitfield.baseindex
7198 && i.tm.operand_types[dest].bitfield.baseindex)
7200 vvvv = source;
7201 source = dest;
7203 else
7204 vvvv = dest;
7206 op = i.tm.operand_types[vvvv];
7207 op.bitfield.regmem = 0;
7208 if ((dest + 1) >= i.operands
7209 || ((!op.bitfield.reg
7210 || (!op.bitfield.dword && !op.bitfield.qword))
7211 && !op.bitfield.regsimd
7212 && !operand_type_equal (&op, &regmask)))
7213 abort ();
7214 i.vex.register_specifier = i.op[vvvv].regs;
7215 dest++;
7219 i.rm.mode = 3;
7220 /* One of the register operands will be encoded in the i.tm.reg
7221 field, the other in the combined i.tm.mode and i.tm.regmem
7222 fields. If no form of this instruction supports a memory
7223 destination operand, then we assume the source operand may
7224 sometimes be a memory operand and so we need to store the
7225 destination in the i.rm.reg field. */
7226 if (!i.tm.operand_types[dest].bitfield.regmem
7227 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7229 i.rm.reg = i.op[dest].regs->reg_num;
7230 i.rm.regmem = i.op[source].regs->reg_num;
7231 if (i.op[dest].regs->reg_type.bitfield.regmmx
7232 || i.op[source].regs->reg_type.bitfield.regmmx)
7233 i.has_regmmx = TRUE;
7234 else if (i.op[dest].regs->reg_type.bitfield.regsimd
7235 || i.op[source].regs->reg_type.bitfield.regsimd)
7237 if (i.types[dest].bitfield.zmmword
7238 || i.types[source].bitfield.zmmword)
7239 i.has_regzmm = TRUE;
7240 else if (i.types[dest].bitfield.ymmword
7241 || i.types[source].bitfield.ymmword)
7242 i.has_regymm = TRUE;
7243 else
7244 i.has_regxmm = TRUE;
7246 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7247 i.rex |= REX_R;
7248 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7249 i.vrex |= REX_R;
7250 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7251 i.rex |= REX_B;
7252 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7253 i.vrex |= REX_B;
7255 else
7257 i.rm.reg = i.op[source].regs->reg_num;
7258 i.rm.regmem = i.op[dest].regs->reg_num;
7259 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7260 i.rex |= REX_B;
7261 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7262 i.vrex |= REX_B;
7263 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7264 i.rex |= REX_R;
7265 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7266 i.vrex |= REX_R;
7268 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7270 if (!i.types[i.tm.operand_types[0].bitfield.regmem].bitfield.control)
7271 abort ();
7272 i.rex &= ~REX_R;
7273 add_prefix (LOCK_PREFIX_OPCODE);
7276 else
7277 { /* If it's not 2 reg operands... */
7278 unsigned int mem;
7280 if (i.mem_operands)
7282 unsigned int fake_zero_displacement = 0;
7283 unsigned int op;
7285 for (op = 0; op < i.operands; op++)
7286 if (operand_type_check (i.types[op], anymem))
7287 break;
7288 gas_assert (op < i.operands);
7290 if (i.tm.opcode_modifier.vecsib)
7292 if (i.index_reg->reg_num == RegIZ)
7293 abort ();
7295 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7296 if (!i.base_reg)
7298 i.sib.base = NO_BASE_REGISTER;
7299 i.sib.scale = i.log2_scale_factor;
7300 i.types[op].bitfield.disp8 = 0;
7301 i.types[op].bitfield.disp16 = 0;
7302 i.types[op].bitfield.disp64 = 0;
7303 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7305 /* Must be 32 bit */
7306 i.types[op].bitfield.disp32 = 1;
7307 i.types[op].bitfield.disp32s = 0;
7309 else
7311 i.types[op].bitfield.disp32 = 0;
7312 i.types[op].bitfield.disp32s = 1;
7315 i.sib.index = i.index_reg->reg_num;
7316 if ((i.index_reg->reg_flags & RegRex) != 0)
7317 i.rex |= REX_X;
7318 if ((i.index_reg->reg_flags & RegVRex) != 0)
7319 i.vrex |= REX_X;
7322 default_seg = &ds;
7324 if (i.base_reg == 0)
7326 i.rm.mode = 0;
7327 if (!i.disp_operands)
7328 fake_zero_displacement = 1;
7329 if (i.index_reg == 0)
7331 i386_operand_type newdisp;
7333 gas_assert (!i.tm.opcode_modifier.vecsib);
7334 /* Operand is just <disp> */
7335 if (flag_code == CODE_64BIT)
7337 /* 64bit mode overwrites the 32bit absolute
7338 addressing by RIP relative addressing and
7339 absolute addressing is encoded by one of the
7340 redundant SIB forms. */
7341 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7342 i.sib.base = NO_BASE_REGISTER;
7343 i.sib.index = NO_INDEX_REGISTER;
7344 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7346 else if ((flag_code == CODE_16BIT)
7347 ^ (i.prefix[ADDR_PREFIX] != 0))
7349 i.rm.regmem = NO_BASE_REGISTER_16;
7350 newdisp = disp16;
7352 else
7354 i.rm.regmem = NO_BASE_REGISTER;
7355 newdisp = disp32;
7357 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7358 i.types[op] = operand_type_or (i.types[op], newdisp);
7360 else if (!i.tm.opcode_modifier.vecsib)
7362 /* !i.base_reg && i.index_reg */
7363 if (i.index_reg->reg_num == RegIZ)
7364 i.sib.index = NO_INDEX_REGISTER;
7365 else
7366 i.sib.index = i.index_reg->reg_num;
7367 i.sib.base = NO_BASE_REGISTER;
7368 i.sib.scale = i.log2_scale_factor;
7369 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7370 i.types[op].bitfield.disp8 = 0;
7371 i.types[op].bitfield.disp16 = 0;
7372 i.types[op].bitfield.disp64 = 0;
7373 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7375 /* Must be 32 bit */
7376 i.types[op].bitfield.disp32 = 1;
7377 i.types[op].bitfield.disp32s = 0;
7379 else
7381 i.types[op].bitfield.disp32 = 0;
7382 i.types[op].bitfield.disp32s = 1;
7384 if ((i.index_reg->reg_flags & RegRex) != 0)
7385 i.rex |= REX_X;
7388 /* RIP addressing for 64bit mode. */
7389 else if (i.base_reg->reg_num == RegIP)
7391 gas_assert (!i.tm.opcode_modifier.vecsib);
7392 i.rm.regmem = NO_BASE_REGISTER;
7393 i.types[op].bitfield.disp8 = 0;
7394 i.types[op].bitfield.disp16 = 0;
7395 i.types[op].bitfield.disp32 = 0;
7396 i.types[op].bitfield.disp32s = 1;
7397 i.types[op].bitfield.disp64 = 0;
7398 i.flags[op] |= Operand_PCrel;
7399 if (! i.disp_operands)
7400 fake_zero_displacement = 1;
7402 else if (i.base_reg->reg_type.bitfield.word)
7404 gas_assert (!i.tm.opcode_modifier.vecsib);
7405 switch (i.base_reg->reg_num)
7407 case 3: /* (%bx) */
7408 if (i.index_reg == 0)
7409 i.rm.regmem = 7;
7410 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7411 i.rm.regmem = i.index_reg->reg_num - 6;
7412 break;
7413 case 5: /* (%bp) */
7414 default_seg = &ss;
7415 if (i.index_reg == 0)
7417 i.rm.regmem = 6;
7418 if (operand_type_check (i.types[op], disp) == 0)
7420 /* fake (%bp) into 0(%bp) */
7421 i.types[op].bitfield.disp8 = 1;
7422 fake_zero_displacement = 1;
7425 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7426 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7427 break;
7428 default: /* (%si) -> 4 or (%di) -> 5 */
7429 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7431 i.rm.mode = mode_from_disp_size (i.types[op]);
7433 else /* i.base_reg and 32/64 bit mode */
7435 if (flag_code == CODE_64BIT
7436 && operand_type_check (i.types[op], disp))
7438 i.types[op].bitfield.disp16 = 0;
7439 i.types[op].bitfield.disp64 = 0;
7440 if (i.prefix[ADDR_PREFIX] == 0)
7442 i.types[op].bitfield.disp32 = 0;
7443 i.types[op].bitfield.disp32s = 1;
7445 else
7447 i.types[op].bitfield.disp32 = 1;
7448 i.types[op].bitfield.disp32s = 0;
7452 if (!i.tm.opcode_modifier.vecsib)
7453 i.rm.regmem = i.base_reg->reg_num;
7454 if ((i.base_reg->reg_flags & RegRex) != 0)
7455 i.rex |= REX_B;
7456 i.sib.base = i.base_reg->reg_num;
7457 /* x86-64 ignores REX prefix bit here to avoid decoder
7458 complications. */
7459 if (!(i.base_reg->reg_flags & RegRex)
7460 && (i.base_reg->reg_num == EBP_REG_NUM
7461 || i.base_reg->reg_num == ESP_REG_NUM))
7462 default_seg = &ss;
7463 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7465 fake_zero_displacement = 1;
7466 i.types[op].bitfield.disp8 = 1;
7468 i.sib.scale = i.log2_scale_factor;
7469 if (i.index_reg == 0)
7471 gas_assert (!i.tm.opcode_modifier.vecsib);
7472 /* <disp>(%esp) becomes two byte modrm with no index
7473 register. We've already stored the code for esp
7474 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7475 Any base register besides %esp will not use the
7476 extra modrm byte. */
7477 i.sib.index = NO_INDEX_REGISTER;
7479 else if (!i.tm.opcode_modifier.vecsib)
7481 if (i.index_reg->reg_num == RegIZ)
7482 i.sib.index = NO_INDEX_REGISTER;
7483 else
7484 i.sib.index = i.index_reg->reg_num;
7485 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7486 if ((i.index_reg->reg_flags & RegRex) != 0)
7487 i.rex |= REX_X;
7490 if (i.disp_operands
7491 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7492 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7493 i.rm.mode = 0;
7494 else
7496 if (!fake_zero_displacement
7497 && !i.disp_operands
7498 && i.disp_encoding)
7500 fake_zero_displacement = 1;
7501 if (i.disp_encoding == disp_encoding_8bit)
7502 i.types[op].bitfield.disp8 = 1;
7503 else
7504 i.types[op].bitfield.disp32 = 1;
7506 i.rm.mode = mode_from_disp_size (i.types[op]);
7510 if (fake_zero_displacement)
7512 /* Fakes a zero displacement assuming that i.types[op]
7513 holds the correct displacement size. */
7514 expressionS *exp;
7516 gas_assert (i.op[op].disps == 0);
7517 exp = &disp_expressions[i.disp_operands++];
7518 i.op[op].disps = exp;
7519 exp->X_op = O_constant;
7520 exp->X_add_number = 0;
7521 exp->X_add_symbol = (symbolS *) 0;
7522 exp->X_op_symbol = (symbolS *) 0;
7525 mem = op;
7527 else
7528 mem = ~0;
7530 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7532 if (operand_type_check (i.types[0], imm))
7533 i.vex.register_specifier = NULL;
7534 else
7536 /* VEX.vvvv encodes one of the sources when the first
7537 operand is not an immediate. */
7538 if (i.tm.opcode_modifier.vexw == VEXW0)
7539 i.vex.register_specifier = i.op[0].regs;
7540 else
7541 i.vex.register_specifier = i.op[1].regs;
7544 /* Destination is a XMM register encoded in the ModRM.reg
7545 and VEX.R bit. */
7546 i.rm.reg = i.op[2].regs->reg_num;
7547 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7548 i.rex |= REX_R;
7550 /* ModRM.rm and VEX.B encodes the other source. */
7551 if (!i.mem_operands)
7553 i.rm.mode = 3;
7555 if (i.tm.opcode_modifier.vexw == VEXW0)
7556 i.rm.regmem = i.op[1].regs->reg_num;
7557 else
7558 i.rm.regmem = i.op[0].regs->reg_num;
7560 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7561 i.rex |= REX_B;
7564 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7566 i.vex.register_specifier = i.op[2].regs;
7567 if (!i.mem_operands)
7569 i.rm.mode = 3;
7570 i.rm.regmem = i.op[1].regs->reg_num;
7571 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7572 i.rex |= REX_B;
7575 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7576 (if any) based on i.tm.extension_opcode. Again, we must be
7577 careful to make sure that segment/control/debug/test/MMX
7578 registers are coded into the i.rm.reg field. */
7579 else if (i.reg_operands)
7581 unsigned int op;
7582 unsigned int vex_reg = ~0;
7584 for (op = 0; op < i.operands; op++)
7586 if (i.types[op].bitfield.reg
7587 || i.types[op].bitfield.regbnd
7588 || i.types[op].bitfield.regmask
7589 || i.types[op].bitfield.sreg2
7590 || i.types[op].bitfield.sreg3
7591 || i.types[op].bitfield.control
7592 || i.types[op].bitfield.debug
7593 || i.types[op].bitfield.test)
7594 break;
7595 if (i.types[op].bitfield.regsimd)
7597 if (i.types[op].bitfield.zmmword)
7598 i.has_regzmm = TRUE;
7599 else if (i.types[op].bitfield.ymmword)
7600 i.has_regymm = TRUE;
7601 else
7602 i.has_regxmm = TRUE;
7603 break;
7605 if (i.types[op].bitfield.regmmx)
7607 i.has_regmmx = TRUE;
7608 break;
7612 if (vex_3_sources)
7613 op = dest;
7614 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7616 /* For instructions with VexNDS, the register-only
7617 source operand is encoded in VEX prefix. */
7618 gas_assert (mem != (unsigned int) ~0);
7620 if (op > mem)
7622 vex_reg = op++;
7623 gas_assert (op < i.operands);
7625 else
7627 /* Check register-only source operand when two source
7628 operands are swapped. */
7629 if (!i.tm.operand_types[op].bitfield.baseindex
7630 && i.tm.operand_types[op + 1].bitfield.baseindex)
7632 vex_reg = op;
7633 op += 2;
7634 gas_assert (mem == (vex_reg + 1)
7635 && op < i.operands);
7637 else
7639 vex_reg = op + 1;
7640 gas_assert (vex_reg < i.operands);
7644 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7646 /* For instructions with VexNDD, the register destination
7647 is encoded in VEX prefix. */
7648 if (i.mem_operands == 0)
7650 /* There is no memory operand. */
7651 gas_assert ((op + 2) == i.operands);
7652 vex_reg = op + 1;
7654 else
7656 /* There are only 2 non-immediate operands. */
7657 gas_assert (op < i.imm_operands + 2
7658 && i.operands == i.imm_operands + 2);
7659 vex_reg = i.imm_operands + 1;
7662 else
7663 gas_assert (op < i.operands);
7665 if (vex_reg != (unsigned int) ~0)
7667 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7669 if ((!type->bitfield.reg
7670 || (!type->bitfield.dword && !type->bitfield.qword))
7671 && !type->bitfield.regsimd
7672 && !operand_type_equal (type, &regmask))
7673 abort ();
7675 i.vex.register_specifier = i.op[vex_reg].regs;
7678 /* Don't set OP operand twice. */
7679 if (vex_reg != op)
7681 /* If there is an extension opcode to put here, the
7682 register number must be put into the regmem field. */
7683 if (i.tm.extension_opcode != None)
7685 i.rm.regmem = i.op[op].regs->reg_num;
7686 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7687 i.rex |= REX_B;
7688 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7689 i.vrex |= REX_B;
7691 else
7693 i.rm.reg = i.op[op].regs->reg_num;
7694 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7695 i.rex |= REX_R;
7696 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7697 i.vrex |= REX_R;
7701 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7702 must set it to 3 to indicate this is a register operand
7703 in the regmem field. */
7704 if (!i.mem_operands)
7705 i.rm.mode = 3;
7708 /* Fill in i.rm.reg field with extension opcode (if any). */
7709 if (i.tm.extension_opcode != None)
7710 i.rm.reg = i.tm.extension_opcode;
7712 return default_seg;
7715 static void
7716 output_branch (void)
7718 char *p;
7719 int size;
7720 int code16;
7721 int prefix;
7722 relax_substateT subtype;
7723 symbolS *sym;
7724 offsetT off;
7726 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7727 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7729 prefix = 0;
7730 if (i.prefix[DATA_PREFIX] != 0)
7732 prefix = 1;
7733 i.prefixes -= 1;
7734 code16 ^= CODE16;
7736 /* Pentium4 branch hints. */
7737 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7738 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7740 prefix++;
7741 i.prefixes--;
7743 if (i.prefix[REX_PREFIX] != 0)
7745 prefix++;
7746 i.prefixes--;
7749 /* BND prefixed jump. */
7750 if (i.prefix[BND_PREFIX] != 0)
7752 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7753 i.prefixes -= 1;
7756 if (i.prefixes != 0 && !intel_syntax)
7757 as_warn (_("skipping prefixes on this instruction"));
7759 /* It's always a symbol; End frag & setup for relax.
7760 Make sure there is enough room in this frag for the largest
7761 instruction we may generate in md_convert_frag. This is 2
7762 bytes for the opcode and room for the prefix and largest
7763 displacement. */
7764 frag_grow (prefix + 2 + 4);
7765 /* Prefix and 1 opcode byte go in fr_fix. */
7766 p = frag_more (prefix + 1);
7767 if (i.prefix[DATA_PREFIX] != 0)
7768 *p++ = DATA_PREFIX_OPCODE;
7769 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7770 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7771 *p++ = i.prefix[SEG_PREFIX];
7772 if (i.prefix[REX_PREFIX] != 0)
7773 *p++ = i.prefix[REX_PREFIX];
7774 *p = i.tm.base_opcode;
7776 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7777 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7778 else if (cpu_arch_flags.bitfield.cpui386)
7779 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7780 else
7781 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7782 subtype |= code16;
7784 sym = i.op[0].disps->X_add_symbol;
7785 off = i.op[0].disps->X_add_number;
7787 if (i.op[0].disps->X_op != O_constant
7788 && i.op[0].disps->X_op != O_symbol)
7790 /* Handle complex expressions. */
7791 sym = make_expr_symbol (i.op[0].disps);
7792 off = 0;
7795 /* 1 possible extra opcode + 4 byte displacement go in var part.
7796 Pass reloc in fr_var. */
7797 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7800 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7801 /* Return TRUE iff PLT32 relocation should be used for branching to
7802 symbol S. */
7804 static bfd_boolean
7805 need_plt32_p (symbolS *s)
7807 /* PLT32 relocation is ELF only. */
7808 if (!IS_ELF)
7809 return FALSE;
7811 #ifdef TE_SOLARIS
7812 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7813 krtld support it. */
7814 return FALSE;
7815 #endif
7817 /* Since there is no need to prepare for PLT branch on x86-64, we
7818 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7819 be used as a marker for 32-bit PC-relative branches. */
7820 if (!object_64bit)
7821 return FALSE;
7823 /* Weak or undefined symbol need PLT32 relocation. */
7824 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7825 return TRUE;
7827 /* Non-global symbol doesn't need PLT32 relocation. */
7828 if (! S_IS_EXTERNAL (s))
7829 return FALSE;
7831 /* Other global symbols need PLT32 relocation. NB: Symbol with
7832 non-default visibilities are treated as normal global symbol
7833 so that PLT32 relocation can be used as a marker for 32-bit
7834 PC-relative branches. It is useful for linker relaxation. */
7835 return TRUE;
7837 #endif
7839 static void
7840 output_jump (void)
7842 char *p;
7843 int size;
7844 fixS *fixP;
7845 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7847 if (i.tm.opcode_modifier.jumpbyte)
7849 /* This is a loop or jecxz type instruction. */
7850 size = 1;
7851 if (i.prefix[ADDR_PREFIX] != 0)
7853 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7854 i.prefixes -= 1;
7856 /* Pentium4 branch hints. */
7857 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7858 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7860 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7861 i.prefixes--;
7864 else
7866 int code16;
7868 code16 = 0;
7869 if (flag_code == CODE_16BIT)
7870 code16 = CODE16;
7872 if (i.prefix[DATA_PREFIX] != 0)
7874 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7875 i.prefixes -= 1;
7876 code16 ^= CODE16;
7879 size = 4;
7880 if (code16)
7881 size = 2;
7884 if (i.prefix[REX_PREFIX] != 0)
7886 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7887 i.prefixes -= 1;
7890 /* BND prefixed jump. */
7891 if (i.prefix[BND_PREFIX] != 0)
7893 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7894 i.prefixes -= 1;
7897 if (i.prefixes != 0 && !intel_syntax)
7898 as_warn (_("skipping prefixes on this instruction"));
7900 p = frag_more (i.tm.opcode_length + size);
7901 switch (i.tm.opcode_length)
7903 case 2:
7904 *p++ = i.tm.base_opcode >> 8;
7905 /* Fall through. */
7906 case 1:
7907 *p++ = i.tm.base_opcode;
7908 break;
7909 default:
7910 abort ();
7913 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7914 if (size == 4
7915 && jump_reloc == NO_RELOC
7916 && need_plt32_p (i.op[0].disps->X_add_symbol))
7917 jump_reloc = BFD_RELOC_X86_64_PLT32;
7918 #endif
7920 jump_reloc = reloc (size, 1, 1, jump_reloc);
7922 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7923 i.op[0].disps, 1, jump_reloc);
7925 /* All jumps handled here are signed, but don't use a signed limit
7926 check for 32 and 16 bit jumps as we want to allow wrap around at
7927 4G and 64k respectively. */
7928 if (size == 1)
7929 fixP->fx_signed = 1;
7932 static void
7933 output_interseg_jump (void)
7935 char *p;
7936 int size;
7937 int prefix;
7938 int code16;
7940 code16 = 0;
7941 if (flag_code == CODE_16BIT)
7942 code16 = CODE16;
7944 prefix = 0;
7945 if (i.prefix[DATA_PREFIX] != 0)
7947 prefix = 1;
7948 i.prefixes -= 1;
7949 code16 ^= CODE16;
7951 if (i.prefix[REX_PREFIX] != 0)
7953 prefix++;
7954 i.prefixes -= 1;
7957 size = 4;
7958 if (code16)
7959 size = 2;
7961 if (i.prefixes != 0 && !intel_syntax)
7962 as_warn (_("skipping prefixes on this instruction"));
7964 /* 1 opcode; 2 segment; offset */
7965 p = frag_more (prefix + 1 + 2 + size);
7967 if (i.prefix[DATA_PREFIX] != 0)
7968 *p++ = DATA_PREFIX_OPCODE;
7970 if (i.prefix[REX_PREFIX] != 0)
7971 *p++ = i.prefix[REX_PREFIX];
7973 *p++ = i.tm.base_opcode;
7974 if (i.op[1].imms->X_op == O_constant)
7976 offsetT n = i.op[1].imms->X_add_number;
7978 if (size == 2
7979 && !fits_in_unsigned_word (n)
7980 && !fits_in_signed_word (n))
7982 as_bad (_("16-bit jump out of range"));
7983 return;
7985 md_number_to_chars (p, n, size);
7987 else
7988 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7989 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
7990 if (i.op[0].imms->X_op != O_constant)
7991 as_bad (_("can't handle non absolute segment in `%s'"),
7992 i.tm.name);
7993 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
7996 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7997 void
7998 x86_cleanup (void)
8000 char *p;
8001 asection *seg = now_seg;
8002 subsegT subseg = now_subseg;
8003 asection *sec;
8004 unsigned int alignment, align_size_1;
8005 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8006 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8007 unsigned int padding;
8009 if (!IS_ELF || !x86_used_note)
8010 return;
8012 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8014 /* The .note.gnu.property section layout:
8016 Field Length Contents
8017 ---- ---- ----
8018 n_namsz 4 4
8019 n_descsz 4 The note descriptor size
8020 n_type 4 NT_GNU_PROPERTY_TYPE_0
8021 n_name 4 "GNU"
8022 n_desc n_descsz The program property array
8023 .... .... ....
8026 /* Create the .note.gnu.property section. */
8027 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8028 bfd_set_section_flags (stdoutput, sec,
8029 (SEC_ALLOC
8030 | SEC_LOAD
8031 | SEC_DATA
8032 | SEC_HAS_CONTENTS
8033 | SEC_READONLY));
8035 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8037 align_size_1 = 7;
8038 alignment = 3;
8040 else
8042 align_size_1 = 3;
8043 alignment = 2;
8046 bfd_set_section_alignment (stdoutput, sec, alignment);
8047 elf_section_type (sec) = SHT_NOTE;
8049 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8050 + 4-byte data */
8051 isa_1_descsz_raw = 4 + 4 + 4;
8052 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8053 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8055 feature_2_descsz_raw = isa_1_descsz;
8056 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8057 + 4-byte data */
8058 feature_2_descsz_raw += 4 + 4 + 4;
8059 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8060 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8061 & ~align_size_1);
8063 descsz = feature_2_descsz;
8064 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8065 p = frag_more (4 + 4 + 4 + 4 + descsz);
8067 /* Write n_namsz. */
8068 md_number_to_chars (p, (valueT) 4, 4);
8070 /* Write n_descsz. */
8071 md_number_to_chars (p + 4, (valueT) descsz, 4);
8073 /* Write n_type. */
8074 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8076 /* Write n_name. */
8077 memcpy (p + 4 * 3, "GNU", 4);
8079 /* Write 4-byte type. */
8080 md_number_to_chars (p + 4 * 4,
8081 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8083 /* Write 4-byte data size. */
8084 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8086 /* Write 4-byte data. */
8087 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8089 /* Zero out paddings. */
8090 padding = isa_1_descsz - isa_1_descsz_raw;
8091 if (padding)
8092 memset (p + 4 * 7, 0, padding);
8094 /* Write 4-byte type. */
8095 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8096 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8098 /* Write 4-byte data size. */
8099 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8101 /* Write 4-byte data. */
8102 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8103 (valueT) x86_feature_2_used, 4);
8105 /* Zero out paddings. */
8106 padding = feature_2_descsz - feature_2_descsz_raw;
8107 if (padding)
8108 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8110 /* We probably can't restore the current segment, for there likely
8111 isn't one yet... */
8112 if (seg && subseg)
8113 subseg_set (seg, subseg);
8115 #endif
8117 static void
8118 output_insn (void)
8120 fragS *insn_start_frag;
8121 offsetT insn_start_off;
8123 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8124 if (IS_ELF && x86_used_note)
8126 if (i.tm.cpu_flags.bitfield.cpucmov)
8127 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8128 if (i.tm.cpu_flags.bitfield.cpusse)
8129 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8130 if (i.tm.cpu_flags.bitfield.cpusse2)
8131 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8132 if (i.tm.cpu_flags.bitfield.cpusse3)
8133 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8134 if (i.tm.cpu_flags.bitfield.cpussse3)
8135 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8136 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8137 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8138 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8139 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8140 if (i.tm.cpu_flags.bitfield.cpuavx)
8141 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8142 if (i.tm.cpu_flags.bitfield.cpuavx2)
8143 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8144 if (i.tm.cpu_flags.bitfield.cpufma)
8145 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8146 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8147 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8148 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8149 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8150 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8151 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8152 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8153 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8154 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8155 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8156 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8157 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8158 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8159 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8160 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8161 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8162 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8163 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8164 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8165 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8166 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8167 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8168 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8169 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8170 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8171 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8172 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8173 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8174 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8175 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8177 if (i.tm.cpu_flags.bitfield.cpu8087
8178 || i.tm.cpu_flags.bitfield.cpu287
8179 || i.tm.cpu_flags.bitfield.cpu387
8180 || i.tm.cpu_flags.bitfield.cpu687
8181 || i.tm.cpu_flags.bitfield.cpufisttp)
8182 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8183 /* Don't set GNU_PROPERTY_X86_FEATURE_2_MMX for prefetchtXXX nor
8184 Xfence instructions. */
8185 if (i.tm.base_opcode != 0xf18
8186 && i.tm.base_opcode != 0xf0d
8187 && i.tm.base_opcode != 0xfae
8188 && (i.has_regmmx
8189 || i.tm.cpu_flags.bitfield.cpummx
8190 || i.tm.cpu_flags.bitfield.cpua3dnow
8191 || i.tm.cpu_flags.bitfield.cpua3dnowa))
8192 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8193 if (i.has_regxmm)
8194 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8195 if (i.has_regymm)
8196 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8197 if (i.has_regzmm)
8198 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8199 if (i.tm.cpu_flags.bitfield.cpufxsr)
8200 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8201 if (i.tm.cpu_flags.bitfield.cpuxsave)
8202 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8203 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8204 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8205 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8206 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8208 #endif
8210 /* Tie dwarf2 debug info to the address at the start of the insn.
8211 We can't do this after the insn has been output as the current
8212 frag may have been closed off. eg. by frag_var. */
8213 dwarf2_emit_insn (0);
8215 insn_start_frag = frag_now;
8216 insn_start_off = frag_now_fix ();
8218 /* Output jumps. */
8219 if (i.tm.opcode_modifier.jump)
8220 output_branch ();
8221 else if (i.tm.opcode_modifier.jumpbyte
8222 || i.tm.opcode_modifier.jumpdword)
8223 output_jump ();
8224 else if (i.tm.opcode_modifier.jumpintersegment)
8225 output_interseg_jump ();
8226 else
8228 /* Output normal instructions here. */
8229 char *p;
8230 unsigned char *q;
8231 unsigned int j;
8232 unsigned int prefix;
8234 if (avoid_fence
8235 && i.tm.base_opcode == 0xfae
8236 && i.operands == 1
8237 && i.imm_operands == 1
8238 && (i.op[0].imms->X_add_number == 0xe8
8239 || i.op[0].imms->X_add_number == 0xf0
8240 || i.op[0].imms->X_add_number == 0xf8))
8242 /* Encode lfence, mfence, and sfence as
8243 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8244 offsetT val = 0x240483f0ULL;
8245 p = frag_more (5);
8246 md_number_to_chars (p, val, 5);
8247 return;
8250 /* Some processors fail on LOCK prefix. This options makes
8251 assembler ignore LOCK prefix and serves as a workaround. */
8252 if (omit_lock_prefix)
8254 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8255 return;
8256 i.prefix[LOCK_PREFIX] = 0;
8259 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8260 don't need the explicit prefix. */
8261 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8263 switch (i.tm.opcode_length)
8265 case 3:
8266 if (i.tm.base_opcode & 0xff000000)
8268 prefix = (i.tm.base_opcode >> 24) & 0xff;
8269 add_prefix (prefix);
8271 break;
8272 case 2:
8273 if ((i.tm.base_opcode & 0xff0000) != 0)
8275 prefix = (i.tm.base_opcode >> 16) & 0xff;
8276 if (!i.tm.cpu_flags.bitfield.cpupadlock
8277 || prefix != REPE_PREFIX_OPCODE
8278 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8279 add_prefix (prefix);
8281 break;
8282 case 1:
8283 break;
8284 case 0:
8285 /* Check for pseudo prefixes. */
8286 as_bad_where (insn_start_frag->fr_file,
8287 insn_start_frag->fr_line,
8288 _("pseudo prefix without instruction"));
8289 return;
8290 default:
8291 abort ();
8294 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8295 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8296 R_X86_64_GOTTPOFF relocation so that linker can safely
8297 perform IE->LE optimization. */
8298 if (x86_elf_abi == X86_64_X32_ABI
8299 && i.operands == 2
8300 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8301 && i.prefix[REX_PREFIX] == 0)
8302 add_prefix (REX_OPCODE);
8303 #endif
8305 /* The prefix bytes. */
8306 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8307 if (*q)
8308 FRAG_APPEND_1_CHAR (*q);
8310 else
8312 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8313 if (*q)
8314 switch (j)
8316 case REX_PREFIX:
8317 /* REX byte is encoded in VEX prefix. */
8318 break;
8319 case SEG_PREFIX:
8320 case ADDR_PREFIX:
8321 FRAG_APPEND_1_CHAR (*q);
8322 break;
8323 default:
8324 /* There should be no other prefixes for instructions
8325 with VEX prefix. */
8326 abort ();
8329 /* For EVEX instructions i.vrex should become 0 after
8330 build_evex_prefix. For VEX instructions upper 16 registers
8331 aren't available, so VREX should be 0. */
8332 if (i.vrex)
8333 abort ();
8334 /* Now the VEX prefix. */
8335 p = frag_more (i.vex.length);
8336 for (j = 0; j < i.vex.length; j++)
8337 p[j] = i.vex.bytes[j];
8340 /* Now the opcode; be careful about word order here! */
8341 if (i.tm.opcode_length == 1)
8343 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8345 else
8347 switch (i.tm.opcode_length)
8349 case 4:
8350 p = frag_more (4);
8351 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8352 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8353 break;
8354 case 3:
8355 p = frag_more (3);
8356 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8357 break;
8358 case 2:
8359 p = frag_more (2);
8360 break;
8361 default:
8362 abort ();
8363 break;
8366 /* Put out high byte first: can't use md_number_to_chars! */
8367 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8368 *p = i.tm.base_opcode & 0xff;
8371 /* Now the modrm byte and sib byte (if present). */
8372 if (i.tm.opcode_modifier.modrm)
8374 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8375 | i.rm.reg << 3
8376 | i.rm.mode << 6));
8377 /* If i.rm.regmem == ESP (4)
8378 && i.rm.mode != (Register mode)
8379 && not 16 bit
8380 ==> need second modrm byte. */
8381 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8382 && i.rm.mode != 3
8383 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8384 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8385 | i.sib.index << 3
8386 | i.sib.scale << 6));
8389 if (i.disp_operands)
8390 output_disp (insn_start_frag, insn_start_off);
8392 if (i.imm_operands)
8393 output_imm (insn_start_frag, insn_start_off);
8396 #ifdef DEBUG386
8397 if (flag_debug)
8399 pi ("" /*line*/, &i);
8401 #endif /* DEBUG386 */
8404 /* Return the size of the displacement operand N. */
8406 static int
8407 disp_size (unsigned int n)
8409 int size = 4;
8411 if (i.types[n].bitfield.disp64)
8412 size = 8;
8413 else if (i.types[n].bitfield.disp8)
8414 size = 1;
8415 else if (i.types[n].bitfield.disp16)
8416 size = 2;
8417 return size;
8420 /* Return the size of the immediate operand N. */
8422 static int
8423 imm_size (unsigned int n)
8425 int size = 4;
8426 if (i.types[n].bitfield.imm64)
8427 size = 8;
8428 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8429 size = 1;
8430 else if (i.types[n].bitfield.imm16)
8431 size = 2;
8432 return size;
8435 static void
8436 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8438 char *p;
8439 unsigned int n;
8441 for (n = 0; n < i.operands; n++)
8443 if (operand_type_check (i.types[n], disp))
8445 if (i.op[n].disps->X_op == O_constant)
8447 int size = disp_size (n);
8448 offsetT val = i.op[n].disps->X_add_number;
8450 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8451 size);
8452 p = frag_more (size);
8453 md_number_to_chars (p, val, size);
8455 else
8457 enum bfd_reloc_code_real reloc_type;
8458 int size = disp_size (n);
8459 int sign = i.types[n].bitfield.disp32s;
8460 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8461 fixS *fixP;
8463 /* We can't have 8 bit displacement here. */
8464 gas_assert (!i.types[n].bitfield.disp8);
8466 /* The PC relative address is computed relative
8467 to the instruction boundary, so in case immediate
8468 fields follows, we need to adjust the value. */
8469 if (pcrel && i.imm_operands)
8471 unsigned int n1;
8472 int sz = 0;
8474 for (n1 = 0; n1 < i.operands; n1++)
8475 if (operand_type_check (i.types[n1], imm))
8477 /* Only one immediate is allowed for PC
8478 relative address. */
8479 gas_assert (sz == 0);
8480 sz = imm_size (n1);
8481 i.op[n].disps->X_add_number -= sz;
8483 /* We should find the immediate. */
8484 gas_assert (sz != 0);
8487 p = frag_more (size);
8488 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
8489 if (GOT_symbol
8490 && GOT_symbol == i.op[n].disps->X_add_symbol
8491 && (((reloc_type == BFD_RELOC_32
8492 || reloc_type == BFD_RELOC_X86_64_32S
8493 || (reloc_type == BFD_RELOC_64
8494 && object_64bit))
8495 && (i.op[n].disps->X_op == O_symbol
8496 || (i.op[n].disps->X_op == O_add
8497 && ((symbol_get_value_expression
8498 (i.op[n].disps->X_op_symbol)->X_op)
8499 == O_subtract))))
8500 || reloc_type == BFD_RELOC_32_PCREL))
8502 offsetT add;
8504 if (insn_start_frag == frag_now)
8505 add = (p - frag_now->fr_literal) - insn_start_off;
8506 else
8508 fragS *fr;
8510 add = insn_start_frag->fr_fix - insn_start_off;
8511 for (fr = insn_start_frag->fr_next;
8512 fr && fr != frag_now; fr = fr->fr_next)
8513 add += fr->fr_fix;
8514 add += p - frag_now->fr_literal;
8517 if (!object_64bit)
8519 reloc_type = BFD_RELOC_386_GOTPC;
8520 i.op[n].imms->X_add_number += add;
8522 else if (reloc_type == BFD_RELOC_64)
8523 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8524 else
8525 /* Don't do the adjustment for x86-64, as there
8526 the pcrel addressing is relative to the _next_
8527 insn, and that is taken care of in other code. */
8528 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8530 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
8531 size, i.op[n].disps, pcrel,
8532 reloc_type);
8533 /* Check for "call/jmp *mem", "mov mem, %reg",
8534 "test %reg, mem" and "binop mem, %reg" where binop
8535 is one of adc, add, and, cmp, or, sbb, sub, xor
8536 instructions without data prefix. Always generate
8537 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
8538 if (i.prefix[DATA_PREFIX] == 0
8539 && (generate_relax_relocations
8540 || (!object_64bit
8541 && i.rm.mode == 0
8542 && i.rm.regmem == 5))
8543 && (i.rm.mode == 2
8544 || (i.rm.mode == 0 && i.rm.regmem == 5))
8545 && ((i.operands == 1
8546 && i.tm.base_opcode == 0xff
8547 && (i.rm.reg == 2 || i.rm.reg == 4))
8548 || (i.operands == 2
8549 && (i.tm.base_opcode == 0x8b
8550 || i.tm.base_opcode == 0x85
8551 || (i.tm.base_opcode & 0xc7) == 0x03))))
8553 if (object_64bit)
8555 fixP->fx_tcbit = i.rex != 0;
8556 if (i.base_reg
8557 && (i.base_reg->reg_num == RegIP))
8558 fixP->fx_tcbit2 = 1;
8560 else
8561 fixP->fx_tcbit2 = 1;
8568 static void
8569 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8571 char *p;
8572 unsigned int n;
8574 for (n = 0; n < i.operands; n++)
8576 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
8577 if (i.rounding && (int) n == i.rounding->operand)
8578 continue;
8580 if (operand_type_check (i.types[n], imm))
8582 if (i.op[n].imms->X_op == O_constant)
8584 int size = imm_size (n);
8585 offsetT val;
8587 val = offset_in_range (i.op[n].imms->X_add_number,
8588 size);
8589 p = frag_more (size);
8590 md_number_to_chars (p, val, size);
8592 else
8594 /* Not absolute_section.
8595 Need a 32-bit fixup (don't support 8bit
8596 non-absolute imms). Try to support other
8597 sizes ... */
8598 enum bfd_reloc_code_real reloc_type;
8599 int size = imm_size (n);
8600 int sign;
8602 if (i.types[n].bitfield.imm32s
8603 && (i.suffix == QWORD_MNEM_SUFFIX
8604 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8605 sign = 1;
8606 else
8607 sign = 0;
8609 p = frag_more (size);
8610 reloc_type = reloc (size, 0, sign, i.reloc[n]);
8612 /* This is tough to explain. We end up with this one if we
8613 * have operands that look like
8614 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
8615 * obtain the absolute address of the GOT, and it is strongly
8616 * preferable from a performance point of view to avoid using
8617 * a runtime relocation for this. The actual sequence of
8618 * instructions often look something like:
8620 * call .L66
8621 * .L66:
8622 * popl %ebx
8623 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8625 * The call and pop essentially return the absolute address
8626 * of the label .L66 and store it in %ebx. The linker itself
8627 * will ultimately change the first operand of the addl so
8628 * that %ebx points to the GOT, but to keep things simple, the
8629 * .o file must have this operand set so that it generates not
8630 * the absolute address of .L66, but the absolute address of
8631 * itself. This allows the linker itself simply treat a GOTPC
8632 * relocation as asking for a pcrel offset to the GOT to be
8633 * added in, and the addend of the relocation is stored in the
8634 * operand field for the instruction itself.
8636 * Our job here is to fix the operand so that it would add
8637 * the correct offset so that %ebx would point to itself. The
8638 * thing that is tricky is that .-.L66 will point to the
8639 * beginning of the instruction, so we need to further modify
8640 * the operand so that it will point to itself. There are
8641 * other cases where you have something like:
8643 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8645 * and here no correction would be required. Internally in
8646 * the assembler we treat operands of this form as not being
8647 * pcrel since the '.' is explicitly mentioned, and I wonder
8648 * whether it would simplify matters to do it this way. Who
8649 * knows. In earlier versions of the PIC patches, the
8650 * pcrel_adjust field was used to store the correction, but
8651 * since the expression is not pcrel, I felt it would be
8652 * confusing to do it this way. */
8654 if ((reloc_type == BFD_RELOC_32
8655 || reloc_type == BFD_RELOC_X86_64_32S
8656 || reloc_type == BFD_RELOC_64)
8657 && GOT_symbol
8658 && GOT_symbol == i.op[n].imms->X_add_symbol
8659 && (i.op[n].imms->X_op == O_symbol
8660 || (i.op[n].imms->X_op == O_add
8661 && ((symbol_get_value_expression
8662 (i.op[n].imms->X_op_symbol)->X_op)
8663 == O_subtract))))
8665 offsetT add;
8667 if (insn_start_frag == frag_now)
8668 add = (p - frag_now->fr_literal) - insn_start_off;
8669 else
8671 fragS *fr;
8673 add = insn_start_frag->fr_fix - insn_start_off;
8674 for (fr = insn_start_frag->fr_next;
8675 fr && fr != frag_now; fr = fr->fr_next)
8676 add += fr->fr_fix;
8677 add += p - frag_now->fr_literal;
8680 if (!object_64bit)
8681 reloc_type = BFD_RELOC_386_GOTPC;
8682 else if (size == 4)
8683 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8684 else if (size == 8)
8685 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8686 i.op[n].imms->X_add_number += add;
8688 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8689 i.op[n].imms, 0, reloc_type);
8695 /* x86_cons_fix_new is called via the expression parsing code when a
8696 reloc is needed. We use this hook to get the correct .got reloc. */
8697 static int cons_sign = -1;
8699 void
8700 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8701 expressionS *exp, bfd_reloc_code_real_type r)
8703 r = reloc (len, 0, cons_sign, r);
8705 #ifdef TE_PE
8706 if (exp->X_op == O_secrel)
8708 exp->X_op = O_symbol;
8709 r = BFD_RELOC_32_SECREL;
8711 #endif
8713 fix_new_exp (frag, off, len, exp, 0, r);
8716 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8717 purpose of the `.dc.a' internal pseudo-op. */
8720 x86_address_bytes (void)
8722 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8723 return 4;
8724 return stdoutput->arch_info->bits_per_address / 8;
8727 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8728 || defined (LEX_AT)
8729 # define lex_got(reloc, adjust, types) NULL
8730 #else
8731 /* Parse operands of the form
8732 <symbol>@GOTOFF+<nnn>
8733 and similar .plt or .got references.
8735 If we find one, set up the correct relocation in RELOC and copy the
8736 input string, minus the `@GOTOFF' into a malloc'd buffer for
8737 parsing by the calling routine. Return this buffer, and if ADJUST
8738 is non-null set it to the length of the string we removed from the
8739 input line. Otherwise return NULL. */
8740 static char *
8741 lex_got (enum bfd_reloc_code_real *rel,
8742 int *adjust,
8743 i386_operand_type *types)
8745 /* Some of the relocations depend on the size of what field is to
8746 be relocated. But in our callers i386_immediate and i386_displacement
8747 we don't yet know the operand size (this will be set by insn
8748 matching). Hence we record the word32 relocation here,
8749 and adjust the reloc according to the real size in reloc(). */
8750 static const struct {
8751 const char *str;
8752 int len;
8753 const enum bfd_reloc_code_real rel[2];
8754 const i386_operand_type types64;
8755 } gotrel[] = {
8756 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8757 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
8758 BFD_RELOC_SIZE32 },
8759 OPERAND_TYPE_IMM32_64 },
8760 #endif
8761 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
8762 BFD_RELOC_X86_64_PLTOFF64 },
8763 OPERAND_TYPE_IMM64 },
8764 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
8765 BFD_RELOC_X86_64_PLT32 },
8766 OPERAND_TYPE_IMM32_32S_DISP32 },
8767 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
8768 BFD_RELOC_X86_64_GOTPLT64 },
8769 OPERAND_TYPE_IMM64_DISP64 },
8770 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
8771 BFD_RELOC_X86_64_GOTOFF64 },
8772 OPERAND_TYPE_IMM64_DISP64 },
8773 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8774 BFD_RELOC_X86_64_GOTPCREL },
8775 OPERAND_TYPE_IMM32_32S_DISP32 },
8776 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
8777 BFD_RELOC_X86_64_TLSGD },
8778 OPERAND_TYPE_IMM32_32S_DISP32 },
8779 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
8780 _dummy_first_bfd_reloc_code_real },
8781 OPERAND_TYPE_NONE },
8782 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
8783 BFD_RELOC_X86_64_TLSLD },
8784 OPERAND_TYPE_IMM32_32S_DISP32 },
8785 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8786 BFD_RELOC_X86_64_GOTTPOFF },
8787 OPERAND_TYPE_IMM32_32S_DISP32 },
8788 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
8789 BFD_RELOC_X86_64_TPOFF32 },
8790 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8791 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
8792 _dummy_first_bfd_reloc_code_real },
8793 OPERAND_TYPE_NONE },
8794 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
8795 BFD_RELOC_X86_64_DTPOFF32 },
8796 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8797 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8798 _dummy_first_bfd_reloc_code_real },
8799 OPERAND_TYPE_NONE },
8800 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8801 _dummy_first_bfd_reloc_code_real },
8802 OPERAND_TYPE_NONE },
8803 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
8804 BFD_RELOC_X86_64_GOT32 },
8805 OPERAND_TYPE_IMM32_32S_64_DISP32 },
8806 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
8807 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8808 OPERAND_TYPE_IMM32_32S_DISP32 },
8809 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
8810 BFD_RELOC_X86_64_TLSDESC_CALL },
8811 OPERAND_TYPE_IMM32_32S_DISP32 },
8813 char *cp;
8814 unsigned int j;
8816 #if defined (OBJ_MAYBE_ELF)
8817 if (!IS_ELF)
8818 return NULL;
8819 #endif
8821 for (cp = input_line_pointer; *cp != '@'; cp++)
8822 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8823 return NULL;
8825 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8827 int len = gotrel[j].len;
8828 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8830 if (gotrel[j].rel[object_64bit] != 0)
8832 int first, second;
8833 char *tmpbuf, *past_reloc;
8835 *rel = gotrel[j].rel[object_64bit];
8837 if (types)
8839 if (flag_code != CODE_64BIT)
8841 types->bitfield.imm32 = 1;
8842 types->bitfield.disp32 = 1;
8844 else
8845 *types = gotrel[j].types64;
8848 if (j != 0 && GOT_symbol == NULL)
8849 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8851 /* The length of the first part of our input line. */
8852 first = cp - input_line_pointer;
8854 /* The second part goes from after the reloc token until
8855 (and including) an end_of_line char or comma. */
8856 past_reloc = cp + 1 + len;
8857 cp = past_reloc;
8858 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8859 ++cp;
8860 second = cp + 1 - past_reloc;
8862 /* Allocate and copy string. The trailing NUL shouldn't
8863 be necessary, but be safe. */
8864 tmpbuf = XNEWVEC (char, first + second + 2);
8865 memcpy (tmpbuf, input_line_pointer, first);
8866 if (second != 0 && *past_reloc != ' ')
8867 /* Replace the relocation token with ' ', so that
8868 errors like foo@GOTOFF1 will be detected. */
8869 tmpbuf[first++] = ' ';
8870 else
8871 /* Increment length by 1 if the relocation token is
8872 removed. */
8873 len++;
8874 if (adjust)
8875 *adjust = len;
8876 memcpy (tmpbuf + first, past_reloc, second);
8877 tmpbuf[first + second] = '\0';
8878 return tmpbuf;
8881 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8882 gotrel[j].str, 1 << (5 + object_64bit));
8883 return NULL;
8887 /* Might be a symbol version string. Don't as_bad here. */
8888 return NULL;
8890 #endif
8892 #ifdef TE_PE
8893 #ifdef lex_got
8894 #undef lex_got
8895 #endif
8896 /* Parse operands of the form
8897 <symbol>@SECREL32+<nnn>
8899 If we find one, set up the correct relocation in RELOC and copy the
8900 input string, minus the `@SECREL32' into a malloc'd buffer for
8901 parsing by the calling routine. Return this buffer, and if ADJUST
8902 is non-null set it to the length of the string we removed from the
8903 input line. Otherwise return NULL.
8905 This function is copied from the ELF version above adjusted for PE targets. */
8907 static char *
8908 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8909 int *adjust ATTRIBUTE_UNUSED,
8910 i386_operand_type *types)
8912 static const struct
8914 const char *str;
8915 int len;
8916 const enum bfd_reloc_code_real rel[2];
8917 const i386_operand_type types64;
8919 gotrel[] =
8921 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
8922 BFD_RELOC_32_SECREL },
8923 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8926 char *cp;
8927 unsigned j;
8929 for (cp = input_line_pointer; *cp != '@'; cp++)
8930 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8931 return NULL;
8933 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8935 int len = gotrel[j].len;
8937 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8939 if (gotrel[j].rel[object_64bit] != 0)
8941 int first, second;
8942 char *tmpbuf, *past_reloc;
8944 *rel = gotrel[j].rel[object_64bit];
8945 if (adjust)
8946 *adjust = len;
8948 if (types)
8950 if (flag_code != CODE_64BIT)
8952 types->bitfield.imm32 = 1;
8953 types->bitfield.disp32 = 1;
8955 else
8956 *types = gotrel[j].types64;
8959 /* The length of the first part of our input line. */
8960 first = cp - input_line_pointer;
8962 /* The second part goes from after the reloc token until
8963 (and including) an end_of_line char or comma. */
8964 past_reloc = cp + 1 + len;
8965 cp = past_reloc;
8966 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8967 ++cp;
8968 second = cp + 1 - past_reloc;
8970 /* Allocate and copy string. The trailing NUL shouldn't
8971 be necessary, but be safe. */
8972 tmpbuf = XNEWVEC (char, first + second + 2);
8973 memcpy (tmpbuf, input_line_pointer, first);
8974 if (second != 0 && *past_reloc != ' ')
8975 /* Replace the relocation token with ' ', so that
8976 errors like foo@SECLREL321 will be detected. */
8977 tmpbuf[first++] = ' ';
8978 memcpy (tmpbuf + first, past_reloc, second);
8979 tmpbuf[first + second] = '\0';
8980 return tmpbuf;
8983 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8984 gotrel[j].str, 1 << (5 + object_64bit));
8985 return NULL;
8989 /* Might be a symbol version string. Don't as_bad here. */
8990 return NULL;
8993 #endif /* TE_PE */
8995 bfd_reloc_code_real_type
8996 x86_cons (expressionS *exp, int size)
8998 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9000 intel_syntax = -intel_syntax;
9002 exp->X_md = 0;
9003 if (size == 4 || (object_64bit && size == 8))
9005 /* Handle @GOTOFF and the like in an expression. */
9006 char *save;
9007 char *gotfree_input_line;
9008 int adjust = 0;
9010 save = input_line_pointer;
9011 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9012 if (gotfree_input_line)
9013 input_line_pointer = gotfree_input_line;
9015 expression (exp);
9017 if (gotfree_input_line)
9019 /* expression () has merrily parsed up to the end of line,
9020 or a comma - in the wrong buffer. Transfer how far
9021 input_line_pointer has moved to the right buffer. */
9022 input_line_pointer = (save
9023 + (input_line_pointer - gotfree_input_line)
9024 + adjust);
9025 free (gotfree_input_line);
9026 if (exp->X_op == O_constant
9027 || exp->X_op == O_absent
9028 || exp->X_op == O_illegal
9029 || exp->X_op == O_register
9030 || exp->X_op == O_big)
9032 char c = *input_line_pointer;
9033 *input_line_pointer = 0;
9034 as_bad (_("missing or invalid expression `%s'"), save);
9035 *input_line_pointer = c;
9037 else if ((got_reloc == BFD_RELOC_386_PLT32
9038 || got_reloc == BFD_RELOC_X86_64_PLT32)
9039 && exp->X_op != O_symbol)
9041 char c = *input_line_pointer;
9042 *input_line_pointer = 0;
9043 as_bad (_("invalid PLT expression `%s'"), save);
9044 *input_line_pointer = c;
9048 else
9049 expression (exp);
9051 intel_syntax = -intel_syntax;
9053 if (intel_syntax)
9054 i386_intel_simplify (exp);
9056 return got_reloc;
9059 static void
9060 signed_cons (int size)
9062 if (flag_code == CODE_64BIT)
9063 cons_sign = 1;
9064 cons (size);
9065 cons_sign = -1;
9068 #ifdef TE_PE
9069 static void
9070 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9072 expressionS exp;
9076 expression (&exp);
9077 if (exp.X_op == O_symbol)
9078 exp.X_op = O_secrel;
9080 emit_expr (&exp, 4);
9082 while (*input_line_pointer++ == ',');
9084 input_line_pointer--;
9085 demand_empty_rest_of_line ();
9087 #endif
9089 /* Handle Vector operations. */
9091 static char *
9092 check_VecOperations (char *op_string, char *op_end)
9094 const reg_entry *mask;
9095 const char *saved;
9096 char *end_op;
9098 while (*op_string
9099 && (op_end == NULL || op_string < op_end))
9101 saved = op_string;
9102 if (*op_string == '{')
9104 op_string++;
9106 /* Check broadcasts. */
9107 if (strncmp (op_string, "1to", 3) == 0)
9109 int bcst_type;
9111 if (i.broadcast)
9112 goto duplicated_vec_op;
9114 op_string += 3;
9115 if (*op_string == '8')
9116 bcst_type = 8;
9117 else if (*op_string == '4')
9118 bcst_type = 4;
9119 else if (*op_string == '2')
9120 bcst_type = 2;
9121 else if (*op_string == '1'
9122 && *(op_string+1) == '6')
9124 bcst_type = 16;
9125 op_string++;
9127 else
9129 as_bad (_("Unsupported broadcast: `%s'"), saved);
9130 return NULL;
9132 op_string++;
9134 broadcast_op.type = bcst_type;
9135 broadcast_op.operand = this_operand;
9136 broadcast_op.bytes = 0;
9137 i.broadcast = &broadcast_op;
9139 /* Check masking operation. */
9140 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9142 /* k0 can't be used for write mask. */
9143 if (!mask->reg_type.bitfield.regmask || mask->reg_num == 0)
9145 as_bad (_("`%s%s' can't be used for write mask"),
9146 register_prefix, mask->reg_name);
9147 return NULL;
9150 if (!i.mask)
9152 mask_op.mask = mask;
9153 mask_op.zeroing = 0;
9154 mask_op.operand = this_operand;
9155 i.mask = &mask_op;
9157 else
9159 if (i.mask->mask)
9160 goto duplicated_vec_op;
9162 i.mask->mask = mask;
9164 /* Only "{z}" is allowed here. No need to check
9165 zeroing mask explicitly. */
9166 if (i.mask->operand != this_operand)
9168 as_bad (_("invalid write mask `%s'"), saved);
9169 return NULL;
9173 op_string = end_op;
9175 /* Check zeroing-flag for masking operation. */
9176 else if (*op_string == 'z')
9178 if (!i.mask)
9180 mask_op.mask = NULL;
9181 mask_op.zeroing = 1;
9182 mask_op.operand = this_operand;
9183 i.mask = &mask_op;
9185 else
9187 if (i.mask->zeroing)
9189 duplicated_vec_op:
9190 as_bad (_("duplicated `%s'"), saved);
9191 return NULL;
9194 i.mask->zeroing = 1;
9196 /* Only "{%k}" is allowed here. No need to check mask
9197 register explicitly. */
9198 if (i.mask->operand != this_operand)
9200 as_bad (_("invalid zeroing-masking `%s'"),
9201 saved);
9202 return NULL;
9206 op_string++;
9208 else
9209 goto unknown_vec_op;
9211 if (*op_string != '}')
9213 as_bad (_("missing `}' in `%s'"), saved);
9214 return NULL;
9216 op_string++;
9218 /* Strip whitespace since the addition of pseudo prefixes
9219 changed how the scrubber treats '{'. */
9220 if (is_space_char (*op_string))
9221 ++op_string;
9223 continue;
9225 unknown_vec_op:
9226 /* We don't know this one. */
9227 as_bad (_("unknown vector operation: `%s'"), saved);
9228 return NULL;
9231 if (i.mask && i.mask->zeroing && !i.mask->mask)
9233 as_bad (_("zeroing-masking only allowed with write mask"));
9234 return NULL;
9237 return op_string;
9240 static int
9241 i386_immediate (char *imm_start)
9243 char *save_input_line_pointer;
9244 char *gotfree_input_line;
9245 segT exp_seg = 0;
9246 expressionS *exp;
9247 i386_operand_type types;
9249 operand_type_set (&types, ~0);
9251 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9253 as_bad (_("at most %d immediate operands are allowed"),
9254 MAX_IMMEDIATE_OPERANDS);
9255 return 0;
9258 exp = &im_expressions[i.imm_operands++];
9259 i.op[this_operand].imms = exp;
9261 if (is_space_char (*imm_start))
9262 ++imm_start;
9264 save_input_line_pointer = input_line_pointer;
9265 input_line_pointer = imm_start;
9267 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9268 if (gotfree_input_line)
9269 input_line_pointer = gotfree_input_line;
9271 exp_seg = expression (exp);
9273 SKIP_WHITESPACE ();
9275 /* Handle vector operations. */
9276 if (*input_line_pointer == '{')
9278 input_line_pointer = check_VecOperations (input_line_pointer,
9279 NULL);
9280 if (input_line_pointer == NULL)
9281 return 0;
9284 if (*input_line_pointer)
9285 as_bad (_("junk `%s' after expression"), input_line_pointer);
9287 input_line_pointer = save_input_line_pointer;
9288 if (gotfree_input_line)
9290 free (gotfree_input_line);
9292 if (exp->X_op == O_constant || exp->X_op == O_register)
9293 exp->X_op = O_illegal;
9296 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9299 static int
9300 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9301 i386_operand_type types, const char *imm_start)
9303 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9305 if (imm_start)
9306 as_bad (_("missing or invalid immediate expression `%s'"),
9307 imm_start);
9308 return 0;
9310 else if (exp->X_op == O_constant)
9312 /* Size it properly later. */
9313 i.types[this_operand].bitfield.imm64 = 1;
9314 /* If not 64bit, sign extend val. */
9315 if (flag_code != CODE_64BIT
9316 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9317 exp->X_add_number
9318 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9320 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9321 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9322 && exp_seg != absolute_section
9323 && exp_seg != text_section
9324 && exp_seg != data_section
9325 && exp_seg != bss_section
9326 && exp_seg != undefined_section
9327 && !bfd_is_com_section (exp_seg))
9329 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9330 return 0;
9332 #endif
9333 else if (!intel_syntax && exp_seg == reg_section)
9335 if (imm_start)
9336 as_bad (_("illegal immediate register operand %s"), imm_start);
9337 return 0;
9339 else
9341 /* This is an address. The size of the address will be
9342 determined later, depending on destination register,
9343 suffix, or the default for the section. */
9344 i.types[this_operand].bitfield.imm8 = 1;
9345 i.types[this_operand].bitfield.imm16 = 1;
9346 i.types[this_operand].bitfield.imm32 = 1;
9347 i.types[this_operand].bitfield.imm32s = 1;
9348 i.types[this_operand].bitfield.imm64 = 1;
9349 i.types[this_operand] = operand_type_and (i.types[this_operand],
9350 types);
9353 return 1;
9356 static char *
9357 i386_scale (char *scale)
9359 offsetT val;
9360 char *save = input_line_pointer;
9362 input_line_pointer = scale;
9363 val = get_absolute_expression ();
9365 switch (val)
9367 case 1:
9368 i.log2_scale_factor = 0;
9369 break;
9370 case 2:
9371 i.log2_scale_factor = 1;
9372 break;
9373 case 4:
9374 i.log2_scale_factor = 2;
9375 break;
9376 case 8:
9377 i.log2_scale_factor = 3;
9378 break;
9379 default:
9381 char sep = *input_line_pointer;
9383 *input_line_pointer = '\0';
9384 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9385 scale);
9386 *input_line_pointer = sep;
9387 input_line_pointer = save;
9388 return NULL;
9391 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9393 as_warn (_("scale factor of %d without an index register"),
9394 1 << i.log2_scale_factor);
9395 i.log2_scale_factor = 0;
9397 scale = input_line_pointer;
9398 input_line_pointer = save;
9399 return scale;
9402 static int
9403 i386_displacement (char *disp_start, char *disp_end)
9405 expressionS *exp;
9406 segT exp_seg = 0;
9407 char *save_input_line_pointer;
9408 char *gotfree_input_line;
9409 int override;
9410 i386_operand_type bigdisp, types = anydisp;
9411 int ret;
9413 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9415 as_bad (_("at most %d displacement operands are allowed"),
9416 MAX_MEMORY_OPERANDS);
9417 return 0;
9420 operand_type_set (&bigdisp, 0);
9421 if ((i.types[this_operand].bitfield.jumpabsolute)
9422 || (!current_templates->start->opcode_modifier.jump
9423 && !current_templates->start->opcode_modifier.jumpdword))
9425 bigdisp.bitfield.disp32 = 1;
9426 override = (i.prefix[ADDR_PREFIX] != 0);
9427 if (flag_code == CODE_64BIT)
9429 if (!override)
9431 bigdisp.bitfield.disp32s = 1;
9432 bigdisp.bitfield.disp64 = 1;
9435 else if ((flag_code == CODE_16BIT) ^ override)
9437 bigdisp.bitfield.disp32 = 0;
9438 bigdisp.bitfield.disp16 = 1;
9441 else
9443 /* For PC-relative branches, the width of the displacement
9444 is dependent upon data size, not address size. */
9445 override = (i.prefix[DATA_PREFIX] != 0);
9446 if (flag_code == CODE_64BIT)
9448 if (override || i.suffix == WORD_MNEM_SUFFIX)
9449 bigdisp.bitfield.disp16 = 1;
9450 else
9452 bigdisp.bitfield.disp32 = 1;
9453 bigdisp.bitfield.disp32s = 1;
9456 else
9458 if (!override)
9459 override = (i.suffix == (flag_code != CODE_16BIT
9460 ? WORD_MNEM_SUFFIX
9461 : LONG_MNEM_SUFFIX));
9462 bigdisp.bitfield.disp32 = 1;
9463 if ((flag_code == CODE_16BIT) ^ override)
9465 bigdisp.bitfield.disp32 = 0;
9466 bigdisp.bitfield.disp16 = 1;
9470 i.types[this_operand] = operand_type_or (i.types[this_operand],
9471 bigdisp);
9473 exp = &disp_expressions[i.disp_operands];
9474 i.op[this_operand].disps = exp;
9475 i.disp_operands++;
9476 save_input_line_pointer = input_line_pointer;
9477 input_line_pointer = disp_start;
9478 END_STRING_AND_SAVE (disp_end);
9480 #ifndef GCC_ASM_O_HACK
9481 #define GCC_ASM_O_HACK 0
9482 #endif
9483 #if GCC_ASM_O_HACK
9484 END_STRING_AND_SAVE (disp_end + 1);
9485 if (i.types[this_operand].bitfield.baseIndex
9486 && displacement_string_end[-1] == '+')
9488 /* This hack is to avoid a warning when using the "o"
9489 constraint within gcc asm statements.
9490 For instance:
9492 #define _set_tssldt_desc(n,addr,limit,type) \
9493 __asm__ __volatile__ ( \
9494 "movw %w2,%0\n\t" \
9495 "movw %w1,2+%0\n\t" \
9496 "rorl $16,%1\n\t" \
9497 "movb %b1,4+%0\n\t" \
9498 "movb %4,5+%0\n\t" \
9499 "movb $0,6+%0\n\t" \
9500 "movb %h1,7+%0\n\t" \
9501 "rorl $16,%1" \
9502 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
9504 This works great except that the output assembler ends
9505 up looking a bit weird if it turns out that there is
9506 no offset. You end up producing code that looks like:
9508 #APP
9509 movw $235,(%eax)
9510 movw %dx,2+(%eax)
9511 rorl $16,%edx
9512 movb %dl,4+(%eax)
9513 movb $137,5+(%eax)
9514 movb $0,6+(%eax)
9515 movb %dh,7+(%eax)
9516 rorl $16,%edx
9517 #NO_APP
9519 So here we provide the missing zero. */
9521 *displacement_string_end = '0';
9523 #endif
9524 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9525 if (gotfree_input_line)
9526 input_line_pointer = gotfree_input_line;
9528 exp_seg = expression (exp);
9530 SKIP_WHITESPACE ();
9531 if (*input_line_pointer)
9532 as_bad (_("junk `%s' after expression"), input_line_pointer);
9533 #if GCC_ASM_O_HACK
9534 RESTORE_END_STRING (disp_end + 1);
9535 #endif
9536 input_line_pointer = save_input_line_pointer;
9537 if (gotfree_input_line)
9539 free (gotfree_input_line);
9541 if (exp->X_op == O_constant || exp->X_op == O_register)
9542 exp->X_op = O_illegal;
9545 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
9547 RESTORE_END_STRING (disp_end);
9549 return ret;
9552 static int
9553 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9554 i386_operand_type types, const char *disp_start)
9556 i386_operand_type bigdisp;
9557 int ret = 1;
9559 /* We do this to make sure that the section symbol is in
9560 the symbol table. We will ultimately change the relocation
9561 to be relative to the beginning of the section. */
9562 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9563 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9564 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9566 if (exp->X_op != O_symbol)
9567 goto inv_disp;
9569 if (S_IS_LOCAL (exp->X_add_symbol)
9570 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9571 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9572 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9573 exp->X_op = O_subtract;
9574 exp->X_op_symbol = GOT_symbol;
9575 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9576 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9577 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9578 i.reloc[this_operand] = BFD_RELOC_64;
9579 else
9580 i.reloc[this_operand] = BFD_RELOC_32;
9583 else if (exp->X_op == O_absent
9584 || exp->X_op == O_illegal
9585 || exp->X_op == O_big)
9587 inv_disp:
9588 as_bad (_("missing or invalid displacement expression `%s'"),
9589 disp_start);
9590 ret = 0;
9593 else if (flag_code == CODE_64BIT
9594 && !i.prefix[ADDR_PREFIX]
9595 && exp->X_op == O_constant)
9597 /* Since displacement is signed extended to 64bit, don't allow
9598 disp32 and turn off disp32s if they are out of range. */
9599 i.types[this_operand].bitfield.disp32 = 0;
9600 if (!fits_in_signed_long (exp->X_add_number))
9602 i.types[this_operand].bitfield.disp32s = 0;
9603 if (i.types[this_operand].bitfield.baseindex)
9605 as_bad (_("0x%lx out range of signed 32bit displacement"),
9606 (long) exp->X_add_number);
9607 ret = 0;
9612 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9613 else if (exp->X_op != O_constant
9614 && OUTPUT_FLAVOR == bfd_target_aout_flavour
9615 && exp_seg != absolute_section
9616 && exp_seg != text_section
9617 && exp_seg != data_section
9618 && exp_seg != bss_section
9619 && exp_seg != undefined_section
9620 && !bfd_is_com_section (exp_seg))
9622 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9623 ret = 0;
9625 #endif
9627 /* Check if this is a displacement only operand. */
9628 bigdisp = i.types[this_operand];
9629 bigdisp.bitfield.disp8 = 0;
9630 bigdisp.bitfield.disp16 = 0;
9631 bigdisp.bitfield.disp32 = 0;
9632 bigdisp.bitfield.disp32s = 0;
9633 bigdisp.bitfield.disp64 = 0;
9634 if (operand_type_all_zero (&bigdisp))
9635 i.types[this_operand] = operand_type_and (i.types[this_operand],
9636 types);
9638 return ret;
9641 /* Return the active addressing mode, taking address override and
9642 registers forming the address into consideration. Update the
9643 address override prefix if necessary. */
9645 static enum flag_code
9646 i386_addressing_mode (void)
9648 enum flag_code addr_mode;
9650 if (i.prefix[ADDR_PREFIX])
9651 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9652 else
9654 addr_mode = flag_code;
9656 #if INFER_ADDR_PREFIX
9657 if (i.mem_operands == 0)
9659 /* Infer address prefix from the first memory operand. */
9660 const reg_entry *addr_reg = i.base_reg;
9662 if (addr_reg == NULL)
9663 addr_reg = i.index_reg;
9665 if (addr_reg)
9667 if (addr_reg->reg_type.bitfield.dword)
9668 addr_mode = CODE_32BIT;
9669 else if (flag_code != CODE_64BIT
9670 && addr_reg->reg_type.bitfield.word)
9671 addr_mode = CODE_16BIT;
9673 if (addr_mode != flag_code)
9675 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9676 i.prefixes += 1;
9677 /* Change the size of any displacement too. At most one
9678 of Disp16 or Disp32 is set.
9679 FIXME. There doesn't seem to be any real need for
9680 separate Disp16 and Disp32 flags. The same goes for
9681 Imm16 and Imm32. Removing them would probably clean
9682 up the code quite a lot. */
9683 if (flag_code != CODE_64BIT
9684 && (i.types[this_operand].bitfield.disp16
9685 || i.types[this_operand].bitfield.disp32))
9686 i.types[this_operand]
9687 = operand_type_xor (i.types[this_operand], disp16_32);
9691 #endif
9694 return addr_mode;
9697 /* Make sure the memory operand we've been dealt is valid.
9698 Return 1 on success, 0 on a failure. */
9700 static int
9701 i386_index_check (const char *operand_string)
9703 const char *kind = "base/index";
9704 enum flag_code addr_mode = i386_addressing_mode ();
9706 if (current_templates->start->opcode_modifier.isstring
9707 && !current_templates->start->opcode_modifier.immext
9708 && (current_templates->end[-1].opcode_modifier.isstring
9709 || i.mem_operands))
9711 /* Memory operands of string insns are special in that they only allow
9712 a single register (rDI, rSI, or rBX) as their memory address. */
9713 const reg_entry *expected_reg;
9714 static const char *di_si[][2] =
9716 { "esi", "edi" },
9717 { "si", "di" },
9718 { "rsi", "rdi" }
9720 static const char *bx[] = { "ebx", "bx", "rbx" };
9722 kind = "string address";
9724 if (current_templates->start->opcode_modifier.repprefixok)
9726 i386_operand_type type = current_templates->end[-1].operand_types[0];
9728 if (!type.bitfield.baseindex
9729 || ((!i.mem_operands != !intel_syntax)
9730 && current_templates->end[-1].operand_types[1]
9731 .bitfield.baseindex))
9732 type = current_templates->end[-1].operand_types[1];
9733 expected_reg = hash_find (reg_hash,
9734 di_si[addr_mode][type.bitfield.esseg]);
9737 else
9738 expected_reg = hash_find (reg_hash, bx[addr_mode]);
9740 if (i.base_reg != expected_reg
9741 || i.index_reg
9742 || operand_type_check (i.types[this_operand], disp))
9744 /* The second memory operand must have the same size as
9745 the first one. */
9746 if (i.mem_operands
9747 && i.base_reg
9748 && !((addr_mode == CODE_64BIT
9749 && i.base_reg->reg_type.bitfield.qword)
9750 || (addr_mode == CODE_32BIT
9751 ? i.base_reg->reg_type.bitfield.dword
9752 : i.base_reg->reg_type.bitfield.word)))
9753 goto bad_address;
9755 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9756 operand_string,
9757 intel_syntax ? '[' : '(',
9758 register_prefix,
9759 expected_reg->reg_name,
9760 intel_syntax ? ']' : ')');
9761 return 1;
9763 else
9764 return 1;
9766 bad_address:
9767 as_bad (_("`%s' is not a valid %s expression"),
9768 operand_string, kind);
9769 return 0;
9771 else
9773 if (addr_mode != CODE_16BIT)
9775 /* 32-bit/64-bit checks. */
9776 if ((i.base_reg
9777 && ((addr_mode == CODE_64BIT
9778 ? !i.base_reg->reg_type.bitfield.qword
9779 : !i.base_reg->reg_type.bitfield.dword)
9780 || (i.index_reg && i.base_reg->reg_num == RegIP)
9781 || i.base_reg->reg_num == RegIZ))
9782 || (i.index_reg
9783 && !i.index_reg->reg_type.bitfield.xmmword
9784 && !i.index_reg->reg_type.bitfield.ymmword
9785 && !i.index_reg->reg_type.bitfield.zmmword
9786 && ((addr_mode == CODE_64BIT
9787 ? !i.index_reg->reg_type.bitfield.qword
9788 : !i.index_reg->reg_type.bitfield.dword)
9789 || !i.index_reg->reg_type.bitfield.baseindex)))
9790 goto bad_address;
9792 /* bndmk, bndldx, and bndstx have special restrictions. */
9793 if (current_templates->start->base_opcode == 0xf30f1b
9794 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9796 /* They cannot use RIP-relative addressing. */
9797 if (i.base_reg && i.base_reg->reg_num == RegIP)
9799 as_bad (_("`%s' cannot be used here"), operand_string);
9800 return 0;
9803 /* bndldx and bndstx ignore their scale factor. */
9804 if (current_templates->start->base_opcode != 0xf30f1b
9805 && i.log2_scale_factor)
9806 as_warn (_("register scaling is being ignored here"));
9809 else
9811 /* 16-bit checks. */
9812 if ((i.base_reg
9813 && (!i.base_reg->reg_type.bitfield.word
9814 || !i.base_reg->reg_type.bitfield.baseindex))
9815 || (i.index_reg
9816 && (!i.index_reg->reg_type.bitfield.word
9817 || !i.index_reg->reg_type.bitfield.baseindex
9818 || !(i.base_reg
9819 && i.base_reg->reg_num < 6
9820 && i.index_reg->reg_num >= 6
9821 && i.log2_scale_factor == 0))))
9822 goto bad_address;
9825 return 1;
9828 /* Handle vector immediates. */
9830 static int
9831 RC_SAE_immediate (const char *imm_start)
9833 unsigned int match_found, j;
9834 const char *pstr = imm_start;
9835 expressionS *exp;
9837 if (*pstr != '{')
9838 return 0;
9840 pstr++;
9841 match_found = 0;
9842 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9844 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9846 if (!i.rounding)
9848 rc_op.type = RC_NamesTable[j].type;
9849 rc_op.operand = this_operand;
9850 i.rounding = &rc_op;
9852 else
9854 as_bad (_("duplicated `%s'"), imm_start);
9855 return 0;
9857 pstr += RC_NamesTable[j].len;
9858 match_found = 1;
9859 break;
9862 if (!match_found)
9863 return 0;
9865 if (*pstr++ != '}')
9867 as_bad (_("Missing '}': '%s'"), imm_start);
9868 return 0;
9870 /* RC/SAE immediate string should contain nothing more. */;
9871 if (*pstr != 0)
9873 as_bad (_("Junk after '}': '%s'"), imm_start);
9874 return 0;
9877 exp = &im_expressions[i.imm_operands++];
9878 i.op[this_operand].imms = exp;
9880 exp->X_op = O_constant;
9881 exp->X_add_number = 0;
9882 exp->X_add_symbol = (symbolS *) 0;
9883 exp->X_op_symbol = (symbolS *) 0;
9885 i.types[this_operand].bitfield.imm8 = 1;
9886 return 1;
9889 /* Only string instructions can have a second memory operand, so
9890 reduce current_templates to just those if it contains any. */
9891 static int
9892 maybe_adjust_templates (void)
9894 const insn_template *t;
9896 gas_assert (i.mem_operands == 1);
9898 for (t = current_templates->start; t < current_templates->end; ++t)
9899 if (t->opcode_modifier.isstring)
9900 break;
9902 if (t < current_templates->end)
9904 static templates aux_templates;
9905 bfd_boolean recheck;
9907 aux_templates.start = t;
9908 for (; t < current_templates->end; ++t)
9909 if (!t->opcode_modifier.isstring)
9910 break;
9911 aux_templates.end = t;
9913 /* Determine whether to re-check the first memory operand. */
9914 recheck = (aux_templates.start != current_templates->start
9915 || t != current_templates->end);
9917 current_templates = &aux_templates;
9919 if (recheck)
9921 i.mem_operands = 0;
9922 if (i.memop1_string != NULL
9923 && i386_index_check (i.memop1_string) == 0)
9924 return 0;
9925 i.mem_operands = 1;
9929 return 1;
9932 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
9933 on error. */
9935 static int
9936 i386_att_operand (char *operand_string)
9938 const reg_entry *r;
9939 char *end_op;
9940 char *op_string = operand_string;
9942 if (is_space_char (*op_string))
9943 ++op_string;
9945 /* We check for an absolute prefix (differentiating,
9946 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
9947 if (*op_string == ABSOLUTE_PREFIX)
9949 ++op_string;
9950 if (is_space_char (*op_string))
9951 ++op_string;
9952 i.types[this_operand].bitfield.jumpabsolute = 1;
9955 /* Check if operand is a register. */
9956 if ((r = parse_register (op_string, &end_op)) != NULL)
9958 i386_operand_type temp;
9960 /* Check for a segment override by searching for ':' after a
9961 segment register. */
9962 op_string = end_op;
9963 if (is_space_char (*op_string))
9964 ++op_string;
9965 if (*op_string == ':'
9966 && (r->reg_type.bitfield.sreg2
9967 || r->reg_type.bitfield.sreg3))
9969 switch (r->reg_num)
9971 case 0:
9972 i.seg[i.mem_operands] = &es;
9973 break;
9974 case 1:
9975 i.seg[i.mem_operands] = &cs;
9976 break;
9977 case 2:
9978 i.seg[i.mem_operands] = &ss;
9979 break;
9980 case 3:
9981 i.seg[i.mem_operands] = &ds;
9982 break;
9983 case 4:
9984 i.seg[i.mem_operands] = &fs;
9985 break;
9986 case 5:
9987 i.seg[i.mem_operands] = &gs;
9988 break;
9991 /* Skip the ':' and whitespace. */
9992 ++op_string;
9993 if (is_space_char (*op_string))
9994 ++op_string;
9996 if (!is_digit_char (*op_string)
9997 && !is_identifier_char (*op_string)
9998 && *op_string != '('
9999 && *op_string != ABSOLUTE_PREFIX)
10001 as_bad (_("bad memory operand `%s'"), op_string);
10002 return 0;
10004 /* Handle case of %es:*foo. */
10005 if (*op_string == ABSOLUTE_PREFIX)
10007 ++op_string;
10008 if (is_space_char (*op_string))
10009 ++op_string;
10010 i.types[this_operand].bitfield.jumpabsolute = 1;
10012 goto do_memory_reference;
10015 /* Handle vector operations. */
10016 if (*op_string == '{')
10018 op_string = check_VecOperations (op_string, NULL);
10019 if (op_string == NULL)
10020 return 0;
10023 if (*op_string)
10025 as_bad (_("junk `%s' after register"), op_string);
10026 return 0;
10028 temp = r->reg_type;
10029 temp.bitfield.baseindex = 0;
10030 i.types[this_operand] = operand_type_or (i.types[this_operand],
10031 temp);
10032 i.types[this_operand].bitfield.unspecified = 0;
10033 i.op[this_operand].regs = r;
10034 i.reg_operands++;
10036 else if (*op_string == REGISTER_PREFIX)
10038 as_bad (_("bad register name `%s'"), op_string);
10039 return 0;
10041 else if (*op_string == IMMEDIATE_PREFIX)
10043 ++op_string;
10044 if (i.types[this_operand].bitfield.jumpabsolute)
10046 as_bad (_("immediate operand illegal with absolute jump"));
10047 return 0;
10049 if (!i386_immediate (op_string))
10050 return 0;
10052 else if (RC_SAE_immediate (operand_string))
10054 /* If it is a RC or SAE immediate, do nothing. */
10057 else if (is_digit_char (*op_string)
10058 || is_identifier_char (*op_string)
10059 || *op_string == '"'
10060 || *op_string == '(')
10062 /* This is a memory reference of some sort. */
10063 char *base_string;
10065 /* Start and end of displacement string expression (if found). */
10066 char *displacement_string_start;
10067 char *displacement_string_end;
10068 char *vop_start;
10070 do_memory_reference:
10071 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10072 return 0;
10073 if ((i.mem_operands == 1
10074 && !current_templates->start->opcode_modifier.isstring)
10075 || i.mem_operands == 2)
10077 as_bad (_("too many memory references for `%s'"),
10078 current_templates->start->name);
10079 return 0;
10082 /* Check for base index form. We detect the base index form by
10083 looking for an ')' at the end of the operand, searching
10084 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10085 after the '('. */
10086 base_string = op_string + strlen (op_string);
10088 /* Handle vector operations. */
10089 vop_start = strchr (op_string, '{');
10090 if (vop_start && vop_start < base_string)
10092 if (check_VecOperations (vop_start, base_string) == NULL)
10093 return 0;
10094 base_string = vop_start;
10097 --base_string;
10098 if (is_space_char (*base_string))
10099 --base_string;
10101 /* If we only have a displacement, set-up for it to be parsed later. */
10102 displacement_string_start = op_string;
10103 displacement_string_end = base_string + 1;
10105 if (*base_string == ')')
10107 char *temp_string;
10108 unsigned int parens_balanced = 1;
10109 /* We've already checked that the number of left & right ()'s are
10110 equal, so this loop will not be infinite. */
10113 base_string--;
10114 if (*base_string == ')')
10115 parens_balanced++;
10116 if (*base_string == '(')
10117 parens_balanced--;
10119 while (parens_balanced);
10121 temp_string = base_string;
10123 /* Skip past '(' and whitespace. */
10124 ++base_string;
10125 if (is_space_char (*base_string))
10126 ++base_string;
10128 if (*base_string == ','
10129 || ((i.base_reg = parse_register (base_string, &end_op))
10130 != NULL))
10132 displacement_string_end = temp_string;
10134 i.types[this_operand].bitfield.baseindex = 1;
10136 if (i.base_reg)
10138 base_string = end_op;
10139 if (is_space_char (*base_string))
10140 ++base_string;
10143 /* There may be an index reg or scale factor here. */
10144 if (*base_string == ',')
10146 ++base_string;
10147 if (is_space_char (*base_string))
10148 ++base_string;
10150 if ((i.index_reg = parse_register (base_string, &end_op))
10151 != NULL)
10153 base_string = end_op;
10154 if (is_space_char (*base_string))
10155 ++base_string;
10156 if (*base_string == ',')
10158 ++base_string;
10159 if (is_space_char (*base_string))
10160 ++base_string;
10162 else if (*base_string != ')')
10164 as_bad (_("expecting `,' or `)' "
10165 "after index register in `%s'"),
10166 operand_string);
10167 return 0;
10170 else if (*base_string == REGISTER_PREFIX)
10172 end_op = strchr (base_string, ',');
10173 if (end_op)
10174 *end_op = '\0';
10175 as_bad (_("bad register name `%s'"), base_string);
10176 return 0;
10179 /* Check for scale factor. */
10180 if (*base_string != ')')
10182 char *end_scale = i386_scale (base_string);
10184 if (!end_scale)
10185 return 0;
10187 base_string = end_scale;
10188 if (is_space_char (*base_string))
10189 ++base_string;
10190 if (*base_string != ')')
10192 as_bad (_("expecting `)' "
10193 "after scale factor in `%s'"),
10194 operand_string);
10195 return 0;
10198 else if (!i.index_reg)
10200 as_bad (_("expecting index register or scale factor "
10201 "after `,'; got '%c'"),
10202 *base_string);
10203 return 0;
10206 else if (*base_string != ')')
10208 as_bad (_("expecting `,' or `)' "
10209 "after base register in `%s'"),
10210 operand_string);
10211 return 0;
10214 else if (*base_string == REGISTER_PREFIX)
10216 end_op = strchr (base_string, ',');
10217 if (end_op)
10218 *end_op = '\0';
10219 as_bad (_("bad register name `%s'"), base_string);
10220 return 0;
10224 /* If there's an expression beginning the operand, parse it,
10225 assuming displacement_string_start and
10226 displacement_string_end are meaningful. */
10227 if (displacement_string_start != displacement_string_end)
10229 if (!i386_displacement (displacement_string_start,
10230 displacement_string_end))
10231 return 0;
10234 /* Special case for (%dx) while doing input/output op. */
10235 if (i.base_reg
10236 && i.base_reg->reg_type.bitfield.inoutportreg
10237 && i.index_reg == 0
10238 && i.log2_scale_factor == 0
10239 && i.seg[i.mem_operands] == 0
10240 && !operand_type_check (i.types[this_operand], disp))
10242 i.types[this_operand] = i.base_reg->reg_type;
10243 return 1;
10246 if (i386_index_check (operand_string) == 0)
10247 return 0;
10248 i.flags[this_operand] |= Operand_Mem;
10249 if (i.mem_operands == 0)
10250 i.memop1_string = xstrdup (operand_string);
10251 i.mem_operands++;
10253 else
10255 /* It's not a memory operand; argh! */
10256 as_bad (_("invalid char %s beginning operand %d `%s'"),
10257 output_invalid (*op_string),
10258 this_operand + 1,
10259 op_string);
10260 return 0;
10262 return 1; /* Normal return. */
10265 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10266 that an rs_machine_dependent frag may reach. */
10268 unsigned int
10269 i386_frag_max_var (fragS *frag)
10271 /* The only relaxable frags are for jumps.
10272 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10273 gas_assert (frag->fr_type == rs_machine_dependent);
10274 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10277 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10278 static int
10279 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10281 /* STT_GNU_IFUNC symbol must go through PLT. */
10282 if ((symbol_get_bfdsym (fr_symbol)->flags
10283 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10284 return 0;
10286 if (!S_IS_EXTERNAL (fr_symbol))
10287 /* Symbol may be weak or local. */
10288 return !S_IS_WEAK (fr_symbol);
10290 /* Global symbols with non-default visibility can't be preempted. */
10291 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10292 return 1;
10294 if (fr_var != NO_RELOC)
10295 switch ((enum bfd_reloc_code_real) fr_var)
10297 case BFD_RELOC_386_PLT32:
10298 case BFD_RELOC_X86_64_PLT32:
10299 /* Symbol with PLT relocation may be preempted. */
10300 return 0;
10301 default:
10302 abort ();
10305 /* Global symbols with default visibility in a shared library may be
10306 preempted by another definition. */
10307 return !shared;
10309 #endif
10311 /* md_estimate_size_before_relax()
10313 Called just before relax() for rs_machine_dependent frags. The x86
10314 assembler uses these frags to handle variable size jump
10315 instructions.
10317 Any symbol that is now undefined will not become defined.
10318 Return the correct fr_subtype in the frag.
10319 Return the initial "guess for variable size of frag" to caller.
10320 The guess is actually the growth beyond the fixed part. Whatever
10321 we do to grow the fixed or variable part contributes to our
10322 returned value. */
10325 md_estimate_size_before_relax (fragS *fragP, segT segment)
10327 /* We've already got fragP->fr_subtype right; all we have to do is
10328 check for un-relaxable symbols. On an ELF system, we can't relax
10329 an externally visible symbol, because it may be overridden by a
10330 shared library. */
10331 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
10332 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10333 || (IS_ELF
10334 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
10335 fragP->fr_var))
10336 #endif
10337 #if defined (OBJ_COFF) && defined (TE_PE)
10338 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
10339 && S_IS_WEAK (fragP->fr_symbol))
10340 #endif
10343 /* Symbol is undefined in this segment, or we need to keep a
10344 reloc so that weak symbols can be overridden. */
10345 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
10346 enum bfd_reloc_code_real reloc_type;
10347 unsigned char *opcode;
10348 int old_fr_fix;
10350 if (fragP->fr_var != NO_RELOC)
10351 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
10352 else if (size == 2)
10353 reloc_type = BFD_RELOC_16_PCREL;
10354 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10355 else if (need_plt32_p (fragP->fr_symbol))
10356 reloc_type = BFD_RELOC_X86_64_PLT32;
10357 #endif
10358 else
10359 reloc_type = BFD_RELOC_32_PCREL;
10361 old_fr_fix = fragP->fr_fix;
10362 opcode = (unsigned char *) fragP->fr_opcode;
10364 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
10366 case UNCOND_JUMP:
10367 /* Make jmp (0xeb) a (d)word displacement jump. */
10368 opcode[0] = 0xe9;
10369 fragP->fr_fix += size;
10370 fix_new (fragP, old_fr_fix, size,
10371 fragP->fr_symbol,
10372 fragP->fr_offset, 1,
10373 reloc_type);
10374 break;
10376 case COND_JUMP86:
10377 if (size == 2
10378 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
10380 /* Negate the condition, and branch past an
10381 unconditional jump. */
10382 opcode[0] ^= 1;
10383 opcode[1] = 3;
10384 /* Insert an unconditional jump. */
10385 opcode[2] = 0xe9;
10386 /* We added two extra opcode bytes, and have a two byte
10387 offset. */
10388 fragP->fr_fix += 2 + 2;
10389 fix_new (fragP, old_fr_fix + 2, 2,
10390 fragP->fr_symbol,
10391 fragP->fr_offset, 1,
10392 reloc_type);
10393 break;
10395 /* Fall through. */
10397 case COND_JUMP:
10398 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
10400 fixS *fixP;
10402 fragP->fr_fix += 1;
10403 fixP = fix_new (fragP, old_fr_fix, 1,
10404 fragP->fr_symbol,
10405 fragP->fr_offset, 1,
10406 BFD_RELOC_8_PCREL);
10407 fixP->fx_signed = 1;
10408 break;
10411 /* This changes the byte-displacement jump 0x7N
10412 to the (d)word-displacement jump 0x0f,0x8N. */
10413 opcode[1] = opcode[0] + 0x10;
10414 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10415 /* We've added an opcode byte. */
10416 fragP->fr_fix += 1 + size;
10417 fix_new (fragP, old_fr_fix + 1, size,
10418 fragP->fr_symbol,
10419 fragP->fr_offset, 1,
10420 reloc_type);
10421 break;
10423 default:
10424 BAD_CASE (fragP->fr_subtype);
10425 break;
10427 frag_wane (fragP);
10428 return fragP->fr_fix - old_fr_fix;
10431 /* Guess size depending on current relax state. Initially the relax
10432 state will correspond to a short jump and we return 1, because
10433 the variable part of the frag (the branch offset) is one byte
10434 long. However, we can relax a section more than once and in that
10435 case we must either set fr_subtype back to the unrelaxed state,
10436 or return the value for the appropriate branch. */
10437 return md_relax_table[fragP->fr_subtype].rlx_length;
10440 /* Called after relax() is finished.
10442 In: Address of frag.
10443 fr_type == rs_machine_dependent.
10444 fr_subtype is what the address relaxed to.
10446 Out: Any fixSs and constants are set up.
10447 Caller will turn frag into a ".space 0". */
10449 void
10450 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
10451 fragS *fragP)
10453 unsigned char *opcode;
10454 unsigned char *where_to_put_displacement = NULL;
10455 offsetT target_address;
10456 offsetT opcode_address;
10457 unsigned int extension = 0;
10458 offsetT displacement_from_opcode_start;
10460 opcode = (unsigned char *) fragP->fr_opcode;
10462 /* Address we want to reach in file space. */
10463 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
10465 /* Address opcode resides at in file space. */
10466 opcode_address = fragP->fr_address + fragP->fr_fix;
10468 /* Displacement from opcode start to fill into instruction. */
10469 displacement_from_opcode_start = target_address - opcode_address;
10471 if ((fragP->fr_subtype & BIG) == 0)
10473 /* Don't have to change opcode. */
10474 extension = 1; /* 1 opcode + 1 displacement */
10475 where_to_put_displacement = &opcode[1];
10477 else
10479 if (no_cond_jump_promotion
10480 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
10481 as_warn_where (fragP->fr_file, fragP->fr_line,
10482 _("long jump required"));
10484 switch (fragP->fr_subtype)
10486 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
10487 extension = 4; /* 1 opcode + 4 displacement */
10488 opcode[0] = 0xe9;
10489 where_to_put_displacement = &opcode[1];
10490 break;
10492 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
10493 extension = 2; /* 1 opcode + 2 displacement */
10494 opcode[0] = 0xe9;
10495 where_to_put_displacement = &opcode[1];
10496 break;
10498 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
10499 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
10500 extension = 5; /* 2 opcode + 4 displacement */
10501 opcode[1] = opcode[0] + 0x10;
10502 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10503 where_to_put_displacement = &opcode[2];
10504 break;
10506 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
10507 extension = 3; /* 2 opcode + 2 displacement */
10508 opcode[1] = opcode[0] + 0x10;
10509 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10510 where_to_put_displacement = &opcode[2];
10511 break;
10513 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
10514 extension = 4;
10515 opcode[0] ^= 1;
10516 opcode[1] = 3;
10517 opcode[2] = 0xe9;
10518 where_to_put_displacement = &opcode[3];
10519 break;
10521 default:
10522 BAD_CASE (fragP->fr_subtype);
10523 break;
10527 /* If size if less then four we are sure that the operand fits,
10528 but if it's 4, then it could be that the displacement is larger
10529 then -/+ 2GB. */
10530 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
10531 && object_64bit
10532 && ((addressT) (displacement_from_opcode_start - extension
10533 + ((addressT) 1 << 31))
10534 > (((addressT) 2 << 31) - 1)))
10536 as_bad_where (fragP->fr_file, fragP->fr_line,
10537 _("jump target out of range"));
10538 /* Make us emit 0. */
10539 displacement_from_opcode_start = extension;
10541 /* Now put displacement after opcode. */
10542 md_number_to_chars ((char *) where_to_put_displacement,
10543 (valueT) (displacement_from_opcode_start - extension),
10544 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
10545 fragP->fr_fix += extension;
10548 /* Apply a fixup (fixP) to segment data, once it has been determined
10549 by our caller that we have all the info we need to fix it up.
10551 Parameter valP is the pointer to the value of the bits.
10553 On the 386, immediates, displacements, and data pointers are all in
10554 the same (little-endian) format, so we don't need to care about which
10555 we are handling. */
10557 void
10558 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10560 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10561 valueT value = *valP;
10563 #if !defined (TE_Mach)
10564 if (fixP->fx_pcrel)
10566 switch (fixP->fx_r_type)
10568 default:
10569 break;
10571 case BFD_RELOC_64:
10572 fixP->fx_r_type = BFD_RELOC_64_PCREL;
10573 break;
10574 case BFD_RELOC_32:
10575 case BFD_RELOC_X86_64_32S:
10576 fixP->fx_r_type = BFD_RELOC_32_PCREL;
10577 break;
10578 case BFD_RELOC_16:
10579 fixP->fx_r_type = BFD_RELOC_16_PCREL;
10580 break;
10581 case BFD_RELOC_8:
10582 fixP->fx_r_type = BFD_RELOC_8_PCREL;
10583 break;
10587 if (fixP->fx_addsy != NULL
10588 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10589 || fixP->fx_r_type == BFD_RELOC_64_PCREL
10590 || fixP->fx_r_type == BFD_RELOC_16_PCREL
10591 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10592 && !use_rela_relocations)
10594 /* This is a hack. There should be a better way to handle this.
10595 This covers for the fact that bfd_install_relocation will
10596 subtract the current location (for partial_inplace, PC relative
10597 relocations); see more below. */
10598 #ifndef OBJ_AOUT
10599 if (IS_ELF
10600 #ifdef TE_PE
10601 || OUTPUT_FLAVOR == bfd_target_coff_flavour
10602 #endif
10604 value += fixP->fx_where + fixP->fx_frag->fr_address;
10605 #endif
10606 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10607 if (IS_ELF)
10609 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10611 if ((sym_seg == seg
10612 || (symbol_section_p (fixP->fx_addsy)
10613 && sym_seg != absolute_section))
10614 && !generic_force_reloc (fixP))
10616 /* Yes, we add the values in twice. This is because
10617 bfd_install_relocation subtracts them out again. I think
10618 bfd_install_relocation is broken, but I don't dare change
10619 it. FIXME. */
10620 value += fixP->fx_where + fixP->fx_frag->fr_address;
10623 #endif
10624 #if defined (OBJ_COFF) && defined (TE_PE)
10625 /* For some reason, the PE format does not store a
10626 section address offset for a PC relative symbol. */
10627 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10628 || S_IS_WEAK (fixP->fx_addsy))
10629 value += md_pcrel_from (fixP);
10630 #endif
10632 #if defined (OBJ_COFF) && defined (TE_PE)
10633 if (fixP->fx_addsy != NULL
10634 && S_IS_WEAK (fixP->fx_addsy)
10635 /* PR 16858: Do not modify weak function references. */
10636 && ! fixP->fx_pcrel)
10638 #if !defined (TE_PEP)
10639 /* For x86 PE weak function symbols are neither PC-relative
10640 nor do they set S_IS_FUNCTION. So the only reliable way
10641 to detect them is to check the flags of their containing
10642 section. */
10643 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10644 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10646 else
10647 #endif
10648 value -= S_GET_VALUE (fixP->fx_addsy);
10650 #endif
10652 /* Fix a few things - the dynamic linker expects certain values here,
10653 and we must not disappoint it. */
10654 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10655 if (IS_ELF && fixP->fx_addsy)
10656 switch (fixP->fx_r_type)
10658 case BFD_RELOC_386_PLT32:
10659 case BFD_RELOC_X86_64_PLT32:
10660 /* Make the jump instruction point to the address of the operand.
10661 At runtime we merely add the offset to the actual PLT entry.
10662 NB: Subtract the offset size only for jump instructions. */
10663 if (fixP->fx_pcrel)
10664 value = -4;
10665 break;
10667 case BFD_RELOC_386_TLS_GD:
10668 case BFD_RELOC_386_TLS_LDM:
10669 case BFD_RELOC_386_TLS_IE_32:
10670 case BFD_RELOC_386_TLS_IE:
10671 case BFD_RELOC_386_TLS_GOTIE:
10672 case BFD_RELOC_386_TLS_GOTDESC:
10673 case BFD_RELOC_X86_64_TLSGD:
10674 case BFD_RELOC_X86_64_TLSLD:
10675 case BFD_RELOC_X86_64_GOTTPOFF:
10676 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10677 value = 0; /* Fully resolved at runtime. No addend. */
10678 /* Fallthrough */
10679 case BFD_RELOC_386_TLS_LE:
10680 case BFD_RELOC_386_TLS_LDO_32:
10681 case BFD_RELOC_386_TLS_LE_32:
10682 case BFD_RELOC_X86_64_DTPOFF32:
10683 case BFD_RELOC_X86_64_DTPOFF64:
10684 case BFD_RELOC_X86_64_TPOFF32:
10685 case BFD_RELOC_X86_64_TPOFF64:
10686 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10687 break;
10689 case BFD_RELOC_386_TLS_DESC_CALL:
10690 case BFD_RELOC_X86_64_TLSDESC_CALL:
10691 value = 0; /* Fully resolved at runtime. No addend. */
10692 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10693 fixP->fx_done = 0;
10694 return;
10696 case BFD_RELOC_VTABLE_INHERIT:
10697 case BFD_RELOC_VTABLE_ENTRY:
10698 fixP->fx_done = 0;
10699 return;
10701 default:
10702 break;
10704 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
10705 *valP = value;
10706 #endif /* !defined (TE_Mach) */
10708 /* Are we finished with this relocation now? */
10709 if (fixP->fx_addsy == NULL)
10710 fixP->fx_done = 1;
10711 #if defined (OBJ_COFF) && defined (TE_PE)
10712 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10714 fixP->fx_done = 0;
10715 /* Remember value for tc_gen_reloc. */
10716 fixP->fx_addnumber = value;
10717 /* Clear out the frag for now. */
10718 value = 0;
10720 #endif
10721 else if (use_rela_relocations)
10723 fixP->fx_no_overflow = 1;
10724 /* Remember value for tc_gen_reloc. */
10725 fixP->fx_addnumber = value;
10726 value = 0;
10729 md_number_to_chars (p, value, fixP->fx_size);
10732 const char *
10733 md_atof (int type, char *litP, int *sizeP)
10735 /* This outputs the LITTLENUMs in REVERSE order;
10736 in accord with the bigendian 386. */
10737 return ieee_md_atof (type, litP, sizeP, FALSE);
10740 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10742 static char *
10743 output_invalid (int c)
10745 if (ISPRINT (c))
10746 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10747 "'%c'", c);
10748 else
10749 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10750 "(0x%x)", (unsigned char) c);
10751 return output_invalid_buf;
10754 /* REG_STRING starts *before* REGISTER_PREFIX. */
10756 static const reg_entry *
10757 parse_real_register (char *reg_string, char **end_op)
10759 char *s = reg_string;
10760 char *p;
10761 char reg_name_given[MAX_REG_NAME_SIZE + 1];
10762 const reg_entry *r;
10764 /* Skip possible REGISTER_PREFIX and possible whitespace. */
10765 if (*s == REGISTER_PREFIX)
10766 ++s;
10768 if (is_space_char (*s))
10769 ++s;
10771 p = reg_name_given;
10772 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10774 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10775 return (const reg_entry *) NULL;
10776 s++;
10779 /* For naked regs, make sure that we are not dealing with an identifier.
10780 This prevents confusing an identifier like `eax_var' with register
10781 `eax'. */
10782 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10783 return (const reg_entry *) NULL;
10785 *end_op = s;
10787 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10789 /* Handle floating point regs, allowing spaces in the (i) part. */
10790 if (r == i386_regtab /* %st is first entry of table */)
10792 if (!cpu_arch_flags.bitfield.cpu8087
10793 && !cpu_arch_flags.bitfield.cpu287
10794 && !cpu_arch_flags.bitfield.cpu387)
10795 return (const reg_entry *) NULL;
10797 if (is_space_char (*s))
10798 ++s;
10799 if (*s == '(')
10801 ++s;
10802 if (is_space_char (*s))
10803 ++s;
10804 if (*s >= '0' && *s <= '7')
10806 int fpr = *s - '0';
10807 ++s;
10808 if (is_space_char (*s))
10809 ++s;
10810 if (*s == ')')
10812 *end_op = s + 1;
10813 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10814 know (r);
10815 return r + fpr;
10818 /* We have "%st(" then garbage. */
10819 return (const reg_entry *) NULL;
10823 if (r == NULL || allow_pseudo_reg)
10824 return r;
10826 if (operand_type_all_zero (&r->reg_type))
10827 return (const reg_entry *) NULL;
10829 if ((r->reg_type.bitfield.dword
10830 || r->reg_type.bitfield.sreg3
10831 || r->reg_type.bitfield.control
10832 || r->reg_type.bitfield.debug
10833 || r->reg_type.bitfield.test)
10834 && !cpu_arch_flags.bitfield.cpui386)
10835 return (const reg_entry *) NULL;
10837 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
10838 return (const reg_entry *) NULL;
10840 if (!cpu_arch_flags.bitfield.cpuavx512f)
10842 if (r->reg_type.bitfield.zmmword || r->reg_type.bitfield.regmask)
10843 return (const reg_entry *) NULL;
10845 if (!cpu_arch_flags.bitfield.cpuavx)
10847 if (r->reg_type.bitfield.ymmword)
10848 return (const reg_entry *) NULL;
10850 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10851 return (const reg_entry *) NULL;
10855 if (r->reg_type.bitfield.regbnd && !cpu_arch_flags.bitfield.cpumpx)
10856 return (const reg_entry *) NULL;
10858 /* Don't allow fake index register unless allow_index_reg isn't 0. */
10859 if (!allow_index_reg && r->reg_num == RegIZ)
10860 return (const reg_entry *) NULL;
10862 /* Upper 16 vector registers are only available with VREX in 64bit
10863 mode, and require EVEX encoding. */
10864 if (r->reg_flags & RegVRex)
10866 if (!cpu_arch_flags.bitfield.cpuavx512f
10867 || flag_code != CODE_64BIT)
10868 return (const reg_entry *) NULL;
10870 i.vec_encoding = vex_encoding_evex;
10873 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10874 && (!cpu_arch_flags.bitfield.cpulm || !r->reg_type.bitfield.control)
10875 && flag_code != CODE_64BIT)
10876 return (const reg_entry *) NULL;
10878 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
10879 return (const reg_entry *) NULL;
10881 return r;
10884 /* REG_STRING starts *before* REGISTER_PREFIX. */
10886 static const reg_entry *
10887 parse_register (char *reg_string, char **end_op)
10889 const reg_entry *r;
10891 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10892 r = parse_real_register (reg_string, end_op);
10893 else
10894 r = NULL;
10895 if (!r)
10897 char *save = input_line_pointer;
10898 char c;
10899 symbolS *symbolP;
10901 input_line_pointer = reg_string;
10902 c = get_symbol_name (&reg_string);
10903 symbolP = symbol_find (reg_string);
10904 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10906 const expressionS *e = symbol_get_value_expression (symbolP);
10908 know (e->X_op == O_register);
10909 know (e->X_add_number >= 0
10910 && (valueT) e->X_add_number < i386_regtab_size);
10911 r = i386_regtab + e->X_add_number;
10912 if ((r->reg_flags & RegVRex))
10913 i.vec_encoding = vex_encoding_evex;
10914 *end_op = input_line_pointer;
10916 *input_line_pointer = c;
10917 input_line_pointer = save;
10919 return r;
10923 i386_parse_name (char *name, expressionS *e, char *nextcharP)
10925 const reg_entry *r;
10926 char *end = input_line_pointer;
10928 *end = *nextcharP;
10929 r = parse_register (name, &input_line_pointer);
10930 if (r && end <= input_line_pointer)
10932 *nextcharP = *input_line_pointer;
10933 *input_line_pointer = 0;
10934 e->X_op = O_register;
10935 e->X_add_number = r - i386_regtab;
10936 return 1;
10938 input_line_pointer = end;
10939 *end = 0;
10940 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
10943 void
10944 md_operand (expressionS *e)
10946 char *end;
10947 const reg_entry *r;
10949 switch (*input_line_pointer)
10951 case REGISTER_PREFIX:
10952 r = parse_real_register (input_line_pointer, &end);
10953 if (r)
10955 e->X_op = O_register;
10956 e->X_add_number = r - i386_regtab;
10957 input_line_pointer = end;
10959 break;
10961 case '[':
10962 gas_assert (intel_syntax);
10963 end = input_line_pointer++;
10964 expression (e);
10965 if (*input_line_pointer == ']')
10967 ++input_line_pointer;
10968 e->X_op_symbol = make_expr_symbol (e);
10969 e->X_add_symbol = NULL;
10970 e->X_add_number = 0;
10971 e->X_op = O_index;
10973 else
10975 e->X_op = O_absent;
10976 input_line_pointer = end;
10978 break;
10983 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10984 const char *md_shortopts = "kVQ:sqnO::";
10985 #else
10986 const char *md_shortopts = "qnO::";
10987 #endif
10989 #define OPTION_32 (OPTION_MD_BASE + 0)
10990 #define OPTION_64 (OPTION_MD_BASE + 1)
10991 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
10992 #define OPTION_MARCH (OPTION_MD_BASE + 3)
10993 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
10994 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
10995 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
10996 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
10997 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
10998 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
10999 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11000 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11001 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
11002 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
11003 #define OPTION_X32 (OPTION_MD_BASE + 14)
11004 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
11005 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
11006 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
11007 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
11008 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
11009 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
11010 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
11011 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
11012 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
11013 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
11014 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
11015 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
11017 struct option md_longopts[] =
11019 {"32", no_argument, NULL, OPTION_32},
11020 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11021 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11022 {"64", no_argument, NULL, OPTION_64},
11023 #endif
11024 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11025 {"x32", no_argument, NULL, OPTION_X32},
11026 {"mshared", no_argument, NULL, OPTION_MSHARED},
11027 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
11028 #endif
11029 {"divide", no_argument, NULL, OPTION_DIVIDE},
11030 {"march", required_argument, NULL, OPTION_MARCH},
11031 {"mtune", required_argument, NULL, OPTION_MTUNE},
11032 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
11033 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
11034 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
11035 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
11036 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
11037 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
11038 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
11039 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
11040 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
11041 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
11042 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
11043 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
11044 # if defined (TE_PE) || defined (TE_PEP)
11045 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
11046 #endif
11047 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
11048 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
11049 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
11050 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
11051 {"mamd64", no_argument, NULL, OPTION_MAMD64},
11052 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
11053 {NULL, no_argument, NULL, 0}
11055 size_t md_longopts_size = sizeof (md_longopts);
11058 md_parse_option (int c, const char *arg)
11060 unsigned int j;
11061 char *arch, *next, *saved;
11063 switch (c)
11065 case 'n':
11066 optimize_align_code = 0;
11067 break;
11069 case 'q':
11070 quiet_warnings = 1;
11071 break;
11073 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11074 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
11075 should be emitted or not. FIXME: Not implemented. */
11076 case 'Q':
11077 break;
11079 /* -V: SVR4 argument to print version ID. */
11080 case 'V':
11081 print_version_id ();
11082 break;
11084 /* -k: Ignore for FreeBSD compatibility. */
11085 case 'k':
11086 break;
11088 case 's':
11089 /* -s: On i386 Solaris, this tells the native assembler to use
11090 .stab instead of .stab.excl. We always use .stab anyhow. */
11091 break;
11093 case OPTION_MSHARED:
11094 shared = 1;
11095 break;
11097 case OPTION_X86_USED_NOTE:
11098 if (strcasecmp (arg, "yes") == 0)
11099 x86_used_note = 1;
11100 else if (strcasecmp (arg, "no") == 0)
11101 x86_used_note = 0;
11102 else
11103 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
11104 break;
11107 #endif
11108 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11109 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11110 case OPTION_64:
11112 const char **list, **l;
11114 list = bfd_target_list ();
11115 for (l = list; *l != NULL; l++)
11116 if (CONST_STRNEQ (*l, "elf64-x86-64")
11117 || strcmp (*l, "coff-x86-64") == 0
11118 || strcmp (*l, "pe-x86-64") == 0
11119 || strcmp (*l, "pei-x86-64") == 0
11120 || strcmp (*l, "mach-o-x86-64") == 0)
11122 default_arch = "x86_64";
11123 break;
11125 if (*l == NULL)
11126 as_fatal (_("no compiled in support for x86_64"));
11127 free (list);
11129 break;
11130 #endif
11132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11133 case OPTION_X32:
11134 if (IS_ELF)
11136 const char **list, **l;
11138 list = bfd_target_list ();
11139 for (l = list; *l != NULL; l++)
11140 if (CONST_STRNEQ (*l, "elf32-x86-64"))
11142 default_arch = "x86_64:32";
11143 break;
11145 if (*l == NULL)
11146 as_fatal (_("no compiled in support for 32bit x86_64"));
11147 free (list);
11149 else
11150 as_fatal (_("32bit x86_64 is only supported for ELF"));
11151 break;
11152 #endif
11154 case OPTION_32:
11155 default_arch = "i386";
11156 break;
11158 case OPTION_DIVIDE:
11159 #ifdef SVR4_COMMENT_CHARS
11161 char *n, *t;
11162 const char *s;
11164 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
11165 t = n;
11166 for (s = i386_comment_chars; *s != '\0'; s++)
11167 if (*s != '/')
11168 *t++ = *s;
11169 *t = '\0';
11170 i386_comment_chars = n;
11172 #endif
11173 break;
11175 case OPTION_MARCH:
11176 saved = xstrdup (arg);
11177 arch = saved;
11178 /* Allow -march=+nosse. */
11179 if (*arch == '+')
11180 arch++;
11183 if (*arch == '.')
11184 as_fatal (_("invalid -march= option: `%s'"), arg);
11185 next = strchr (arch, '+');
11186 if (next)
11187 *next++ = '\0';
11188 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11190 if (strcmp (arch, cpu_arch [j].name) == 0)
11192 /* Processor. */
11193 if (! cpu_arch[j].flags.bitfield.cpui386)
11194 continue;
11196 cpu_arch_name = cpu_arch[j].name;
11197 cpu_sub_arch_name = NULL;
11198 cpu_arch_flags = cpu_arch[j].flags;
11199 cpu_arch_isa = cpu_arch[j].type;
11200 cpu_arch_isa_flags = cpu_arch[j].flags;
11201 if (!cpu_arch_tune_set)
11203 cpu_arch_tune = cpu_arch_isa;
11204 cpu_arch_tune_flags = cpu_arch_isa_flags;
11206 break;
11208 else if (*cpu_arch [j].name == '.'
11209 && strcmp (arch, cpu_arch [j].name + 1) == 0)
11211 /* ISA extension. */
11212 i386_cpu_flags flags;
11214 flags = cpu_flags_or (cpu_arch_flags,
11215 cpu_arch[j].flags);
11217 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11219 if (cpu_sub_arch_name)
11221 char *name = cpu_sub_arch_name;
11222 cpu_sub_arch_name = concat (name,
11223 cpu_arch[j].name,
11224 (const char *) NULL);
11225 free (name);
11227 else
11228 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
11229 cpu_arch_flags = flags;
11230 cpu_arch_isa_flags = flags;
11232 else
11233 cpu_arch_isa_flags
11234 = cpu_flags_or (cpu_arch_isa_flags,
11235 cpu_arch[j].flags);
11236 break;
11240 if (j >= ARRAY_SIZE (cpu_arch))
11242 /* Disable an ISA extension. */
11243 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11244 if (strcmp (arch, cpu_noarch [j].name) == 0)
11246 i386_cpu_flags flags;
11248 flags = cpu_flags_and_not (cpu_arch_flags,
11249 cpu_noarch[j].flags);
11250 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11252 if (cpu_sub_arch_name)
11254 char *name = cpu_sub_arch_name;
11255 cpu_sub_arch_name = concat (arch,
11256 (const char *) NULL);
11257 free (name);
11259 else
11260 cpu_sub_arch_name = xstrdup (arch);
11261 cpu_arch_flags = flags;
11262 cpu_arch_isa_flags = flags;
11264 break;
11267 if (j >= ARRAY_SIZE (cpu_noarch))
11268 j = ARRAY_SIZE (cpu_arch);
11271 if (j >= ARRAY_SIZE (cpu_arch))
11272 as_fatal (_("invalid -march= option: `%s'"), arg);
11274 arch = next;
11276 while (next != NULL);
11277 free (saved);
11278 break;
11280 case OPTION_MTUNE:
11281 if (*arg == '.')
11282 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11283 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11285 if (strcmp (arg, cpu_arch [j].name) == 0)
11287 cpu_arch_tune_set = 1;
11288 cpu_arch_tune = cpu_arch [j].type;
11289 cpu_arch_tune_flags = cpu_arch[j].flags;
11290 break;
11293 if (j >= ARRAY_SIZE (cpu_arch))
11294 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11295 break;
11297 case OPTION_MMNEMONIC:
11298 if (strcasecmp (arg, "att") == 0)
11299 intel_mnemonic = 0;
11300 else if (strcasecmp (arg, "intel") == 0)
11301 intel_mnemonic = 1;
11302 else
11303 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
11304 break;
11306 case OPTION_MSYNTAX:
11307 if (strcasecmp (arg, "att") == 0)
11308 intel_syntax = 0;
11309 else if (strcasecmp (arg, "intel") == 0)
11310 intel_syntax = 1;
11311 else
11312 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
11313 break;
11315 case OPTION_MINDEX_REG:
11316 allow_index_reg = 1;
11317 break;
11319 case OPTION_MNAKED_REG:
11320 allow_naked_reg = 1;
11321 break;
11323 case OPTION_MSSE2AVX:
11324 sse2avx = 1;
11325 break;
11327 case OPTION_MSSE_CHECK:
11328 if (strcasecmp (arg, "error") == 0)
11329 sse_check = check_error;
11330 else if (strcasecmp (arg, "warning") == 0)
11331 sse_check = check_warning;
11332 else if (strcasecmp (arg, "none") == 0)
11333 sse_check = check_none;
11334 else
11335 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
11336 break;
11338 case OPTION_MOPERAND_CHECK:
11339 if (strcasecmp (arg, "error") == 0)
11340 operand_check = check_error;
11341 else if (strcasecmp (arg, "warning") == 0)
11342 operand_check = check_warning;
11343 else if (strcasecmp (arg, "none") == 0)
11344 operand_check = check_none;
11345 else
11346 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
11347 break;
11349 case OPTION_MAVXSCALAR:
11350 if (strcasecmp (arg, "128") == 0)
11351 avxscalar = vex128;
11352 else if (strcasecmp (arg, "256") == 0)
11353 avxscalar = vex256;
11354 else
11355 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
11356 break;
11358 case OPTION_MVEXWIG:
11359 if (strcmp (arg, "0") == 0)
11360 vexwig = evexw0;
11361 else if (strcmp (arg, "1") == 0)
11362 vexwig = evexw1;
11363 else
11364 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
11365 break;
11367 case OPTION_MADD_BND_PREFIX:
11368 add_bnd_prefix = 1;
11369 break;
11371 case OPTION_MEVEXLIG:
11372 if (strcmp (arg, "128") == 0)
11373 evexlig = evexl128;
11374 else if (strcmp (arg, "256") == 0)
11375 evexlig = evexl256;
11376 else if (strcmp (arg, "512") == 0)
11377 evexlig = evexl512;
11378 else
11379 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
11380 break;
11382 case OPTION_MEVEXRCIG:
11383 if (strcmp (arg, "rne") == 0)
11384 evexrcig = rne;
11385 else if (strcmp (arg, "rd") == 0)
11386 evexrcig = rd;
11387 else if (strcmp (arg, "ru") == 0)
11388 evexrcig = ru;
11389 else if (strcmp (arg, "rz") == 0)
11390 evexrcig = rz;
11391 else
11392 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
11393 break;
11395 case OPTION_MEVEXWIG:
11396 if (strcmp (arg, "0") == 0)
11397 evexwig = evexw0;
11398 else if (strcmp (arg, "1") == 0)
11399 evexwig = evexw1;
11400 else
11401 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
11402 break;
11404 # if defined (TE_PE) || defined (TE_PEP)
11405 case OPTION_MBIG_OBJ:
11406 use_big_obj = 1;
11407 break;
11408 #endif
11410 case OPTION_MOMIT_LOCK_PREFIX:
11411 if (strcasecmp (arg, "yes") == 0)
11412 omit_lock_prefix = 1;
11413 else if (strcasecmp (arg, "no") == 0)
11414 omit_lock_prefix = 0;
11415 else
11416 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
11417 break;
11419 case OPTION_MFENCE_AS_LOCK_ADD:
11420 if (strcasecmp (arg, "yes") == 0)
11421 avoid_fence = 1;
11422 else if (strcasecmp (arg, "no") == 0)
11423 avoid_fence = 0;
11424 else
11425 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
11426 break;
11428 case OPTION_MRELAX_RELOCATIONS:
11429 if (strcasecmp (arg, "yes") == 0)
11430 generate_relax_relocations = 1;
11431 else if (strcasecmp (arg, "no") == 0)
11432 generate_relax_relocations = 0;
11433 else
11434 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
11435 break;
11437 case OPTION_MAMD64:
11438 intel64 = 0;
11439 break;
11441 case OPTION_MINTEL64:
11442 intel64 = 1;
11443 break;
11445 case 'O':
11446 if (arg == NULL)
11448 optimize = 1;
11449 /* Turn off -Os. */
11450 optimize_for_space = 0;
11452 else if (*arg == 's')
11454 optimize_for_space = 1;
11455 /* Turn on all encoding optimizations. */
11456 optimize = INT_MAX;
11458 else
11460 optimize = atoi (arg);
11461 /* Turn off -Os. */
11462 optimize_for_space = 0;
11464 break;
11466 default:
11467 return 0;
11469 return 1;
11472 #define MESSAGE_TEMPLATE \
11475 static char *
11476 output_message (FILE *stream, char *p, char *message, char *start,
11477 int *left_p, const char *name, int len)
11479 int size = sizeof (MESSAGE_TEMPLATE);
11480 int left = *left_p;
11482 /* Reserve 2 spaces for ", " or ",\0" */
11483 left -= len + 2;
11485 /* Check if there is any room. */
11486 if (left >= 0)
11488 if (p != start)
11490 *p++ = ',';
11491 *p++ = ' ';
11493 p = mempcpy (p, name, len);
11495 else
11497 /* Output the current message now and start a new one. */
11498 *p++ = ',';
11499 *p = '\0';
11500 fprintf (stream, "%s\n", message);
11501 p = start;
11502 left = size - (start - message) - len - 2;
11504 gas_assert (left >= 0);
11506 p = mempcpy (p, name, len);
11509 *left_p = left;
11510 return p;
11513 static void
11514 show_arch (FILE *stream, int ext, int check)
11516 static char message[] = MESSAGE_TEMPLATE;
11517 char *start = message + 27;
11518 char *p;
11519 int size = sizeof (MESSAGE_TEMPLATE);
11520 int left;
11521 const char *name;
11522 int len;
11523 unsigned int j;
11525 p = start;
11526 left = size - (start - message);
11527 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11529 /* Should it be skipped? */
11530 if (cpu_arch [j].skip)
11531 continue;
11533 name = cpu_arch [j].name;
11534 len = cpu_arch [j].len;
11535 if (*name == '.')
11537 /* It is an extension. Skip if we aren't asked to show it. */
11538 if (ext)
11540 name++;
11541 len--;
11543 else
11544 continue;
11546 else if (ext)
11548 /* It is an processor. Skip if we show only extension. */
11549 continue;
11551 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
11553 /* It is an impossible processor - skip. */
11554 continue;
11557 p = output_message (stream, p, message, start, &left, name, len);
11560 /* Display disabled extensions. */
11561 if (ext)
11562 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11564 name = cpu_noarch [j].name;
11565 len = cpu_noarch [j].len;
11566 p = output_message (stream, p, message, start, &left, name,
11567 len);
11570 *p = '\0';
11571 fprintf (stream, "%s\n", message);
11574 void
11575 md_show_usage (FILE *stream)
11577 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11578 fprintf (stream, _("\
11579 -Q ignored\n\
11580 -V print assembler version number\n\
11581 -k ignored\n"));
11582 #endif
11583 fprintf (stream, _("\
11584 -n Do not optimize code alignment\n\
11585 -q quieten some warnings\n"));
11586 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11587 fprintf (stream, _("\
11588 -s ignored\n"));
11589 #endif
11590 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11591 || defined (TE_PE) || defined (TE_PEP))
11592 fprintf (stream, _("\
11593 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
11594 #endif
11595 #ifdef SVR4_COMMENT_CHARS
11596 fprintf (stream, _("\
11597 --divide do not treat `/' as a comment character\n"));
11598 #else
11599 fprintf (stream, _("\
11600 --divide ignored\n"));
11601 #endif
11602 fprintf (stream, _("\
11603 -march=CPU[,+EXTENSION...]\n\
11604 generate code for CPU and EXTENSION, CPU is one of:\n"));
11605 show_arch (stream, 0, 1);
11606 fprintf (stream, _("\
11607 EXTENSION is combination of:\n"));
11608 show_arch (stream, 1, 0);
11609 fprintf (stream, _("\
11610 -mtune=CPU optimize for CPU, CPU is one of:\n"));
11611 show_arch (stream, 0, 0);
11612 fprintf (stream, _("\
11613 -msse2avx encode SSE instructions with VEX prefix\n"));
11614 fprintf (stream, _("\
11615 -msse-check=[none|error|warning] (default: warning)\n\
11616 check SSE instructions\n"));
11617 fprintf (stream, _("\
11618 -moperand-check=[none|error|warning] (default: warning)\n\
11619 check operand combinations for validity\n"));
11620 fprintf (stream, _("\
11621 -mavxscalar=[128|256] (default: 128)\n\
11622 encode scalar AVX instructions with specific vector\n\
11623 length\n"));
11624 fprintf (stream, _("\
11625 -mvexwig=[0|1] (default: 0)\n\
11626 encode VEX instructions with specific VEX.W value\n\
11627 for VEX.W bit ignored instructions\n"));
11628 fprintf (stream, _("\
11629 -mevexlig=[128|256|512] (default: 128)\n\
11630 encode scalar EVEX instructions with specific vector\n\
11631 length\n"));
11632 fprintf (stream, _("\
11633 -mevexwig=[0|1] (default: 0)\n\
11634 encode EVEX instructions with specific EVEX.W value\n\
11635 for EVEX.W bit ignored instructions\n"));
11636 fprintf (stream, _("\
11637 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
11638 encode EVEX instructions with specific EVEX.RC value\n\
11639 for SAE-only ignored instructions\n"));
11640 fprintf (stream, _("\
11641 -mmnemonic=[att|intel] "));
11642 if (SYSV386_COMPAT)
11643 fprintf (stream, _("(default: att)\n"));
11644 else
11645 fprintf (stream, _("(default: intel)\n"));
11646 fprintf (stream, _("\
11647 use AT&T/Intel mnemonic\n"));
11648 fprintf (stream, _("\
11649 -msyntax=[att|intel] (default: att)\n\
11650 use AT&T/Intel syntax\n"));
11651 fprintf (stream, _("\
11652 -mindex-reg support pseudo index registers\n"));
11653 fprintf (stream, _("\
11654 -mnaked-reg don't require `%%' prefix for registers\n"));
11655 fprintf (stream, _("\
11656 -madd-bnd-prefix add BND prefix for all valid branches\n"));
11657 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11658 fprintf (stream, _("\
11659 -mshared disable branch optimization for shared code\n"));
11660 fprintf (stream, _("\
11661 -mx86-used-note=[no|yes] "));
11662 if (DEFAULT_X86_USED_NOTE)
11663 fprintf (stream, _("(default: yes)\n"));
11664 else
11665 fprintf (stream, _("(default: no)\n"));
11666 fprintf (stream, _("\
11667 generate x86 used ISA and feature properties\n"));
11668 #endif
11669 #if defined (TE_PE) || defined (TE_PEP)
11670 fprintf (stream, _("\
11671 -mbig-obj generate big object files\n"));
11672 #endif
11673 fprintf (stream, _("\
11674 -momit-lock-prefix=[no|yes] (default: no)\n\
11675 strip all lock prefixes\n"));
11676 fprintf (stream, _("\
11677 -mfence-as-lock-add=[no|yes] (default: no)\n\
11678 encode lfence, mfence and sfence as\n\
11679 lock addl $0x0, (%%{re}sp)\n"));
11680 fprintf (stream, _("\
11681 -mrelax-relocations=[no|yes] "));
11682 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
11683 fprintf (stream, _("(default: yes)\n"));
11684 else
11685 fprintf (stream, _("(default: no)\n"));
11686 fprintf (stream, _("\
11687 generate relax relocations\n"));
11688 fprintf (stream, _("\
11689 -mamd64 accept only AMD64 ISA [default]\n"));
11690 fprintf (stream, _("\
11691 -mintel64 accept only Intel64 ISA\n"));
11694 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11695 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11696 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11698 /* Pick the target format to use. */
11700 const char *
11701 i386_target_format (void)
11703 if (!strncmp (default_arch, "x86_64", 6))
11705 update_code_flag (CODE_64BIT, 1);
11706 if (default_arch[6] == '\0')
11707 x86_elf_abi = X86_64_ABI;
11708 else
11709 x86_elf_abi = X86_64_X32_ABI;
11711 else if (!strcmp (default_arch, "i386"))
11712 update_code_flag (CODE_32BIT, 1);
11713 else if (!strcmp (default_arch, "iamcu"))
11715 update_code_flag (CODE_32BIT, 1);
11716 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11718 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11719 cpu_arch_name = "iamcu";
11720 cpu_sub_arch_name = NULL;
11721 cpu_arch_flags = iamcu_flags;
11722 cpu_arch_isa = PROCESSOR_IAMCU;
11723 cpu_arch_isa_flags = iamcu_flags;
11724 if (!cpu_arch_tune_set)
11726 cpu_arch_tune = cpu_arch_isa;
11727 cpu_arch_tune_flags = cpu_arch_isa_flags;
11730 else if (cpu_arch_isa != PROCESSOR_IAMCU)
11731 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11732 cpu_arch_name);
11734 else
11735 as_fatal (_("unknown architecture"));
11737 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11738 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11739 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11740 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11742 switch (OUTPUT_FLAVOR)
11744 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11745 case bfd_target_aout_flavour:
11746 return AOUT_TARGET_FORMAT;
11747 #endif
11748 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11749 # if defined (TE_PE) || defined (TE_PEP)
11750 case bfd_target_coff_flavour:
11751 if (flag_code == CODE_64BIT)
11752 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11753 else
11754 return "pe-i386";
11755 # elif defined (TE_GO32)
11756 case bfd_target_coff_flavour:
11757 return "coff-go32";
11758 # else
11759 case bfd_target_coff_flavour:
11760 return "coff-i386";
11761 # endif
11762 #endif
11763 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11764 case bfd_target_elf_flavour:
11766 const char *format;
11768 switch (x86_elf_abi)
11770 default:
11771 format = ELF_TARGET_FORMAT;
11772 break;
11773 case X86_64_ABI:
11774 use_rela_relocations = 1;
11775 object_64bit = 1;
11776 format = ELF_TARGET_FORMAT64;
11777 break;
11778 case X86_64_X32_ABI:
11779 use_rela_relocations = 1;
11780 object_64bit = 1;
11781 disallow_64bit_reloc = 1;
11782 format = ELF_TARGET_FORMAT32;
11783 break;
11785 if (cpu_arch_isa == PROCESSOR_L1OM)
11787 if (x86_elf_abi != X86_64_ABI)
11788 as_fatal (_("Intel L1OM is 64bit only"));
11789 return ELF_TARGET_L1OM_FORMAT;
11791 else if (cpu_arch_isa == PROCESSOR_K1OM)
11793 if (x86_elf_abi != X86_64_ABI)
11794 as_fatal (_("Intel K1OM is 64bit only"));
11795 return ELF_TARGET_K1OM_FORMAT;
11797 else if (cpu_arch_isa == PROCESSOR_IAMCU)
11799 if (x86_elf_abi != I386_ABI)
11800 as_fatal (_("Intel MCU is 32bit only"));
11801 return ELF_TARGET_IAMCU_FORMAT;
11803 else
11804 return format;
11806 #endif
11807 #if defined (OBJ_MACH_O)
11808 case bfd_target_mach_o_flavour:
11809 if (flag_code == CODE_64BIT)
11811 use_rela_relocations = 1;
11812 object_64bit = 1;
11813 return "mach-o-x86-64";
11815 else
11816 return "mach-o-i386";
11817 #endif
11818 default:
11819 abort ();
11820 return NULL;
11824 #endif /* OBJ_MAYBE_ more than one */
11826 symbolS *
11827 md_undefined_symbol (char *name)
11829 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11830 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11831 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11832 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11834 if (!GOT_symbol)
11836 if (symbol_find (name))
11837 as_bad (_("GOT already in symbol table"));
11838 GOT_symbol = symbol_new (name, undefined_section,
11839 (valueT) 0, &zero_address_frag);
11841 return GOT_symbol;
11843 return 0;
11846 /* Round up a section size to the appropriate boundary. */
11848 valueT
11849 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11851 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11852 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11854 /* For a.out, force the section size to be aligned. If we don't do
11855 this, BFD will align it for us, but it will not write out the
11856 final bytes of the section. This may be a bug in BFD, but it is
11857 easier to fix it here since that is how the other a.out targets
11858 work. */
11859 int align;
11861 align = bfd_get_section_alignment (stdoutput, segment);
11862 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11864 #endif
11866 return size;
11869 /* On the i386, PC-relative offsets are relative to the start of the
11870 next instruction. That is, the address of the offset, plus its
11871 size, since the offset is always the last part of the insn. */
11873 long
11874 md_pcrel_from (fixS *fixP)
11876 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11879 #ifndef I386COFF
11881 static void
11882 s_bss (int ignore ATTRIBUTE_UNUSED)
11884 int temp;
11886 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11887 if (IS_ELF)
11888 obj_elf_section_change_hook ();
11889 #endif
11890 temp = get_absolute_expression ();
11891 subseg_set (bss_section, (subsegT) temp);
11892 demand_empty_rest_of_line ();
11895 #endif
11897 void
11898 i386_validate_fix (fixS *fixp)
11900 if (fixp->fx_subsy)
11902 if (fixp->fx_subsy == GOT_symbol)
11904 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11906 if (!object_64bit)
11907 abort ();
11908 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11909 if (fixp->fx_tcbit2)
11910 fixp->fx_r_type = (fixp->fx_tcbit
11911 ? BFD_RELOC_X86_64_REX_GOTPCRELX
11912 : BFD_RELOC_X86_64_GOTPCRELX);
11913 else
11914 #endif
11915 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
11917 else
11919 if (!object_64bit)
11920 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
11921 else
11922 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
11924 fixp->fx_subsy = 0;
11927 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11928 else if (!object_64bit)
11930 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
11931 && fixp->fx_tcbit2)
11932 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
11934 #endif
11937 arelent *
11938 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
11940 arelent *rel;
11941 bfd_reloc_code_real_type code;
11943 switch (fixp->fx_r_type)
11945 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11946 case BFD_RELOC_SIZE32:
11947 case BFD_RELOC_SIZE64:
11948 if (S_IS_DEFINED (fixp->fx_addsy)
11949 && !S_IS_EXTERNAL (fixp->fx_addsy))
11951 /* Resolve size relocation against local symbol to size of
11952 the symbol plus addend. */
11953 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
11954 if (fixp->fx_r_type == BFD_RELOC_SIZE32
11955 && !fits_in_unsigned_long (value))
11956 as_bad_where (fixp->fx_file, fixp->fx_line,
11957 _("symbol size computation overflow"));
11958 fixp->fx_addsy = NULL;
11959 fixp->fx_subsy = NULL;
11960 md_apply_fix (fixp, (valueT *) &value, NULL);
11961 return NULL;
11963 #endif
11964 /* Fall through. */
11966 case BFD_RELOC_X86_64_PLT32:
11967 case BFD_RELOC_X86_64_GOT32:
11968 case BFD_RELOC_X86_64_GOTPCREL:
11969 case BFD_RELOC_X86_64_GOTPCRELX:
11970 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11971 case BFD_RELOC_386_PLT32:
11972 case BFD_RELOC_386_GOT32:
11973 case BFD_RELOC_386_GOT32X:
11974 case BFD_RELOC_386_GOTOFF:
11975 case BFD_RELOC_386_GOTPC:
11976 case BFD_RELOC_386_TLS_GD:
11977 case BFD_RELOC_386_TLS_LDM:
11978 case BFD_RELOC_386_TLS_LDO_32:
11979 case BFD_RELOC_386_TLS_IE_32:
11980 case BFD_RELOC_386_TLS_IE:
11981 case BFD_RELOC_386_TLS_GOTIE:
11982 case BFD_RELOC_386_TLS_LE_32:
11983 case BFD_RELOC_386_TLS_LE:
11984 case BFD_RELOC_386_TLS_GOTDESC:
11985 case BFD_RELOC_386_TLS_DESC_CALL:
11986 case BFD_RELOC_X86_64_TLSGD:
11987 case BFD_RELOC_X86_64_TLSLD:
11988 case BFD_RELOC_X86_64_DTPOFF32:
11989 case BFD_RELOC_X86_64_DTPOFF64:
11990 case BFD_RELOC_X86_64_GOTTPOFF:
11991 case BFD_RELOC_X86_64_TPOFF32:
11992 case BFD_RELOC_X86_64_TPOFF64:
11993 case BFD_RELOC_X86_64_GOTOFF64:
11994 case BFD_RELOC_X86_64_GOTPC32:
11995 case BFD_RELOC_X86_64_GOT64:
11996 case BFD_RELOC_X86_64_GOTPCREL64:
11997 case BFD_RELOC_X86_64_GOTPC64:
11998 case BFD_RELOC_X86_64_GOTPLT64:
11999 case BFD_RELOC_X86_64_PLTOFF64:
12000 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12001 case BFD_RELOC_X86_64_TLSDESC_CALL:
12002 case BFD_RELOC_RVA:
12003 case BFD_RELOC_VTABLE_ENTRY:
12004 case BFD_RELOC_VTABLE_INHERIT:
12005 #ifdef TE_PE
12006 case BFD_RELOC_32_SECREL:
12007 #endif
12008 code = fixp->fx_r_type;
12009 break;
12010 case BFD_RELOC_X86_64_32S:
12011 if (!fixp->fx_pcrel)
12013 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
12014 code = fixp->fx_r_type;
12015 break;
12017 /* Fall through. */
12018 default:
12019 if (fixp->fx_pcrel)
12021 switch (fixp->fx_size)
12023 default:
12024 as_bad_where (fixp->fx_file, fixp->fx_line,
12025 _("can not do %d byte pc-relative relocation"),
12026 fixp->fx_size);
12027 code = BFD_RELOC_32_PCREL;
12028 break;
12029 case 1: code = BFD_RELOC_8_PCREL; break;
12030 case 2: code = BFD_RELOC_16_PCREL; break;
12031 case 4: code = BFD_RELOC_32_PCREL; break;
12032 #ifdef BFD64
12033 case 8: code = BFD_RELOC_64_PCREL; break;
12034 #endif
12037 else
12039 switch (fixp->fx_size)
12041 default:
12042 as_bad_where (fixp->fx_file, fixp->fx_line,
12043 _("can not do %d byte relocation"),
12044 fixp->fx_size);
12045 code = BFD_RELOC_32;
12046 break;
12047 case 1: code = BFD_RELOC_8; break;
12048 case 2: code = BFD_RELOC_16; break;
12049 case 4: code = BFD_RELOC_32; break;
12050 #ifdef BFD64
12051 case 8: code = BFD_RELOC_64; break;
12052 #endif
12055 break;
12058 if ((code == BFD_RELOC_32
12059 || code == BFD_RELOC_32_PCREL
12060 || code == BFD_RELOC_X86_64_32S)
12061 && GOT_symbol
12062 && fixp->fx_addsy == GOT_symbol)
12064 if (!object_64bit)
12065 code = BFD_RELOC_386_GOTPC;
12066 else
12067 code = BFD_RELOC_X86_64_GOTPC32;
12069 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
12070 && GOT_symbol
12071 && fixp->fx_addsy == GOT_symbol)
12073 code = BFD_RELOC_X86_64_GOTPC64;
12076 rel = XNEW (arelent);
12077 rel->sym_ptr_ptr = XNEW (asymbol *);
12078 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
12080 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
12082 if (!use_rela_relocations)
12084 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
12085 vtable entry to be used in the relocation's section offset. */
12086 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
12087 rel->address = fixp->fx_offset;
12088 #if defined (OBJ_COFF) && defined (TE_PE)
12089 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
12090 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
12091 else
12092 #endif
12093 rel->addend = 0;
12095 /* Use the rela in 64bit mode. */
12096 else
12098 if (disallow_64bit_reloc)
12099 switch (code)
12101 case BFD_RELOC_X86_64_DTPOFF64:
12102 case BFD_RELOC_X86_64_TPOFF64:
12103 case BFD_RELOC_64_PCREL:
12104 case BFD_RELOC_X86_64_GOTOFF64:
12105 case BFD_RELOC_X86_64_GOT64:
12106 case BFD_RELOC_X86_64_GOTPCREL64:
12107 case BFD_RELOC_X86_64_GOTPC64:
12108 case BFD_RELOC_X86_64_GOTPLT64:
12109 case BFD_RELOC_X86_64_PLTOFF64:
12110 as_bad_where (fixp->fx_file, fixp->fx_line,
12111 _("cannot represent relocation type %s in x32 mode"),
12112 bfd_get_reloc_code_name (code));
12113 break;
12114 default:
12115 break;
12118 if (!fixp->fx_pcrel)
12119 rel->addend = fixp->fx_offset;
12120 else
12121 switch (code)
12123 case BFD_RELOC_X86_64_PLT32:
12124 case BFD_RELOC_X86_64_GOT32:
12125 case BFD_RELOC_X86_64_GOTPCREL:
12126 case BFD_RELOC_X86_64_GOTPCRELX:
12127 case BFD_RELOC_X86_64_REX_GOTPCRELX:
12128 case BFD_RELOC_X86_64_TLSGD:
12129 case BFD_RELOC_X86_64_TLSLD:
12130 case BFD_RELOC_X86_64_GOTTPOFF:
12131 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12132 case BFD_RELOC_X86_64_TLSDESC_CALL:
12133 rel->addend = fixp->fx_offset - fixp->fx_size;
12134 break;
12135 default:
12136 rel->addend = (section->vma
12137 - fixp->fx_size
12138 + fixp->fx_addnumber
12139 + md_pcrel_from (fixp));
12140 break;
12144 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
12145 if (rel->howto == NULL)
12147 as_bad_where (fixp->fx_file, fixp->fx_line,
12148 _("cannot represent relocation type %s"),
12149 bfd_get_reloc_code_name (code));
12150 /* Set howto to a garbage value so that we can keep going. */
12151 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
12152 gas_assert (rel->howto != NULL);
12155 return rel;
12158 #include "tc-i386-intel.c"
12160 void
12161 tc_x86_parse_to_dw2regnum (expressionS *exp)
12163 int saved_naked_reg;
12164 char saved_register_dot;
12166 saved_naked_reg = allow_naked_reg;
12167 allow_naked_reg = 1;
12168 saved_register_dot = register_chars['.'];
12169 register_chars['.'] = '.';
12170 allow_pseudo_reg = 1;
12171 expression_and_evaluate (exp);
12172 allow_pseudo_reg = 0;
12173 register_chars['.'] = saved_register_dot;
12174 allow_naked_reg = saved_naked_reg;
12176 if (exp->X_op == O_register && exp->X_add_number >= 0)
12178 if ((addressT) exp->X_add_number < i386_regtab_size)
12180 exp->X_op = O_constant;
12181 exp->X_add_number = i386_regtab[exp->X_add_number]
12182 .dw2_regnum[flag_code >> 1];
12184 else
12185 exp->X_op = O_illegal;
12189 void
12190 tc_x86_frame_initial_instructions (void)
12192 static unsigned int sp_regno[2];
12194 if (!sp_regno[flag_code >> 1])
12196 char *saved_input = input_line_pointer;
12197 char sp[][4] = {"esp", "rsp"};
12198 expressionS exp;
12200 input_line_pointer = sp[flag_code >> 1];
12201 tc_x86_parse_to_dw2regnum (&exp);
12202 gas_assert (exp.X_op == O_constant);
12203 sp_regno[flag_code >> 1] = exp.X_add_number;
12204 input_line_pointer = saved_input;
12207 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
12208 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
12212 x86_dwarf2_addr_size (void)
12214 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12215 if (x86_elf_abi == X86_64_X32_ABI)
12216 return 4;
12217 #endif
12218 return bfd_arch_bits_per_address (stdoutput) / 8;
12222 i386_elf_section_type (const char *str, size_t len)
12224 if (flag_code == CODE_64BIT
12225 && len == sizeof ("unwind") - 1
12226 && strncmp (str, "unwind", 6) == 0)
12227 return SHT_X86_64_UNWIND;
12229 return -1;
12232 #ifdef TE_SOLARIS
12233 void
12234 i386_solaris_fix_up_eh_frame (segT sec)
12236 if (flag_code == CODE_64BIT)
12237 elf_section_type (sec) = SHT_X86_64_UNWIND;
12239 #endif
12241 #ifdef TE_PE
12242 void
12243 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
12245 expressionS exp;
12247 exp.X_op = O_secrel;
12248 exp.X_add_symbol = symbol;
12249 exp.X_add_number = 0;
12250 emit_expr (&exp, size);
12252 #endif
12254 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12255 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
12257 bfd_vma
12258 x86_64_section_letter (int letter, const char **ptr_msg)
12260 if (flag_code == CODE_64BIT)
12262 if (letter == 'l')
12263 return SHF_X86_64_LARGE;
12265 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
12267 else
12268 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
12269 return -1;
12272 bfd_vma
12273 x86_64_section_word (char *str, size_t len)
12275 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
12276 return SHF_X86_64_LARGE;
12278 return -1;
12281 static void
12282 handle_large_common (int small ATTRIBUTE_UNUSED)
12284 if (flag_code != CODE_64BIT)
12286 s_comm_internal (0, elf_common_parse);
12287 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
12289 else
12291 static segT lbss_section;
12292 asection *saved_com_section_ptr = elf_com_section_ptr;
12293 asection *saved_bss_section = bss_section;
12295 if (lbss_section == NULL)
12297 flagword applicable;
12298 segT seg = now_seg;
12299 subsegT subseg = now_subseg;
12301 /* The .lbss section is for local .largecomm symbols. */
12302 lbss_section = subseg_new (".lbss", 0);
12303 applicable = bfd_applicable_section_flags (stdoutput);
12304 bfd_set_section_flags (stdoutput, lbss_section,
12305 applicable & SEC_ALLOC);
12306 seg_info (lbss_section)->bss = 1;
12308 subseg_set (seg, subseg);
12311 elf_com_section_ptr = &_bfd_elf_large_com_section;
12312 bss_section = lbss_section;
12314 s_comm_internal (0, elf_common_parse);
12316 elf_com_section_ptr = saved_com_section_ptr;
12317 bss_section = saved_bss_section;
12320 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */