* config/tc-xtensa.c (xg_translate_sysreg_op): Remove has_underbar
[binutils.git] / gas / config / tc-i386.c
blobf42a9a4705b23b68e71c53f2ea419cc3686092ed
1 /* i386.c -- Assemble code for the Intel 80386
2 Copyright 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
3 2000, 2001, 2002, 2003, 2004, 2005, 2006
4 Free Software Foundation, Inc.
6 This file is part of GAS, the GNU Assembler.
8 GAS is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2, or (at your option)
11 any later version.
13 GAS is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GAS; see the file COPYING. If not, write to the Free
20 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
21 02110-1301, USA. */
23 /* Intel 80386 machine specific gas.
24 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
25 x86_64 support by Jan Hubicka (jh@suse.cz)
26 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
27 Bugs & suggestions are completely welcome. This is free software.
28 Please help us make it better. */
30 #include "as.h"
31 #include "safe-ctype.h"
32 #include "subsegs.h"
33 #include "dwarf2dbg.h"
34 #include "dw2gencfi.h"
35 #include "opcode/i386.h"
36 #include "elf/x86-64.h"
38 #ifndef REGISTER_WARNINGS
39 #define REGISTER_WARNINGS 1
40 #endif
42 #ifndef INFER_ADDR_PREFIX
43 #define INFER_ADDR_PREFIX 1
44 #endif
46 #ifndef SCALE1_WHEN_NO_INDEX
47 /* Specifying a scale factor besides 1 when there is no index is
48 futile. eg. `mov (%ebx,2),%al' does exactly the same as
49 `mov (%ebx),%al'. To slavishly follow what the programmer
50 specified, set SCALE1_WHEN_NO_INDEX to 0. */
51 #define SCALE1_WHEN_NO_INDEX 1
52 #endif
54 #ifndef DEFAULT_ARCH
55 #define DEFAULT_ARCH "i386"
56 #endif
58 #ifndef INLINE
59 #if __GNUC__ >= 2
60 #define INLINE __inline__
61 #else
62 #define INLINE
63 #endif
64 #endif
66 static INLINE unsigned int mode_from_disp_size PARAMS ((unsigned int));
67 static INLINE int fits_in_signed_byte PARAMS ((offsetT));
68 static INLINE int fits_in_unsigned_byte PARAMS ((offsetT));
69 static INLINE int fits_in_unsigned_word PARAMS ((offsetT));
70 static INLINE int fits_in_signed_word PARAMS ((offsetT));
71 static INLINE int fits_in_unsigned_long PARAMS ((offsetT));
72 static INLINE int fits_in_signed_long PARAMS ((offsetT));
73 static int smallest_imm_type PARAMS ((offsetT));
74 static offsetT offset_in_range PARAMS ((offsetT, int));
75 static int add_prefix PARAMS ((unsigned int));
76 static void set_code_flag PARAMS ((int));
77 static void set_16bit_gcc_code_flag PARAMS ((int));
78 static void set_intel_syntax PARAMS ((int));
79 static void set_cpu_arch PARAMS ((int));
80 #ifdef TE_PE
81 static void pe_directive_secrel PARAMS ((int));
82 #endif
83 static void signed_cons PARAMS ((int));
84 static char *output_invalid PARAMS ((int c));
85 static int i386_operand PARAMS ((char *operand_string));
86 static int i386_intel_operand PARAMS ((char *operand_string, int got_a_float));
87 static const reg_entry *parse_register PARAMS ((char *reg_string,
88 char **end_op));
89 static char *parse_insn PARAMS ((char *, char *));
90 static char *parse_operands PARAMS ((char *, const char *));
91 static void swap_operands PARAMS ((void));
92 static void optimize_imm PARAMS ((void));
93 static void optimize_disp PARAMS ((void));
94 static int match_template PARAMS ((void));
95 static int check_string PARAMS ((void));
96 static int process_suffix PARAMS ((void));
97 static int check_byte_reg PARAMS ((void));
98 static int check_long_reg PARAMS ((void));
99 static int check_qword_reg PARAMS ((void));
100 static int check_word_reg PARAMS ((void));
101 static int finalize_imm PARAMS ((void));
102 static int process_operands PARAMS ((void));
103 static const seg_entry *build_modrm_byte PARAMS ((void));
104 static void output_insn PARAMS ((void));
105 static void output_branch PARAMS ((void));
106 static void output_jump PARAMS ((void));
107 static void output_interseg_jump PARAMS ((void));
108 static void output_imm PARAMS ((fragS *insn_start_frag,
109 offsetT insn_start_off));
110 static void output_disp PARAMS ((fragS *insn_start_frag,
111 offsetT insn_start_off));
112 #ifndef I386COFF
113 static void s_bss PARAMS ((int));
114 #endif
115 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
116 static void handle_large_common (int small ATTRIBUTE_UNUSED);
117 #endif
119 static const char *default_arch = DEFAULT_ARCH;
121 /* 'md_assemble ()' gathers together information and puts it into a
122 i386_insn. */
124 union i386_op
126 expressionS *disps;
127 expressionS *imms;
128 const reg_entry *regs;
131 struct _i386_insn
133 /* TM holds the template for the insn were currently assembling. */
134 template tm;
136 /* SUFFIX holds the instruction mnemonic suffix if given.
137 (e.g. 'l' for 'movl') */
138 char suffix;
140 /* OPERANDS gives the number of given operands. */
141 unsigned int operands;
143 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
144 of given register, displacement, memory operands and immediate
145 operands. */
146 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
148 /* TYPES [i] is the type (see above #defines) which tells us how to
149 use OP[i] for the corresponding operand. */
150 unsigned int types[MAX_OPERANDS];
152 /* Displacement expression, immediate expression, or register for each
153 operand. */
154 union i386_op op[MAX_OPERANDS];
156 /* Flags for operands. */
157 unsigned int flags[MAX_OPERANDS];
158 #define Operand_PCrel 1
160 /* Relocation type for operand */
161 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
163 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
164 the base index byte below. */
165 const reg_entry *base_reg;
166 const reg_entry *index_reg;
167 unsigned int log2_scale_factor;
169 /* SEG gives the seg_entries of this insn. They are zero unless
170 explicit segment overrides are given. */
171 const seg_entry *seg[2];
173 /* PREFIX holds all the given prefix opcodes (usually null).
174 PREFIXES is the number of prefix opcodes. */
175 unsigned int prefixes;
176 unsigned char prefix[MAX_PREFIXES];
178 /* RM and SIB are the modrm byte and the sib byte where the
179 addressing modes of this insn are encoded. */
181 modrm_byte rm;
182 rex_byte rex;
183 sib_byte sib;
186 typedef struct _i386_insn i386_insn;
188 /* List of chars besides those in app.c:symbol_chars that can start an
189 operand. Used to prevent the scrubber eating vital white-space. */
190 const char extra_symbol_chars[] = "*%-(["
191 #ifdef LEX_AT
193 #endif
194 #ifdef LEX_QM
196 #endif
199 #if (defined (TE_I386AIX) \
200 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
201 && !defined (TE_GNU) \
202 && !defined (TE_LINUX) \
203 && !defined (TE_NETWARE) \
204 && !defined (TE_FreeBSD) \
205 && !defined (TE_NetBSD)))
206 /* This array holds the chars that always start a comment. If the
207 pre-processor is disabled, these aren't very useful. The option
208 --divide will remove '/' from this list. */
209 const char *i386_comment_chars = "#/";
210 #define SVR4_COMMENT_CHARS 1
211 #define PREFIX_SEPARATOR '\\'
213 #else
214 const char *i386_comment_chars = "#";
215 #define PREFIX_SEPARATOR '/'
216 #endif
218 /* This array holds the chars that only start a comment at the beginning of
219 a line. If the line seems to have the form '# 123 filename'
220 .line and .file directives will appear in the pre-processed output.
221 Note that input_file.c hand checks for '#' at the beginning of the
222 first line of the input file. This is because the compiler outputs
223 #NO_APP at the beginning of its output.
224 Also note that comments started like this one will always work if
225 '/' isn't otherwise defined. */
226 const char line_comment_chars[] = "#/";
228 const char line_separator_chars[] = ";";
230 /* Chars that can be used to separate mant from exp in floating point
231 nums. */
232 const char EXP_CHARS[] = "eE";
234 /* Chars that mean this number is a floating point constant
235 As in 0f12.456
236 or 0d1.2345e12. */
237 const char FLT_CHARS[] = "fFdDxX";
239 /* Tables for lexical analysis. */
240 static char mnemonic_chars[256];
241 static char register_chars[256];
242 static char operand_chars[256];
243 static char identifier_chars[256];
244 static char digit_chars[256];
246 /* Lexical macros. */
247 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
248 #define is_operand_char(x) (operand_chars[(unsigned char) x])
249 #define is_register_char(x) (register_chars[(unsigned char) x])
250 #define is_space_char(x) ((x) == ' ')
251 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
252 #define is_digit_char(x) (digit_chars[(unsigned char) x])
254 /* All non-digit non-letter characters that may occur in an operand. */
255 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
257 /* md_assemble() always leaves the strings it's passed unaltered. To
258 effect this we maintain a stack of saved characters that we've smashed
259 with '\0's (indicating end of strings for various sub-fields of the
260 assembler instruction). */
261 static char save_stack[32];
262 static char *save_stack_p;
263 #define END_STRING_AND_SAVE(s) \
264 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
265 #define RESTORE_END_STRING(s) \
266 do { *(s) = *--save_stack_p; } while (0)
268 /* The instruction we're assembling. */
269 static i386_insn i;
271 /* Possible templates for current insn. */
272 static const templates *current_templates;
274 /* Per instruction expressionS buffers: 2 displacements & 2 immediate max. */
275 static expressionS disp_expressions[2], im_expressions[2];
277 /* Current operand we are working on. */
278 static int this_operand;
280 /* We support four different modes. FLAG_CODE variable is used to distinguish
281 these. */
283 enum flag_code {
284 CODE_32BIT,
285 CODE_16BIT,
286 CODE_64BIT };
287 #define NUM_FLAG_CODE ((int) CODE_64BIT + 1)
289 static enum flag_code flag_code;
290 static unsigned int object_64bit;
291 static int use_rela_relocations = 0;
293 /* The names used to print error messages. */
294 static const char *flag_code_names[] =
296 "32",
297 "16",
298 "64"
301 /* 1 for intel syntax,
302 0 if att syntax. */
303 static int intel_syntax = 0;
305 /* 1 if register prefix % not required. */
306 static int allow_naked_reg = 0;
308 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
309 leave, push, and pop instructions so that gcc has the same stack
310 frame as in 32 bit mode. */
311 static char stackop_size = '\0';
313 /* Non-zero to optimize code alignment. */
314 int optimize_align_code = 1;
316 /* Non-zero to quieten some warnings. */
317 static int quiet_warnings = 0;
319 /* CPU name. */
320 static const char *cpu_arch_name = NULL;
321 static const char *cpu_sub_arch_name = NULL;
323 /* CPU feature flags. */
324 static unsigned int cpu_arch_flags = CpuUnknownFlags | CpuNo64;
326 /* If set, conditional jumps are not automatically promoted to handle
327 larger than a byte offset. */
328 static unsigned int no_cond_jump_promotion = 0;
330 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
331 static symbolS *GOT_symbol;
333 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
334 unsigned int x86_dwarf2_return_column;
336 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
337 int x86_cie_data_alignment;
339 /* Interface to relax_segment.
340 There are 3 major relax states for 386 jump insns because the
341 different types of jumps add different sizes to frags when we're
342 figuring out what sort of jump to choose to reach a given label. */
344 /* Types. */
345 #define UNCOND_JUMP 0
346 #define COND_JUMP 1
347 #define COND_JUMP86 2
349 /* Sizes. */
350 #define CODE16 1
351 #define SMALL 0
352 #define SMALL16 (SMALL | CODE16)
353 #define BIG 2
354 #define BIG16 (BIG | CODE16)
356 #ifndef INLINE
357 #ifdef __GNUC__
358 #define INLINE __inline__
359 #else
360 #define INLINE
361 #endif
362 #endif
364 #define ENCODE_RELAX_STATE(type, size) \
365 ((relax_substateT) (((type) << 2) | (size)))
366 #define TYPE_FROM_RELAX_STATE(s) \
367 ((s) >> 2)
368 #define DISP_SIZE_FROM_RELAX_STATE(s) \
369 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
371 /* This table is used by relax_frag to promote short jumps to long
372 ones where necessary. SMALL (short) jumps may be promoted to BIG
373 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
374 don't allow a short jump in a 32 bit code segment to be promoted to
375 a 16 bit offset jump because it's slower (requires data size
376 prefix), and doesn't work, unless the destination is in the bottom
377 64k of the code segment (The top 16 bits of eip are zeroed). */
379 const relax_typeS md_relax_table[] =
381 /* The fields are:
382 1) most positive reach of this state,
383 2) most negative reach of this state,
384 3) how many bytes this mode will have in the variable part of the frag
385 4) which index into the table to try if we can't fit into this one. */
387 /* UNCOND_JUMP states. */
388 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
389 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
390 /* dword jmp adds 4 bytes to frag:
391 0 extra opcode bytes, 4 displacement bytes. */
392 {0, 0, 4, 0},
393 /* word jmp adds 2 byte2 to frag:
394 0 extra opcode bytes, 2 displacement bytes. */
395 {0, 0, 2, 0},
397 /* COND_JUMP states. */
398 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
399 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
400 /* dword conditionals adds 5 bytes to frag:
401 1 extra opcode byte, 4 displacement bytes. */
402 {0, 0, 5, 0},
403 /* word conditionals add 3 bytes to frag:
404 1 extra opcode byte, 2 displacement bytes. */
405 {0, 0, 3, 0},
407 /* COND_JUMP86 states. */
408 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
409 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
410 /* dword conditionals adds 5 bytes to frag:
411 1 extra opcode byte, 4 displacement bytes. */
412 {0, 0, 5, 0},
413 /* word conditionals add 4 bytes to frag:
414 1 displacement byte and a 3 byte long branch insn. */
415 {0, 0, 4, 0}
418 static const arch_entry cpu_arch[] = {
419 {"i8086", Cpu086 },
420 {"i186", Cpu086|Cpu186 },
421 {"i286", Cpu086|Cpu186|Cpu286 },
422 {"i386", Cpu086|Cpu186|Cpu286|Cpu386 },
423 {"i486", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486 },
424 {"i586", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
425 {"i686", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
426 {"pentium", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586 },
427 {"pentiumpro",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686 },
428 {"pentiumii", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX },
429 {"pentiumiii",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuMMX|CpuMMX2|CpuSSE },
430 {"pentium4", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
431 {"prescott", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuP4|CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuPNI },
432 {"k6", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX },
433 {"k6_2", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|CpuK6|CpuMMX|Cpu3dnow },
434 {"athlon", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
435 {"sledgehammer",Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
436 {"opteron", Cpu086|Cpu186|Cpu286|Cpu386|Cpu486|Cpu586|Cpu686|CpuK6|CpuAthlon|CpuSledgehammer|CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA|CpuSSE|CpuSSE2 },
437 {".mmx", CpuMMX },
438 {".sse", CpuMMX|CpuMMX2|CpuSSE },
439 {".sse2", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2 },
440 {".sse3", CpuMMX|CpuMMX2|CpuSSE|CpuSSE2|CpuSSE3 },
441 {".3dnow", CpuMMX|Cpu3dnow },
442 {".3dnowa", CpuMMX|CpuMMX2|Cpu3dnow|Cpu3dnowA },
443 {".padlock", CpuPadLock },
444 {".pacifica", CpuSVME },
445 {".svme", CpuSVME },
446 {NULL, 0 }
449 const pseudo_typeS md_pseudo_table[] =
451 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
452 {"align", s_align_bytes, 0},
453 #else
454 {"align", s_align_ptwo, 0},
455 #endif
456 {"arch", set_cpu_arch, 0},
457 #ifndef I386COFF
458 {"bss", s_bss, 0},
459 #endif
460 {"ffloat", float_cons, 'f'},
461 {"dfloat", float_cons, 'd'},
462 {"tfloat", float_cons, 'x'},
463 {"value", cons, 2},
464 {"slong", signed_cons, 4},
465 {"noopt", s_ignore, 0},
466 {"optim", s_ignore, 0},
467 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
468 {"code16", set_code_flag, CODE_16BIT},
469 {"code32", set_code_flag, CODE_32BIT},
470 {"code64", set_code_flag, CODE_64BIT},
471 {"intel_syntax", set_intel_syntax, 1},
472 {"att_syntax", set_intel_syntax, 0},
473 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
474 {"largecomm", handle_large_common, 0},
475 #else
476 {"file", (void (*) PARAMS ((int))) dwarf2_directive_file, 0},
477 {"loc", dwarf2_directive_loc, 0},
478 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
479 #endif
480 #ifdef TE_PE
481 {"secrel32", pe_directive_secrel, 0},
482 #endif
483 {0, 0, 0}
486 /* For interface with expression (). */
487 extern char *input_line_pointer;
489 /* Hash table for instruction mnemonic lookup. */
490 static struct hash_control *op_hash;
492 /* Hash table for register lookup. */
493 static struct hash_control *reg_hash;
495 void
496 i386_align_code (fragP, count)
497 fragS *fragP;
498 int count;
500 /* Various efficient no-op patterns for aligning code labels.
501 Note: Don't try to assemble the instructions in the comments.
502 0L and 0w are not legal. */
503 static const char f32_1[] =
504 {0x90}; /* nop */
505 static const char f32_2[] =
506 {0x89,0xf6}; /* movl %esi,%esi */
507 static const char f32_3[] =
508 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
509 static const char f32_4[] =
510 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
511 static const char f32_5[] =
512 {0x90, /* nop */
513 0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
514 static const char f32_6[] =
515 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
516 static const char f32_7[] =
517 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
518 static const char f32_8[] =
519 {0x90, /* nop */
520 0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
521 static const char f32_9[] =
522 {0x89,0xf6, /* movl %esi,%esi */
523 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
524 static const char f32_10[] =
525 {0x8d,0x76,0x00, /* leal 0(%esi),%esi */
526 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
527 static const char f32_11[] =
528 {0x8d,0x74,0x26,0x00, /* leal 0(%esi,1),%esi */
529 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
530 static const char f32_12[] =
531 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
532 0x8d,0xbf,0x00,0x00,0x00,0x00}; /* leal 0L(%edi),%edi */
533 static const char f32_13[] =
534 {0x8d,0xb6,0x00,0x00,0x00,0x00, /* leal 0L(%esi),%esi */
535 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
536 static const char f32_14[] =
537 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00, /* leal 0L(%esi,1),%esi */
538 0x8d,0xbc,0x27,0x00,0x00,0x00,0x00}; /* leal 0L(%edi,1),%edi */
539 static const char f32_15[] =
540 {0xeb,0x0d,0x90,0x90,0x90,0x90,0x90, /* jmp .+15; lotsa nops */
541 0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
542 static const char f16_3[] =
543 {0x8d,0x74,0x00}; /* lea 0(%esi),%esi */
544 static const char f16_4[] =
545 {0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
546 static const char f16_5[] =
547 {0x90, /* nop */
548 0x8d,0xb4,0x00,0x00}; /* lea 0w(%si),%si */
549 static const char f16_6[] =
550 {0x89,0xf6, /* mov %si,%si */
551 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
552 static const char f16_7[] =
553 {0x8d,0x74,0x00, /* lea 0(%si),%si */
554 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
555 static const char f16_8[] =
556 {0x8d,0xb4,0x00,0x00, /* lea 0w(%si),%si */
557 0x8d,0xbd,0x00,0x00}; /* lea 0w(%di),%di */
558 static const char *const f32_patt[] = {
559 f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
560 f32_9, f32_10, f32_11, f32_12, f32_13, f32_14, f32_15
562 static const char *const f16_patt[] = {
563 f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8,
564 f32_15, f32_15, f32_15, f32_15, f32_15, f32_15, f32_15
567 if (count <= 0 || count > 15)
568 return;
570 /* The recommended way to pad 64bit code is to use NOPs preceded by
571 maximally four 0x66 prefixes. Balance the size of nops. */
572 if (flag_code == CODE_64BIT)
574 int i;
575 int nnops = (count + 3) / 4;
576 int len = count / nnops;
577 int remains = count - nnops * len;
578 int pos = 0;
580 for (i = 0; i < remains; i++)
582 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len);
583 fragP->fr_literal[fragP->fr_fix + pos + len] = 0x90;
584 pos += len + 1;
586 for (; i < nnops; i++)
588 memset (fragP->fr_literal + fragP->fr_fix + pos, 0x66, len - 1);
589 fragP->fr_literal[fragP->fr_fix + pos + len - 1] = 0x90;
590 pos += len;
593 else
594 if (flag_code == CODE_16BIT)
596 memcpy (fragP->fr_literal + fragP->fr_fix,
597 f16_patt[count - 1], count);
598 if (count > 8)
599 /* Adjust jump offset. */
600 fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
602 else
603 memcpy (fragP->fr_literal + fragP->fr_fix,
604 f32_patt[count - 1], count);
605 fragP->fr_var = count;
608 static INLINE unsigned int
609 mode_from_disp_size (t)
610 unsigned int t;
612 return (t & Disp8) ? 1 : (t & (Disp16 | Disp32 | Disp32S)) ? 2 : 0;
615 static INLINE int
616 fits_in_signed_byte (num)
617 offsetT num;
619 return (num >= -128) && (num <= 127);
622 static INLINE int
623 fits_in_unsigned_byte (num)
624 offsetT num;
626 return (num & 0xff) == num;
629 static INLINE int
630 fits_in_unsigned_word (num)
631 offsetT num;
633 return (num & 0xffff) == num;
636 static INLINE int
637 fits_in_signed_word (num)
638 offsetT num;
640 return (-32768 <= num) && (num <= 32767);
642 static INLINE int
643 fits_in_signed_long (num)
644 offsetT num ATTRIBUTE_UNUSED;
646 #ifndef BFD64
647 return 1;
648 #else
649 return (!(((offsetT) -1 << 31) & num)
650 || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
651 #endif
652 } /* fits_in_signed_long() */
653 static INLINE int
654 fits_in_unsigned_long (num)
655 offsetT num ATTRIBUTE_UNUSED;
657 #ifndef BFD64
658 return 1;
659 #else
660 return (num & (((offsetT) 2 << 31) - 1)) == num;
661 #endif
662 } /* fits_in_unsigned_long() */
664 static int
665 smallest_imm_type (num)
666 offsetT num;
668 if (cpu_arch_flags != (Cpu086 | Cpu186 | Cpu286 | Cpu386 | Cpu486 | CpuNo64))
670 /* This code is disabled on the 486 because all the Imm1 forms
671 in the opcode table are slower on the i486. They're the
672 versions with the implicitly specified single-position
673 displacement, which has another syntax if you really want to
674 use that form. */
675 if (num == 1)
676 return Imm1 | Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64;
678 return (fits_in_signed_byte (num)
679 ? (Imm8S | Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
680 : fits_in_unsigned_byte (num)
681 ? (Imm8 | Imm16 | Imm32 | Imm32S | Imm64)
682 : (fits_in_signed_word (num) || fits_in_unsigned_word (num))
683 ? (Imm16 | Imm32 | Imm32S | Imm64)
684 : fits_in_signed_long (num)
685 ? (Imm32 | Imm32S | Imm64)
686 : fits_in_unsigned_long (num)
687 ? (Imm32 | Imm64)
688 : Imm64);
691 static offsetT
692 offset_in_range (val, size)
693 offsetT val;
694 int size;
696 addressT mask;
698 switch (size)
700 case 1: mask = ((addressT) 1 << 8) - 1; break;
701 case 2: mask = ((addressT) 1 << 16) - 1; break;
702 case 4: mask = ((addressT) 2 << 31) - 1; break;
703 #ifdef BFD64
704 case 8: mask = ((addressT) 2 << 63) - 1; break;
705 #endif
706 default: abort ();
709 /* If BFD64, sign extend val. */
710 if (!use_rela_relocations)
711 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
712 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
714 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
716 char buf1[40], buf2[40];
718 sprint_value (buf1, val);
719 sprint_value (buf2, val & mask);
720 as_warn (_("%s shortened to %s"), buf1, buf2);
722 return val & mask;
725 /* Returns 0 if attempting to add a prefix where one from the same
726 class already exists, 1 if non rep/repne added, 2 if rep/repne
727 added. */
728 static int
729 add_prefix (prefix)
730 unsigned int prefix;
732 int ret = 1;
733 unsigned int q;
735 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
736 && flag_code == CODE_64BIT)
738 if ((i.prefix[REX_PREFIX] & prefix & REX_MODE64)
739 || ((i.prefix[REX_PREFIX] & (REX_EXTX | REX_EXTY | REX_EXTZ))
740 && (prefix & (REX_EXTX | REX_EXTY | REX_EXTZ))))
741 ret = 0;
742 q = REX_PREFIX;
744 else
746 switch (prefix)
748 default:
749 abort ();
751 case CS_PREFIX_OPCODE:
752 case DS_PREFIX_OPCODE:
753 case ES_PREFIX_OPCODE:
754 case FS_PREFIX_OPCODE:
755 case GS_PREFIX_OPCODE:
756 case SS_PREFIX_OPCODE:
757 q = SEG_PREFIX;
758 break;
760 case REPNE_PREFIX_OPCODE:
761 case REPE_PREFIX_OPCODE:
762 ret = 2;
763 /* fall thru */
764 case LOCK_PREFIX_OPCODE:
765 q = LOCKREP_PREFIX;
766 break;
768 case FWAIT_OPCODE:
769 q = WAIT_PREFIX;
770 break;
772 case ADDR_PREFIX_OPCODE:
773 q = ADDR_PREFIX;
774 break;
776 case DATA_PREFIX_OPCODE:
777 q = DATA_PREFIX;
778 break;
780 if (i.prefix[q] != 0)
781 ret = 0;
784 if (ret)
786 if (!i.prefix[q])
787 ++i.prefixes;
788 i.prefix[q] |= prefix;
790 else
791 as_bad (_("same type of prefix used twice"));
793 return ret;
796 static void
797 set_code_flag (value)
798 int value;
800 flag_code = value;
801 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
802 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
803 if (value == CODE_64BIT && !(cpu_arch_flags & CpuSledgehammer))
805 as_bad (_("64bit mode not supported on this CPU."));
807 if (value == CODE_32BIT && !(cpu_arch_flags & Cpu386))
809 as_bad (_("32bit mode not supported on this CPU."));
811 stackop_size = '\0';
814 static void
815 set_16bit_gcc_code_flag (new_code_flag)
816 int new_code_flag;
818 flag_code = new_code_flag;
819 cpu_arch_flags &= ~(Cpu64 | CpuNo64);
820 cpu_arch_flags |= (flag_code == CODE_64BIT ? Cpu64 : CpuNo64);
821 stackop_size = LONG_MNEM_SUFFIX;
824 static void
825 set_intel_syntax (syntax_flag)
826 int syntax_flag;
828 /* Find out if register prefixing is specified. */
829 int ask_naked_reg = 0;
831 SKIP_WHITESPACE ();
832 if (!is_end_of_line[(unsigned char) *input_line_pointer])
834 char *string = input_line_pointer;
835 int e = get_symbol_end ();
837 if (strcmp (string, "prefix") == 0)
838 ask_naked_reg = 1;
839 else if (strcmp (string, "noprefix") == 0)
840 ask_naked_reg = -1;
841 else
842 as_bad (_("bad argument to syntax directive."));
843 *input_line_pointer = e;
845 demand_empty_rest_of_line ();
847 intel_syntax = syntax_flag;
849 if (ask_naked_reg == 0)
850 allow_naked_reg = (intel_syntax
851 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
852 else
853 allow_naked_reg = (ask_naked_reg < 0);
855 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
856 identifier_chars['$'] = intel_syntax ? '$' : 0;
859 static void
860 set_cpu_arch (dummy)
861 int dummy ATTRIBUTE_UNUSED;
863 SKIP_WHITESPACE ();
865 if (!is_end_of_line[(unsigned char) *input_line_pointer])
867 char *string = input_line_pointer;
868 int e = get_symbol_end ();
869 int i;
871 for (i = 0; cpu_arch[i].name; i++)
873 if (strcmp (string, cpu_arch[i].name) == 0)
875 if (*string != '.')
877 cpu_arch_name = cpu_arch[i].name;
878 cpu_sub_arch_name = NULL;
879 cpu_arch_flags = (cpu_arch[i].flags
880 | (flag_code == CODE_64BIT ? Cpu64 : CpuNo64));
881 break;
883 if ((cpu_arch_flags | cpu_arch[i].flags) != cpu_arch_flags)
885 cpu_sub_arch_name = cpu_arch[i].name;
886 cpu_arch_flags |= cpu_arch[i].flags;
888 *input_line_pointer = e;
889 demand_empty_rest_of_line ();
890 return;
893 if (!cpu_arch[i].name)
894 as_bad (_("no such architecture: `%s'"), string);
896 *input_line_pointer = e;
898 else
899 as_bad (_("missing cpu architecture"));
901 no_cond_jump_promotion = 0;
902 if (*input_line_pointer == ','
903 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
905 char *string = ++input_line_pointer;
906 int e = get_symbol_end ();
908 if (strcmp (string, "nojumps") == 0)
909 no_cond_jump_promotion = 1;
910 else if (strcmp (string, "jumps") == 0)
912 else
913 as_bad (_("no such architecture modifier: `%s'"), string);
915 *input_line_pointer = e;
918 demand_empty_rest_of_line ();
921 unsigned long
922 i386_mach ()
924 if (!strcmp (default_arch, "x86_64"))
925 return bfd_mach_x86_64;
926 else if (!strcmp (default_arch, "i386"))
927 return bfd_mach_i386_i386;
928 else
929 as_fatal (_("Unknown architecture"));
932 void
933 md_begin ()
935 const char *hash_err;
937 /* Initialize op_hash hash table. */
938 op_hash = hash_new ();
941 const template *optab;
942 templates *core_optab;
944 /* Setup for loop. */
945 optab = i386_optab;
946 core_optab = (templates *) xmalloc (sizeof (templates));
947 core_optab->start = optab;
949 while (1)
951 ++optab;
952 if (optab->name == NULL
953 || strcmp (optab->name, (optab - 1)->name) != 0)
955 /* different name --> ship out current template list;
956 add to hash table; & begin anew. */
957 core_optab->end = optab;
958 hash_err = hash_insert (op_hash,
959 (optab - 1)->name,
960 (PTR) core_optab);
961 if (hash_err)
963 as_fatal (_("Internal Error: Can't hash %s: %s"),
964 (optab - 1)->name,
965 hash_err);
967 if (optab->name == NULL)
968 break;
969 core_optab = (templates *) xmalloc (sizeof (templates));
970 core_optab->start = optab;
975 /* Initialize reg_hash hash table. */
976 reg_hash = hash_new ();
978 const reg_entry *regtab;
980 for (regtab = i386_regtab;
981 regtab < i386_regtab + sizeof (i386_regtab) / sizeof (i386_regtab[0]);
982 regtab++)
984 hash_err = hash_insert (reg_hash, regtab->reg_name, (PTR) regtab);
985 if (hash_err)
986 as_fatal (_("Internal Error: Can't hash %s: %s"),
987 regtab->reg_name,
988 hash_err);
992 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
994 int c;
995 char *p;
997 for (c = 0; c < 256; c++)
999 if (ISDIGIT (c))
1001 digit_chars[c] = c;
1002 mnemonic_chars[c] = c;
1003 register_chars[c] = c;
1004 operand_chars[c] = c;
1006 else if (ISLOWER (c))
1008 mnemonic_chars[c] = c;
1009 register_chars[c] = c;
1010 operand_chars[c] = c;
1012 else if (ISUPPER (c))
1014 mnemonic_chars[c] = TOLOWER (c);
1015 register_chars[c] = mnemonic_chars[c];
1016 operand_chars[c] = c;
1019 if (ISALPHA (c) || ISDIGIT (c))
1020 identifier_chars[c] = c;
1021 else if (c >= 128)
1023 identifier_chars[c] = c;
1024 operand_chars[c] = c;
1028 #ifdef LEX_AT
1029 identifier_chars['@'] = '@';
1030 #endif
1031 #ifdef LEX_QM
1032 identifier_chars['?'] = '?';
1033 operand_chars['?'] = '?';
1034 #endif
1035 digit_chars['-'] = '-';
1036 mnemonic_chars['-'] = '-';
1037 identifier_chars['_'] = '_';
1038 identifier_chars['.'] = '.';
1040 for (p = operand_special_chars; *p != '\0'; p++)
1041 operand_chars[(unsigned char) *p] = *p;
1044 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1045 if (IS_ELF)
1047 record_alignment (text_section, 2);
1048 record_alignment (data_section, 2);
1049 record_alignment (bss_section, 2);
1051 #endif
1053 if (flag_code == CODE_64BIT)
1055 x86_dwarf2_return_column = 16;
1056 x86_cie_data_alignment = -8;
1058 else
1060 x86_dwarf2_return_column = 8;
1061 x86_cie_data_alignment = -4;
1065 void
1066 i386_print_statistics (file)
1067 FILE *file;
1069 hash_print_statistics (file, "i386 opcode", op_hash);
1070 hash_print_statistics (file, "i386 register", reg_hash);
1073 #ifdef DEBUG386
1075 /* Debugging routines for md_assemble. */
1076 static void pi PARAMS ((char *, i386_insn *));
1077 static void pte PARAMS ((template *));
1078 static void pt PARAMS ((unsigned int));
1079 static void pe PARAMS ((expressionS *));
1080 static void ps PARAMS ((symbolS *));
1082 static void
1083 pi (line, x)
1084 char *line;
1085 i386_insn *x;
1087 unsigned int i;
1089 fprintf (stdout, "%s: template ", line);
1090 pte (&x->tm);
1091 fprintf (stdout, " address: base %s index %s scale %x\n",
1092 x->base_reg ? x->base_reg->reg_name : "none",
1093 x->index_reg ? x->index_reg->reg_name : "none",
1094 x->log2_scale_factor);
1095 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
1096 x->rm.mode, x->rm.reg, x->rm.regmem);
1097 fprintf (stdout, " sib: base %x index %x scale %x\n",
1098 x->sib.base, x->sib.index, x->sib.scale);
1099 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
1100 (x->rex & REX_MODE64) != 0,
1101 (x->rex & REX_EXTX) != 0,
1102 (x->rex & REX_EXTY) != 0,
1103 (x->rex & REX_EXTZ) != 0);
1104 for (i = 0; i < x->operands; i++)
1106 fprintf (stdout, " #%d: ", i + 1);
1107 pt (x->types[i]);
1108 fprintf (stdout, "\n");
1109 if (x->types[i]
1110 & (Reg | SReg2 | SReg3 | Control | Debug | Test | RegMMX | RegXMM))
1111 fprintf (stdout, "%s\n", x->op[i].regs->reg_name);
1112 if (x->types[i] & Imm)
1113 pe (x->op[i].imms);
1114 if (x->types[i] & Disp)
1115 pe (x->op[i].disps);
1119 static void
1120 pte (t)
1121 template *t;
1123 unsigned int i;
1124 fprintf (stdout, " %d operands ", t->operands);
1125 fprintf (stdout, "opcode %x ", t->base_opcode);
1126 if (t->extension_opcode != None)
1127 fprintf (stdout, "ext %x ", t->extension_opcode);
1128 if (t->opcode_modifier & D)
1129 fprintf (stdout, "D");
1130 if (t->opcode_modifier & W)
1131 fprintf (stdout, "W");
1132 fprintf (stdout, "\n");
1133 for (i = 0; i < t->operands; i++)
1135 fprintf (stdout, " #%d type ", i + 1);
1136 pt (t->operand_types[i]);
1137 fprintf (stdout, "\n");
1141 static void
1142 pe (e)
1143 expressionS *e;
1145 fprintf (stdout, " operation %d\n", e->X_op);
1146 fprintf (stdout, " add_number %ld (%lx)\n",
1147 (long) e->X_add_number, (long) e->X_add_number);
1148 if (e->X_add_symbol)
1150 fprintf (stdout, " add_symbol ");
1151 ps (e->X_add_symbol);
1152 fprintf (stdout, "\n");
1154 if (e->X_op_symbol)
1156 fprintf (stdout, " op_symbol ");
1157 ps (e->X_op_symbol);
1158 fprintf (stdout, "\n");
1162 static void
1163 ps (s)
1164 symbolS *s;
1166 fprintf (stdout, "%s type %s%s",
1167 S_GET_NAME (s),
1168 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
1169 segment_name (S_GET_SEGMENT (s)));
1172 struct type_name
1174 unsigned int mask;
1175 char *tname;
1178 static const type_names[] =
1180 { Reg8, "r8" },
1181 { Reg16, "r16" },
1182 { Reg32, "r32" },
1183 { Reg64, "r64" },
1184 { Imm8, "i8" },
1185 { Imm8S, "i8s" },
1186 { Imm16, "i16" },
1187 { Imm32, "i32" },
1188 { Imm32S, "i32s" },
1189 { Imm64, "i64" },
1190 { Imm1, "i1" },
1191 { BaseIndex, "BaseIndex" },
1192 { Disp8, "d8" },
1193 { Disp16, "d16" },
1194 { Disp32, "d32" },
1195 { Disp32S, "d32s" },
1196 { Disp64, "d64" },
1197 { InOutPortReg, "InOutPortReg" },
1198 { ShiftCount, "ShiftCount" },
1199 { Control, "control reg" },
1200 { Test, "test reg" },
1201 { Debug, "debug reg" },
1202 { FloatReg, "FReg" },
1203 { FloatAcc, "FAcc" },
1204 { SReg2, "SReg2" },
1205 { SReg3, "SReg3" },
1206 { Acc, "Acc" },
1207 { JumpAbsolute, "Jump Absolute" },
1208 { RegMMX, "rMMX" },
1209 { RegXMM, "rXMM" },
1210 { EsSeg, "es" },
1211 { 0, "" }
1214 static void
1215 pt (t)
1216 unsigned int t;
1218 const struct type_name *ty;
1220 for (ty = type_names; ty->mask; ty++)
1221 if (t & ty->mask)
1222 fprintf (stdout, "%s, ", ty->tname);
1223 fflush (stdout);
1226 #endif /* DEBUG386 */
1228 static bfd_reloc_code_real_type
1229 reloc (unsigned int size,
1230 int pcrel,
1231 int sign,
1232 bfd_reloc_code_real_type other)
1234 if (other != NO_RELOC)
1236 reloc_howto_type *reloc;
1238 if (size == 8)
1239 switch (other)
1241 case BFD_RELOC_X86_64_TPOFF32:
1242 other = BFD_RELOC_X86_64_TPOFF64;
1243 break;
1244 case BFD_RELOC_X86_64_DTPOFF32:
1245 other = BFD_RELOC_X86_64_DTPOFF64;
1246 break;
1247 default:
1248 break;
1251 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
1252 if (size == 4 && flag_code != CODE_64BIT)
1253 sign = -1;
1255 reloc = bfd_reloc_type_lookup (stdoutput, other);
1256 if (!reloc)
1257 as_bad (_("unknown relocation (%u)"), other);
1258 else if (size != bfd_get_reloc_size (reloc))
1259 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
1260 bfd_get_reloc_size (reloc),
1261 size);
1262 else if (pcrel && !reloc->pc_relative)
1263 as_bad (_("non-pc-relative relocation for pc-relative field"));
1264 else if ((reloc->complain_on_overflow == complain_overflow_signed
1265 && !sign)
1266 || (reloc->complain_on_overflow == complain_overflow_unsigned
1267 && sign > 0))
1268 as_bad (_("relocated field and relocation type differ in signedness"));
1269 else
1270 return other;
1271 return NO_RELOC;
1274 if (pcrel)
1276 if (!sign)
1277 as_bad (_("there are no unsigned pc-relative relocations"));
1278 switch (size)
1280 case 1: return BFD_RELOC_8_PCREL;
1281 case 2: return BFD_RELOC_16_PCREL;
1282 case 4: return BFD_RELOC_32_PCREL;
1283 case 8: return BFD_RELOC_64_PCREL;
1285 as_bad (_("cannot do %u byte pc-relative relocation"), size);
1287 else
1289 if (sign > 0)
1290 switch (size)
1292 case 4: return BFD_RELOC_X86_64_32S;
1294 else
1295 switch (size)
1297 case 1: return BFD_RELOC_8;
1298 case 2: return BFD_RELOC_16;
1299 case 4: return BFD_RELOC_32;
1300 case 8: return BFD_RELOC_64;
1302 as_bad (_("cannot do %s %u byte relocation"),
1303 sign > 0 ? "signed" : "unsigned", size);
1306 abort ();
1307 return BFD_RELOC_NONE;
1310 /* Here we decide which fixups can be adjusted to make them relative to
1311 the beginning of the section instead of the symbol. Basically we need
1312 to make sure that the dynamic relocations are done correctly, so in
1313 some cases we force the original symbol to be used. */
1316 tc_i386_fix_adjustable (fixP)
1317 fixS *fixP ATTRIBUTE_UNUSED;
1319 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1320 if (!IS_ELF)
1321 return 1;
1323 /* Don't adjust pc-relative references to merge sections in 64-bit
1324 mode. */
1325 if (use_rela_relocations
1326 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
1327 && fixP->fx_pcrel)
1328 return 0;
1330 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
1331 and changed later by validate_fix. */
1332 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
1333 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
1334 return 0;
1336 /* adjust_reloc_syms doesn't know about the GOT. */
1337 if (fixP->fx_r_type == BFD_RELOC_386_GOTOFF
1338 || fixP->fx_r_type == BFD_RELOC_386_PLT32
1339 || fixP->fx_r_type == BFD_RELOC_386_GOT32
1340 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
1341 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
1342 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
1343 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
1344 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
1345 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
1346 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
1347 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
1348 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
1349 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
1350 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
1351 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
1352 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
1353 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
1354 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
1355 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
1356 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
1357 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
1358 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
1359 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
1360 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
1361 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
1362 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
1363 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
1364 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
1365 return 0;
1366 #endif
1367 return 1;
1370 static int intel_float_operand PARAMS ((const char *mnemonic));
1372 static int
1373 intel_float_operand (mnemonic)
1374 const char *mnemonic;
1376 /* Note that the value returned is meaningful only for opcodes with (memory)
1377 operands, hence the code here is free to improperly handle opcodes that
1378 have no operands (for better performance and smaller code). */
1380 if (mnemonic[0] != 'f')
1381 return 0; /* non-math */
1383 switch (mnemonic[1])
1385 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
1386 the fs segment override prefix not currently handled because no
1387 call path can make opcodes without operands get here */
1388 case 'i':
1389 return 2 /* integer op */;
1390 case 'l':
1391 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
1392 return 3; /* fldcw/fldenv */
1393 break;
1394 case 'n':
1395 if (mnemonic[2] != 'o' /* fnop */)
1396 return 3; /* non-waiting control op */
1397 break;
1398 case 'r':
1399 if (mnemonic[2] == 's')
1400 return 3; /* frstor/frstpm */
1401 break;
1402 case 's':
1403 if (mnemonic[2] == 'a')
1404 return 3; /* fsave */
1405 if (mnemonic[2] == 't')
1407 switch (mnemonic[3])
1409 case 'c': /* fstcw */
1410 case 'd': /* fstdw */
1411 case 'e': /* fstenv */
1412 case 's': /* fsts[gw] */
1413 return 3;
1416 break;
1417 case 'x':
1418 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
1419 return 0; /* fxsave/fxrstor are not really math ops */
1420 break;
1423 return 1;
1426 /* This is the guts of the machine-dependent assembler. LINE points to a
1427 machine dependent instruction. This function is supposed to emit
1428 the frags/bytes it assembles to. */
1430 void
1431 md_assemble (line)
1432 char *line;
1434 int j;
1435 char mnemonic[MAX_MNEM_SIZE];
1437 /* Initialize globals. */
1438 memset (&i, '\0', sizeof (i));
1439 for (j = 0; j < MAX_OPERANDS; j++)
1440 i.reloc[j] = NO_RELOC;
1441 memset (disp_expressions, '\0', sizeof (disp_expressions));
1442 memset (im_expressions, '\0', sizeof (im_expressions));
1443 save_stack_p = save_stack;
1445 /* First parse an instruction mnemonic & call i386_operand for the operands.
1446 We assume that the scrubber has arranged it so that line[0] is the valid
1447 start of a (possibly prefixed) mnemonic. */
1449 line = parse_insn (line, mnemonic);
1450 if (line == NULL)
1451 return;
1453 line = parse_operands (line, mnemonic);
1454 if (line == NULL)
1455 return;
1457 /* Now we've parsed the mnemonic into a set of templates, and have the
1458 operands at hand. */
1460 /* All intel opcodes have reversed operands except for "bound" and
1461 "enter". We also don't reverse intersegment "jmp" and "call"
1462 instructions with 2 immediate operands so that the immediate segment
1463 precedes the offset, as it does when in AT&T mode. "enter" and the
1464 intersegment "jmp" and "call" instructions are the only ones that
1465 have two immediate operands. */
1466 if (intel_syntax && i.operands > 1
1467 && (strcmp (mnemonic, "bound") != 0)
1468 && (strcmp (mnemonic, "invlpga") != 0)
1469 && !((i.types[0] & Imm) && (i.types[1] & Imm)))
1470 swap_operands ();
1472 if (i.imm_operands)
1473 optimize_imm ();
1475 /* Don't optimize displacement for movabs since it only takes 64bit
1476 displacement. */
1477 if (i.disp_operands
1478 && (flag_code != CODE_64BIT
1479 || strcmp (mnemonic, "movabs") != 0))
1480 optimize_disp ();
1482 /* Next, we find a template that matches the given insn,
1483 making sure the overlap of the given operands types is consistent
1484 with the template operand types. */
1486 if (!match_template ())
1487 return;
1489 if (intel_syntax)
1491 /* Undo SYSV386_COMPAT brokenness when in Intel mode. See i386.h */
1492 if (SYSV386_COMPAT
1493 && (i.tm.base_opcode & 0xfffffde0) == 0xdce0)
1494 i.tm.base_opcode ^= FloatR;
1496 /* Zap movzx and movsx suffix. The suffix may have been set from
1497 "word ptr" or "byte ptr" on the source operand, but we'll use
1498 the suffix later to choose the destination register. */
1499 if ((i.tm.base_opcode & ~9) == 0x0fb6)
1501 if (i.reg_operands < 2
1502 && !i.suffix
1503 && (~i.tm.opcode_modifier
1504 & (No_bSuf
1505 | No_wSuf
1506 | No_lSuf
1507 | No_sSuf
1508 | No_xSuf
1509 | No_qSuf)))
1510 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
1512 i.suffix = 0;
1516 if (i.tm.opcode_modifier & FWait)
1517 if (!add_prefix (FWAIT_OPCODE))
1518 return;
1520 /* Check string instruction segment overrides. */
1521 if ((i.tm.opcode_modifier & IsString) != 0 && i.mem_operands != 0)
1523 if (!check_string ())
1524 return;
1527 if (!process_suffix ())
1528 return;
1530 /* Make still unresolved immediate matches conform to size of immediate
1531 given in i.suffix. */
1532 if (!finalize_imm ())
1533 return;
1535 if (i.types[0] & Imm1)
1536 i.imm_operands = 0; /* kludge for shift insns. */
1537 if (i.types[0] & ImplicitRegister)
1538 i.reg_operands--;
1539 if (i.types[1] & ImplicitRegister)
1540 i.reg_operands--;
1541 if (i.types[2] & ImplicitRegister)
1542 i.reg_operands--;
1544 if (i.tm.opcode_modifier & ImmExt)
1546 expressionS *exp;
1548 if ((i.tm.cpu_flags & CpuPNI) && i.operands > 0)
1550 /* These Intel Prescott New Instructions have the fixed
1551 operands with an opcode suffix which is coded in the same
1552 place as an 8-bit immediate field would be. Here we check
1553 those operands and remove them afterwards. */
1554 unsigned int x;
1556 for (x = 0; x < i.operands; x++)
1557 if (i.op[x].regs->reg_num != x)
1558 as_bad (_("can't use register '%%%s' as operand %d in '%s'."),
1559 i.op[x].regs->reg_name, x + 1, i.tm.name);
1560 i.operands = 0;
1563 /* These AMD 3DNow! and Intel Katmai New Instructions have an
1564 opcode suffix which is coded in the same place as an 8-bit
1565 immediate field would be. Here we fake an 8-bit immediate
1566 operand from the opcode suffix stored in tm.extension_opcode. */
1568 assert (i.imm_operands == 0 && i.operands <= 2 && 2 < MAX_OPERANDS);
1570 exp = &im_expressions[i.imm_operands++];
1571 i.op[i.operands].imms = exp;
1572 i.types[i.operands++] = Imm8;
1573 exp->X_op = O_constant;
1574 exp->X_add_number = i.tm.extension_opcode;
1575 i.tm.extension_opcode = None;
1578 /* For insns with operands there are more diddles to do to the opcode. */
1579 if (i.operands)
1581 if (!process_operands ())
1582 return;
1584 else if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
1586 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
1587 as_warn (_("translating to `%sp'"), i.tm.name);
1590 /* Handle conversion of 'int $3' --> special int3 insn. */
1591 if (i.tm.base_opcode == INT_OPCODE && i.op[0].imms->X_add_number == 3)
1593 i.tm.base_opcode = INT3_OPCODE;
1594 i.imm_operands = 0;
1597 if ((i.tm.opcode_modifier & (Jump | JumpByte | JumpDword))
1598 && i.op[0].disps->X_op == O_constant)
1600 /* Convert "jmp constant" (and "call constant") to a jump (call) to
1601 the absolute address given by the constant. Since ix86 jumps and
1602 calls are pc relative, we need to generate a reloc. */
1603 i.op[0].disps->X_add_symbol = &abs_symbol;
1604 i.op[0].disps->X_op = O_symbol;
1607 if ((i.tm.opcode_modifier & Rex64) != 0)
1608 i.rex |= REX_MODE64;
1610 /* For 8 bit registers we need an empty rex prefix. Also if the
1611 instruction already has a prefix, we need to convert old
1612 registers to new ones. */
1614 if (((i.types[0] & Reg8) != 0
1615 && (i.op[0].regs->reg_flags & RegRex64) != 0)
1616 || ((i.types[1] & Reg8) != 0
1617 && (i.op[1].regs->reg_flags & RegRex64) != 0)
1618 || (((i.types[0] & Reg8) != 0 || (i.types[1] & Reg8) != 0)
1619 && i.rex != 0))
1621 int x;
1623 i.rex |= REX_OPCODE;
1624 for (x = 0; x < 2; x++)
1626 /* Look for 8 bit operand that uses old registers. */
1627 if ((i.types[x] & Reg8) != 0
1628 && (i.op[x].regs->reg_flags & RegRex64) == 0)
1630 /* In case it is "hi" register, give up. */
1631 if (i.op[x].regs->reg_num > 3)
1632 as_bad (_("can't encode register '%%%s' in an instruction requiring REX prefix."),
1633 i.op[x].regs->reg_name);
1635 /* Otherwise it is equivalent to the extended register.
1636 Since the encoding doesn't change this is merely
1637 cosmetic cleanup for debug output. */
1639 i.op[x].regs = i.op[x].regs + 8;
1644 if (i.rex != 0)
1645 add_prefix (REX_OPCODE | i.rex);
1647 /* We are ready to output the insn. */
1648 output_insn ();
1651 static char *
1652 parse_insn (line, mnemonic)
1653 char *line;
1654 char *mnemonic;
1656 char *l = line;
1657 char *token_start = l;
1658 char *mnem_p;
1659 int supported;
1660 const template *t;
1662 /* Non-zero if we found a prefix only acceptable with string insns. */
1663 const char *expecting_string_instruction = NULL;
1665 while (1)
1667 mnem_p = mnemonic;
1668 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
1670 mnem_p++;
1671 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
1673 as_bad (_("no such instruction: `%s'"), token_start);
1674 return NULL;
1676 l++;
1678 if (!is_space_char (*l)
1679 && *l != END_OF_INSN
1680 && (intel_syntax
1681 || (*l != PREFIX_SEPARATOR
1682 && *l != ',')))
1684 as_bad (_("invalid character %s in mnemonic"),
1685 output_invalid (*l));
1686 return NULL;
1688 if (token_start == l)
1690 if (!intel_syntax && *l == PREFIX_SEPARATOR)
1691 as_bad (_("expecting prefix; got nothing"));
1692 else
1693 as_bad (_("expecting mnemonic; got nothing"));
1694 return NULL;
1697 /* Look up instruction (or prefix) via hash table. */
1698 current_templates = hash_find (op_hash, mnemonic);
1700 if (*l != END_OF_INSN
1701 && (!is_space_char (*l) || l[1] != END_OF_INSN)
1702 && current_templates
1703 && (current_templates->start->opcode_modifier & IsPrefix))
1705 if (current_templates->start->cpu_flags
1706 & (flag_code != CODE_64BIT ? Cpu64 : CpuNo64))
1708 as_bad ((flag_code != CODE_64BIT
1709 ? _("`%s' is only supported in 64-bit mode")
1710 : _("`%s' is not supported in 64-bit mode")),
1711 current_templates->start->name);
1712 return NULL;
1714 /* If we are in 16-bit mode, do not allow addr16 or data16.
1715 Similarly, in 32-bit mode, do not allow addr32 or data32. */
1716 if ((current_templates->start->opcode_modifier & (Size16 | Size32))
1717 && flag_code != CODE_64BIT
1718 && (((current_templates->start->opcode_modifier & Size32) != 0)
1719 ^ (flag_code == CODE_16BIT)))
1721 as_bad (_("redundant %s prefix"),
1722 current_templates->start->name);
1723 return NULL;
1725 /* Add prefix, checking for repeated prefixes. */
1726 switch (add_prefix (current_templates->start->base_opcode))
1728 case 0:
1729 return NULL;
1730 case 2:
1731 expecting_string_instruction = current_templates->start->name;
1732 break;
1734 /* Skip past PREFIX_SEPARATOR and reset token_start. */
1735 token_start = ++l;
1737 else
1738 break;
1741 if (!current_templates)
1743 /* See if we can get a match by trimming off a suffix. */
1744 switch (mnem_p[-1])
1746 case WORD_MNEM_SUFFIX:
1747 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
1748 i.suffix = SHORT_MNEM_SUFFIX;
1749 else
1750 case BYTE_MNEM_SUFFIX:
1751 case QWORD_MNEM_SUFFIX:
1752 i.suffix = mnem_p[-1];
1753 mnem_p[-1] = '\0';
1754 current_templates = hash_find (op_hash, mnemonic);
1755 break;
1756 case SHORT_MNEM_SUFFIX:
1757 case LONG_MNEM_SUFFIX:
1758 if (!intel_syntax)
1760 i.suffix = mnem_p[-1];
1761 mnem_p[-1] = '\0';
1762 current_templates = hash_find (op_hash, mnemonic);
1764 break;
1766 /* Intel Syntax. */
1767 case 'd':
1768 if (intel_syntax)
1770 if (intel_float_operand (mnemonic) == 1)
1771 i.suffix = SHORT_MNEM_SUFFIX;
1772 else
1773 i.suffix = LONG_MNEM_SUFFIX;
1774 mnem_p[-1] = '\0';
1775 current_templates = hash_find (op_hash, mnemonic);
1777 break;
1779 if (!current_templates)
1781 as_bad (_("no such instruction: `%s'"), token_start);
1782 return NULL;
1786 if (current_templates->start->opcode_modifier & (Jump | JumpByte))
1788 /* Check for a branch hint. We allow ",pt" and ",pn" for
1789 predict taken and predict not taken respectively.
1790 I'm not sure that branch hints actually do anything on loop
1791 and jcxz insns (JumpByte) for current Pentium4 chips. They
1792 may work in the future and it doesn't hurt to accept them
1793 now. */
1794 if (l[0] == ',' && l[1] == 'p')
1796 if (l[2] == 't')
1798 if (!add_prefix (DS_PREFIX_OPCODE))
1799 return NULL;
1800 l += 3;
1802 else if (l[2] == 'n')
1804 if (!add_prefix (CS_PREFIX_OPCODE))
1805 return NULL;
1806 l += 3;
1810 /* Any other comma loses. */
1811 if (*l == ',')
1813 as_bad (_("invalid character %s in mnemonic"),
1814 output_invalid (*l));
1815 return NULL;
1818 /* Check if instruction is supported on specified architecture. */
1819 supported = 0;
1820 for (t = current_templates->start; t < current_templates->end; ++t)
1822 if (!((t->cpu_flags & ~(Cpu64 | CpuNo64))
1823 & ~(cpu_arch_flags & ~(Cpu64 | CpuNo64))))
1824 supported |= 1;
1825 if (!(t->cpu_flags & (flag_code == CODE_64BIT ? CpuNo64 : Cpu64)))
1826 supported |= 2;
1828 if (!(supported & 2))
1830 as_bad (flag_code == CODE_64BIT
1831 ? _("`%s' is not supported in 64-bit mode")
1832 : _("`%s' is only supported in 64-bit mode"),
1833 current_templates->start->name);
1834 return NULL;
1836 if (!(supported & 1))
1838 as_warn (_("`%s' is not supported on `%s%s'"),
1839 current_templates->start->name,
1840 cpu_arch_name,
1841 cpu_sub_arch_name ? cpu_sub_arch_name : "");
1843 else if ((Cpu386 & ~cpu_arch_flags) && (flag_code != CODE_16BIT))
1845 as_warn (_("use .code16 to ensure correct addressing mode"));
1848 /* Check for rep/repne without a string instruction. */
1849 if (expecting_string_instruction)
1851 static templates override;
1853 for (t = current_templates->start; t < current_templates->end; ++t)
1854 if (t->opcode_modifier & IsString)
1855 break;
1856 if (t >= current_templates->end)
1858 as_bad (_("expecting string instruction after `%s'"),
1859 expecting_string_instruction);
1860 return NULL;
1862 for (override.start = t; t < current_templates->end; ++t)
1863 if (!(t->opcode_modifier & IsString))
1864 break;
1865 override.end = t;
1866 current_templates = &override;
1869 return l;
1872 static char *
1873 parse_operands (l, mnemonic)
1874 char *l;
1875 const char *mnemonic;
1877 char *token_start;
1879 /* 1 if operand is pending after ','. */
1880 unsigned int expecting_operand = 0;
1882 /* Non-zero if operand parens not balanced. */
1883 unsigned int paren_not_balanced;
1885 while (*l != END_OF_INSN)
1887 /* Skip optional white space before operand. */
1888 if (is_space_char (*l))
1889 ++l;
1890 if (!is_operand_char (*l) && *l != END_OF_INSN)
1892 as_bad (_("invalid character %s before operand %d"),
1893 output_invalid (*l),
1894 i.operands + 1);
1895 return NULL;
1897 token_start = l; /* after white space */
1898 paren_not_balanced = 0;
1899 while (paren_not_balanced || *l != ',')
1901 if (*l == END_OF_INSN)
1903 if (paren_not_balanced)
1905 if (!intel_syntax)
1906 as_bad (_("unbalanced parenthesis in operand %d."),
1907 i.operands + 1);
1908 else
1909 as_bad (_("unbalanced brackets in operand %d."),
1910 i.operands + 1);
1911 return NULL;
1913 else
1914 break; /* we are done */
1916 else if (!is_operand_char (*l) && !is_space_char (*l))
1918 as_bad (_("invalid character %s in operand %d"),
1919 output_invalid (*l),
1920 i.operands + 1);
1921 return NULL;
1923 if (!intel_syntax)
1925 if (*l == '(')
1926 ++paren_not_balanced;
1927 if (*l == ')')
1928 --paren_not_balanced;
1930 else
1932 if (*l == '[')
1933 ++paren_not_balanced;
1934 if (*l == ']')
1935 --paren_not_balanced;
1937 l++;
1939 if (l != token_start)
1940 { /* Yes, we've read in another operand. */
1941 unsigned int operand_ok;
1942 this_operand = i.operands++;
1943 if (i.operands > MAX_OPERANDS)
1945 as_bad (_("spurious operands; (%d operands/instruction max)"),
1946 MAX_OPERANDS);
1947 return NULL;
1949 /* Now parse operand adding info to 'i' as we go along. */
1950 END_STRING_AND_SAVE (l);
1952 if (intel_syntax)
1953 operand_ok =
1954 i386_intel_operand (token_start,
1955 intel_float_operand (mnemonic));
1956 else
1957 operand_ok = i386_operand (token_start);
1959 RESTORE_END_STRING (l);
1960 if (!operand_ok)
1961 return NULL;
1963 else
1965 if (expecting_operand)
1967 expecting_operand_after_comma:
1968 as_bad (_("expecting operand after ','; got nothing"));
1969 return NULL;
1971 if (*l == ',')
1973 as_bad (_("expecting operand before ','; got nothing"));
1974 return NULL;
1978 /* Now *l must be either ',' or END_OF_INSN. */
1979 if (*l == ',')
1981 if (*++l == END_OF_INSN)
1983 /* Just skip it, if it's \n complain. */
1984 goto expecting_operand_after_comma;
1986 expecting_operand = 1;
1989 return l;
1992 static void
1993 swap_operands ()
1995 union i386_op temp_op;
1996 unsigned int temp_type;
1997 enum bfd_reloc_code_real temp_reloc;
1998 int xchg1 = 0;
1999 int xchg2 = 0;
2001 if (i.operands == 2)
2003 xchg1 = 0;
2004 xchg2 = 1;
2006 else if (i.operands == 3)
2008 xchg1 = 0;
2009 xchg2 = 2;
2011 temp_type = i.types[xchg2];
2012 i.types[xchg2] = i.types[xchg1];
2013 i.types[xchg1] = temp_type;
2014 temp_op = i.op[xchg2];
2015 i.op[xchg2] = i.op[xchg1];
2016 i.op[xchg1] = temp_op;
2017 temp_reloc = i.reloc[xchg2];
2018 i.reloc[xchg2] = i.reloc[xchg1];
2019 i.reloc[xchg1] = temp_reloc;
2021 if (i.mem_operands == 2)
2023 const seg_entry *temp_seg;
2024 temp_seg = i.seg[0];
2025 i.seg[0] = i.seg[1];
2026 i.seg[1] = temp_seg;
2030 /* Try to ensure constant immediates are represented in the smallest
2031 opcode possible. */
2032 static void
2033 optimize_imm ()
2035 char guess_suffix = 0;
2036 int op;
2038 if (i.suffix)
2039 guess_suffix = i.suffix;
2040 else if (i.reg_operands)
2042 /* Figure out a suffix from the last register operand specified.
2043 We can't do this properly yet, ie. excluding InOutPortReg,
2044 but the following works for instructions with immediates.
2045 In any case, we can't set i.suffix yet. */
2046 for (op = i.operands; --op >= 0;)
2047 if (i.types[op] & Reg)
2049 if (i.types[op] & Reg8)
2050 guess_suffix = BYTE_MNEM_SUFFIX;
2051 else if (i.types[op] & Reg16)
2052 guess_suffix = WORD_MNEM_SUFFIX;
2053 else if (i.types[op] & Reg32)
2054 guess_suffix = LONG_MNEM_SUFFIX;
2055 else if (i.types[op] & Reg64)
2056 guess_suffix = QWORD_MNEM_SUFFIX;
2057 break;
2060 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
2061 guess_suffix = WORD_MNEM_SUFFIX;
2063 for (op = i.operands; --op >= 0;)
2064 if (i.types[op] & Imm)
2066 switch (i.op[op].imms->X_op)
2068 case O_constant:
2069 /* If a suffix is given, this operand may be shortened. */
2070 switch (guess_suffix)
2072 case LONG_MNEM_SUFFIX:
2073 i.types[op] |= Imm32 | Imm64;
2074 break;
2075 case WORD_MNEM_SUFFIX:
2076 i.types[op] |= Imm16 | Imm32S | Imm32 | Imm64;
2077 break;
2078 case BYTE_MNEM_SUFFIX:
2079 i.types[op] |= Imm16 | Imm8 | Imm8S | Imm32S | Imm32 | Imm64;
2080 break;
2083 /* If this operand is at most 16 bits, convert it
2084 to a signed 16 bit number before trying to see
2085 whether it will fit in an even smaller size.
2086 This allows a 16-bit operand such as $0xffe0 to
2087 be recognised as within Imm8S range. */
2088 if ((i.types[op] & Imm16)
2089 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
2091 i.op[op].imms->X_add_number =
2092 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
2094 if ((i.types[op] & Imm32)
2095 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
2096 == 0))
2098 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
2099 ^ ((offsetT) 1 << 31))
2100 - ((offsetT) 1 << 31));
2102 i.types[op] |= smallest_imm_type (i.op[op].imms->X_add_number);
2104 /* We must avoid matching of Imm32 templates when 64bit
2105 only immediate is available. */
2106 if (guess_suffix == QWORD_MNEM_SUFFIX)
2107 i.types[op] &= ~Imm32;
2108 break;
2110 case O_absent:
2111 case O_register:
2112 abort ();
2114 /* Symbols and expressions. */
2115 default:
2116 /* Convert symbolic operand to proper sizes for matching, but don't
2117 prevent matching a set of insns that only supports sizes other
2118 than those matching the insn suffix. */
2120 unsigned int mask, allowed = 0;
2121 const template *t;
2123 for (t = current_templates->start; t < current_templates->end; ++t)
2124 allowed |= t->operand_types[op];
2125 switch (guess_suffix)
2127 case QWORD_MNEM_SUFFIX:
2128 mask = Imm64 | Imm32S;
2129 break;
2130 case LONG_MNEM_SUFFIX:
2131 mask = Imm32;
2132 break;
2133 case WORD_MNEM_SUFFIX:
2134 mask = Imm16;
2135 break;
2136 case BYTE_MNEM_SUFFIX:
2137 mask = Imm8;
2138 break;
2139 default:
2140 mask = 0;
2141 break;
2143 if (mask & allowed)
2144 i.types[op] &= mask;
2146 break;
2151 /* Try to use the smallest displacement type too. */
2152 static void
2153 optimize_disp ()
2155 int op;
2157 for (op = i.operands; --op >= 0;)
2158 if (i.types[op] & Disp)
2160 if (i.op[op].disps->X_op == O_constant)
2162 offsetT disp = i.op[op].disps->X_add_number;
2164 if ((i.types[op] & Disp16)
2165 && (disp & ~(offsetT) 0xffff) == 0)
2167 /* If this operand is at most 16 bits, convert
2168 to a signed 16 bit number and don't use 64bit
2169 displacement. */
2170 disp = (((disp & 0xffff) ^ 0x8000) - 0x8000);
2171 i.types[op] &= ~Disp64;
2173 if ((i.types[op] & Disp32)
2174 && (disp & ~(((offsetT) 2 << 31) - 1)) == 0)
2176 /* If this operand is at most 32 bits, convert
2177 to a signed 32 bit number and don't use 64bit
2178 displacement. */
2179 disp &= (((offsetT) 2 << 31) - 1);
2180 disp = (disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
2181 i.types[op] &= ~Disp64;
2183 if (!disp && (i.types[op] & BaseIndex))
2185 i.types[op] &= ~Disp;
2186 i.op[op].disps = 0;
2187 i.disp_operands--;
2189 else if (flag_code == CODE_64BIT)
2191 if (fits_in_signed_long (disp))
2193 i.types[op] &= ~Disp64;
2194 i.types[op] |= Disp32S;
2196 if (fits_in_unsigned_long (disp))
2197 i.types[op] |= Disp32;
2199 if ((i.types[op] & (Disp32 | Disp32S | Disp16))
2200 && fits_in_signed_byte (disp))
2201 i.types[op] |= Disp8;
2203 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
2204 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
2206 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
2207 i.op[op].disps, 0, i.reloc[op]);
2208 i.types[op] &= ~Disp;
2210 else
2211 /* We only support 64bit displacement on constants. */
2212 i.types[op] &= ~Disp64;
2216 static int
2217 match_template ()
2219 /* Points to template once we've found it. */
2220 const template *t;
2221 unsigned int overlap0, overlap1, overlap2;
2222 unsigned int found_reverse_match;
2223 int suffix_check;
2225 #define MATCH(overlap, given, template) \
2226 ((overlap & ~JumpAbsolute) \
2227 && (((given) & (BaseIndex | JumpAbsolute)) \
2228 == ((overlap) & (BaseIndex | JumpAbsolute))))
2230 /* If given types r0 and r1 are registers they must be of the same type
2231 unless the expected operand type register overlap is null.
2232 Note that Acc in a template matches every size of reg. */
2233 #define CONSISTENT_REGISTER_MATCH(m0, g0, t0, m1, g1, t1) \
2234 (((g0) & Reg) == 0 || ((g1) & Reg) == 0 \
2235 || ((g0) & Reg) == ((g1) & Reg) \
2236 || ((((m0) & Acc) ? Reg : (t0)) & (((m1) & Acc) ? Reg : (t1)) & Reg) == 0 )
2238 overlap0 = 0;
2239 overlap1 = 0;
2240 overlap2 = 0;
2241 found_reverse_match = 0;
2242 suffix_check = (i.suffix == BYTE_MNEM_SUFFIX
2243 ? No_bSuf
2244 : (i.suffix == WORD_MNEM_SUFFIX
2245 ? No_wSuf
2246 : (i.suffix == SHORT_MNEM_SUFFIX
2247 ? No_sSuf
2248 : (i.suffix == LONG_MNEM_SUFFIX
2249 ? No_lSuf
2250 : (i.suffix == QWORD_MNEM_SUFFIX
2251 ? No_qSuf
2252 : (i.suffix == LONG_DOUBLE_MNEM_SUFFIX
2253 ? No_xSuf : 0))))));
2255 t = current_templates->start;
2256 if (i.suffix == QWORD_MNEM_SUFFIX
2257 && flag_code != CODE_64BIT
2258 && (intel_syntax
2259 ? !(t->opcode_modifier & IgnoreSize)
2260 && !intel_float_operand (t->name)
2261 : intel_float_operand (t->name) != 2)
2262 && (!(t->operand_types[0] & (RegMMX | RegXMM))
2263 || !(t->operand_types[t->operands > 1] & (RegMMX | RegXMM)))
2264 && (t->base_opcode != 0x0fc7
2265 || t->extension_opcode != 1 /* cmpxchg8b */))
2266 t = current_templates->end;
2267 for (; t < current_templates->end; t++)
2269 /* Must have right number of operands. */
2270 if (i.operands != t->operands)
2271 continue;
2273 /* Check the suffix, except for some instructions in intel mode. */
2274 if ((t->opcode_modifier & suffix_check)
2275 && !(intel_syntax
2276 && (t->opcode_modifier & IgnoreSize)))
2277 continue;
2279 /* Do not verify operands when there are none. */
2280 else if (!t->operands)
2282 if (t->cpu_flags & ~cpu_arch_flags)
2283 continue;
2284 /* We've found a match; break out of loop. */
2285 break;
2288 overlap0 = i.types[0] & t->operand_types[0];
2289 switch (t->operands)
2291 case 1:
2292 if (!MATCH (overlap0, i.types[0], t->operand_types[0]))
2293 continue;
2294 break;
2295 case 2:
2296 case 3:
2297 overlap1 = i.types[1] & t->operand_types[1];
2298 if (!MATCH (overlap0, i.types[0], t->operand_types[0])
2299 || !MATCH (overlap1, i.types[1], t->operand_types[1])
2300 /* monitor in SSE3 is a very special case. The first
2301 register and the second register may have differnet
2302 sizes. */
2303 || !((t->base_opcode == 0x0f01
2304 && t->extension_opcode == 0xc8)
2305 || CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2306 t->operand_types[0],
2307 overlap1, i.types[1],
2308 t->operand_types[1])))
2310 /* Check if other direction is valid ... */
2311 if ((t->opcode_modifier & (D | FloatD)) == 0)
2312 continue;
2314 /* Try reversing direction of operands. */
2315 overlap0 = i.types[0] & t->operand_types[1];
2316 overlap1 = i.types[1] & t->operand_types[0];
2317 if (!MATCH (overlap0, i.types[0], t->operand_types[1])
2318 || !MATCH (overlap1, i.types[1], t->operand_types[0])
2319 || !CONSISTENT_REGISTER_MATCH (overlap0, i.types[0],
2320 t->operand_types[1],
2321 overlap1, i.types[1],
2322 t->operand_types[0]))
2324 /* Does not match either direction. */
2325 continue;
2327 /* found_reverse_match holds which of D or FloatDR
2328 we've found. */
2329 found_reverse_match = t->opcode_modifier & (D | FloatDR);
2331 /* Found a forward 2 operand match here. */
2332 else if (t->operands == 3)
2334 /* Here we make use of the fact that there are no
2335 reverse match 3 operand instructions, and all 3
2336 operand instructions only need to be checked for
2337 register consistency between operands 2 and 3. */
2338 overlap2 = i.types[2] & t->operand_types[2];
2339 if (!MATCH (overlap2, i.types[2], t->operand_types[2])
2340 || !CONSISTENT_REGISTER_MATCH (overlap1, i.types[1],
2341 t->operand_types[1],
2342 overlap2, i.types[2],
2343 t->operand_types[2]))
2345 continue;
2347 /* Found either forward/reverse 2 or 3 operand match here:
2348 slip through to break. */
2350 if (t->cpu_flags & ~cpu_arch_flags)
2352 found_reverse_match = 0;
2353 continue;
2355 /* We've found a match; break out of loop. */
2356 break;
2359 if (t == current_templates->end)
2361 /* We found no match. */
2362 as_bad (_("suffix or operands invalid for `%s'"),
2363 current_templates->start->name);
2364 return 0;
2367 if (!quiet_warnings)
2369 if (!intel_syntax
2370 && ((i.types[0] & JumpAbsolute)
2371 != (t->operand_types[0] & JumpAbsolute)))
2373 as_warn (_("indirect %s without `*'"), t->name);
2376 if ((t->opcode_modifier & (IsPrefix | IgnoreSize))
2377 == (IsPrefix | IgnoreSize))
2379 /* Warn them that a data or address size prefix doesn't
2380 affect assembly of the next line of code. */
2381 as_warn (_("stand-alone `%s' prefix"), t->name);
2385 /* Copy the template we found. */
2386 i.tm = *t;
2387 if (found_reverse_match)
2389 /* If we found a reverse match we must alter the opcode
2390 direction bit. found_reverse_match holds bits to change
2391 (different for int & float insns). */
2393 i.tm.base_opcode ^= found_reverse_match;
2395 i.tm.operand_types[0] = t->operand_types[1];
2396 i.tm.operand_types[1] = t->operand_types[0];
2399 return 1;
2402 static int
2403 check_string ()
2405 int mem_op = (i.types[0] & AnyMem) ? 0 : 1;
2406 if ((i.tm.operand_types[mem_op] & EsSeg) != 0)
2408 if (i.seg[0] != NULL && i.seg[0] != &es)
2410 as_bad (_("`%s' operand %d must use `%%es' segment"),
2411 i.tm.name,
2412 mem_op + 1);
2413 return 0;
2415 /* There's only ever one segment override allowed per instruction.
2416 This instruction possibly has a legal segment override on the
2417 second operand, so copy the segment to where non-string
2418 instructions store it, allowing common code. */
2419 i.seg[0] = i.seg[1];
2421 else if ((i.tm.operand_types[mem_op + 1] & EsSeg) != 0)
2423 if (i.seg[1] != NULL && i.seg[1] != &es)
2425 as_bad (_("`%s' operand %d must use `%%es' segment"),
2426 i.tm.name,
2427 mem_op + 2);
2428 return 0;
2431 return 1;
2434 static int
2435 process_suffix (void)
2437 /* If matched instruction specifies an explicit instruction mnemonic
2438 suffix, use it. */
2439 if (i.tm.opcode_modifier & (Size16 | Size32 | Size64))
2441 if (i.tm.opcode_modifier & Size16)
2442 i.suffix = WORD_MNEM_SUFFIX;
2443 else if (i.tm.opcode_modifier & Size64)
2444 i.suffix = QWORD_MNEM_SUFFIX;
2445 else
2446 i.suffix = LONG_MNEM_SUFFIX;
2448 else if (i.reg_operands)
2450 /* If there's no instruction mnemonic suffix we try to invent one
2451 based on register operands. */
2452 if (!i.suffix)
2454 /* We take i.suffix from the last register operand specified,
2455 Destination register type is more significant than source
2456 register type. */
2457 int op;
2459 for (op = i.operands; --op >= 0;)
2460 if ((i.types[op] & Reg)
2461 && !(i.tm.operand_types[op] & InOutPortReg))
2463 i.suffix = ((i.types[op] & Reg8) ? BYTE_MNEM_SUFFIX :
2464 (i.types[op] & Reg16) ? WORD_MNEM_SUFFIX :
2465 (i.types[op] & Reg64) ? QWORD_MNEM_SUFFIX :
2466 LONG_MNEM_SUFFIX);
2467 break;
2470 else if (i.suffix == BYTE_MNEM_SUFFIX)
2472 if (!check_byte_reg ())
2473 return 0;
2475 else if (i.suffix == LONG_MNEM_SUFFIX)
2477 if (!check_long_reg ())
2478 return 0;
2480 else if (i.suffix == QWORD_MNEM_SUFFIX)
2482 if (!check_qword_reg ())
2483 return 0;
2485 else if (i.suffix == WORD_MNEM_SUFFIX)
2487 if (!check_word_reg ())
2488 return 0;
2490 else if (intel_syntax && (i.tm.opcode_modifier & IgnoreSize))
2491 /* Do nothing if the instruction is going to ignore the prefix. */
2493 else
2494 abort ();
2496 else if ((i.tm.opcode_modifier & DefaultSize)
2497 && !i.suffix
2498 /* exclude fldenv/frstor/fsave/fstenv */
2499 && (i.tm.opcode_modifier & No_sSuf))
2501 i.suffix = stackop_size;
2503 else if (intel_syntax
2504 && !i.suffix
2505 && ((i.tm.operand_types[0] & JumpAbsolute)
2506 || (i.tm.opcode_modifier & (JumpByte|JumpInterSegment))
2507 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
2508 && i.tm.extension_opcode <= 3)))
2510 switch (flag_code)
2512 case CODE_64BIT:
2513 if (!(i.tm.opcode_modifier & No_qSuf))
2515 i.suffix = QWORD_MNEM_SUFFIX;
2516 break;
2518 case CODE_32BIT:
2519 if (!(i.tm.opcode_modifier & No_lSuf))
2520 i.suffix = LONG_MNEM_SUFFIX;
2521 break;
2522 case CODE_16BIT:
2523 if (!(i.tm.opcode_modifier & No_wSuf))
2524 i.suffix = WORD_MNEM_SUFFIX;
2525 break;
2529 if (!i.suffix)
2531 if (!intel_syntax)
2533 if (i.tm.opcode_modifier & W)
2535 as_bad (_("no instruction mnemonic suffix given and no register operands; can't size instruction"));
2536 return 0;
2539 else
2541 unsigned int suffixes = ~i.tm.opcode_modifier
2542 & (No_bSuf
2543 | No_wSuf
2544 | No_lSuf
2545 | No_sSuf
2546 | No_xSuf
2547 | No_qSuf);
2549 if ((i.tm.opcode_modifier & W)
2550 || ((suffixes & (suffixes - 1))
2551 && !(i.tm.opcode_modifier & (DefaultSize | IgnoreSize))))
2553 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
2554 return 0;
2559 /* Change the opcode based on the operand size given by i.suffix;
2560 We don't need to change things for byte insns. */
2562 if (i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
2564 /* It's not a byte, select word/dword operation. */
2565 if (i.tm.opcode_modifier & W)
2567 if (i.tm.opcode_modifier & ShortForm)
2568 i.tm.base_opcode |= 8;
2569 else
2570 i.tm.base_opcode |= 1;
2573 /* Now select between word & dword operations via the operand
2574 size prefix, except for instructions that will ignore this
2575 prefix anyway. */
2576 if (i.tm.base_opcode == 0x0f01 && i.tm.extension_opcode == 0xc8)
2578 /* monitor in SSE3 is a very special case. The default size
2579 of AX is the size of mode. The address size override
2580 prefix will change the size of AX. */
2581 if (i.op->regs[0].reg_type &
2582 (flag_code == CODE_32BIT ? Reg16 : Reg32))
2583 if (!add_prefix (ADDR_PREFIX_OPCODE))
2584 return 0;
2586 else if (i.suffix != QWORD_MNEM_SUFFIX
2587 && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
2588 && !(i.tm.opcode_modifier & (IgnoreSize | FloatMF))
2589 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
2590 || (flag_code == CODE_64BIT
2591 && (i.tm.opcode_modifier & JumpByte))))
2593 unsigned int prefix = DATA_PREFIX_OPCODE;
2595 if (i.tm.opcode_modifier & JumpByte) /* jcxz, loop */
2596 prefix = ADDR_PREFIX_OPCODE;
2598 if (!add_prefix (prefix))
2599 return 0;
2602 /* Set mode64 for an operand. */
2603 if (i.suffix == QWORD_MNEM_SUFFIX
2604 && flag_code == CODE_64BIT
2605 && (i.tm.opcode_modifier & NoRex64) == 0)
2606 i.rex |= REX_MODE64;
2608 /* Size floating point instruction. */
2609 if (i.suffix == LONG_MNEM_SUFFIX)
2610 if (i.tm.opcode_modifier & FloatMF)
2611 i.tm.base_opcode ^= 4;
2614 return 1;
2617 static int
2618 check_byte_reg (void)
2620 int op;
2622 for (op = i.operands; --op >= 0;)
2624 /* If this is an eight bit register, it's OK. If it's the 16 or
2625 32 bit version of an eight bit register, we will just use the
2626 low portion, and that's OK too. */
2627 if (i.types[op] & Reg8)
2628 continue;
2630 /* movzx and movsx should not generate this warning. */
2631 if (intel_syntax
2632 && (i.tm.base_opcode == 0xfb7
2633 || i.tm.base_opcode == 0xfb6
2634 || i.tm.base_opcode == 0x63
2635 || i.tm.base_opcode == 0xfbe
2636 || i.tm.base_opcode == 0xfbf))
2637 continue;
2639 if ((i.types[op] & WordReg) && i.op[op].regs->reg_num < 4)
2641 /* Prohibit these changes in the 64bit mode, since the
2642 lowering is more complicated. */
2643 if (flag_code == CODE_64BIT
2644 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2646 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2647 i.op[op].regs->reg_name,
2648 i.suffix);
2649 return 0;
2651 #if REGISTER_WARNINGS
2652 if (!quiet_warnings
2653 && (i.tm.operand_types[op] & InOutPortReg) == 0)
2654 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2655 (i.op[op].regs + (i.types[op] & Reg16
2656 ? REGNAM_AL - REGNAM_AX
2657 : REGNAM_AL - REGNAM_EAX))->reg_name,
2658 i.op[op].regs->reg_name,
2659 i.suffix);
2660 #endif
2661 continue;
2663 /* Any other register is bad. */
2664 if (i.types[op] & (Reg | RegMMX | RegXMM
2665 | SReg2 | SReg3
2666 | Control | Debug | Test
2667 | FloatReg | FloatAcc))
2669 as_bad (_("`%%%s' not allowed with `%s%c'"),
2670 i.op[op].regs->reg_name,
2671 i.tm.name,
2672 i.suffix);
2673 return 0;
2676 return 1;
2679 static int
2680 check_long_reg ()
2682 int op;
2684 for (op = i.operands; --op >= 0;)
2685 /* Reject eight bit registers, except where the template requires
2686 them. (eg. movzb) */
2687 if ((i.types[op] & Reg8) != 0
2688 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2690 as_bad (_("`%%%s' not allowed with `%s%c'"),
2691 i.op[op].regs->reg_name,
2692 i.tm.name,
2693 i.suffix);
2694 return 0;
2696 /* Warn if the e prefix on a general reg is missing. */
2697 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2698 && (i.types[op] & Reg16) != 0
2699 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2701 /* Prohibit these changes in the 64bit mode, since the
2702 lowering is more complicated. */
2703 if (flag_code == CODE_64BIT)
2705 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2706 i.op[op].regs->reg_name,
2707 i.suffix);
2708 return 0;
2710 #if REGISTER_WARNINGS
2711 else
2712 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2713 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
2714 i.op[op].regs->reg_name,
2715 i.suffix);
2716 #endif
2718 /* Warn if the r prefix on a general reg is missing. */
2719 else if ((i.types[op] & Reg64) != 0
2720 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2722 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2723 i.op[op].regs->reg_name,
2724 i.suffix);
2725 return 0;
2727 return 1;
2730 static int
2731 check_qword_reg ()
2733 int op;
2735 for (op = i.operands; --op >= 0; )
2736 /* Reject eight bit registers, except where the template requires
2737 them. (eg. movzb) */
2738 if ((i.types[op] & Reg8) != 0
2739 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2741 as_bad (_("`%%%s' not allowed with `%s%c'"),
2742 i.op[op].regs->reg_name,
2743 i.tm.name,
2744 i.suffix);
2745 return 0;
2747 /* Warn if the e prefix on a general reg is missing. */
2748 else if (((i.types[op] & Reg16) != 0
2749 || (i.types[op] & Reg32) != 0)
2750 && (i.tm.operand_types[op] & (Reg32 | Acc)) != 0)
2752 /* Prohibit these changes in the 64bit mode, since the
2753 lowering is more complicated. */
2754 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2755 i.op[op].regs->reg_name,
2756 i.suffix);
2757 return 0;
2759 return 1;
2762 static int
2763 check_word_reg ()
2765 int op;
2766 for (op = i.operands; --op >= 0;)
2767 /* Reject eight bit registers, except where the template requires
2768 them. (eg. movzb) */
2769 if ((i.types[op] & Reg8) != 0
2770 && (i.tm.operand_types[op] & (Reg16 | Reg32 | Acc)) != 0)
2772 as_bad (_("`%%%s' not allowed with `%s%c'"),
2773 i.op[op].regs->reg_name,
2774 i.tm.name,
2775 i.suffix);
2776 return 0;
2778 /* Warn if the e prefix on a general reg is present. */
2779 else if ((!quiet_warnings || flag_code == CODE_64BIT)
2780 && (i.types[op] & Reg32) != 0
2781 && (i.tm.operand_types[op] & (Reg16 | Acc)) != 0)
2783 /* Prohibit these changes in the 64bit mode, since the
2784 lowering is more complicated. */
2785 if (flag_code == CODE_64BIT)
2787 as_bad (_("Incorrect register `%%%s' used with `%c' suffix"),
2788 i.op[op].regs->reg_name,
2789 i.suffix);
2790 return 0;
2792 else
2793 #if REGISTER_WARNINGS
2794 as_warn (_("using `%%%s' instead of `%%%s' due to `%c' suffix"),
2795 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
2796 i.op[op].regs->reg_name,
2797 i.suffix);
2798 #endif
2800 return 1;
2803 static int
2804 finalize_imm ()
2806 unsigned int overlap0, overlap1, overlap2;
2808 overlap0 = i.types[0] & i.tm.operand_types[0];
2809 if ((overlap0 & (Imm8 | Imm8S | Imm16 | Imm32 | Imm32S | Imm64))
2810 && overlap0 != Imm8 && overlap0 != Imm8S
2811 && overlap0 != Imm16 && overlap0 != Imm32S
2812 && overlap0 != Imm32 && overlap0 != Imm64)
2814 if (i.suffix)
2816 overlap0 &= (i.suffix == BYTE_MNEM_SUFFIX
2817 ? Imm8 | Imm8S
2818 : (i.suffix == WORD_MNEM_SUFFIX
2819 ? Imm16
2820 : (i.suffix == QWORD_MNEM_SUFFIX
2821 ? Imm64 | Imm32S
2822 : Imm32)));
2824 else if (overlap0 == (Imm16 | Imm32S | Imm32)
2825 || overlap0 == (Imm16 | Imm32)
2826 || overlap0 == (Imm16 | Imm32S))
2828 overlap0 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2829 ? Imm16 : Imm32S);
2831 if (overlap0 != Imm8 && overlap0 != Imm8S
2832 && overlap0 != Imm16 && overlap0 != Imm32S
2833 && overlap0 != Imm32 && overlap0 != Imm64)
2835 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size"));
2836 return 0;
2839 i.types[0] = overlap0;
2841 overlap1 = i.types[1] & i.tm.operand_types[1];
2842 if ((overlap1 & (Imm8 | Imm8S | Imm16 | Imm32S | Imm32 | Imm64))
2843 && overlap1 != Imm8 && overlap1 != Imm8S
2844 && overlap1 != Imm16 && overlap1 != Imm32S
2845 && overlap1 != Imm32 && overlap1 != Imm64)
2847 if (i.suffix)
2849 overlap1 &= (i.suffix == BYTE_MNEM_SUFFIX
2850 ? Imm8 | Imm8S
2851 : (i.suffix == WORD_MNEM_SUFFIX
2852 ? Imm16
2853 : (i.suffix == QWORD_MNEM_SUFFIX
2854 ? Imm64 | Imm32S
2855 : Imm32)));
2857 else if (overlap1 == (Imm16 | Imm32 | Imm32S)
2858 || overlap1 == (Imm16 | Imm32)
2859 || overlap1 == (Imm16 | Imm32S))
2861 overlap1 = ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0)
2862 ? Imm16 : Imm32S);
2864 if (overlap1 != Imm8 && overlap1 != Imm8S
2865 && overlap1 != Imm16 && overlap1 != Imm32S
2866 && overlap1 != Imm32 && overlap1 != Imm64)
2868 as_bad (_("no instruction mnemonic suffix given; can't determine immediate size %x %c"),overlap1, i.suffix);
2869 return 0;
2872 i.types[1] = overlap1;
2874 overlap2 = i.types[2] & i.tm.operand_types[2];
2875 assert ((overlap2 & Imm) == 0);
2876 i.types[2] = overlap2;
2878 return 1;
2881 static int
2882 process_operands ()
2884 /* Default segment register this instruction will use for memory
2885 accesses. 0 means unknown. This is only for optimizing out
2886 unnecessary segment overrides. */
2887 const seg_entry *default_seg = 0;
2889 /* The imul $imm, %reg instruction is converted into
2890 imul $imm, %reg, %reg, and the clr %reg instruction
2891 is converted into xor %reg, %reg. */
2892 if (i.tm.opcode_modifier & regKludge)
2894 unsigned int first_reg_op = (i.types[0] & Reg) ? 0 : 1;
2895 /* Pretend we saw the extra register operand. */
2896 assert (i.op[first_reg_op + 1].regs == 0);
2897 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
2898 i.types[first_reg_op + 1] = i.types[first_reg_op];
2899 i.reg_operands = 2;
2902 if (i.tm.opcode_modifier & ShortForm)
2904 /* The register or float register operand is in operand 0 or 1. */
2905 unsigned int op = (i.types[0] & (Reg | FloatReg)) ? 0 : 1;
2906 /* Register goes in low 3 bits of opcode. */
2907 i.tm.base_opcode |= i.op[op].regs->reg_num;
2908 if ((i.op[op].regs->reg_flags & RegRex) != 0)
2909 i.rex |= REX_EXTZ;
2910 if (!quiet_warnings && (i.tm.opcode_modifier & Ugh) != 0)
2912 /* Warn about some common errors, but press on regardless.
2913 The first case can be generated by gcc (<= 2.8.1). */
2914 if (i.operands == 2)
2916 /* Reversed arguments on faddp, fsubp, etc. */
2917 as_warn (_("translating to `%s %%%s,%%%s'"), i.tm.name,
2918 i.op[1].regs->reg_name,
2919 i.op[0].regs->reg_name);
2921 else
2923 /* Extraneous `l' suffix on fp insn. */
2924 as_warn (_("translating to `%s %%%s'"), i.tm.name,
2925 i.op[0].regs->reg_name);
2929 else if (i.tm.opcode_modifier & Modrm)
2931 /* The opcode is completed (modulo i.tm.extension_opcode which
2932 must be put into the modrm byte). Now, we make the modrm and
2933 index base bytes based on all the info we've collected. */
2935 default_seg = build_modrm_byte ();
2937 else if (i.tm.opcode_modifier & (Seg2ShortForm | Seg3ShortForm))
2939 if (i.tm.base_opcode == POP_SEG_SHORT
2940 && i.op[0].regs->reg_num == 1)
2942 as_bad (_("you can't `pop %%cs'"));
2943 return 0;
2945 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
2946 if ((i.op[0].regs->reg_flags & RegRex) != 0)
2947 i.rex |= REX_EXTZ;
2949 else if ((i.tm.base_opcode & ~(D | W)) == MOV_AX_DISP32)
2951 default_seg = &ds;
2953 else if ((i.tm.opcode_modifier & IsString) != 0)
2955 /* For the string instructions that allow a segment override
2956 on one of their operands, the default segment is ds. */
2957 default_seg = &ds;
2960 if ((i.tm.base_opcode == 0x8d /* lea */
2961 || (i.tm.cpu_flags & CpuSVME))
2962 && i.seg[0] && !quiet_warnings)
2963 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
2965 /* If a segment was explicitly specified, and the specified segment
2966 is not the default, use an opcode prefix to select it. If we
2967 never figured out what the default segment is, then default_seg
2968 will be zero at this point, and the specified segment prefix will
2969 always be used. */
2970 if ((i.seg[0]) && (i.seg[0] != default_seg))
2972 if (!add_prefix (i.seg[0]->seg_prefix))
2973 return 0;
2975 return 1;
2978 static const seg_entry *
2979 build_modrm_byte ()
2981 const seg_entry *default_seg = 0;
2983 /* i.reg_operands MUST be the number of real register operands;
2984 implicit registers do not count. */
2985 if (i.reg_operands == 2)
2987 unsigned int source, dest;
2988 source = ((i.types[0]
2989 & (Reg | RegMMX | RegXMM
2990 | SReg2 | SReg3
2991 | Control | Debug | Test))
2992 ? 0 : 1);
2993 dest = source + 1;
2995 i.rm.mode = 3;
2996 /* One of the register operands will be encoded in the i.tm.reg
2997 field, the other in the combined i.tm.mode and i.tm.regmem
2998 fields. If no form of this instruction supports a memory
2999 destination operand, then we assume the source operand may
3000 sometimes be a memory operand and so we need to store the
3001 destination in the i.rm.reg field. */
3002 if ((i.tm.operand_types[dest] & AnyMem) == 0)
3004 i.rm.reg = i.op[dest].regs->reg_num;
3005 i.rm.regmem = i.op[source].regs->reg_num;
3006 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3007 i.rex |= REX_EXTX;
3008 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3009 i.rex |= REX_EXTZ;
3011 else
3013 i.rm.reg = i.op[source].regs->reg_num;
3014 i.rm.regmem = i.op[dest].regs->reg_num;
3015 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
3016 i.rex |= REX_EXTZ;
3017 if ((i.op[source].regs->reg_flags & RegRex) != 0)
3018 i.rex |= REX_EXTX;
3020 if (flag_code != CODE_64BIT && (i.rex & (REX_EXTX | REX_EXTZ)))
3022 if (!((i.types[0] | i.types[1]) & Control))
3023 abort ();
3024 i.rex &= ~(REX_EXTX | REX_EXTZ);
3025 add_prefix (LOCK_PREFIX_OPCODE);
3028 else
3029 { /* If it's not 2 reg operands... */
3030 if (i.mem_operands)
3032 unsigned int fake_zero_displacement = 0;
3033 unsigned int op = ((i.types[0] & AnyMem)
3035 : (i.types[1] & AnyMem) ? 1 : 2);
3037 default_seg = &ds;
3039 if (i.base_reg == 0)
3041 i.rm.mode = 0;
3042 if (!i.disp_operands)
3043 fake_zero_displacement = 1;
3044 if (i.index_reg == 0)
3046 /* Operand is just <disp> */
3047 if (flag_code == CODE_64BIT)
3049 /* 64bit mode overwrites the 32bit absolute
3050 addressing by RIP relative addressing and
3051 absolute addressing is encoded by one of the
3052 redundant SIB forms. */
3053 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3054 i.sib.base = NO_BASE_REGISTER;
3055 i.sib.index = NO_INDEX_REGISTER;
3056 i.types[op] = ((i.prefix[ADDR_PREFIX] == 0) ? Disp32S : Disp32);
3058 else if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
3060 i.rm.regmem = NO_BASE_REGISTER_16;
3061 i.types[op] = Disp16;
3063 else
3065 i.rm.regmem = NO_BASE_REGISTER;
3066 i.types[op] = Disp32;
3069 else /* !i.base_reg && i.index_reg */
3071 i.sib.index = i.index_reg->reg_num;
3072 i.sib.base = NO_BASE_REGISTER;
3073 i.sib.scale = i.log2_scale_factor;
3074 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3075 i.types[op] &= ~Disp;
3076 if (flag_code != CODE_64BIT)
3077 i.types[op] |= Disp32; /* Must be 32 bit */
3078 else
3079 i.types[op] |= Disp32S;
3080 if ((i.index_reg->reg_flags & RegRex) != 0)
3081 i.rex |= REX_EXTY;
3084 /* RIP addressing for 64bit mode. */
3085 else if (i.base_reg->reg_type == BaseIndex)
3087 i.rm.regmem = NO_BASE_REGISTER;
3088 i.types[op] &= ~ Disp;
3089 i.types[op] |= Disp32S;
3090 i.flags[op] = Operand_PCrel;
3091 if (! i.disp_operands)
3092 fake_zero_displacement = 1;
3094 else if (i.base_reg->reg_type & Reg16)
3096 switch (i.base_reg->reg_num)
3098 case 3: /* (%bx) */
3099 if (i.index_reg == 0)
3100 i.rm.regmem = 7;
3101 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
3102 i.rm.regmem = i.index_reg->reg_num - 6;
3103 break;
3104 case 5: /* (%bp) */
3105 default_seg = &ss;
3106 if (i.index_reg == 0)
3108 i.rm.regmem = 6;
3109 if ((i.types[op] & Disp) == 0)
3111 /* fake (%bp) into 0(%bp) */
3112 i.types[op] |= Disp8;
3113 fake_zero_displacement = 1;
3116 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
3117 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
3118 break;
3119 default: /* (%si) -> 4 or (%di) -> 5 */
3120 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
3122 i.rm.mode = mode_from_disp_size (i.types[op]);
3124 else /* i.base_reg and 32/64 bit mode */
3126 if (flag_code == CODE_64BIT
3127 && (i.types[op] & Disp))
3128 i.types[op] = (i.types[op] & Disp8) | (i.prefix[ADDR_PREFIX] == 0 ? Disp32S : Disp32);
3130 i.rm.regmem = i.base_reg->reg_num;
3131 if ((i.base_reg->reg_flags & RegRex) != 0)
3132 i.rex |= REX_EXTZ;
3133 i.sib.base = i.base_reg->reg_num;
3134 /* x86-64 ignores REX prefix bit here to avoid decoder
3135 complications. */
3136 if ((i.base_reg->reg_num & 7) == EBP_REG_NUM)
3138 default_seg = &ss;
3139 if (i.disp_operands == 0)
3141 fake_zero_displacement = 1;
3142 i.types[op] |= Disp8;
3145 else if (i.base_reg->reg_num == ESP_REG_NUM)
3147 default_seg = &ss;
3149 i.sib.scale = i.log2_scale_factor;
3150 if (i.index_reg == 0)
3152 /* <disp>(%esp) becomes two byte modrm with no index
3153 register. We've already stored the code for esp
3154 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
3155 Any base register besides %esp will not use the
3156 extra modrm byte. */
3157 i.sib.index = NO_INDEX_REGISTER;
3158 #if !SCALE1_WHEN_NO_INDEX
3159 /* Another case where we force the second modrm byte. */
3160 if (i.log2_scale_factor)
3161 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3162 #endif
3164 else
3166 i.sib.index = i.index_reg->reg_num;
3167 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
3168 if ((i.index_reg->reg_flags & RegRex) != 0)
3169 i.rex |= REX_EXTY;
3172 if (i.disp_operands
3173 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
3174 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
3175 i.rm.mode = 0;
3176 else
3177 i.rm.mode = mode_from_disp_size (i.types[op]);
3180 if (fake_zero_displacement)
3182 /* Fakes a zero displacement assuming that i.types[op]
3183 holds the correct displacement size. */
3184 expressionS *exp;
3186 assert (i.op[op].disps == 0);
3187 exp = &disp_expressions[i.disp_operands++];
3188 i.op[op].disps = exp;
3189 exp->X_op = O_constant;
3190 exp->X_add_number = 0;
3191 exp->X_add_symbol = (symbolS *) 0;
3192 exp->X_op_symbol = (symbolS *) 0;
3196 /* Fill in i.rm.reg or i.rm.regmem field with register operand
3197 (if any) based on i.tm.extension_opcode. Again, we must be
3198 careful to make sure that segment/control/debug/test/MMX
3199 registers are coded into the i.rm.reg field. */
3200 if (i.reg_operands)
3202 unsigned int op =
3203 ((i.types[0]
3204 & (Reg | RegMMX | RegXMM
3205 | SReg2 | SReg3
3206 | Control | Debug | Test))
3208 : ((i.types[1]
3209 & (Reg | RegMMX | RegXMM
3210 | SReg2 | SReg3
3211 | Control | Debug | Test))
3213 : 2));
3214 /* If there is an extension opcode to put here, the register
3215 number must be put into the regmem field. */
3216 if (i.tm.extension_opcode != None)
3218 i.rm.regmem = i.op[op].regs->reg_num;
3219 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3220 i.rex |= REX_EXTZ;
3222 else
3224 i.rm.reg = i.op[op].regs->reg_num;
3225 if ((i.op[op].regs->reg_flags & RegRex) != 0)
3226 i.rex |= REX_EXTX;
3229 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
3230 must set it to 3 to indicate this is a register operand
3231 in the regmem field. */
3232 if (!i.mem_operands)
3233 i.rm.mode = 3;
3236 /* Fill in i.rm.reg field with extension opcode (if any). */
3237 if (i.tm.extension_opcode != None)
3238 i.rm.reg = i.tm.extension_opcode;
3240 return default_seg;
3243 static void
3244 output_branch ()
3246 char *p;
3247 int code16;
3248 int prefix;
3249 relax_substateT subtype;
3250 symbolS *sym;
3251 offsetT off;
3253 code16 = 0;
3254 if (flag_code == CODE_16BIT)
3255 code16 = CODE16;
3257 prefix = 0;
3258 if (i.prefix[DATA_PREFIX] != 0)
3260 prefix = 1;
3261 i.prefixes -= 1;
3262 code16 ^= CODE16;
3264 /* Pentium4 branch hints. */
3265 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3266 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3268 prefix++;
3269 i.prefixes--;
3271 if (i.prefix[REX_PREFIX] != 0)
3273 prefix++;
3274 i.prefixes--;
3277 if (i.prefixes != 0 && !intel_syntax)
3278 as_warn (_("skipping prefixes on this instruction"));
3280 /* It's always a symbol; End frag & setup for relax.
3281 Make sure there is enough room in this frag for the largest
3282 instruction we may generate in md_convert_frag. This is 2
3283 bytes for the opcode and room for the prefix and largest
3284 displacement. */
3285 frag_grow (prefix + 2 + 4);
3286 /* Prefix and 1 opcode byte go in fr_fix. */
3287 p = frag_more (prefix + 1);
3288 if (i.prefix[DATA_PREFIX] != 0)
3289 *p++ = DATA_PREFIX_OPCODE;
3290 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
3291 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
3292 *p++ = i.prefix[SEG_PREFIX];
3293 if (i.prefix[REX_PREFIX] != 0)
3294 *p++ = i.prefix[REX_PREFIX];
3295 *p = i.tm.base_opcode;
3297 if ((unsigned char) *p == JUMP_PC_RELATIVE)
3298 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, SMALL);
3299 else if ((cpu_arch_flags & Cpu386) != 0)
3300 subtype = ENCODE_RELAX_STATE (COND_JUMP, SMALL);
3301 else
3302 subtype = ENCODE_RELAX_STATE (COND_JUMP86, SMALL);
3303 subtype |= code16;
3305 sym = i.op[0].disps->X_add_symbol;
3306 off = i.op[0].disps->X_add_number;
3308 if (i.op[0].disps->X_op != O_constant
3309 && i.op[0].disps->X_op != O_symbol)
3311 /* Handle complex expressions. */
3312 sym = make_expr_symbol (i.op[0].disps);
3313 off = 0;
3316 /* 1 possible extra opcode + 4 byte displacement go in var part.
3317 Pass reloc in fr_var. */
3318 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
3321 static void
3322 output_jump ()
3324 char *p;
3325 int size;
3326 fixS *fixP;
3328 if (i.tm.opcode_modifier & JumpByte)
3330 /* This is a loop or jecxz type instruction. */
3331 size = 1;
3332 if (i.prefix[ADDR_PREFIX] != 0)
3334 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
3335 i.prefixes -= 1;
3337 /* Pentium4 branch hints. */
3338 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
3339 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
3341 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
3342 i.prefixes--;
3345 else
3347 int code16;
3349 code16 = 0;
3350 if (flag_code == CODE_16BIT)
3351 code16 = CODE16;
3353 if (i.prefix[DATA_PREFIX] != 0)
3355 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
3356 i.prefixes -= 1;
3357 code16 ^= CODE16;
3360 size = 4;
3361 if (code16)
3362 size = 2;
3365 if (i.prefix[REX_PREFIX] != 0)
3367 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
3368 i.prefixes -= 1;
3371 if (i.prefixes != 0 && !intel_syntax)
3372 as_warn (_("skipping prefixes on this instruction"));
3374 p = frag_more (1 + size);
3375 *p++ = i.tm.base_opcode;
3377 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3378 i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
3380 /* All jumps handled here are signed, but don't use a signed limit
3381 check for 32 and 16 bit jumps as we want to allow wrap around at
3382 4G and 64k respectively. */
3383 if (size == 1)
3384 fixP->fx_signed = 1;
3387 static void
3388 output_interseg_jump ()
3390 char *p;
3391 int size;
3392 int prefix;
3393 int code16;
3395 code16 = 0;
3396 if (flag_code == CODE_16BIT)
3397 code16 = CODE16;
3399 prefix = 0;
3400 if (i.prefix[DATA_PREFIX] != 0)
3402 prefix = 1;
3403 i.prefixes -= 1;
3404 code16 ^= CODE16;
3406 if (i.prefix[REX_PREFIX] != 0)
3408 prefix++;
3409 i.prefixes -= 1;
3412 size = 4;
3413 if (code16)
3414 size = 2;
3416 if (i.prefixes != 0 && !intel_syntax)
3417 as_warn (_("skipping prefixes on this instruction"));
3419 /* 1 opcode; 2 segment; offset */
3420 p = frag_more (prefix + 1 + 2 + size);
3422 if (i.prefix[DATA_PREFIX] != 0)
3423 *p++ = DATA_PREFIX_OPCODE;
3425 if (i.prefix[REX_PREFIX] != 0)
3426 *p++ = i.prefix[REX_PREFIX];
3428 *p++ = i.tm.base_opcode;
3429 if (i.op[1].imms->X_op == O_constant)
3431 offsetT n = i.op[1].imms->X_add_number;
3433 if (size == 2
3434 && !fits_in_unsigned_word (n)
3435 && !fits_in_signed_word (n))
3437 as_bad (_("16-bit jump out of range"));
3438 return;
3440 md_number_to_chars (p, n, size);
3442 else
3443 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3444 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
3445 if (i.op[0].imms->X_op != O_constant)
3446 as_bad (_("can't handle non absolute segment in `%s'"),
3447 i.tm.name);
3448 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
3451 static void
3452 output_insn ()
3454 fragS *insn_start_frag;
3455 offsetT insn_start_off;
3457 /* Tie dwarf2 debug info to the address at the start of the insn.
3458 We can't do this after the insn has been output as the current
3459 frag may have been closed off. eg. by frag_var. */
3460 dwarf2_emit_insn (0);
3462 insn_start_frag = frag_now;
3463 insn_start_off = frag_now_fix ();
3465 /* Output jumps. */
3466 if (i.tm.opcode_modifier & Jump)
3467 output_branch ();
3468 else if (i.tm.opcode_modifier & (JumpByte | JumpDword))
3469 output_jump ();
3470 else if (i.tm.opcode_modifier & JumpInterSegment)
3471 output_interseg_jump ();
3472 else
3474 /* Output normal instructions here. */
3475 char *p;
3476 unsigned char *q;
3477 unsigned int prefix;
3479 /* All opcodes on i386 have either 1 or 2 bytes. Merom New
3480 Instructions have 3 bytes. We may use one more higher byte
3481 to specify a prefix the instruction requires. */
3482 if ((i.tm.cpu_flags & CpuMNI) != 0)
3484 if (i.tm.base_opcode & 0xff000000)
3486 prefix = (i.tm.base_opcode >> 24) & 0xff;
3487 goto check_prefix;
3490 else if ((i.tm.base_opcode & 0xff0000) != 0)
3492 prefix = (i.tm.base_opcode >> 16) & 0xff;
3493 if ((i.tm.cpu_flags & CpuPadLock) != 0)
3495 check_prefix:
3496 if (prefix != REPE_PREFIX_OPCODE
3497 || i.prefix[LOCKREP_PREFIX] != REPE_PREFIX_OPCODE)
3498 add_prefix (prefix);
3500 else
3501 add_prefix (prefix);
3504 /* The prefix bytes. */
3505 for (q = i.prefix;
3506 q < i.prefix + sizeof (i.prefix) / sizeof (i.prefix[0]);
3507 q++)
3509 if (*q)
3511 p = frag_more (1);
3512 md_number_to_chars (p, (valueT) *q, 1);
3516 /* Now the opcode; be careful about word order here! */
3517 if (fits_in_unsigned_byte (i.tm.base_opcode))
3519 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
3521 else
3523 if ((i.tm.cpu_flags & CpuMNI) != 0)
3525 p = frag_more (3);
3526 *p++ = (i.tm.base_opcode >> 16) & 0xff;
3528 else
3529 p = frag_more (2);
3531 /* Put out high byte first: can't use md_number_to_chars! */
3532 *p++ = (i.tm.base_opcode >> 8) & 0xff;
3533 *p = i.tm.base_opcode & 0xff;
3536 /* Now the modrm byte and sib byte (if present). */
3537 if (i.tm.opcode_modifier & Modrm)
3539 p = frag_more (1);
3540 md_number_to_chars (p,
3541 (valueT) (i.rm.regmem << 0
3542 | i.rm.reg << 3
3543 | i.rm.mode << 6),
3545 /* If i.rm.regmem == ESP (4)
3546 && i.rm.mode != (Register mode)
3547 && not 16 bit
3548 ==> need second modrm byte. */
3549 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
3550 && i.rm.mode != 3
3551 && !(i.base_reg && (i.base_reg->reg_type & Reg16) != 0))
3553 p = frag_more (1);
3554 md_number_to_chars (p,
3555 (valueT) (i.sib.base << 0
3556 | i.sib.index << 3
3557 | i.sib.scale << 6),
3562 if (i.disp_operands)
3563 output_disp (insn_start_frag, insn_start_off);
3565 if (i.imm_operands)
3566 output_imm (insn_start_frag, insn_start_off);
3569 #ifdef DEBUG386
3570 if (flag_debug)
3572 pi (line, &i);
3574 #endif /* DEBUG386 */
3577 static void
3578 output_disp (insn_start_frag, insn_start_off)
3579 fragS *insn_start_frag;
3580 offsetT insn_start_off;
3582 char *p;
3583 unsigned int n;
3585 for (n = 0; n < i.operands; n++)
3587 if (i.types[n] & Disp)
3589 if (i.op[n].disps->X_op == O_constant)
3591 int size;
3592 offsetT val;
3594 size = 4;
3595 if (i.types[n] & (Disp8 | Disp16 | Disp64))
3597 size = 2;
3598 if (i.types[n] & Disp8)
3599 size = 1;
3600 if (i.types[n] & Disp64)
3601 size = 8;
3603 val = offset_in_range (i.op[n].disps->X_add_number,
3604 size);
3605 p = frag_more (size);
3606 md_number_to_chars (p, val, size);
3608 else
3610 enum bfd_reloc_code_real reloc_type;
3611 int size = 4;
3612 int sign = 0;
3613 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
3615 /* The PC relative address is computed relative
3616 to the instruction boundary, so in case immediate
3617 fields follows, we need to adjust the value. */
3618 if (pcrel && i.imm_operands)
3620 int imm_size = 4;
3621 unsigned int n1;
3623 for (n1 = 0; n1 < i.operands; n1++)
3624 if (i.types[n1] & Imm)
3626 if (i.types[n1] & (Imm8 | Imm8S | Imm16 | Imm64))
3628 imm_size = 2;
3629 if (i.types[n1] & (Imm8 | Imm8S))
3630 imm_size = 1;
3631 if (i.types[n1] & Imm64)
3632 imm_size = 8;
3634 break;
3636 /* We should find the immediate. */
3637 if (n1 == i.operands)
3638 abort ();
3639 i.op[n].disps->X_add_number -= imm_size;
3642 if (i.types[n] & Disp32S)
3643 sign = 1;
3645 if (i.types[n] & (Disp16 | Disp64))
3647 size = 2;
3648 if (i.types[n] & Disp64)
3649 size = 8;
3652 p = frag_more (size);
3653 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
3654 if (GOT_symbol
3655 && GOT_symbol == i.op[n].disps->X_add_symbol
3656 && (((reloc_type == BFD_RELOC_32
3657 || reloc_type == BFD_RELOC_X86_64_32S)
3658 && (i.op[n].disps->X_op == O_symbol
3659 || (i.op[n].disps->X_op == O_add
3660 && ((symbol_get_value_expression
3661 (i.op[n].disps->X_op_symbol)->X_op)
3662 == O_subtract))))
3663 || reloc_type == BFD_RELOC_32_PCREL))
3665 offsetT add;
3667 if (insn_start_frag == frag_now)
3668 add = (p - frag_now->fr_literal) - insn_start_off;
3669 else
3671 fragS *fr;
3673 add = insn_start_frag->fr_fix - insn_start_off;
3674 for (fr = insn_start_frag->fr_next;
3675 fr && fr != frag_now; fr = fr->fr_next)
3676 add += fr->fr_fix;
3677 add += p - frag_now->fr_literal;
3680 if (!object_64bit)
3681 reloc_type = BFD_RELOC_386_GOTPC;
3682 else
3683 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3684 i.op[n].disps->X_add_number += add;
3686 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3687 i.op[n].disps, pcrel, reloc_type);
3693 static void
3694 output_imm (insn_start_frag, insn_start_off)
3695 fragS *insn_start_frag;
3696 offsetT insn_start_off;
3698 char *p;
3699 unsigned int n;
3701 for (n = 0; n < i.operands; n++)
3703 if (i.types[n] & Imm)
3705 if (i.op[n].imms->X_op == O_constant)
3707 int size;
3708 offsetT val;
3710 size = 4;
3711 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3713 size = 2;
3714 if (i.types[n] & (Imm8 | Imm8S))
3715 size = 1;
3716 else if (i.types[n] & Imm64)
3717 size = 8;
3719 val = offset_in_range (i.op[n].imms->X_add_number,
3720 size);
3721 p = frag_more (size);
3722 md_number_to_chars (p, val, size);
3724 else
3726 /* Not absolute_section.
3727 Need a 32-bit fixup (don't support 8bit
3728 non-absolute imms). Try to support other
3729 sizes ... */
3730 enum bfd_reloc_code_real reloc_type;
3731 int size = 4;
3732 int sign = 0;
3734 if ((i.types[n] & (Imm32S))
3735 && (i.suffix == QWORD_MNEM_SUFFIX
3736 || (!i.suffix && (i.tm.opcode_modifier & No_lSuf))))
3737 sign = 1;
3738 if (i.types[n] & (Imm8 | Imm8S | Imm16 | Imm64))
3740 size = 2;
3741 if (i.types[n] & (Imm8 | Imm8S))
3742 size = 1;
3743 if (i.types[n] & Imm64)
3744 size = 8;
3747 p = frag_more (size);
3748 reloc_type = reloc (size, 0, sign, i.reloc[n]);
3750 /* This is tough to explain. We end up with this one if we
3751 * have operands that look like
3752 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
3753 * obtain the absolute address of the GOT, and it is strongly
3754 * preferable from a performance point of view to avoid using
3755 * a runtime relocation for this. The actual sequence of
3756 * instructions often look something like:
3758 * call .L66
3759 * .L66:
3760 * popl %ebx
3761 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
3763 * The call and pop essentially return the absolute address
3764 * of the label .L66 and store it in %ebx. The linker itself
3765 * will ultimately change the first operand of the addl so
3766 * that %ebx points to the GOT, but to keep things simple, the
3767 * .o file must have this operand set so that it generates not
3768 * the absolute address of .L66, but the absolute address of
3769 * itself. This allows the linker itself simply treat a GOTPC
3770 * relocation as asking for a pcrel offset to the GOT to be
3771 * added in, and the addend of the relocation is stored in the
3772 * operand field for the instruction itself.
3774 * Our job here is to fix the operand so that it would add
3775 * the correct offset so that %ebx would point to itself. The
3776 * thing that is tricky is that .-.L66 will point to the
3777 * beginning of the instruction, so we need to further modify
3778 * the operand so that it will point to itself. There are
3779 * other cases where you have something like:
3781 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
3783 * and here no correction would be required. Internally in
3784 * the assembler we treat operands of this form as not being
3785 * pcrel since the '.' is explicitly mentioned, and I wonder
3786 * whether it would simplify matters to do it this way. Who
3787 * knows. In earlier versions of the PIC patches, the
3788 * pcrel_adjust field was used to store the correction, but
3789 * since the expression is not pcrel, I felt it would be
3790 * confusing to do it this way. */
3792 if ((reloc_type == BFD_RELOC_32
3793 || reloc_type == BFD_RELOC_X86_64_32S)
3794 && GOT_symbol
3795 && GOT_symbol == i.op[n].imms->X_add_symbol
3796 && (i.op[n].imms->X_op == O_symbol
3797 || (i.op[n].imms->X_op == O_add
3798 && ((symbol_get_value_expression
3799 (i.op[n].imms->X_op_symbol)->X_op)
3800 == O_subtract))))
3802 offsetT add;
3804 if (insn_start_frag == frag_now)
3805 add = (p - frag_now->fr_literal) - insn_start_off;
3806 else
3808 fragS *fr;
3810 add = insn_start_frag->fr_fix - insn_start_off;
3811 for (fr = insn_start_frag->fr_next;
3812 fr && fr != frag_now; fr = fr->fr_next)
3813 add += fr->fr_fix;
3814 add += p - frag_now->fr_literal;
3817 if (!object_64bit)
3818 reloc_type = BFD_RELOC_386_GOTPC;
3819 else
3820 reloc_type = BFD_RELOC_X86_64_GOTPC32;
3821 i.op[n].imms->X_add_number += add;
3823 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
3824 i.op[n].imms, 0, reloc_type);
3830 /* x86_cons_fix_new is called via the expression parsing code when a
3831 reloc is needed. We use this hook to get the correct .got reloc. */
3832 static enum bfd_reloc_code_real got_reloc = NO_RELOC;
3833 static int cons_sign = -1;
3835 void
3836 x86_cons_fix_new (fragS *frag,
3837 unsigned int off,
3838 unsigned int len,
3839 expressionS *exp)
3841 enum bfd_reloc_code_real r = reloc (len, 0, cons_sign, got_reloc);
3843 got_reloc = NO_RELOC;
3845 #ifdef TE_PE
3846 if (exp->X_op == O_secrel)
3848 exp->X_op = O_symbol;
3849 r = BFD_RELOC_32_SECREL;
3851 #endif
3853 fix_new_exp (frag, off, len, exp, 0, r);
3856 #if (!defined (OBJ_ELF) && !defined (OBJ_MAYBE_ELF)) || defined (LEX_AT)
3857 # define lex_got(reloc, adjust, types) NULL
3858 #else
3859 /* Parse operands of the form
3860 <symbol>@GOTOFF+<nnn>
3861 and similar .plt or .got references.
3863 If we find one, set up the correct relocation in RELOC and copy the
3864 input string, minus the `@GOTOFF' into a malloc'd buffer for
3865 parsing by the calling routine. Return this buffer, and if ADJUST
3866 is non-null set it to the length of the string we removed from the
3867 input line. Otherwise return NULL. */
3868 static char *
3869 lex_got (enum bfd_reloc_code_real *reloc,
3870 int *adjust,
3871 unsigned int *types)
3873 static const struct {
3874 const char *str;
3875 const enum bfd_reloc_code_real rel[2];
3876 const unsigned int types64;
3877 } gotrel[] = {
3878 { "PLT", { BFD_RELOC_386_PLT32, BFD_RELOC_X86_64_PLT32 }, Imm32|Imm32S|Disp32 },
3879 { "GOTOFF", { BFD_RELOC_386_GOTOFF, BFD_RELOC_X86_64_GOTOFF64 }, Imm64|Disp64 },
3880 { "GOTPCREL", { 0, BFD_RELOC_X86_64_GOTPCREL }, Imm32|Imm32S|Disp32 },
3881 { "TLSGD", { BFD_RELOC_386_TLS_GD, BFD_RELOC_X86_64_TLSGD }, Imm32|Imm32S|Disp32 },
3882 { "TLSLDM", { BFD_RELOC_386_TLS_LDM, 0 }, 0 },
3883 { "TLSLD", { 0, BFD_RELOC_X86_64_TLSLD }, Imm32|Imm32S|Disp32 },
3884 { "GOTTPOFF", { BFD_RELOC_386_TLS_IE_32, BFD_RELOC_X86_64_GOTTPOFF }, Imm32|Imm32S|Disp32 },
3885 { "TPOFF", { BFD_RELOC_386_TLS_LE_32, BFD_RELOC_X86_64_TPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3886 { "NTPOFF", { BFD_RELOC_386_TLS_LE, 0 }, 0 },
3887 { "DTPOFF", { BFD_RELOC_386_TLS_LDO_32, BFD_RELOC_X86_64_DTPOFF32 }, Imm32|Imm32S|Imm64|Disp32|Disp64 },
3888 { "GOTNTPOFF",{ BFD_RELOC_386_TLS_GOTIE, 0 }, 0 },
3889 { "INDNTPOFF",{ BFD_RELOC_386_TLS_IE, 0 }, 0 },
3890 { "GOT", { BFD_RELOC_386_GOT32, BFD_RELOC_X86_64_GOT32 }, Imm32|Imm32S|Disp32 },
3891 { "TLSDESC", { BFD_RELOC_386_TLS_GOTDESC, BFD_RELOC_X86_64_GOTPC32_TLSDESC }, Imm32|Imm32S|Disp32 },
3892 { "TLSCALL", { BFD_RELOC_386_TLS_DESC_CALL, BFD_RELOC_X86_64_TLSDESC_CALL }, Imm32|Imm32S|Disp32 }
3894 char *cp;
3895 unsigned int j;
3897 if (!IS_ELF)
3898 return NULL;
3900 for (cp = input_line_pointer; *cp != '@'; cp++)
3901 if (is_end_of_line[(unsigned char) *cp])
3902 return NULL;
3904 for (j = 0; j < sizeof (gotrel) / sizeof (gotrel[0]); j++)
3906 int len;
3908 len = strlen (gotrel[j].str);
3909 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
3911 if (gotrel[j].rel[object_64bit] != 0)
3913 int first, second;
3914 char *tmpbuf, *past_reloc;
3916 *reloc = gotrel[j].rel[object_64bit];
3917 if (adjust)
3918 *adjust = len;
3920 if (types)
3922 if (flag_code != CODE_64BIT)
3923 *types = Imm32|Disp32;
3924 else
3925 *types = gotrel[j].types64;
3928 if (GOT_symbol == NULL)
3929 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
3931 /* Replace the relocation token with ' ', so that
3932 errors like foo@GOTOFF1 will be detected. */
3934 /* The length of the first part of our input line. */
3935 first = cp - input_line_pointer;
3937 /* The second part goes from after the reloc token until
3938 (and including) an end_of_line char. Don't use strlen
3939 here as the end_of_line char may not be a NUL. */
3940 past_reloc = cp + 1 + len;
3941 for (cp = past_reloc; !is_end_of_line[(unsigned char) *cp++]; )
3943 second = cp - past_reloc;
3945 /* Allocate and copy string. The trailing NUL shouldn't
3946 be necessary, but be safe. */
3947 tmpbuf = xmalloc (first + second + 2);
3948 memcpy (tmpbuf, input_line_pointer, first);
3949 tmpbuf[first] = ' ';
3950 memcpy (tmpbuf + first + 1, past_reloc, second);
3951 tmpbuf[first + second + 1] = '\0';
3952 return tmpbuf;
3955 as_bad (_("@%s reloc is not supported with %d-bit output format"),
3956 gotrel[j].str, 1 << (5 + object_64bit));
3957 return NULL;
3961 /* Might be a symbol version string. Don't as_bad here. */
3962 return NULL;
3965 void
3966 x86_cons (exp, size)
3967 expressionS *exp;
3968 int size;
3970 if (size == 4 || (object_64bit && size == 8))
3972 /* Handle @GOTOFF and the like in an expression. */
3973 char *save;
3974 char *gotfree_input_line;
3975 int adjust;
3977 save = input_line_pointer;
3978 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
3979 if (gotfree_input_line)
3980 input_line_pointer = gotfree_input_line;
3982 expression (exp);
3984 if (gotfree_input_line)
3986 /* expression () has merrily parsed up to the end of line,
3987 or a comma - in the wrong buffer. Transfer how far
3988 input_line_pointer has moved to the right buffer. */
3989 input_line_pointer = (save
3990 + (input_line_pointer - gotfree_input_line)
3991 + adjust);
3992 free (gotfree_input_line);
3995 else
3996 expression (exp);
3998 #endif
4000 static void signed_cons (int size)
4002 if (flag_code == CODE_64BIT)
4003 cons_sign = 1;
4004 cons (size);
4005 cons_sign = -1;
4008 #ifdef TE_PE
4009 static void
4010 pe_directive_secrel (dummy)
4011 int dummy ATTRIBUTE_UNUSED;
4013 expressionS exp;
4017 expression (&exp);
4018 if (exp.X_op == O_symbol)
4019 exp.X_op = O_secrel;
4021 emit_expr (&exp, 4);
4023 while (*input_line_pointer++ == ',');
4025 input_line_pointer--;
4026 demand_empty_rest_of_line ();
4028 #endif
4030 static int i386_immediate PARAMS ((char *));
4032 static int
4033 i386_immediate (imm_start)
4034 char *imm_start;
4036 char *save_input_line_pointer;
4037 char *gotfree_input_line;
4038 segT exp_seg = 0;
4039 expressionS *exp;
4040 unsigned int types = ~0U;
4042 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
4044 as_bad (_("only 1 or 2 immediate operands are allowed"));
4045 return 0;
4048 exp = &im_expressions[i.imm_operands++];
4049 i.op[this_operand].imms = exp;
4051 if (is_space_char (*imm_start))
4052 ++imm_start;
4054 save_input_line_pointer = input_line_pointer;
4055 input_line_pointer = imm_start;
4057 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4058 if (gotfree_input_line)
4059 input_line_pointer = gotfree_input_line;
4061 exp_seg = expression (exp);
4063 SKIP_WHITESPACE ();
4064 if (*input_line_pointer)
4065 as_bad (_("junk `%s' after expression"), input_line_pointer);
4067 input_line_pointer = save_input_line_pointer;
4068 if (gotfree_input_line)
4069 free (gotfree_input_line);
4071 if (exp->X_op == O_absent || exp->X_op == O_big)
4073 /* Missing or bad expr becomes absolute 0. */
4074 as_bad (_("missing or invalid immediate expression `%s' taken as 0"),
4075 imm_start);
4076 exp->X_op = O_constant;
4077 exp->X_add_number = 0;
4078 exp->X_add_symbol = (symbolS *) 0;
4079 exp->X_op_symbol = (symbolS *) 0;
4081 else if (exp->X_op == O_constant)
4083 /* Size it properly later. */
4084 i.types[this_operand] |= Imm64;
4085 /* If BFD64, sign extend val. */
4086 if (!use_rela_relocations)
4087 if ((exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
4088 exp->X_add_number = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
4090 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4091 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
4092 && exp_seg != absolute_section
4093 && exp_seg != text_section
4094 && exp_seg != data_section
4095 && exp_seg != bss_section
4096 && exp_seg != undefined_section
4097 && !bfd_is_com_section (exp_seg))
4099 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4100 return 0;
4102 #endif
4103 else
4105 /* This is an address. The size of the address will be
4106 determined later, depending on destination register,
4107 suffix, or the default for the section. */
4108 i.types[this_operand] |= Imm8 | Imm16 | Imm32 | Imm32S | Imm64;
4109 i.types[this_operand] &= types;
4112 return 1;
4115 static char *i386_scale PARAMS ((char *));
4117 static char *
4118 i386_scale (scale)
4119 char *scale;
4121 offsetT val;
4122 char *save = input_line_pointer;
4124 input_line_pointer = scale;
4125 val = get_absolute_expression ();
4127 switch (val)
4129 case 1:
4130 i.log2_scale_factor = 0;
4131 break;
4132 case 2:
4133 i.log2_scale_factor = 1;
4134 break;
4135 case 4:
4136 i.log2_scale_factor = 2;
4137 break;
4138 case 8:
4139 i.log2_scale_factor = 3;
4140 break;
4141 default:
4143 char sep = *input_line_pointer;
4145 *input_line_pointer = '\0';
4146 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
4147 scale);
4148 *input_line_pointer = sep;
4149 input_line_pointer = save;
4150 return NULL;
4153 if (i.log2_scale_factor != 0 && i.index_reg == 0)
4155 as_warn (_("scale factor of %d without an index register"),
4156 1 << i.log2_scale_factor);
4157 #if SCALE1_WHEN_NO_INDEX
4158 i.log2_scale_factor = 0;
4159 #endif
4161 scale = input_line_pointer;
4162 input_line_pointer = save;
4163 return scale;
4166 static int i386_displacement PARAMS ((char *, char *));
4168 static int
4169 i386_displacement (disp_start, disp_end)
4170 char *disp_start;
4171 char *disp_end;
4173 expressionS *exp;
4174 segT exp_seg = 0;
4175 char *save_input_line_pointer;
4176 char *gotfree_input_line;
4177 int bigdisp, override;
4178 unsigned int types = Disp;
4180 if ((i.types[this_operand] & JumpAbsolute)
4181 || !(current_templates->start->opcode_modifier & (Jump | JumpDword)))
4183 bigdisp = Disp32;
4184 override = (i.prefix[ADDR_PREFIX] != 0);
4186 else
4188 /* For PC-relative branches, the width of the displacement
4189 is dependent upon data size, not address size. */
4190 bigdisp = 0;
4191 override = (i.prefix[DATA_PREFIX] != 0);
4193 if (flag_code == CODE_64BIT)
4195 if (!bigdisp)
4196 bigdisp = (override || i.suffix == WORD_MNEM_SUFFIX)
4197 ? Disp16
4198 : Disp32S | Disp32;
4199 else if (!override)
4200 bigdisp = Disp64 | Disp32S | Disp32;
4202 else
4204 if (!bigdisp)
4206 if (!override)
4207 override = (i.suffix == (flag_code != CODE_16BIT
4208 ? WORD_MNEM_SUFFIX
4209 : LONG_MNEM_SUFFIX));
4210 bigdisp = Disp32;
4212 if ((flag_code == CODE_16BIT) ^ override)
4213 bigdisp = Disp16;
4215 i.types[this_operand] |= bigdisp;
4217 exp = &disp_expressions[i.disp_operands];
4218 i.op[this_operand].disps = exp;
4219 i.disp_operands++;
4220 save_input_line_pointer = input_line_pointer;
4221 input_line_pointer = disp_start;
4222 END_STRING_AND_SAVE (disp_end);
4224 #ifndef GCC_ASM_O_HACK
4225 #define GCC_ASM_O_HACK 0
4226 #endif
4227 #if GCC_ASM_O_HACK
4228 END_STRING_AND_SAVE (disp_end + 1);
4229 if ((i.types[this_operand] & BaseIndex) != 0
4230 && displacement_string_end[-1] == '+')
4232 /* This hack is to avoid a warning when using the "o"
4233 constraint within gcc asm statements.
4234 For instance:
4236 #define _set_tssldt_desc(n,addr,limit,type) \
4237 __asm__ __volatile__ ( \
4238 "movw %w2,%0\n\t" \
4239 "movw %w1,2+%0\n\t" \
4240 "rorl $16,%1\n\t" \
4241 "movb %b1,4+%0\n\t" \
4242 "movb %4,5+%0\n\t" \
4243 "movb $0,6+%0\n\t" \
4244 "movb %h1,7+%0\n\t" \
4245 "rorl $16,%1" \
4246 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
4248 This works great except that the output assembler ends
4249 up looking a bit weird if it turns out that there is
4250 no offset. You end up producing code that looks like:
4252 #APP
4253 movw $235,(%eax)
4254 movw %dx,2+(%eax)
4255 rorl $16,%edx
4256 movb %dl,4+(%eax)
4257 movb $137,5+(%eax)
4258 movb $0,6+(%eax)
4259 movb %dh,7+(%eax)
4260 rorl $16,%edx
4261 #NO_APP
4263 So here we provide the missing zero. */
4265 *displacement_string_end = '0';
4267 #endif
4268 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
4269 if (gotfree_input_line)
4270 input_line_pointer = gotfree_input_line;
4272 exp_seg = expression (exp);
4274 SKIP_WHITESPACE ();
4275 if (*input_line_pointer)
4276 as_bad (_("junk `%s' after expression"), input_line_pointer);
4277 #if GCC_ASM_O_HACK
4278 RESTORE_END_STRING (disp_end + 1);
4279 #endif
4280 RESTORE_END_STRING (disp_end);
4281 input_line_pointer = save_input_line_pointer;
4282 if (gotfree_input_line)
4283 free (gotfree_input_line);
4285 /* We do this to make sure that the section symbol is in
4286 the symbol table. We will ultimately change the relocation
4287 to be relative to the beginning of the section. */
4288 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
4289 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4290 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4292 if (exp->X_op != O_symbol)
4294 as_bad (_("bad expression used with @%s"),
4295 (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
4296 ? "GOTPCREL"
4297 : "GOTOFF"));
4298 return 0;
4301 if (S_IS_LOCAL (exp->X_add_symbol)
4302 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section)
4303 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
4304 exp->X_op = O_subtract;
4305 exp->X_op_symbol = GOT_symbol;
4306 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
4307 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
4308 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
4309 i.reloc[this_operand] = BFD_RELOC_64;
4310 else
4311 i.reloc[this_operand] = BFD_RELOC_32;
4314 if (exp->X_op == O_absent || exp->X_op == O_big)
4316 /* Missing or bad expr becomes absolute 0. */
4317 as_bad (_("missing or invalid displacement expression `%s' taken as 0"),
4318 disp_start);
4319 exp->X_op = O_constant;
4320 exp->X_add_number = 0;
4321 exp->X_add_symbol = (symbolS *) 0;
4322 exp->X_op_symbol = (symbolS *) 0;
4325 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
4326 if (exp->X_op != O_constant
4327 && OUTPUT_FLAVOR == bfd_target_aout_flavour
4328 && exp_seg != absolute_section
4329 && exp_seg != text_section
4330 && exp_seg != data_section
4331 && exp_seg != bss_section
4332 && exp_seg != undefined_section
4333 && !bfd_is_com_section (exp_seg))
4335 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
4336 return 0;
4338 #endif
4340 if (!(i.types[this_operand] & ~Disp))
4341 i.types[this_operand] &= types;
4343 return 1;
4346 static int i386_index_check PARAMS ((const char *));
4348 /* Make sure the memory operand we've been dealt is valid.
4349 Return 1 on success, 0 on a failure. */
4351 static int
4352 i386_index_check (operand_string)
4353 const char *operand_string;
4355 int ok;
4356 #if INFER_ADDR_PREFIX
4357 int fudged = 0;
4359 tryprefix:
4360 #endif
4361 ok = 1;
4362 if ((current_templates->start->cpu_flags & CpuSVME)
4363 && current_templates->end[-1].operand_types[0] == AnyMem)
4365 /* Memory operands of SVME insns are special in that they only allow
4366 rAX as their memory address and ignore any segment override. */
4367 unsigned RegXX;
4369 /* SKINIT is even more restrictive: it always requires EAX. */
4370 if (strcmp (current_templates->start->name, "skinit") == 0)
4371 RegXX = Reg32;
4372 else if (flag_code == CODE_64BIT)
4373 RegXX = i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32;
4374 else
4375 RegXX = (flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0)
4376 ? Reg16
4377 : Reg32;
4378 if (!i.base_reg
4379 || !(i.base_reg->reg_type & Acc)
4380 || !(i.base_reg->reg_type & RegXX)
4381 || i.index_reg
4382 || (i.types[0] & Disp))
4383 ok = 0;
4385 else if (flag_code == CODE_64BIT)
4387 unsigned RegXX = (i.prefix[ADDR_PREFIX] == 0 ? Reg64 : Reg32);
4389 if ((i.base_reg
4390 && ((i.base_reg->reg_type & RegXX) == 0)
4391 && (i.base_reg->reg_type != BaseIndex
4392 || i.index_reg))
4393 || (i.index_reg
4394 && ((i.index_reg->reg_type & (RegXX | BaseIndex))
4395 != (RegXX | BaseIndex))))
4396 ok = 0;
4398 else
4400 if ((flag_code == CODE_16BIT) ^ (i.prefix[ADDR_PREFIX] != 0))
4402 /* 16bit checks. */
4403 if ((i.base_reg
4404 && ((i.base_reg->reg_type & (Reg16 | BaseIndex | RegRex))
4405 != (Reg16 | BaseIndex)))
4406 || (i.index_reg
4407 && (((i.index_reg->reg_type & (Reg16 | BaseIndex))
4408 != (Reg16 | BaseIndex))
4409 || !(i.base_reg
4410 && i.base_reg->reg_num < 6
4411 && i.index_reg->reg_num >= 6
4412 && i.log2_scale_factor == 0))))
4413 ok = 0;
4415 else
4417 /* 32bit checks. */
4418 if ((i.base_reg
4419 && (i.base_reg->reg_type & (Reg32 | RegRex)) != Reg32)
4420 || (i.index_reg
4421 && ((i.index_reg->reg_type & (Reg32 | BaseIndex | RegRex))
4422 != (Reg32 | BaseIndex))))
4423 ok = 0;
4426 if (!ok)
4428 #if INFER_ADDR_PREFIX
4429 if (i.prefix[ADDR_PREFIX] == 0)
4431 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
4432 i.prefixes += 1;
4433 /* Change the size of any displacement too. At most one of
4434 Disp16 or Disp32 is set.
4435 FIXME. There doesn't seem to be any real need for separate
4436 Disp16 and Disp32 flags. The same goes for Imm16 and Imm32.
4437 Removing them would probably clean up the code quite a lot. */
4438 if (flag_code != CODE_64BIT && (i.types[this_operand] & (Disp16 | Disp32)))
4439 i.types[this_operand] ^= (Disp16 | Disp32);
4440 fudged = 1;
4441 goto tryprefix;
4443 if (fudged)
4444 as_bad (_("`%s' is not a valid base/index expression"),
4445 operand_string);
4446 else
4447 #endif
4448 as_bad (_("`%s' is not a valid %s bit base/index expression"),
4449 operand_string,
4450 flag_code_names[flag_code]);
4452 return ok;
4455 /* Parse OPERAND_STRING into the i386_insn structure I. Returns non-zero
4456 on error. */
4458 static int
4459 i386_operand (operand_string)
4460 char *operand_string;
4462 const reg_entry *r;
4463 char *end_op;
4464 char *op_string = operand_string;
4466 if (is_space_char (*op_string))
4467 ++op_string;
4469 /* We check for an absolute prefix (differentiating,
4470 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
4471 if (*op_string == ABSOLUTE_PREFIX)
4473 ++op_string;
4474 if (is_space_char (*op_string))
4475 ++op_string;
4476 i.types[this_operand] |= JumpAbsolute;
4479 /* Check if operand is a register. */
4480 if ((r = parse_register (op_string, &end_op)) != NULL)
4482 /* Check for a segment override by searching for ':' after a
4483 segment register. */
4484 op_string = end_op;
4485 if (is_space_char (*op_string))
4486 ++op_string;
4487 if (*op_string == ':' && (r->reg_type & (SReg2 | SReg3)))
4489 switch (r->reg_num)
4491 case 0:
4492 i.seg[i.mem_operands] = &es;
4493 break;
4494 case 1:
4495 i.seg[i.mem_operands] = &cs;
4496 break;
4497 case 2:
4498 i.seg[i.mem_operands] = &ss;
4499 break;
4500 case 3:
4501 i.seg[i.mem_operands] = &ds;
4502 break;
4503 case 4:
4504 i.seg[i.mem_operands] = &fs;
4505 break;
4506 case 5:
4507 i.seg[i.mem_operands] = &gs;
4508 break;
4511 /* Skip the ':' and whitespace. */
4512 ++op_string;
4513 if (is_space_char (*op_string))
4514 ++op_string;
4516 if (!is_digit_char (*op_string)
4517 && !is_identifier_char (*op_string)
4518 && *op_string != '('
4519 && *op_string != ABSOLUTE_PREFIX)
4521 as_bad (_("bad memory operand `%s'"), op_string);
4522 return 0;
4524 /* Handle case of %es:*foo. */
4525 if (*op_string == ABSOLUTE_PREFIX)
4527 ++op_string;
4528 if (is_space_char (*op_string))
4529 ++op_string;
4530 i.types[this_operand] |= JumpAbsolute;
4532 goto do_memory_reference;
4534 if (*op_string)
4536 as_bad (_("junk `%s' after register"), op_string);
4537 return 0;
4539 i.types[this_operand] |= r->reg_type & ~BaseIndex;
4540 i.op[this_operand].regs = r;
4541 i.reg_operands++;
4543 else if (*op_string == REGISTER_PREFIX)
4545 as_bad (_("bad register name `%s'"), op_string);
4546 return 0;
4548 else if (*op_string == IMMEDIATE_PREFIX)
4550 ++op_string;
4551 if (i.types[this_operand] & JumpAbsolute)
4553 as_bad (_("immediate operand illegal with absolute jump"));
4554 return 0;
4556 if (!i386_immediate (op_string))
4557 return 0;
4559 else if (is_digit_char (*op_string)
4560 || is_identifier_char (*op_string)
4561 || *op_string == '(')
4563 /* This is a memory reference of some sort. */
4564 char *base_string;
4566 /* Start and end of displacement string expression (if found). */
4567 char *displacement_string_start;
4568 char *displacement_string_end;
4570 do_memory_reference:
4571 if ((i.mem_operands == 1
4572 && (current_templates->start->opcode_modifier & IsString) == 0)
4573 || i.mem_operands == 2)
4575 as_bad (_("too many memory references for `%s'"),
4576 current_templates->start->name);
4577 return 0;
4580 /* Check for base index form. We detect the base index form by
4581 looking for an ')' at the end of the operand, searching
4582 for the '(' matching it, and finding a REGISTER_PREFIX or ','
4583 after the '('. */
4584 base_string = op_string + strlen (op_string);
4586 --base_string;
4587 if (is_space_char (*base_string))
4588 --base_string;
4590 /* If we only have a displacement, set-up for it to be parsed later. */
4591 displacement_string_start = op_string;
4592 displacement_string_end = base_string + 1;
4594 if (*base_string == ')')
4596 char *temp_string;
4597 unsigned int parens_balanced = 1;
4598 /* We've already checked that the number of left & right ()'s are
4599 equal, so this loop will not be infinite. */
4602 base_string--;
4603 if (*base_string == ')')
4604 parens_balanced++;
4605 if (*base_string == '(')
4606 parens_balanced--;
4608 while (parens_balanced);
4610 temp_string = base_string;
4612 /* Skip past '(' and whitespace. */
4613 ++base_string;
4614 if (is_space_char (*base_string))
4615 ++base_string;
4617 if (*base_string == ','
4618 || ((i.base_reg = parse_register (base_string, &end_op)) != NULL))
4620 displacement_string_end = temp_string;
4622 i.types[this_operand] |= BaseIndex;
4624 if (i.base_reg)
4626 base_string = end_op;
4627 if (is_space_char (*base_string))
4628 ++base_string;
4631 /* There may be an index reg or scale factor here. */
4632 if (*base_string == ',')
4634 ++base_string;
4635 if (is_space_char (*base_string))
4636 ++base_string;
4638 if ((i.index_reg = parse_register (base_string, &end_op)) != NULL)
4640 base_string = end_op;
4641 if (is_space_char (*base_string))
4642 ++base_string;
4643 if (*base_string == ',')
4645 ++base_string;
4646 if (is_space_char (*base_string))
4647 ++base_string;
4649 else if (*base_string != ')')
4651 as_bad (_("expecting `,' or `)' after index register in `%s'"),
4652 operand_string);
4653 return 0;
4656 else if (*base_string == REGISTER_PREFIX)
4658 as_bad (_("bad register name `%s'"), base_string);
4659 return 0;
4662 /* Check for scale factor. */
4663 if (*base_string != ')')
4665 char *end_scale = i386_scale (base_string);
4667 if (!end_scale)
4668 return 0;
4670 base_string = end_scale;
4671 if (is_space_char (*base_string))
4672 ++base_string;
4673 if (*base_string != ')')
4675 as_bad (_("expecting `)' after scale factor in `%s'"),
4676 operand_string);
4677 return 0;
4680 else if (!i.index_reg)
4682 as_bad (_("expecting index register or scale factor after `,'; got '%c'"),
4683 *base_string);
4684 return 0;
4687 else if (*base_string != ')')
4689 as_bad (_("expecting `,' or `)' after base register in `%s'"),
4690 operand_string);
4691 return 0;
4694 else if (*base_string == REGISTER_PREFIX)
4696 as_bad (_("bad register name `%s'"), base_string);
4697 return 0;
4701 /* If there's an expression beginning the operand, parse it,
4702 assuming displacement_string_start and
4703 displacement_string_end are meaningful. */
4704 if (displacement_string_start != displacement_string_end)
4706 if (!i386_displacement (displacement_string_start,
4707 displacement_string_end))
4708 return 0;
4711 /* Special case for (%dx) while doing input/output op. */
4712 if (i.base_reg
4713 && i.base_reg->reg_type == (Reg16 | InOutPortReg)
4714 && i.index_reg == 0
4715 && i.log2_scale_factor == 0
4716 && i.seg[i.mem_operands] == 0
4717 && (i.types[this_operand] & Disp) == 0)
4719 i.types[this_operand] = InOutPortReg;
4720 return 1;
4723 if (i386_index_check (operand_string) == 0)
4724 return 0;
4725 i.mem_operands++;
4727 else
4729 /* It's not a memory operand; argh! */
4730 as_bad (_("invalid char %s beginning operand %d `%s'"),
4731 output_invalid (*op_string),
4732 this_operand + 1,
4733 op_string);
4734 return 0;
4736 return 1; /* Normal return. */
4739 /* md_estimate_size_before_relax()
4741 Called just before relax() for rs_machine_dependent frags. The x86
4742 assembler uses these frags to handle variable size jump
4743 instructions.
4745 Any symbol that is now undefined will not become defined.
4746 Return the correct fr_subtype in the frag.
4747 Return the initial "guess for variable size of frag" to caller.
4748 The guess is actually the growth beyond the fixed part. Whatever
4749 we do to grow the fixed or variable part contributes to our
4750 returned value. */
4753 md_estimate_size_before_relax (fragP, segment)
4754 fragS *fragP;
4755 segT segment;
4757 /* We've already got fragP->fr_subtype right; all we have to do is
4758 check for un-relaxable symbols. On an ELF system, we can't relax
4759 an externally visible symbol, because it may be overridden by a
4760 shared library. */
4761 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
4762 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
4763 || (IS_ELF
4764 && (S_IS_EXTERNAL (fragP->fr_symbol)
4765 || S_IS_WEAK (fragP->fr_symbol)))
4766 #endif
4769 /* Symbol is undefined in this segment, or we need to keep a
4770 reloc so that weak symbols can be overridden. */
4771 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
4772 enum bfd_reloc_code_real reloc_type;
4773 unsigned char *opcode;
4774 int old_fr_fix;
4776 if (fragP->fr_var != NO_RELOC)
4777 reloc_type = fragP->fr_var;
4778 else if (size == 2)
4779 reloc_type = BFD_RELOC_16_PCREL;
4780 else
4781 reloc_type = BFD_RELOC_32_PCREL;
4783 old_fr_fix = fragP->fr_fix;
4784 opcode = (unsigned char *) fragP->fr_opcode;
4786 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
4788 case UNCOND_JUMP:
4789 /* Make jmp (0xeb) a (d)word displacement jump. */
4790 opcode[0] = 0xe9;
4791 fragP->fr_fix += size;
4792 fix_new (fragP, old_fr_fix, size,
4793 fragP->fr_symbol,
4794 fragP->fr_offset, 1,
4795 reloc_type);
4796 break;
4798 case COND_JUMP86:
4799 if (size == 2
4800 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
4802 /* Negate the condition, and branch past an
4803 unconditional jump. */
4804 opcode[0] ^= 1;
4805 opcode[1] = 3;
4806 /* Insert an unconditional jump. */
4807 opcode[2] = 0xe9;
4808 /* We added two extra opcode bytes, and have a two byte
4809 offset. */
4810 fragP->fr_fix += 2 + 2;
4811 fix_new (fragP, old_fr_fix + 2, 2,
4812 fragP->fr_symbol,
4813 fragP->fr_offset, 1,
4814 reloc_type);
4815 break;
4817 /* Fall through. */
4819 case COND_JUMP:
4820 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
4822 fixS *fixP;
4824 fragP->fr_fix += 1;
4825 fixP = fix_new (fragP, old_fr_fix, 1,
4826 fragP->fr_symbol,
4827 fragP->fr_offset, 1,
4828 BFD_RELOC_8_PCREL);
4829 fixP->fx_signed = 1;
4830 break;
4833 /* This changes the byte-displacement jump 0x7N
4834 to the (d)word-displacement jump 0x0f,0x8N. */
4835 opcode[1] = opcode[0] + 0x10;
4836 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4837 /* We've added an opcode byte. */
4838 fragP->fr_fix += 1 + size;
4839 fix_new (fragP, old_fr_fix + 1, size,
4840 fragP->fr_symbol,
4841 fragP->fr_offset, 1,
4842 reloc_type);
4843 break;
4845 default:
4846 BAD_CASE (fragP->fr_subtype);
4847 break;
4849 frag_wane (fragP);
4850 return fragP->fr_fix - old_fr_fix;
4853 /* Guess size depending on current relax state. Initially the relax
4854 state will correspond to a short jump and we return 1, because
4855 the variable part of the frag (the branch offset) is one byte
4856 long. However, we can relax a section more than once and in that
4857 case we must either set fr_subtype back to the unrelaxed state,
4858 or return the value for the appropriate branch. */
4859 return md_relax_table[fragP->fr_subtype].rlx_length;
4862 /* Called after relax() is finished.
4864 In: Address of frag.
4865 fr_type == rs_machine_dependent.
4866 fr_subtype is what the address relaxed to.
4868 Out: Any fixSs and constants are set up.
4869 Caller will turn frag into a ".space 0". */
4871 void
4872 md_convert_frag (abfd, sec, fragP)
4873 bfd *abfd ATTRIBUTE_UNUSED;
4874 segT sec ATTRIBUTE_UNUSED;
4875 fragS *fragP;
4877 unsigned char *opcode;
4878 unsigned char *where_to_put_displacement = NULL;
4879 offsetT target_address;
4880 offsetT opcode_address;
4881 unsigned int extension = 0;
4882 offsetT displacement_from_opcode_start;
4884 opcode = (unsigned char *) fragP->fr_opcode;
4886 /* Address we want to reach in file space. */
4887 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
4889 /* Address opcode resides at in file space. */
4890 opcode_address = fragP->fr_address + fragP->fr_fix;
4892 /* Displacement from opcode start to fill into instruction. */
4893 displacement_from_opcode_start = target_address - opcode_address;
4895 if ((fragP->fr_subtype & BIG) == 0)
4897 /* Don't have to change opcode. */
4898 extension = 1; /* 1 opcode + 1 displacement */
4899 where_to_put_displacement = &opcode[1];
4901 else
4903 if (no_cond_jump_promotion
4904 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
4905 as_warn_where (fragP->fr_file, fragP->fr_line, _("long jump required"));
4907 switch (fragP->fr_subtype)
4909 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
4910 extension = 4; /* 1 opcode + 4 displacement */
4911 opcode[0] = 0xe9;
4912 where_to_put_displacement = &opcode[1];
4913 break;
4915 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
4916 extension = 2; /* 1 opcode + 2 displacement */
4917 opcode[0] = 0xe9;
4918 where_to_put_displacement = &opcode[1];
4919 break;
4921 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
4922 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
4923 extension = 5; /* 2 opcode + 4 displacement */
4924 opcode[1] = opcode[0] + 0x10;
4925 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4926 where_to_put_displacement = &opcode[2];
4927 break;
4929 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
4930 extension = 3; /* 2 opcode + 2 displacement */
4931 opcode[1] = opcode[0] + 0x10;
4932 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
4933 where_to_put_displacement = &opcode[2];
4934 break;
4936 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
4937 extension = 4;
4938 opcode[0] ^= 1;
4939 opcode[1] = 3;
4940 opcode[2] = 0xe9;
4941 where_to_put_displacement = &opcode[3];
4942 break;
4944 default:
4945 BAD_CASE (fragP->fr_subtype);
4946 break;
4950 /* Now put displacement after opcode. */
4951 md_number_to_chars ((char *) where_to_put_displacement,
4952 (valueT) (displacement_from_opcode_start - extension),
4953 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
4954 fragP->fr_fix += extension;
4957 /* Size of byte displacement jmp. */
4958 int md_short_jump_size = 2;
4960 /* Size of dword displacement jmp. */
4961 int md_long_jump_size = 5;
4963 void
4964 md_create_short_jump (ptr, from_addr, to_addr, frag, to_symbol)
4965 char *ptr;
4966 addressT from_addr, to_addr;
4967 fragS *frag ATTRIBUTE_UNUSED;
4968 symbolS *to_symbol ATTRIBUTE_UNUSED;
4970 offsetT offset;
4972 offset = to_addr - (from_addr + 2);
4973 /* Opcode for byte-disp jump. */
4974 md_number_to_chars (ptr, (valueT) 0xeb, 1);
4975 md_number_to_chars (ptr + 1, (valueT) offset, 1);
4978 void
4979 md_create_long_jump (ptr, from_addr, to_addr, frag, to_symbol)
4980 char *ptr;
4981 addressT from_addr, to_addr;
4982 fragS *frag ATTRIBUTE_UNUSED;
4983 symbolS *to_symbol ATTRIBUTE_UNUSED;
4985 offsetT offset;
4987 offset = to_addr - (from_addr + 5);
4988 md_number_to_chars (ptr, (valueT) 0xe9, 1);
4989 md_number_to_chars (ptr + 1, (valueT) offset, 4);
4992 /* Apply a fixup (fixS) to segment data, once it has been determined
4993 by our caller that we have all the info we need to fix it up.
4995 On the 386, immediates, displacements, and data pointers are all in
4996 the same (little-endian) format, so we don't need to care about which
4997 we are handling. */
4999 void
5000 md_apply_fix (fixP, valP, seg)
5001 /* The fix we're to put in. */
5002 fixS *fixP;
5003 /* Pointer to the value of the bits. */
5004 valueT *valP;
5005 /* Segment fix is from. */
5006 segT seg ATTRIBUTE_UNUSED;
5008 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
5009 valueT value = *valP;
5011 #if !defined (TE_Mach)
5012 if (fixP->fx_pcrel)
5014 switch (fixP->fx_r_type)
5016 default:
5017 break;
5019 case BFD_RELOC_64:
5020 fixP->fx_r_type = BFD_RELOC_64_PCREL;
5021 break;
5022 case BFD_RELOC_32:
5023 case BFD_RELOC_X86_64_32S:
5024 fixP->fx_r_type = BFD_RELOC_32_PCREL;
5025 break;
5026 case BFD_RELOC_16:
5027 fixP->fx_r_type = BFD_RELOC_16_PCREL;
5028 break;
5029 case BFD_RELOC_8:
5030 fixP->fx_r_type = BFD_RELOC_8_PCREL;
5031 break;
5035 if (fixP->fx_addsy != NULL
5036 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
5037 || fixP->fx_r_type == BFD_RELOC_64_PCREL
5038 || fixP->fx_r_type == BFD_RELOC_16_PCREL
5039 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
5040 && !use_rela_relocations)
5042 /* This is a hack. There should be a better way to handle this.
5043 This covers for the fact that bfd_install_relocation will
5044 subtract the current location (for partial_inplace, PC relative
5045 relocations); see more below. */
5046 #ifndef OBJ_AOUT
5047 if (IS_ELF
5048 #ifdef TE_PE
5049 || OUTPUT_FLAVOR == bfd_target_coff_flavour
5050 #endif
5052 value += fixP->fx_where + fixP->fx_frag->fr_address;
5053 #endif
5054 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5055 if (IS_ELF)
5057 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
5059 if ((sym_seg == seg
5060 || (symbol_section_p (fixP->fx_addsy)
5061 && sym_seg != absolute_section))
5062 && !generic_force_reloc (fixP))
5064 /* Yes, we add the values in twice. This is because
5065 bfd_install_relocation subtracts them out again. I think
5066 bfd_install_relocation is broken, but I don't dare change
5067 it. FIXME. */
5068 value += fixP->fx_where + fixP->fx_frag->fr_address;
5071 #endif
5072 #if defined (OBJ_COFF) && defined (TE_PE)
5073 /* For some reason, the PE format does not store a
5074 section address offset for a PC relative symbol. */
5075 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
5076 || S_IS_WEAK (fixP->fx_addsy))
5077 value += md_pcrel_from (fixP);
5078 #endif
5081 /* Fix a few things - the dynamic linker expects certain values here,
5082 and we must not disappoint it. */
5083 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5084 if (IS_ELF && fixP->fx_addsy)
5085 switch (fixP->fx_r_type)
5087 case BFD_RELOC_386_PLT32:
5088 case BFD_RELOC_X86_64_PLT32:
5089 /* Make the jump instruction point to the address of the operand. At
5090 runtime we merely add the offset to the actual PLT entry. */
5091 value = -4;
5092 break;
5094 case BFD_RELOC_386_TLS_GD:
5095 case BFD_RELOC_386_TLS_LDM:
5096 case BFD_RELOC_386_TLS_IE_32:
5097 case BFD_RELOC_386_TLS_IE:
5098 case BFD_RELOC_386_TLS_GOTIE:
5099 case BFD_RELOC_386_TLS_GOTDESC:
5100 case BFD_RELOC_X86_64_TLSGD:
5101 case BFD_RELOC_X86_64_TLSLD:
5102 case BFD_RELOC_X86_64_GOTTPOFF:
5103 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5104 value = 0; /* Fully resolved at runtime. No addend. */
5105 /* Fallthrough */
5106 case BFD_RELOC_386_TLS_LE:
5107 case BFD_RELOC_386_TLS_LDO_32:
5108 case BFD_RELOC_386_TLS_LE_32:
5109 case BFD_RELOC_X86_64_DTPOFF32:
5110 case BFD_RELOC_X86_64_DTPOFF64:
5111 case BFD_RELOC_X86_64_TPOFF32:
5112 case BFD_RELOC_X86_64_TPOFF64:
5113 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5114 break;
5116 case BFD_RELOC_386_TLS_DESC_CALL:
5117 case BFD_RELOC_X86_64_TLSDESC_CALL:
5118 value = 0; /* Fully resolved at runtime. No addend. */
5119 S_SET_THREAD_LOCAL (fixP->fx_addsy);
5120 fixP->fx_done = 0;
5121 return;
5123 case BFD_RELOC_386_GOT32:
5124 case BFD_RELOC_X86_64_GOT32:
5125 value = 0; /* Fully resolved at runtime. No addend. */
5126 break;
5128 case BFD_RELOC_VTABLE_INHERIT:
5129 case BFD_RELOC_VTABLE_ENTRY:
5130 fixP->fx_done = 0;
5131 return;
5133 default:
5134 break;
5136 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
5137 *valP = value;
5138 #endif /* !defined (TE_Mach) */
5140 /* Are we finished with this relocation now? */
5141 if (fixP->fx_addsy == NULL)
5142 fixP->fx_done = 1;
5143 else if (use_rela_relocations)
5145 fixP->fx_no_overflow = 1;
5146 /* Remember value for tc_gen_reloc. */
5147 fixP->fx_addnumber = value;
5148 value = 0;
5151 md_number_to_chars (p, value, fixP->fx_size);
5154 #define MAX_LITTLENUMS 6
5156 /* Turn the string pointed to by litP into a floating point constant
5157 of type TYPE, and emit the appropriate bytes. The number of
5158 LITTLENUMS emitted is stored in *SIZEP. An error message is
5159 returned, or NULL on OK. */
5161 char *
5162 md_atof (type, litP, sizeP)
5163 int type;
5164 char *litP;
5165 int *sizeP;
5167 int prec;
5168 LITTLENUM_TYPE words[MAX_LITTLENUMS];
5169 LITTLENUM_TYPE *wordP;
5170 char *t;
5172 switch (type)
5174 case 'f':
5175 case 'F':
5176 prec = 2;
5177 break;
5179 case 'd':
5180 case 'D':
5181 prec = 4;
5182 break;
5184 case 'x':
5185 case 'X':
5186 prec = 5;
5187 break;
5189 default:
5190 *sizeP = 0;
5191 return _("Bad call to md_atof ()");
5193 t = atof_ieee (input_line_pointer, type, words);
5194 if (t)
5195 input_line_pointer = t;
5197 *sizeP = prec * sizeof (LITTLENUM_TYPE);
5198 /* This loops outputs the LITTLENUMs in REVERSE order; in accord with
5199 the bigendian 386. */
5200 for (wordP = words + prec - 1; prec--;)
5202 md_number_to_chars (litP, (valueT) (*wordP--), sizeof (LITTLENUM_TYPE));
5203 litP += sizeof (LITTLENUM_TYPE);
5205 return 0;
5208 static char output_invalid_buf[8];
5210 static char *
5211 output_invalid (c)
5212 int c;
5214 if (ISPRINT (c))
5215 sprintf (output_invalid_buf, "'%c'", c);
5216 else
5217 sprintf (output_invalid_buf, "(0x%x)", (unsigned) c);
5218 return output_invalid_buf;
5221 /* REG_STRING starts *before* REGISTER_PREFIX. */
5223 static const reg_entry *
5224 parse_real_register (char *reg_string, char **end_op)
5226 char *s = reg_string;
5227 char *p;
5228 char reg_name_given[MAX_REG_NAME_SIZE + 1];
5229 const reg_entry *r;
5231 /* Skip possible REGISTER_PREFIX and possible whitespace. */
5232 if (*s == REGISTER_PREFIX)
5233 ++s;
5235 if (is_space_char (*s))
5236 ++s;
5238 p = reg_name_given;
5239 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
5241 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
5242 return (const reg_entry *) NULL;
5243 s++;
5246 /* For naked regs, make sure that we are not dealing with an identifier.
5247 This prevents confusing an identifier like `eax_var' with register
5248 `eax'. */
5249 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
5250 return (const reg_entry *) NULL;
5252 *end_op = s;
5254 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
5256 /* Handle floating point regs, allowing spaces in the (i) part. */
5257 if (r == i386_regtab /* %st is first entry of table */)
5259 if (is_space_char (*s))
5260 ++s;
5261 if (*s == '(')
5263 ++s;
5264 if (is_space_char (*s))
5265 ++s;
5266 if (*s >= '0' && *s <= '7')
5268 r = &i386_float_regtab[*s - '0'];
5269 ++s;
5270 if (is_space_char (*s))
5271 ++s;
5272 if (*s == ')')
5274 *end_op = s + 1;
5275 return r;
5278 /* We have "%st(" then garbage. */
5279 return (const reg_entry *) NULL;
5283 if (r != NULL
5284 && ((r->reg_flags & (RegRex64 | RegRex)) | (r->reg_type & Reg64)) != 0
5285 && (r->reg_type != Control || !(cpu_arch_flags & CpuSledgehammer))
5286 && flag_code != CODE_64BIT)
5287 return (const reg_entry *) NULL;
5289 return r;
5292 /* REG_STRING starts *before* REGISTER_PREFIX. */
5294 static const reg_entry *
5295 parse_register (char *reg_string, char **end_op)
5297 const reg_entry *r;
5299 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
5300 r = parse_real_register (reg_string, end_op);
5301 else
5302 r = NULL;
5303 if (!r)
5305 char *save = input_line_pointer;
5306 char c;
5307 symbolS *symbolP;
5309 input_line_pointer = reg_string;
5310 c = get_symbol_end ();
5311 symbolP = symbol_find (reg_string);
5312 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
5314 const expressionS *e = symbol_get_value_expression (symbolP);
5316 know (e->X_op == O_register);
5317 know (e->X_add_number >= 0 && (valueT) e->X_add_number < ARRAY_SIZE (i386_regtab));
5318 r = i386_regtab + e->X_add_number;
5319 *end_op = input_line_pointer;
5321 *input_line_pointer = c;
5322 input_line_pointer = save;
5324 return r;
5328 i386_parse_name (char *name, expressionS *e, char *nextcharP)
5330 const reg_entry *r;
5331 char *end = input_line_pointer;
5333 *end = *nextcharP;
5334 r = parse_register (name, &input_line_pointer);
5335 if (r && end <= input_line_pointer)
5337 *nextcharP = *input_line_pointer;
5338 *input_line_pointer = 0;
5339 e->X_op = O_register;
5340 e->X_add_number = r - i386_regtab;
5341 return 1;
5343 input_line_pointer = end;
5344 *end = 0;
5345 return 0;
5348 void
5349 md_operand (expressionS *e)
5351 if (*input_line_pointer == REGISTER_PREFIX)
5353 char *end;
5354 const reg_entry *r = parse_real_register (input_line_pointer, &end);
5356 if (r)
5358 e->X_op = O_register;
5359 e->X_add_number = r - i386_regtab;
5360 input_line_pointer = end;
5366 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5367 const char *md_shortopts = "kVQ:sqn";
5368 #else
5369 const char *md_shortopts = "qn";
5370 #endif
5372 #define OPTION_32 (OPTION_MD_BASE + 0)
5373 #define OPTION_64 (OPTION_MD_BASE + 1)
5374 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
5376 struct option md_longopts[] = {
5377 {"32", no_argument, NULL, OPTION_32},
5378 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5379 {"64", no_argument, NULL, OPTION_64},
5380 #endif
5381 {"divide", no_argument, NULL, OPTION_DIVIDE},
5382 {NULL, no_argument, NULL, 0}
5384 size_t md_longopts_size = sizeof (md_longopts);
5387 md_parse_option (c, arg)
5388 int c;
5389 char *arg ATTRIBUTE_UNUSED;
5391 switch (c)
5393 case 'n':
5394 optimize_align_code = 0;
5395 break;
5397 case 'q':
5398 quiet_warnings = 1;
5399 break;
5401 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5402 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
5403 should be emitted or not. FIXME: Not implemented. */
5404 case 'Q':
5405 break;
5407 /* -V: SVR4 argument to print version ID. */
5408 case 'V':
5409 print_version_id ();
5410 break;
5412 /* -k: Ignore for FreeBSD compatibility. */
5413 case 'k':
5414 break;
5416 case 's':
5417 /* -s: On i386 Solaris, this tells the native assembler to use
5418 .stab instead of .stab.excl. We always use .stab anyhow. */
5419 break;
5421 case OPTION_64:
5423 const char **list, **l;
5425 list = bfd_target_list ();
5426 for (l = list; *l != NULL; l++)
5427 if (strcmp (*l, "elf64-x86-64") == 0)
5429 default_arch = "x86_64";
5430 break;
5432 if (*l == NULL)
5433 as_fatal (_("No compiled in support for x86_64"));
5434 free (list);
5436 break;
5437 #endif
5439 case OPTION_32:
5440 default_arch = "i386";
5441 break;
5443 case OPTION_DIVIDE:
5444 #ifdef SVR4_COMMENT_CHARS
5446 char *n, *t;
5447 const char *s;
5449 n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
5450 t = n;
5451 for (s = i386_comment_chars; *s != '\0'; s++)
5452 if (*s != '/')
5453 *t++ = *s;
5454 *t = '\0';
5455 i386_comment_chars = n;
5457 #endif
5458 break;
5460 default:
5461 return 0;
5463 return 1;
5466 void
5467 md_show_usage (stream)
5468 FILE *stream;
5470 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5471 fprintf (stream, _("\
5472 -Q ignored\n\
5473 -V print assembler version number\n\
5474 -k ignored\n"));
5475 #endif
5476 fprintf (stream, _("\
5477 -n Do not optimize code alignment\n\
5478 -q quieten some warnings\n"));
5479 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5480 fprintf (stream, _("\
5481 -s ignored\n"));
5482 #endif
5483 #ifdef SVR4_COMMENT_CHARS
5484 fprintf (stream, _("\
5485 --divide do not treat `/' as a comment character\n"));
5486 #else
5487 fprintf (stream, _("\
5488 --divide ignored\n"));
5489 #endif
5492 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
5493 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5495 /* Pick the target format to use. */
5497 const char *
5498 i386_target_format ()
5500 if (!strcmp (default_arch, "x86_64"))
5501 set_code_flag (CODE_64BIT);
5502 else if (!strcmp (default_arch, "i386"))
5503 set_code_flag (CODE_32BIT);
5504 else
5505 as_fatal (_("Unknown architecture"));
5506 switch (OUTPUT_FLAVOR)
5508 #ifdef OBJ_MAYBE_AOUT
5509 case bfd_target_aout_flavour:
5510 return AOUT_TARGET_FORMAT;
5511 #endif
5512 #ifdef OBJ_MAYBE_COFF
5513 case bfd_target_coff_flavour:
5514 return "coff-i386";
5515 #endif
5516 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
5517 case bfd_target_elf_flavour:
5519 if (flag_code == CODE_64BIT)
5521 object_64bit = 1;
5522 use_rela_relocations = 1;
5524 return flag_code == CODE_64BIT ? "elf64-x86-64" : ELF_TARGET_FORMAT;
5526 #endif
5527 default:
5528 abort ();
5529 return NULL;
5533 #endif /* OBJ_MAYBE_ more than one */
5535 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
5536 void i386_elf_emit_arch_note ()
5538 if (IS_ELF && cpu_arch_name != NULL)
5540 char *p;
5541 asection *seg = now_seg;
5542 subsegT subseg = now_subseg;
5543 Elf_Internal_Note i_note;
5544 Elf_External_Note e_note;
5545 asection *note_secp;
5546 int len;
5548 /* Create the .note section. */
5549 note_secp = subseg_new (".note", 0);
5550 bfd_set_section_flags (stdoutput,
5551 note_secp,
5552 SEC_HAS_CONTENTS | SEC_READONLY);
5554 /* Process the arch string. */
5555 len = strlen (cpu_arch_name);
5557 i_note.namesz = len + 1;
5558 i_note.descsz = 0;
5559 i_note.type = NT_ARCH;
5560 p = frag_more (sizeof (e_note.namesz));
5561 md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
5562 p = frag_more (sizeof (e_note.descsz));
5563 md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
5564 p = frag_more (sizeof (e_note.type));
5565 md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
5566 p = frag_more (len + 1);
5567 strcpy (p, cpu_arch_name);
5569 frag_align (2, 0, 0);
5571 subseg_set (seg, subseg);
5574 #endif
5576 symbolS *
5577 md_undefined_symbol (name)
5578 char *name;
5580 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
5581 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
5582 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
5583 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
5585 if (!GOT_symbol)
5587 if (symbol_find (name))
5588 as_bad (_("GOT already in symbol table"));
5589 GOT_symbol = symbol_new (name, undefined_section,
5590 (valueT) 0, &zero_address_frag);
5592 return GOT_symbol;
5594 return 0;
5597 /* Round up a section size to the appropriate boundary. */
5599 valueT
5600 md_section_align (segment, size)
5601 segT segment ATTRIBUTE_UNUSED;
5602 valueT size;
5604 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
5605 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
5607 /* For a.out, force the section size to be aligned. If we don't do
5608 this, BFD will align it for us, but it will not write out the
5609 final bytes of the section. This may be a bug in BFD, but it is
5610 easier to fix it here since that is how the other a.out targets
5611 work. */
5612 int align;
5614 align = bfd_get_section_alignment (stdoutput, segment);
5615 size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
5617 #endif
5619 return size;
5622 /* On the i386, PC-relative offsets are relative to the start of the
5623 next instruction. That is, the address of the offset, plus its
5624 size, since the offset is always the last part of the insn. */
5626 long
5627 md_pcrel_from (fixP)
5628 fixS *fixP;
5630 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
5633 #ifndef I386COFF
5635 static void
5636 s_bss (ignore)
5637 int ignore ATTRIBUTE_UNUSED;
5639 int temp;
5641 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
5642 if (IS_ELF)
5643 obj_elf_section_change_hook ();
5644 #endif
5645 temp = get_absolute_expression ();
5646 subseg_set (bss_section, (subsegT) temp);
5647 demand_empty_rest_of_line ();
5650 #endif
5652 void
5653 i386_validate_fix (fixp)
5654 fixS *fixp;
5656 if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
5658 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
5660 if (!object_64bit)
5661 abort ();
5662 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
5664 else
5666 if (!object_64bit)
5667 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
5668 else
5669 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
5671 fixp->fx_subsy = 0;
5675 arelent *
5676 tc_gen_reloc (section, fixp)
5677 asection *section ATTRIBUTE_UNUSED;
5678 fixS *fixp;
5680 arelent *rel;
5681 bfd_reloc_code_real_type code;
5683 switch (fixp->fx_r_type)
5685 case BFD_RELOC_X86_64_PLT32:
5686 case BFD_RELOC_X86_64_GOT32:
5687 case BFD_RELOC_X86_64_GOTPCREL:
5688 case BFD_RELOC_386_PLT32:
5689 case BFD_RELOC_386_GOT32:
5690 case BFD_RELOC_386_GOTOFF:
5691 case BFD_RELOC_386_GOTPC:
5692 case BFD_RELOC_386_TLS_GD:
5693 case BFD_RELOC_386_TLS_LDM:
5694 case BFD_RELOC_386_TLS_LDO_32:
5695 case BFD_RELOC_386_TLS_IE_32:
5696 case BFD_RELOC_386_TLS_IE:
5697 case BFD_RELOC_386_TLS_GOTIE:
5698 case BFD_RELOC_386_TLS_LE_32:
5699 case BFD_RELOC_386_TLS_LE:
5700 case BFD_RELOC_386_TLS_GOTDESC:
5701 case BFD_RELOC_386_TLS_DESC_CALL:
5702 case BFD_RELOC_X86_64_TLSGD:
5703 case BFD_RELOC_X86_64_TLSLD:
5704 case BFD_RELOC_X86_64_DTPOFF32:
5705 case BFD_RELOC_X86_64_DTPOFF64:
5706 case BFD_RELOC_X86_64_GOTTPOFF:
5707 case BFD_RELOC_X86_64_TPOFF32:
5708 case BFD_RELOC_X86_64_TPOFF64:
5709 case BFD_RELOC_X86_64_GOTOFF64:
5710 case BFD_RELOC_X86_64_GOTPC32:
5711 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5712 case BFD_RELOC_X86_64_TLSDESC_CALL:
5713 case BFD_RELOC_RVA:
5714 case BFD_RELOC_VTABLE_ENTRY:
5715 case BFD_RELOC_VTABLE_INHERIT:
5716 #ifdef TE_PE
5717 case BFD_RELOC_32_SECREL:
5718 #endif
5719 code = fixp->fx_r_type;
5720 break;
5721 case BFD_RELOC_X86_64_32S:
5722 if (!fixp->fx_pcrel)
5724 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
5725 code = fixp->fx_r_type;
5726 break;
5728 default:
5729 if (fixp->fx_pcrel)
5731 switch (fixp->fx_size)
5733 default:
5734 as_bad_where (fixp->fx_file, fixp->fx_line,
5735 _("can not do %d byte pc-relative relocation"),
5736 fixp->fx_size);
5737 code = BFD_RELOC_32_PCREL;
5738 break;
5739 case 1: code = BFD_RELOC_8_PCREL; break;
5740 case 2: code = BFD_RELOC_16_PCREL; break;
5741 case 4: code = BFD_RELOC_32_PCREL; break;
5742 #ifdef BFD64
5743 case 8: code = BFD_RELOC_64_PCREL; break;
5744 #endif
5747 else
5749 switch (fixp->fx_size)
5751 default:
5752 as_bad_where (fixp->fx_file, fixp->fx_line,
5753 _("can not do %d byte relocation"),
5754 fixp->fx_size);
5755 code = BFD_RELOC_32;
5756 break;
5757 case 1: code = BFD_RELOC_8; break;
5758 case 2: code = BFD_RELOC_16; break;
5759 case 4: code = BFD_RELOC_32; break;
5760 #ifdef BFD64
5761 case 8: code = BFD_RELOC_64; break;
5762 #endif
5765 break;
5768 if ((code == BFD_RELOC_32
5769 || code == BFD_RELOC_32_PCREL
5770 || code == BFD_RELOC_X86_64_32S)
5771 && GOT_symbol
5772 && fixp->fx_addsy == GOT_symbol)
5774 if (!object_64bit)
5775 code = BFD_RELOC_386_GOTPC;
5776 else
5777 code = BFD_RELOC_X86_64_GOTPC32;
5780 rel = (arelent *) xmalloc (sizeof (arelent));
5781 rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
5782 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
5784 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
5786 if (!use_rela_relocations)
5788 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
5789 vtable entry to be used in the relocation's section offset. */
5790 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
5791 rel->address = fixp->fx_offset;
5793 rel->addend = 0;
5795 /* Use the rela in 64bit mode. */
5796 else
5798 if (!fixp->fx_pcrel)
5799 rel->addend = fixp->fx_offset;
5800 else
5801 switch (code)
5803 case BFD_RELOC_X86_64_PLT32:
5804 case BFD_RELOC_X86_64_GOT32:
5805 case BFD_RELOC_X86_64_GOTPCREL:
5806 case BFD_RELOC_X86_64_TLSGD:
5807 case BFD_RELOC_X86_64_TLSLD:
5808 case BFD_RELOC_X86_64_GOTTPOFF:
5809 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
5810 case BFD_RELOC_X86_64_TLSDESC_CALL:
5811 rel->addend = fixp->fx_offset - fixp->fx_size;
5812 break;
5813 default:
5814 rel->addend = (section->vma
5815 - fixp->fx_size
5816 + fixp->fx_addnumber
5817 + md_pcrel_from (fixp));
5818 break;
5822 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
5823 if (rel->howto == NULL)
5825 as_bad_where (fixp->fx_file, fixp->fx_line,
5826 _("cannot represent relocation type %s"),
5827 bfd_get_reloc_code_name (code));
5828 /* Set howto to a garbage value so that we can keep going. */
5829 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
5830 assert (rel->howto != NULL);
5833 return rel;
5837 /* Parse operands using Intel syntax. This implements a recursive descent
5838 parser based on the BNF grammar published in Appendix B of the MASM 6.1
5839 Programmer's Guide.
5841 FIXME: We do not recognize the full operand grammar defined in the MASM
5842 documentation. In particular, all the structure/union and
5843 high-level macro operands are missing.
5845 Uppercase words are terminals, lower case words are non-terminals.
5846 Objects surrounded by double brackets '[[' ']]' are optional. Vertical
5847 bars '|' denote choices. Most grammar productions are implemented in
5848 functions called 'intel_<production>'.
5850 Initial production is 'expr'.
5852 addOp + | -
5854 alpha [a-zA-Z]
5856 binOp & | AND | \| | OR | ^ | XOR
5858 byteRegister AL | AH | BL | BH | CL | CH | DL | DH
5860 constant digits [[ radixOverride ]]
5862 dataType BYTE | WORD | DWORD | FWORD | QWORD | TBYTE | OWORD | XMMWORD
5864 digits decdigit
5865 | digits decdigit
5866 | digits hexdigit
5868 decdigit [0-9]
5870 e04 e04 addOp e05
5871 | e05
5873 e05 e05 binOp e06
5874 | e06
5876 e06 e06 mulOp e09
5877 | e09
5879 e09 OFFSET e10
5880 | SHORT e10
5881 | + e10
5882 | - e10
5883 | ~ e10
5884 | NOT e10
5885 | e09 PTR e10
5886 | e09 : e10
5887 | e10
5889 e10 e10 [ expr ]
5890 | e11
5892 e11 ( expr )
5893 | [ expr ]
5894 | constant
5895 | dataType
5896 | id
5898 | register
5900 => expr expr cmpOp e04
5901 | e04
5903 gpRegister AX | EAX | BX | EBX | CX | ECX | DX | EDX
5904 | BP | EBP | SP | ESP | DI | EDI | SI | ESI
5906 hexdigit a | b | c | d | e | f
5907 | A | B | C | D | E | F
5909 id alpha
5910 | id alpha
5911 | id decdigit
5913 mulOp * | / | % | MOD | << | SHL | >> | SHR
5915 quote " | '
5917 register specialRegister
5918 | gpRegister
5919 | byteRegister
5921 segmentRegister CS | DS | ES | FS | GS | SS
5923 specialRegister CR0 | CR2 | CR3 | CR4
5924 | DR0 | DR1 | DR2 | DR3 | DR6 | DR7
5925 | TR3 | TR4 | TR5 | TR6 | TR7
5927 We simplify the grammar in obvious places (e.g., register parsing is
5928 done by calling parse_register) and eliminate immediate left recursion
5929 to implement a recursive-descent parser.
5931 expr e04 expr'
5933 expr' cmpOp e04 expr'
5934 | Empty
5936 e04 e05 e04'
5938 e04' addOp e05 e04'
5939 | Empty
5941 e05 e06 e05'
5943 e05' binOp e06 e05'
5944 | Empty
5946 e06 e09 e06'
5948 e06' mulOp e09 e06'
5949 | Empty
5951 e09 OFFSET e10 e09'
5952 | SHORT e10'
5953 | + e10'
5954 | - e10'
5955 | ~ e10'
5956 | NOT e10'
5957 | e10 e09'
5959 e09' PTR e10 e09'
5960 | : e10 e09'
5961 | Empty
5963 e10 e11 e10'
5965 e10' [ expr ] e10'
5966 | Empty
5968 e11 ( expr )
5969 | [ expr ]
5970 | BYTE
5971 | WORD
5972 | DWORD
5973 | FWORD
5974 | QWORD
5975 | TBYTE
5976 | OWORD
5977 | XMMWORD
5980 | register
5981 | id
5982 | constant */
5984 /* Parsing structure for the intel syntax parser. Used to implement the
5985 semantic actions for the operand grammar. */
5986 struct intel_parser_s
5988 char *op_string; /* The string being parsed. */
5989 int got_a_float; /* Whether the operand is a float. */
5990 int op_modifier; /* Operand modifier. */
5991 int is_mem; /* 1 if operand is memory reference. */
5992 int in_offset; /* >=1 if parsing operand of offset. */
5993 int in_bracket; /* >=1 if parsing operand in brackets. */
5994 const reg_entry *reg; /* Last register reference found. */
5995 char *disp; /* Displacement string being built. */
5996 char *next_operand; /* Resume point when splitting operands. */
5999 static struct intel_parser_s intel_parser;
6001 /* Token structure for parsing intel syntax. */
6002 struct intel_token
6004 int code; /* Token code. */
6005 const reg_entry *reg; /* Register entry for register tokens. */
6006 char *str; /* String representation. */
6009 static struct intel_token cur_token, prev_token;
6011 /* Token codes for the intel parser. Since T_SHORT is already used
6012 by COFF, undefine it first to prevent a warning. */
6013 #define T_NIL -1
6014 #define T_CONST 1
6015 #define T_REG 2
6016 #define T_BYTE 3
6017 #define T_WORD 4
6018 #define T_DWORD 5
6019 #define T_FWORD 6
6020 #define T_QWORD 7
6021 #define T_TBYTE 8
6022 #define T_XMMWORD 9
6023 #undef T_SHORT
6024 #define T_SHORT 10
6025 #define T_OFFSET 11
6026 #define T_PTR 12
6027 #define T_ID 13
6028 #define T_SHL 14
6029 #define T_SHR 15
6031 /* Prototypes for intel parser functions. */
6032 static int intel_match_token PARAMS ((int code));
6033 static void intel_get_token PARAMS ((void));
6034 static void intel_putback_token PARAMS ((void));
6035 static int intel_expr PARAMS ((void));
6036 static int intel_e04 PARAMS ((void));
6037 static int intel_e05 PARAMS ((void));
6038 static int intel_e06 PARAMS ((void));
6039 static int intel_e09 PARAMS ((void));
6040 static int intel_bracket_expr PARAMS ((void));
6041 static int intel_e10 PARAMS ((void));
6042 static int intel_e11 PARAMS ((void));
6044 static int
6045 i386_intel_operand (operand_string, got_a_float)
6046 char *operand_string;
6047 int got_a_float;
6049 int ret;
6050 char *p;
6052 p = intel_parser.op_string = xstrdup (operand_string);
6053 intel_parser.disp = (char *) xmalloc (strlen (operand_string) + 1);
6055 for (;;)
6057 /* Initialize token holders. */
6058 cur_token.code = prev_token.code = T_NIL;
6059 cur_token.reg = prev_token.reg = NULL;
6060 cur_token.str = prev_token.str = NULL;
6062 /* Initialize parser structure. */
6063 intel_parser.got_a_float = got_a_float;
6064 intel_parser.op_modifier = 0;
6065 intel_parser.is_mem = 0;
6066 intel_parser.in_offset = 0;
6067 intel_parser.in_bracket = 0;
6068 intel_parser.reg = NULL;
6069 intel_parser.disp[0] = '\0';
6070 intel_parser.next_operand = NULL;
6072 /* Read the first token and start the parser. */
6073 intel_get_token ();
6074 ret = intel_expr ();
6076 if (!ret)
6077 break;
6079 if (cur_token.code != T_NIL)
6081 as_bad (_("invalid operand for '%s' ('%s' unexpected)"),
6082 current_templates->start->name, cur_token.str);
6083 ret = 0;
6085 /* If we found a memory reference, hand it over to i386_displacement
6086 to fill in the rest of the operand fields. */
6087 else if (intel_parser.is_mem)
6089 if ((i.mem_operands == 1
6090 && (current_templates->start->opcode_modifier & IsString) == 0)
6091 || i.mem_operands == 2)
6093 as_bad (_("too many memory references for '%s'"),
6094 current_templates->start->name);
6095 ret = 0;
6097 else
6099 char *s = intel_parser.disp;
6100 i.mem_operands++;
6102 if (!quiet_warnings && intel_parser.is_mem < 0)
6103 /* See the comments in intel_bracket_expr. */
6104 as_warn (_("Treating `%s' as memory reference"), operand_string);
6106 /* Add the displacement expression. */
6107 if (*s != '\0')
6108 ret = i386_displacement (s, s + strlen (s));
6109 if (ret)
6111 /* Swap base and index in 16-bit memory operands like
6112 [si+bx]. Since i386_index_check is also used in AT&T
6113 mode we have to do that here. */
6114 if (i.base_reg
6115 && i.index_reg
6116 && (i.base_reg->reg_type & Reg16)
6117 && (i.index_reg->reg_type & Reg16)
6118 && i.base_reg->reg_num >= 6
6119 && i.index_reg->reg_num < 6)
6121 const reg_entry *base = i.index_reg;
6123 i.index_reg = i.base_reg;
6124 i.base_reg = base;
6126 ret = i386_index_check (operand_string);
6131 /* Constant and OFFSET expressions are handled by i386_immediate. */
6132 else if ((intel_parser.op_modifier & (1 << T_OFFSET))
6133 || intel_parser.reg == NULL)
6134 ret = i386_immediate (intel_parser.disp);
6136 if (intel_parser.next_operand && this_operand >= MAX_OPERANDS - 1)
6137 ret = 0;
6138 if (!ret || !intel_parser.next_operand)
6139 break;
6140 intel_parser.op_string = intel_parser.next_operand;
6141 this_operand = i.operands++;
6144 free (p);
6145 free (intel_parser.disp);
6147 return ret;
6150 #define NUM_ADDRESS_REGS (!!i.base_reg + !!i.index_reg)
6152 /* expr e04 expr'
6154 expr' cmpOp e04 expr'
6155 | Empty */
6156 static int
6157 intel_expr ()
6159 /* XXX Implement the comparison operators. */
6160 return intel_e04 ();
6163 /* e04 e05 e04'
6165 e04' addOp e05 e04'
6166 | Empty */
6167 static int
6168 intel_e04 ()
6170 int nregs = -1;
6172 for (;;)
6174 if (!intel_e05())
6175 return 0;
6177 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6178 i.base_reg = i386_regtab + REGNAM_AL; /* al is invalid as base */
6180 if (cur_token.code == '+')
6181 nregs = -1;
6182 else if (cur_token.code == '-')
6183 nregs = NUM_ADDRESS_REGS;
6184 else
6185 return 1;
6187 strcat (intel_parser.disp, cur_token.str);
6188 intel_match_token (cur_token.code);
6192 /* e05 e06 e05'
6194 e05' binOp e06 e05'
6195 | Empty */
6196 static int
6197 intel_e05 ()
6199 int nregs = ~NUM_ADDRESS_REGS;
6201 for (;;)
6203 if (!intel_e06())
6204 return 0;
6206 if (cur_token.code == '&' || cur_token.code == '|' || cur_token.code == '^')
6208 char str[2];
6210 str[0] = cur_token.code;
6211 str[1] = 0;
6212 strcat (intel_parser.disp, str);
6214 else
6215 break;
6217 intel_match_token (cur_token.code);
6219 if (nregs < 0)
6220 nregs = ~nregs;
6222 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6223 i.base_reg = i386_regtab + REGNAM_AL + 1; /* cl is invalid as base */
6224 return 1;
6227 /* e06 e09 e06'
6229 e06' mulOp e09 e06'
6230 | Empty */
6231 static int
6232 intel_e06 ()
6234 int nregs = ~NUM_ADDRESS_REGS;
6236 for (;;)
6238 if (!intel_e09())
6239 return 0;
6241 if (cur_token.code == '*' || cur_token.code == '/' || cur_token.code == '%')
6243 char str[2];
6245 str[0] = cur_token.code;
6246 str[1] = 0;
6247 strcat (intel_parser.disp, str);
6249 else if (cur_token.code == T_SHL)
6250 strcat (intel_parser.disp, "<<");
6251 else if (cur_token.code == T_SHR)
6252 strcat (intel_parser.disp, ">>");
6253 else
6254 break;
6256 intel_match_token (cur_token.code);
6258 if (nregs < 0)
6259 nregs = ~nregs;
6261 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6262 i.base_reg = i386_regtab + REGNAM_AL + 2; /* dl is invalid as base */
6263 return 1;
6266 /* e09 OFFSET e09
6267 | SHORT e09
6268 | + e09
6269 | - e09
6270 | ~ e09
6271 | NOT e09
6272 | e10 e09'
6274 e09' PTR e10 e09'
6275 | : e10 e09'
6276 | Empty */
6277 static int
6278 intel_e09 ()
6280 int nregs = ~NUM_ADDRESS_REGS;
6281 int in_offset = 0;
6283 for (;;)
6285 /* Don't consume constants here. */
6286 if (cur_token.code == '+' || cur_token.code == '-')
6288 /* Need to look one token ahead - if the next token
6289 is a constant, the current token is its sign. */
6290 int next_code;
6292 intel_match_token (cur_token.code);
6293 next_code = cur_token.code;
6294 intel_putback_token ();
6295 if (next_code == T_CONST)
6296 break;
6299 /* e09 OFFSET e09 */
6300 if (cur_token.code == T_OFFSET)
6302 if (!in_offset++)
6303 ++intel_parser.in_offset;
6306 /* e09 SHORT e09 */
6307 else if (cur_token.code == T_SHORT)
6308 intel_parser.op_modifier |= 1 << T_SHORT;
6310 /* e09 + e09 */
6311 else if (cur_token.code == '+')
6312 strcat (intel_parser.disp, "+");
6314 /* e09 - e09
6315 | ~ e09
6316 | NOT e09 */
6317 else if (cur_token.code == '-' || cur_token.code == '~')
6319 char str[2];
6321 if (nregs < 0)
6322 nregs = ~nregs;
6323 str[0] = cur_token.code;
6324 str[1] = 0;
6325 strcat (intel_parser.disp, str);
6328 /* e09 e10 e09' */
6329 else
6330 break;
6332 intel_match_token (cur_token.code);
6335 for (;;)
6337 if (!intel_e10 ())
6338 return 0;
6340 /* e09' PTR e10 e09' */
6341 if (cur_token.code == T_PTR)
6343 char suffix;
6345 if (prev_token.code == T_BYTE)
6346 suffix = BYTE_MNEM_SUFFIX;
6348 else if (prev_token.code == T_WORD)
6350 if (current_templates->start->name[0] == 'l'
6351 && current_templates->start->name[2] == 's'
6352 && current_templates->start->name[3] == 0)
6353 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6354 else if (intel_parser.got_a_float == 2) /* "fi..." */
6355 suffix = SHORT_MNEM_SUFFIX;
6356 else
6357 suffix = WORD_MNEM_SUFFIX;
6360 else if (prev_token.code == T_DWORD)
6362 if (current_templates->start->name[0] == 'l'
6363 && current_templates->start->name[2] == 's'
6364 && current_templates->start->name[3] == 0)
6365 suffix = WORD_MNEM_SUFFIX;
6366 else if (flag_code == CODE_16BIT
6367 && (current_templates->start->opcode_modifier
6368 & (Jump | JumpDword)))
6369 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6370 else if (intel_parser.got_a_float == 1) /* "f..." */
6371 suffix = SHORT_MNEM_SUFFIX;
6372 else
6373 suffix = LONG_MNEM_SUFFIX;
6376 else if (prev_token.code == T_FWORD)
6378 if (current_templates->start->name[0] == 'l'
6379 && current_templates->start->name[2] == 's'
6380 && current_templates->start->name[3] == 0)
6381 suffix = LONG_MNEM_SUFFIX;
6382 else if (!intel_parser.got_a_float)
6384 if (flag_code == CODE_16BIT)
6385 add_prefix (DATA_PREFIX_OPCODE);
6386 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6388 else
6389 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6392 else if (prev_token.code == T_QWORD)
6394 if (intel_parser.got_a_float == 1) /* "f..." */
6395 suffix = LONG_MNEM_SUFFIX;
6396 else
6397 suffix = QWORD_MNEM_SUFFIX;
6400 else if (prev_token.code == T_TBYTE)
6402 if (intel_parser.got_a_float == 1)
6403 suffix = LONG_DOUBLE_MNEM_SUFFIX;
6404 else
6405 suffix = BYTE_MNEM_SUFFIX; /* so it will cause an error */
6408 else if (prev_token.code == T_XMMWORD)
6410 /* XXX ignored for now, but accepted since gcc uses it */
6411 suffix = 0;
6414 else
6416 as_bad (_("Unknown operand modifier `%s'"), prev_token.str);
6417 return 0;
6420 /* Operands for jump/call using 'ptr' notation denote absolute
6421 addresses. */
6422 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6423 i.types[this_operand] |= JumpAbsolute;
6425 if (current_templates->start->base_opcode == 0x8d /* lea */)
6427 else if (!i.suffix)
6428 i.suffix = suffix;
6429 else if (i.suffix != suffix)
6431 as_bad (_("Conflicting operand modifiers"));
6432 return 0;
6437 /* e09' : e10 e09' */
6438 else if (cur_token.code == ':')
6440 if (prev_token.code != T_REG)
6442 /* While {call,jmp} SSSS:OOOO is MASM syntax only when SSSS is a
6443 segment/group identifier (which we don't have), using comma
6444 as the operand separator there is even less consistent, since
6445 there all branches only have a single operand. */
6446 if (this_operand != 0
6447 || intel_parser.in_offset
6448 || intel_parser.in_bracket
6449 || (!(current_templates->start->opcode_modifier
6450 & (Jump|JumpDword|JumpInterSegment))
6451 && !(current_templates->start->operand_types[0]
6452 & JumpAbsolute)))
6453 return intel_match_token (T_NIL);
6454 /* Remember the start of the 2nd operand and terminate 1st
6455 operand here.
6456 XXX This isn't right, yet (when SSSS:OOOO is right operand of
6457 another expression), but it gets at least the simplest case
6458 (a plain number or symbol on the left side) right. */
6459 intel_parser.next_operand = intel_parser.op_string;
6460 *--intel_parser.op_string = '\0';
6461 return intel_match_token (':');
6465 /* e09' Empty */
6466 else
6467 break;
6469 intel_match_token (cur_token.code);
6473 if (in_offset)
6475 --intel_parser.in_offset;
6476 if (nregs < 0)
6477 nregs = ~nregs;
6478 if (NUM_ADDRESS_REGS > nregs)
6480 as_bad (_("Invalid operand to `OFFSET'"));
6481 return 0;
6483 intel_parser.op_modifier |= 1 << T_OFFSET;
6486 if (nregs >= 0 && NUM_ADDRESS_REGS > nregs)
6487 i.base_reg = i386_regtab + REGNAM_AL + 3; /* bl is invalid as base */
6488 return 1;
6491 static int
6492 intel_bracket_expr ()
6494 int was_offset = intel_parser.op_modifier & (1 << T_OFFSET);
6495 const char *start = intel_parser.op_string;
6496 int len;
6498 if (i.op[this_operand].regs)
6499 return intel_match_token (T_NIL);
6501 intel_match_token ('[');
6503 /* Mark as a memory operand only if it's not already known to be an
6504 offset expression. If it's an offset expression, we need to keep
6505 the brace in. */
6506 if (!intel_parser.in_offset)
6508 ++intel_parser.in_bracket;
6510 /* Operands for jump/call inside brackets denote absolute addresses. */
6511 if (current_templates->start->opcode_modifier & (Jump | JumpDword))
6512 i.types[this_operand] |= JumpAbsolute;
6514 /* Unfortunately gas always diverged from MASM in a respect that can't
6515 be easily fixed without risking to break code sequences likely to be
6516 encountered (the testsuite even check for this): MASM doesn't consider
6517 an expression inside brackets unconditionally as a memory reference.
6518 When that is e.g. a constant, an offset expression, or the sum of the
6519 two, this is still taken as a constant load. gas, however, always
6520 treated these as memory references. As a compromise, we'll try to make
6521 offset expressions inside brackets work the MASM way (since that's
6522 less likely to be found in real world code), but make constants alone
6523 continue to work the traditional gas way. In either case, issue a
6524 warning. */
6525 intel_parser.op_modifier &= ~was_offset;
6527 else
6528 strcat (intel_parser.disp, "[");
6530 /* Add a '+' to the displacement string if necessary. */
6531 if (*intel_parser.disp != '\0'
6532 && *(intel_parser.disp + strlen (intel_parser.disp) - 1) != '+')
6533 strcat (intel_parser.disp, "+");
6535 if (intel_expr ()
6536 && (len = intel_parser.op_string - start - 1,
6537 intel_match_token (']')))
6539 /* Preserve brackets when the operand is an offset expression. */
6540 if (intel_parser.in_offset)
6541 strcat (intel_parser.disp, "]");
6542 else
6544 --intel_parser.in_bracket;
6545 if (i.base_reg || i.index_reg)
6546 intel_parser.is_mem = 1;
6547 if (!intel_parser.is_mem)
6549 if (!(intel_parser.op_modifier & (1 << T_OFFSET)))
6550 /* Defer the warning until all of the operand was parsed. */
6551 intel_parser.is_mem = -1;
6552 else if (!quiet_warnings)
6553 as_warn (_("`[%.*s]' taken to mean just `%.*s'"), len, start, len, start);
6556 intel_parser.op_modifier |= was_offset;
6558 return 1;
6560 return 0;
6563 /* e10 e11 e10'
6565 e10' [ expr ] e10'
6566 | Empty */
6567 static int
6568 intel_e10 ()
6570 if (!intel_e11 ())
6571 return 0;
6573 while (cur_token.code == '[')
6575 if (!intel_bracket_expr ())
6576 return 0;
6579 return 1;
6582 /* e11 ( expr )
6583 | [ expr ]
6584 | BYTE
6585 | WORD
6586 | DWORD
6587 | FWORD
6588 | QWORD
6589 | TBYTE
6590 | OWORD
6591 | XMMWORD
6594 | register
6595 | id
6596 | constant */
6597 static int
6598 intel_e11 ()
6600 switch (cur_token.code)
6602 /* e11 ( expr ) */
6603 case '(':
6604 intel_match_token ('(');
6605 strcat (intel_parser.disp, "(");
6607 if (intel_expr () && intel_match_token (')'))
6609 strcat (intel_parser.disp, ")");
6610 return 1;
6612 return 0;
6614 /* e11 [ expr ] */
6615 case '[':
6616 return intel_bracket_expr ();
6618 /* e11 $
6619 | . */
6620 case '.':
6621 strcat (intel_parser.disp, cur_token.str);
6622 intel_match_token (cur_token.code);
6624 /* Mark as a memory operand only if it's not already known to be an
6625 offset expression. */
6626 if (!intel_parser.in_offset)
6627 intel_parser.is_mem = 1;
6629 return 1;
6631 /* e11 register */
6632 case T_REG:
6634 const reg_entry *reg = intel_parser.reg = cur_token.reg;
6636 intel_match_token (T_REG);
6638 /* Check for segment change. */
6639 if (cur_token.code == ':')
6641 if (!(reg->reg_type & (SReg2 | SReg3)))
6643 as_bad (_("`%s' is not a valid segment register"), reg->reg_name);
6644 return 0;
6646 else if (i.seg[i.mem_operands])
6647 as_warn (_("Extra segment override ignored"));
6648 else
6650 if (!intel_parser.in_offset)
6651 intel_parser.is_mem = 1;
6652 switch (reg->reg_num)
6654 case 0:
6655 i.seg[i.mem_operands] = &es;
6656 break;
6657 case 1:
6658 i.seg[i.mem_operands] = &cs;
6659 break;
6660 case 2:
6661 i.seg[i.mem_operands] = &ss;
6662 break;
6663 case 3:
6664 i.seg[i.mem_operands] = &ds;
6665 break;
6666 case 4:
6667 i.seg[i.mem_operands] = &fs;
6668 break;
6669 case 5:
6670 i.seg[i.mem_operands] = &gs;
6671 break;
6676 /* Not a segment register. Check for register scaling. */
6677 else if (cur_token.code == '*')
6679 if (!intel_parser.in_bracket)
6681 as_bad (_("Register scaling only allowed in memory operands"));
6682 return 0;
6685 if (reg->reg_type & Reg16) /* Disallow things like [si*1]. */
6686 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6687 else if (i.index_reg)
6688 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6690 /* What follows must be a valid scale. */
6691 intel_match_token ('*');
6692 i.index_reg = reg;
6693 i.types[this_operand] |= BaseIndex;
6695 /* Set the scale after setting the register (otherwise,
6696 i386_scale will complain) */
6697 if (cur_token.code == '+' || cur_token.code == '-')
6699 char *str, sign = cur_token.code;
6700 intel_match_token (cur_token.code);
6701 if (cur_token.code != T_CONST)
6703 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6704 cur_token.str);
6705 return 0;
6707 str = (char *) xmalloc (strlen (cur_token.str) + 2);
6708 strcpy (str + 1, cur_token.str);
6709 *str = sign;
6710 if (!i386_scale (str))
6711 return 0;
6712 free (str);
6714 else if (!i386_scale (cur_token.str))
6715 return 0;
6716 intel_match_token (cur_token.code);
6719 /* No scaling. If this is a memory operand, the register is either a
6720 base register (first occurrence) or an index register (second
6721 occurrence). */
6722 else if (intel_parser.in_bracket)
6725 if (!i.base_reg)
6726 i.base_reg = reg;
6727 else if (!i.index_reg)
6728 i.index_reg = reg;
6729 else
6731 as_bad (_("Too many register references in memory operand"));
6732 return 0;
6735 i.types[this_operand] |= BaseIndex;
6738 /* It's neither base nor index. */
6739 else if (!intel_parser.in_offset && !intel_parser.is_mem)
6741 i.types[this_operand] |= reg->reg_type & ~BaseIndex;
6742 i.op[this_operand].regs = reg;
6743 i.reg_operands++;
6745 else
6747 as_bad (_("Invalid use of register"));
6748 return 0;
6751 /* Since registers are not part of the displacement string (except
6752 when we're parsing offset operands), we may need to remove any
6753 preceding '+' from the displacement string. */
6754 if (*intel_parser.disp != '\0'
6755 && !intel_parser.in_offset)
6757 char *s = intel_parser.disp;
6758 s += strlen (s) - 1;
6759 if (*s == '+')
6760 *s = '\0';
6763 return 1;
6766 /* e11 BYTE
6767 | WORD
6768 | DWORD
6769 | FWORD
6770 | QWORD
6771 | TBYTE
6772 | OWORD
6773 | XMMWORD */
6774 case T_BYTE:
6775 case T_WORD:
6776 case T_DWORD:
6777 case T_FWORD:
6778 case T_QWORD:
6779 case T_TBYTE:
6780 case T_XMMWORD:
6781 intel_match_token (cur_token.code);
6783 if (cur_token.code == T_PTR)
6784 return 1;
6786 /* It must have been an identifier. */
6787 intel_putback_token ();
6788 cur_token.code = T_ID;
6789 /* FALLTHRU */
6791 /* e11 id
6792 | constant */
6793 case T_ID:
6794 if (!intel_parser.in_offset && intel_parser.is_mem <= 0)
6796 symbolS *symbolP;
6798 /* The identifier represents a memory reference only if it's not
6799 preceded by an offset modifier and if it's not an equate. */
6800 symbolP = symbol_find(cur_token.str);
6801 if (!symbolP || S_GET_SEGMENT(symbolP) != absolute_section)
6802 intel_parser.is_mem = 1;
6804 /* FALLTHRU */
6806 case T_CONST:
6807 case '-':
6808 case '+':
6810 char *save_str, sign = 0;
6812 /* Allow constants that start with `+' or `-'. */
6813 if (cur_token.code == '-' || cur_token.code == '+')
6815 sign = cur_token.code;
6816 intel_match_token (cur_token.code);
6817 if (cur_token.code != T_CONST)
6819 as_bad (_("Syntax error: Expecting a constant, got `%s'"),
6820 cur_token.str);
6821 return 0;
6825 save_str = (char *) xmalloc (strlen (cur_token.str) + 2);
6826 strcpy (save_str + !!sign, cur_token.str);
6827 if (sign)
6828 *save_str = sign;
6830 /* Get the next token to check for register scaling. */
6831 intel_match_token (cur_token.code);
6833 /* Check if this constant is a scaling factor for an index register. */
6834 if (cur_token.code == '*')
6836 if (intel_match_token ('*') && cur_token.code == T_REG)
6838 const reg_entry *reg = cur_token.reg;
6840 if (!intel_parser.in_bracket)
6842 as_bad (_("Register scaling only allowed in memory operands"));
6843 return 0;
6846 if (reg->reg_type & Reg16) /* Disallow things like [1*si]. */
6847 reg = i386_regtab + REGNAM_AX + 4; /* sp is invalid as index */
6848 else if (i.index_reg)
6849 reg = i386_regtab + REGNAM_EAX + 4; /* esp is invalid as index */
6851 /* The constant is followed by `* reg', so it must be
6852 a valid scale. */
6853 i.index_reg = reg;
6854 i.types[this_operand] |= BaseIndex;
6856 /* Set the scale after setting the register (otherwise,
6857 i386_scale will complain) */
6858 if (!i386_scale (save_str))
6859 return 0;
6860 intel_match_token (T_REG);
6862 /* Since registers are not part of the displacement
6863 string, we may need to remove any preceding '+' from
6864 the displacement string. */
6865 if (*intel_parser.disp != '\0')
6867 char *s = intel_parser.disp;
6868 s += strlen (s) - 1;
6869 if (*s == '+')
6870 *s = '\0';
6873 free (save_str);
6875 return 1;
6878 /* The constant was not used for register scaling. Since we have
6879 already consumed the token following `*' we now need to put it
6880 back in the stream. */
6881 intel_putback_token ();
6884 /* Add the constant to the displacement string. */
6885 strcat (intel_parser.disp, save_str);
6886 free (save_str);
6888 return 1;
6892 as_bad (_("Unrecognized token '%s'"), cur_token.str);
6893 return 0;
6896 /* Match the given token against cur_token. If they match, read the next
6897 token from the operand string. */
6898 static int
6899 intel_match_token (code)
6900 int code;
6902 if (cur_token.code == code)
6904 intel_get_token ();
6905 return 1;
6907 else
6909 as_bad (_("Unexpected token `%s'"), cur_token.str);
6910 return 0;
6914 /* Read a new token from intel_parser.op_string and store it in cur_token. */
6915 static void
6916 intel_get_token ()
6918 char *end_op;
6919 const reg_entry *reg;
6920 struct intel_token new_token;
6922 new_token.code = T_NIL;
6923 new_token.reg = NULL;
6924 new_token.str = NULL;
6926 /* Free the memory allocated to the previous token and move
6927 cur_token to prev_token. */
6928 if (prev_token.str)
6929 free (prev_token.str);
6931 prev_token = cur_token;
6933 /* Skip whitespace. */
6934 while (is_space_char (*intel_parser.op_string))
6935 intel_parser.op_string++;
6937 /* Return an empty token if we find nothing else on the line. */
6938 if (*intel_parser.op_string == '\0')
6940 cur_token = new_token;
6941 return;
6944 /* The new token cannot be larger than the remainder of the operand
6945 string. */
6946 new_token.str = (char *) xmalloc (strlen (intel_parser.op_string) + 1);
6947 new_token.str[0] = '\0';
6949 if (strchr ("0123456789", *intel_parser.op_string))
6951 char *p = new_token.str;
6952 char *q = intel_parser.op_string;
6953 new_token.code = T_CONST;
6955 /* Allow any kind of identifier char to encompass floating point and
6956 hexadecimal numbers. */
6957 while (is_identifier_char (*q))
6958 *p++ = *q++;
6959 *p = '\0';
6961 /* Recognize special symbol names [0-9][bf]. */
6962 if (strlen (intel_parser.op_string) == 2
6963 && (intel_parser.op_string[1] == 'b'
6964 || intel_parser.op_string[1] == 'f'))
6965 new_token.code = T_ID;
6968 else if ((reg = parse_register (intel_parser.op_string, &end_op)) != NULL)
6970 size_t len = end_op - intel_parser.op_string;
6972 new_token.code = T_REG;
6973 new_token.reg = reg;
6975 memcpy (new_token.str, intel_parser.op_string, len);
6976 new_token.str[len] = '\0';
6979 else if (is_identifier_char (*intel_parser.op_string))
6981 char *p = new_token.str;
6982 char *q = intel_parser.op_string;
6984 /* A '.' or '$' followed by an identifier char is an identifier.
6985 Otherwise, it's operator '.' followed by an expression. */
6986 if ((*q == '.' || *q == '$') && !is_identifier_char (*(q + 1)))
6988 new_token.code = '.';
6989 new_token.str[0] = '.';
6990 new_token.str[1] = '\0';
6992 else
6994 while (is_identifier_char (*q) || *q == '@')
6995 *p++ = *q++;
6996 *p = '\0';
6998 if (strcasecmp (new_token.str, "NOT") == 0)
6999 new_token.code = '~';
7001 else if (strcasecmp (new_token.str, "MOD") == 0)
7002 new_token.code = '%';
7004 else if (strcasecmp (new_token.str, "AND") == 0)
7005 new_token.code = '&';
7007 else if (strcasecmp (new_token.str, "OR") == 0)
7008 new_token.code = '|';
7010 else if (strcasecmp (new_token.str, "XOR") == 0)
7011 new_token.code = '^';
7013 else if (strcasecmp (new_token.str, "SHL") == 0)
7014 new_token.code = T_SHL;
7016 else if (strcasecmp (new_token.str, "SHR") == 0)
7017 new_token.code = T_SHR;
7019 else if (strcasecmp (new_token.str, "BYTE") == 0)
7020 new_token.code = T_BYTE;
7022 else if (strcasecmp (new_token.str, "WORD") == 0)
7023 new_token.code = T_WORD;
7025 else if (strcasecmp (new_token.str, "DWORD") == 0)
7026 new_token.code = T_DWORD;
7028 else if (strcasecmp (new_token.str, "FWORD") == 0)
7029 new_token.code = T_FWORD;
7031 else if (strcasecmp (new_token.str, "QWORD") == 0)
7032 new_token.code = T_QWORD;
7034 else if (strcasecmp (new_token.str, "TBYTE") == 0
7035 /* XXX remove (gcc still uses it) */
7036 || strcasecmp (new_token.str, "XWORD") == 0)
7037 new_token.code = T_TBYTE;
7039 else if (strcasecmp (new_token.str, "XMMWORD") == 0
7040 || strcasecmp (new_token.str, "OWORD") == 0)
7041 new_token.code = T_XMMWORD;
7043 else if (strcasecmp (new_token.str, "PTR") == 0)
7044 new_token.code = T_PTR;
7046 else if (strcasecmp (new_token.str, "SHORT") == 0)
7047 new_token.code = T_SHORT;
7049 else if (strcasecmp (new_token.str, "OFFSET") == 0)
7051 new_token.code = T_OFFSET;
7053 /* ??? This is not mentioned in the MASM grammar but gcc
7054 makes use of it with -mintel-syntax. OFFSET may be
7055 followed by FLAT: */
7056 if (strncasecmp (q, " FLAT:", 6) == 0)
7057 strcat (new_token.str, " FLAT:");
7060 /* ??? This is not mentioned in the MASM grammar. */
7061 else if (strcasecmp (new_token.str, "FLAT") == 0)
7063 new_token.code = T_OFFSET;
7064 if (*q == ':')
7065 strcat (new_token.str, ":");
7066 else
7067 as_bad (_("`:' expected"));
7070 else
7071 new_token.code = T_ID;
7075 else if (strchr ("+-/*%|&^:[]()~", *intel_parser.op_string))
7077 new_token.code = *intel_parser.op_string;
7078 new_token.str[0] = *intel_parser.op_string;
7079 new_token.str[1] = '\0';
7082 else if (strchr ("<>", *intel_parser.op_string)
7083 && *intel_parser.op_string == *(intel_parser.op_string + 1))
7085 new_token.code = *intel_parser.op_string == '<' ? T_SHL : T_SHR;
7086 new_token.str[0] = *intel_parser.op_string;
7087 new_token.str[1] = *intel_parser.op_string;
7088 new_token.str[2] = '\0';
7091 else
7092 as_bad (_("Unrecognized token `%s'"), intel_parser.op_string);
7094 intel_parser.op_string += strlen (new_token.str);
7095 cur_token = new_token;
7098 /* Put cur_token back into the token stream and make cur_token point to
7099 prev_token. */
7100 static void
7101 intel_putback_token ()
7103 if (cur_token.code != T_NIL)
7105 intel_parser.op_string -= strlen (cur_token.str);
7106 free (cur_token.str);
7108 cur_token = prev_token;
7110 /* Forget prev_token. */
7111 prev_token.code = T_NIL;
7112 prev_token.reg = NULL;
7113 prev_token.str = NULL;
7117 tc_x86_regname_to_dw2regnum (const char *regname)
7119 unsigned int regnum;
7120 unsigned int regnames_count;
7121 static const char *const regnames_32[] =
7123 "eax", "ecx", "edx", "ebx",
7124 "esp", "ebp", "esi", "edi",
7125 "eip", "eflags", NULL,
7126 "st0", "st1", "st2", "st3",
7127 "st4", "st5", "st6", "st7",
7128 NULL, NULL,
7129 "xmm0", "xmm1", "xmm2", "xmm3",
7130 "xmm4", "xmm5", "xmm6", "xmm7",
7131 "mm0", "mm1", "mm2", "mm3",
7132 "mm4", "mm5", "mm6", "mm7",
7133 "fcw", "fsw", "mxcsr",
7134 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7135 "tr", "ldtr"
7137 static const char *const regnames_64[] =
7139 "rax", "rdx", "rcx", "rbx",
7140 "rsi", "rdi", "rbp", "rsp",
7141 "r8", "r9", "r10", "r11",
7142 "r12", "r13", "r14", "r15",
7143 "rip",
7144 "xmm0", "xmm1", "xmm2", "xmm3",
7145 "xmm4", "xmm5", "xmm6", "xmm7",
7146 "xmm8", "xmm9", "xmm10", "xmm11",
7147 "xmm12", "xmm13", "xmm14", "xmm15",
7148 "st0", "st1", "st2", "st3",
7149 "st4", "st5", "st6", "st7",
7150 "mm0", "mm1", "mm2", "mm3",
7151 "mm4", "mm5", "mm6", "mm7",
7152 "rflags",
7153 "es", "cs", "ss", "ds", "fs", "gs", NULL, NULL,
7154 "fs.base", "gs.base", NULL, NULL,
7155 "tr", "ldtr",
7156 "mxcsr", "fcw", "fsw"
7158 const char *const *regnames;
7160 if (flag_code == CODE_64BIT)
7162 regnames = regnames_64;
7163 regnames_count = ARRAY_SIZE (regnames_64);
7165 else
7167 regnames = regnames_32;
7168 regnames_count = ARRAY_SIZE (regnames_32);
7171 for (regnum = 0; regnum < regnames_count; regnum++)
7172 if (regnames[regnum] != NULL
7173 && strcmp (regname, regnames[regnum]) == 0)
7174 return regnum;
7176 return -1;
7179 void
7180 tc_x86_frame_initial_instructions (void)
7182 static unsigned int sp_regno;
7184 if (!sp_regno)
7185 sp_regno = tc_x86_regname_to_dw2regnum (flag_code == CODE_64BIT
7186 ? "rsp" : "esp");
7188 cfi_add_CFA_def_cfa (sp_regno, -x86_cie_data_alignment);
7189 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
7193 i386_elf_section_type (const char *str, size_t len)
7195 if (flag_code == CODE_64BIT
7196 && len == sizeof ("unwind") - 1
7197 && strncmp (str, "unwind", 6) == 0)
7198 return SHT_X86_64_UNWIND;
7200 return -1;
7203 #ifdef TE_PE
7204 void
7205 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
7207 expressionS expr;
7209 expr.X_op = O_secrel;
7210 expr.X_add_symbol = symbol;
7211 expr.X_add_number = 0;
7212 emit_expr (&expr, size);
7214 #endif
7216 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7217 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
7220 x86_64_section_letter (int letter, char **ptr_msg)
7222 if (flag_code == CODE_64BIT)
7224 if (letter == 'l')
7225 return SHF_X86_64_LARGE;
7227 *ptr_msg = _("Bad .section directive: want a,l,w,x,M,S,G,T in string");
7229 else
7230 *ptr_msg = _("Bad .section directive: want a,w,x,M,S,G,T in string");
7231 return -1;
7235 x86_64_section_word (char *str, size_t len)
7237 if (len == 5 && flag_code == CODE_64BIT && strncmp (str, "large", 5) == 0)
7238 return SHF_X86_64_LARGE;
7240 return -1;
7243 static void
7244 handle_large_common (int small ATTRIBUTE_UNUSED)
7246 if (flag_code != CODE_64BIT)
7248 s_comm_internal (0, elf_common_parse);
7249 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
7251 else
7253 static segT lbss_section;
7254 asection *saved_com_section_ptr = elf_com_section_ptr;
7255 asection *saved_bss_section = bss_section;
7257 if (lbss_section == NULL)
7259 flagword applicable;
7260 segT seg = now_seg;
7261 subsegT subseg = now_subseg;
7263 /* The .lbss section is for local .largecomm symbols. */
7264 lbss_section = subseg_new (".lbss", 0);
7265 applicable = bfd_applicable_section_flags (stdoutput);
7266 bfd_set_section_flags (stdoutput, lbss_section,
7267 applicable & SEC_ALLOC);
7268 seg_info (lbss_section)->bss = 1;
7270 subseg_set (seg, subseg);
7273 elf_com_section_ptr = &_bfd_elf_large_com_section;
7274 bss_section = lbss_section;
7276 s_comm_internal (0, elf_common_parse);
7278 elf_com_section_ptr = saved_com_section_ptr;
7279 bss_section = saved_bss_section;
7282 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */