1 /* ----------------------------------------------------------------------- *
3 * Copyright 1996-2010 The NASM Authors - All Rights Reserved
4 * See the file AUTHORS included with the NASM distribution for
5 * the specific copyright holders.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above
14 * copyright notice, this list of conditions and the following
15 * disclaimer in the documentation and/or other materials provided
16 * with the distribution.
18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
19 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
20 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
21 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
22 * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
24 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
25 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
26 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
28 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
29 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
30 * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 * ----------------------------------------------------------------------- */
35 * assemble.c code generation for the Netwide Assembler
37 * the actual codes (C syntax, i.e. octal):
38 * \0 - terminates the code. (Unless it's a literal of course.)
39 * \1..\4 - that many literal bytes follow in the code stream
40 * \5 - add 4 to the primary operand number (b, low octdigit)
41 * \6 - add 4 to the secondary operand number (a, middle octdigit)
42 * \7 - add 4 to both the primary and the secondary operand number
43 * \10..\13 - a literal byte follows in the code stream, to be added
44 * to the register value of operand 0..3
45 * \14..\17 - a signed byte immediate operand, from operand 0..3
46 * \20..\23 - a byte immediate operand, from operand 0..3
47 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
48 * \30..\33 - a word immediate operand, from operand 0..3
49 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
50 * assembly mode or the operand-size override on the operand
51 * \40..\43 - a long immediate operand, from operand 0..3
52 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
53 * depending on the address size of the instruction.
54 * \50..\53 - a byte relative operand, from operand 0..3
55 * \54..\57 - a qword immediate operand, from operand 0..3
56 * \60..\63 - a word relative operand, from operand 0..3
57 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
58 * assembly mode or the operand-size override on the operand
59 * \70..\73 - a long relative operand, from operand 0..3
60 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
61 * \1ab - a ModRM, calculated on EA in operand a, with the spare
62 * field the register value of operand b.
63 * \140..\143 - an immediate word or signed byte for operand 0..3
64 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
65 * is a signed byte rather than a word. Opcode byte follows.
66 * \150..\153 - an immediate dword or signed byte for operand 0..3
67 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
68 * is a signed byte rather than a dword. Opcode byte follows.
69 * \160..\163 - this instruction uses DREX rather than REX, with the
70 * OC0 field set to 0, and the dest field taken from
72 * \164..\167 - this instruction uses DREX rather than REX, with the
73 * OC0 field set to 1, and the dest field taken from
75 * \171 - placement of DREX suffix in the absence of an EA
76 * \172\ab - the register number from operand a in bits 7..4, with
77 * the 4-bit immediate from operand b in bits 3..0.
78 * \173\xab - the register number from operand a in bits 7..4, with
79 * the value b in bits 3..0.
80 * \174\a - the register number from operand a in bits 7..4, and
81 * an arbitrary value in bits 3..0 (assembled as zero.)
82 * \2ab - a ModRM, calculated on EA in operand a, with the spare
83 * field equal to digit b.
84 * \250..\253 - same as \150..\153, except warn if the 64-bit operand
85 * is not equal to the truncated and sign-extended 32-bit
86 * operand; used for 32-bit immediates in 64-bit mode.
87 * \254..\257 - a signed 32-bit operand to be extended to 64 bits.
88 * \260..\263 - this instruction uses VEX/XOP rather than REX, with the
89 * V field taken from operand 0..3.
90 * \270 - this instruction uses VEX/XOP rather than REX, with the
91 * V field set to 1111b.
93 * VEX/XOP prefixes are followed by the sequence:
94 * \tmm\wlp where mm is the M field; and wlp is:
96 * [l0] ll = 0 for L = 0 (.128, .lz)
97 * [l1] ll = 1 for L = 1 (.256)
98 * [lig] ll = 2 for L don't care (always assembled as 0)
100 * [w0] ww = 0 for W = 0
101 * [w1 ] ww = 1 for W = 1
102 * [wig] ww = 2 for W don't care (always assembled as 0)
103 * [ww] ww = 3 for W used as REX.W
105 * t = 0 for VEX (C4/C5), t = 1 for XOP (8F).
107 * \274..\277 - a signed byte immediate operand, from operand 0..3,
108 * which is to be extended to the operand size.
109 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
110 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
111 * \312 - (disassembler only) invalid with non-default address size.
112 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
113 * \314 - (disassembler only) invalid with REX.B
114 * \315 - (disassembler only) invalid with REX.X
115 * \316 - (disassembler only) invalid with REX.R
116 * \317 - (disassembler only) invalid with REX.W
117 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
118 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
119 * \322 - indicates that this instruction is only valid when the
120 * operand size is the default (instruction to disassembler,
121 * generates no code in the assembler)
122 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
123 * \324 - indicates 64-bit operand size requiring REX prefix.
124 * \325 - instruction which always uses spl/bpl/sil/dil
125 * \330 - a literal byte follows in the code stream, to be added
126 * to the condition code value of the instruction.
127 * \331 - instruction not valid with REP prefix. Hint for
128 * disassembler only; for SSE instructions.
129 * \332 - REP prefix (0xF2 byte) used as opcode extension.
130 * \333 - REP prefix (0xF3 byte) used as opcode extension.
131 * \334 - LOCK prefix used as REX.R (used in non-64-bit mode)
132 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
133 * \336 - force a REP(E) prefix (0xF2) even if not specified.
134 * \337 - force a REPNE prefix (0xF3) even if not specified.
135 * \336-\337 are still listed as prefixes in the disassembler.
136 * \340 - reserve <operand 0> bytes of uninitialized storage.
137 * Operand 0 had better be a segmentless constant.
138 * \341 - this instruction needs a WAIT "prefix"
139 * \344,\345 - the PUSH/POP (respectively) codes for CS, DS, ES, SS
140 * (POP is never used for CS) depending on operand 0
141 * \346,\347 - the second byte of PUSH/POP codes for FS, GS, depending
143 * \360 - no SSE prefix (== \364\331)
144 * \361 - 66 SSE prefix (== \366\331)
145 * \362 - F2 SSE prefix (== \364\332)
146 * \363 - F3 SSE prefix (== \364\333)
147 * \364 - operand-size prefix (0x66) not permitted
148 * \365 - address-size prefix (0x67) not permitted
149 * \366 - operand-size prefix (0x66) used as opcode extension
150 * \367 - address-size prefix (0x67) used as opcode extension
151 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
152 * 370 is used for Jcc, 371 is used for JMP.
153 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
154 * used for conditional jump over longer jump
157 #include "compiler.h"
161 #include <inttypes.h>
165 #include "assemble.h"
171 * Matching errors. These should be sorted so that more specific
172 * errors come later in the sequence.
180 * Matching success; the conditional ones first
182 MOK_JUMP
, /* Matching OK but needs jmp_match() */
183 MOK_GOOD
/* Matching unconditionally OK */
187 int sib_present
; /* is a SIB byte necessary? */
188 int bytes
; /* # of bytes of offset needed */
189 int size
; /* lazy - this is sib+bytes+1 */
190 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
193 static uint32_t cpu
; /* cpu level received from nasm.c */
194 static efunc errfunc
;
195 static struct ofmt
*outfmt
;
196 static ListGen
*list
;
198 static int64_t calcsize(int32_t, int64_t, int, insn
*, const uint8_t *);
199 static void gencode(int32_t segment
, int64_t offset
, int bits
,
200 insn
* ins
, const struct itemplate
*temp
,
202 static enum match_result
find_match(const struct itemplate
**tempp
,
204 int32_t segment
, int64_t offset
, int bits
);
205 static enum match_result
matches(const struct itemplate
*, insn
*, int bits
);
206 static opflags_t
regflag(const operand
*);
207 static int32_t regval(const operand
*);
208 static int rexflags(int, opflags_t
, int);
209 static int op_rexflags(const operand
*, int);
210 static ea
*process_ea(operand
*, ea
*, int, int, int, opflags_t
);
211 static void add_asp(insn
*, int);
213 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
215 return ins
->prefixes
[pos
] == prefix
;
218 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
220 if (ins
->prefixes
[pos
])
221 errfunc(ERR_NONFATAL
, "invalid %s prefix",
222 prefix_name(ins
->prefixes
[pos
]));
225 static const char *size_name(int size
)
247 static void warn_overflow(int pass
, int size
)
249 errfunc(ERR_WARNING
| pass
| ERR_WARN_NOV
,
250 "%s data exceeds bounds", size_name(size
));
253 static void warn_overflow_const(int64_t data
, int size
)
255 if (overflow_general(data
, size
))
256 warn_overflow(ERR_PASS1
, size
);
259 static void warn_overflow_opd(const struct operand
*o
, int size
)
261 if (o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
) {
262 if (overflow_general(o
->offset
, size
))
263 warn_overflow(ERR_PASS2
, size
);
268 * This routine wrappers the real output format's output routine,
269 * in order to pass a copy of the data off to the listing file
270 * generator at the same time.
272 static void out(int64_t offset
, int32_t segto
, const void *data
,
273 enum out_type type
, uint64_t size
,
274 int32_t segment
, int32_t wrt
)
276 static int32_t lineno
= 0; /* static!!! */
277 static char *lnfname
= NULL
;
280 if (type
== OUT_ADDRESS
&& segment
== NO_SEG
&& wrt
== NO_SEG
) {
282 * This is a non-relocated address, and we're going to
283 * convert it into RAWDATA format.
288 errfunc(ERR_PANIC
, "OUT_ADDRESS with size > 8");
292 WRITEADDR(q
, *(int64_t *)data
, size
);
297 list
->output(offset
, data
, type
, size
);
300 * this call to src_get determines when we call the
301 * debug-format-specific "linenum" function
302 * it updates lineno and lnfname to the current values
303 * returning 0 if "same as last time", -2 if lnfname
304 * changed, and the amount by which lineno changed,
305 * if it did. thus, these variables must be static
308 if (src_get(&lineno
, &lnfname
))
309 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
311 outfmt
->output(segto
, data
, type
, size
, segment
, wrt
);
314 static bool jmp_match(int32_t segment
, int64_t offset
, int bits
,
315 insn
* ins
, const uint8_t *code
)
320 if ((c
!= 0370 && c
!= 0371) || (ins
->oprs
[0].type
& STRICT
))
324 if (optimizing
< 0 && c
== 0371)
327 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
329 if (ins
->oprs
[0].opflags
& OPFLAG_UNKNOWN
)
330 /* Be optimistic in pass 1 */
333 if (ins
->oprs
[0].segment
!= segment
)
336 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is delta */
337 return (isize
>= -128 && isize
<= 127); /* is it byte size? */
340 int64_t assemble(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
341 insn
* instruction
, struct ofmt
*output
, efunc error
,
344 const struct itemplate
*temp
;
349 int64_t start
= offset
;
350 int64_t wsize
; /* size for DB etc. */
352 errfunc
= error
; /* to pass to other functions */
354 outfmt
= output
; /* likewise */
355 list
= listgen
; /* and again */
357 wsize
= idata_bytes(instruction
->opcode
);
363 int32_t t
= instruction
->times
;
366 "instruction->times < 0 (%ld) in assemble()", t
);
368 while (t
--) { /* repeat TIMES times */
369 list_for_each(e
, instruction
->eops
) {
370 if (e
->type
== EOT_DB_NUMBER
) {
372 errfunc(ERR_NONFATAL
,
373 "integer supplied to a DT, DO or DY"
376 out(offset
, segment
, &e
->offset
,
377 OUT_ADDRESS
, wsize
, e
->segment
, e
->wrt
);
380 } else if (e
->type
== EOT_DB_STRING
||
381 e
->type
== EOT_DB_STRING_FREE
) {
384 out(offset
, segment
, e
->stringval
,
385 OUT_RAWDATA
, e
->stringlen
, NO_SEG
, NO_SEG
);
386 align
= e
->stringlen
% wsize
;
389 align
= wsize
- align
;
390 out(offset
, segment
, zero_buffer
,
391 OUT_RAWDATA
, align
, NO_SEG
, NO_SEG
);
393 offset
+= e
->stringlen
+ align
;
396 if (t
> 0 && t
== instruction
->times
- 1) {
398 * Dummy call to list->output to give the offset to the
401 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
402 list
->uplevel(LIST_TIMES
);
405 if (instruction
->times
> 1)
406 list
->downlevel(LIST_TIMES
);
407 return offset
- start
;
410 if (instruction
->opcode
== I_INCBIN
) {
411 const char *fname
= instruction
->eops
->stringval
;
414 fp
= fopen(fname
, "rb");
416 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
418 } else if (fseek(fp
, 0L, SEEK_END
) < 0) {
419 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
422 static char buf
[4096];
423 size_t t
= instruction
->times
;
428 if (instruction
->eops
->next
) {
429 base
= instruction
->eops
->next
->offset
;
431 if (instruction
->eops
->next
->next
&&
432 len
> (size_t)instruction
->eops
->next
->next
->offset
)
433 len
= (size_t)instruction
->eops
->next
->next
->offset
;
436 * Dummy call to list->output to give the offset to the
439 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
440 list
->uplevel(LIST_INCBIN
);
444 fseek(fp
, base
, SEEK_SET
);
448 m
= fread(buf
, 1, l
> sizeof(buf
) ? sizeof(buf
) : l
, fp
);
451 * This shouldn't happen unless the file
452 * actually changes while we are reading
456 "`incbin': unexpected EOF while"
457 " reading file `%s'", fname
);
458 t
= 0; /* Try to exit cleanly */
461 out(offset
, segment
, buf
, OUT_RAWDATA
, m
,
466 list
->downlevel(LIST_INCBIN
);
467 if (instruction
->times
> 1) {
469 * Dummy call to list->output to give the offset to the
472 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
473 list
->uplevel(LIST_TIMES
);
474 list
->downlevel(LIST_TIMES
);
477 return instruction
->times
* len
;
479 return 0; /* if we're here, there's an error */
482 /* Check to see if we need an address-size prefix */
483 add_asp(instruction
, bits
);
485 m
= find_match(&temp
, instruction
, segment
, offset
, bits
);
489 int64_t insn_size
= calcsize(segment
, offset
, bits
,
490 instruction
, temp
->code
);
491 itimes
= instruction
->times
;
492 if (insn_size
< 0) /* shouldn't be, on pass two */
493 error(ERR_PANIC
, "errors made it through from pass one");
496 for (j
= 0; j
< MAXPREFIX
; j
++) {
498 switch (instruction
->prefixes
[j
]) {
516 error(ERR_WARNING
| ERR_PASS2
,
517 "cs segment base generated, but will be ignored in 64-bit mode");
523 error(ERR_WARNING
| ERR_PASS2
,
524 "ds segment base generated, but will be ignored in 64-bit mode");
530 error(ERR_WARNING
| ERR_PASS2
,
531 "es segment base generated, but will be ignored in 64-bit mode");
543 error(ERR_WARNING
| ERR_PASS2
,
544 "ss segment base generated, but will be ignored in 64-bit mode");
551 "segr6 and segr7 cannot be used as prefixes");
556 "16-bit addressing is not supported "
558 } else if (bits
!= 16)
568 "64-bit addressing is only supported "
592 error(ERR_PANIC
, "invalid instruction prefix");
595 out(offset
, segment
, &c
, OUT_RAWDATA
, 1,
600 insn_end
= offset
+ insn_size
;
601 gencode(segment
, offset
, bits
, instruction
,
604 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
606 * Dummy call to list->output to give the offset to the
609 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
610 list
->uplevel(LIST_TIMES
);
613 if (instruction
->times
> 1)
614 list
->downlevel(LIST_TIMES
);
615 return offset
- start
;
619 case MERR_OPSIZEMISSING
:
620 error(ERR_NONFATAL
, "operation size not specified");
622 case MERR_OPSIZEMISMATCH
:
623 error(ERR_NONFATAL
, "mismatch in operand sizes");
626 error(ERR_NONFATAL
, "no instruction for this cpu level");
629 error(ERR_NONFATAL
, "instruction not supported in %d-bit mode",
634 "invalid combination of opcode and operands");
641 int64_t insn_size(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
642 insn
* instruction
, efunc error
)
644 const struct itemplate
*temp
;
647 errfunc
= error
; /* to pass to other functions */
650 if (instruction
->opcode
== I_none
)
653 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
654 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
655 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
||
656 instruction
->opcode
== I_DY
) {
658 int32_t isize
, osize
, wsize
;
661 wsize
= idata_bytes(instruction
->opcode
);
663 list_for_each(e
, instruction
->eops
) {
667 if (e
->type
== EOT_DB_NUMBER
) {
669 warn_overflow_const(e
->offset
, wsize
);
670 } else if (e
->type
== EOT_DB_STRING
||
671 e
->type
== EOT_DB_STRING_FREE
)
672 osize
= e
->stringlen
;
674 align
= (-osize
) % wsize
;
677 isize
+= osize
+ align
;
679 return isize
* instruction
->times
;
682 if (instruction
->opcode
== I_INCBIN
) {
683 const char *fname
= instruction
->eops
->stringval
;
688 fp
= fopen(fname
, "rb");
690 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
692 else if (fseek(fp
, 0L, SEEK_END
) < 0)
693 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
697 if (instruction
->eops
->next
) {
698 len
-= instruction
->eops
->next
->offset
;
699 if (instruction
->eops
->next
->next
&&
700 len
> (size_t)instruction
->eops
->next
->next
->offset
) {
701 len
= (size_t)instruction
->eops
->next
->next
->offset
;
704 val
= instruction
->times
* len
;
711 /* Check to see if we need an address-size prefix */
712 add_asp(instruction
, bits
);
714 m
= find_match(&temp
, instruction
, segment
, offset
, bits
);
716 /* we've matched an instruction. */
718 const uint8_t *codes
= temp
->code
;
721 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
724 for (j
= 0; j
< MAXPREFIX
; j
++) {
725 switch (instruction
->prefixes
[j
]) {
751 return isize
* instruction
->times
;
753 return -1; /* didn't match any instruction */
757 static bool possible_sbyte(operand
*o
)
759 return o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
&&
760 !(o
->opflags
& OPFLAG_UNKNOWN
) &&
761 optimizing
>= 0 && !(o
->type
& STRICT
);
764 /* check that opn[op] is a signed byte of size 16 or 32 */
765 static bool is_sbyte16(operand
*o
)
769 if (!possible_sbyte(o
))
773 return v
>= -128 && v
<= 127;
776 static bool is_sbyte32(operand
*o
)
780 if (!possible_sbyte(o
))
784 return v
>= -128 && v
<= 127;
787 /* Common construct */
788 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
790 static int64_t calcsize(int32_t segment
, int64_t offset
, int bits
,
791 insn
* ins
, const uint8_t *codes
)
800 ins
->rex
= 0; /* Ensure REX is reset */
802 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
805 (void)segment
; /* Don't warn that this parameter is unused */
806 (void)offset
; /* Don't warn that this parameter is unused */
810 op1
= (c
& 3) + ((opex
& 1) << 2);
811 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
812 opx
= &ins
->oprs
[op1
];
813 opex
= 0; /* For the next iteration */
820 codes
+= c
, length
+= c
;
831 op_rexflags(opx
, REX_B
|REX_H
|REX_P
|REX_W
);
846 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
847 length
+= (opx
->type
& BITS16
) ? 2 : 4;
849 length
+= (bits
== 16) ? 2 : 4;
857 length
+= ins
->addr_size
>> 3;
865 length
+= 8; /* MOV reg64/imm */
873 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
874 length
+= (opx
->type
& BITS16
) ? 2 : 4;
876 length
+= (bits
== 16) ? 2 : 4;
888 length
+= is_sbyte16(opx
) ? 1 : 2;
897 length
+= is_sbyte32(opx
) ? 1 : 4;
908 ins
->drexdst
= regval(opx
);
913 ins
->rex
|= REX_D
|REX_OC
;
914 ins
->drexdst
= regval(opx
);
928 length
+= is_sbyte32(opx
) ? 1 : 4;
937 ins
->drexdst
= regval(opx
);
938 ins
->vex_cm
= *codes
++;
939 ins
->vex_wlp
= *codes
++;
945 ins
->vex_cm
= *codes
++;
946 ins
->vex_wlp
= *codes
++;
959 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
963 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
970 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
971 has_prefix(ins
, PPS_ASIZE
, P_A32
))
980 enum prefixes pfx
= ins
->prefixes
[PPS_OSIZE
];
984 errfunc(ERR_WARNING
| ERR_PASS2
, "invalid operand size prefix");
986 ins
->prefixes
[PPS_OSIZE
] = P_O16
;
992 enum prefixes pfx
= ins
->prefixes
[PPS_OSIZE
];
996 errfunc(ERR_WARNING
| ERR_PASS2
, "invalid operand size prefix");
998 ins
->prefixes
[PPS_OSIZE
] = P_O32
;
1037 if (!ins
->prefixes
[PPS_LREP
])
1038 ins
->prefixes
[PPS_LREP
] = P_REP
;
1042 if (!ins
->prefixes
[PPS_LREP
])
1043 ins
->prefixes
[PPS_LREP
] = P_REPNE
;
1047 if (ins
->oprs
[0].segment
!= NO_SEG
)
1048 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1049 " quantity of BSS space");
1051 length
+= ins
->oprs
[0].offset
;
1055 if (!ins
->prefixes
[PPS_WAIT
])
1056 ins
->prefixes
[PPS_WAIT
] = P_WAIT
;
1106 struct operand
*opy
= &ins
->oprs
[op2
];
1108 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1111 /* pick rfield from operand b (opx) */
1112 rflags
= regflag(opx
);
1113 rfield
= nasm_regvals
[opx
->basereg
];
1118 if (!process_ea(opy
, &ea_data
, bits
,
1119 ins
->addr_size
, rfield
, rflags
)) {
1120 errfunc(ERR_NONFATAL
, "invalid effective address");
1123 ins
->rex
|= ea_data
.rex
;
1124 length
+= ea_data
.size
;
1130 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1131 ": instruction code \\%o (0x%02X) given", c
, c
);
1136 ins
->rex
&= rex_mask
;
1138 if (ins
->rex
& REX_NH
) {
1139 if (ins
->rex
& REX_H
) {
1140 errfunc(ERR_NONFATAL
, "instruction cannot use high registers");
1143 ins
->rex
&= ~REX_P
; /* Don't force REX prefix due to high reg */
1146 if (ins
->rex
& REX_V
) {
1147 int bad32
= REX_R
|REX_W
|REX_X
|REX_B
;
1149 if (ins
->rex
& REX_H
) {
1150 errfunc(ERR_NONFATAL
, "cannot use high register in vex instruction");
1153 switch (ins
->vex_wlp
& 060) {
1167 if (bits
!= 64 && ((ins
->rex
& bad32
) || ins
->drexdst
> 7)) {
1168 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1171 if (ins
->vex_cm
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
)))
1175 } else if (ins
->rex
& REX_D
) {
1176 if (ins
->rex
& REX_H
) {
1177 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1180 if (bits
!= 64 && ((ins
->rex
& (REX_R
|REX_W
|REX_X
|REX_B
)) ||
1181 ins
->drexdst
> 7)) {
1182 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1186 } else if (ins
->rex
& REX_REAL
) {
1187 if (ins
->rex
& REX_H
) {
1188 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1190 } else if (bits
== 64) {
1192 } else if ((ins
->rex
& REX_L
) &&
1193 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1196 assert_no_prefix(ins
, PPS_LREP
);
1199 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1207 #define EMIT_REX() \
1208 if (!(ins->rex & (REX_D|REX_V)) && (ins->rex & REX_REAL) && (bits == 64)) { \
1209 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1210 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1215 static void gencode(int32_t segment
, int64_t offset
, int bits
,
1216 insn
* ins
, const struct itemplate
*temp
,
1219 static char condval
[] = { /* conditional opcodes */
1220 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1221 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1222 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1229 struct operand
*opx
;
1230 const uint8_t *codes
= temp
->code
;
1235 op1
= (c
& 3) + ((opex
& 1) << 2);
1236 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
1237 opx
= &ins
->oprs
[op1
];
1238 opex
= 0; /* For the next iteration */
1246 out(offset
, segment
, codes
, OUT_RAWDATA
, c
, NO_SEG
, NO_SEG
);
1259 bytes
[0] = *codes
++ + (regval(opx
) & 7);
1260 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1266 * The test for BITS8 and SBYTE here is intended to avoid
1267 * warning on optimizer actions due to SBYTE, while still
1268 * warn on explicit BYTE directives. Also warn, obviously,
1269 * if the optimizer isn't enabled.
1271 if (((opx
->type
& BITS8
) ||
1272 !(opx
->type
& temp
->opd
[op1
] & BYTENESS
)) &&
1273 (opx
->offset
< -128 || opx
->offset
> 127)) {
1274 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1275 "signed byte value exceeds bounds");
1277 if (opx
->segment
!= NO_SEG
) {
1279 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1280 opx
->segment
, opx
->wrt
);
1282 bytes
[0] = opx
->offset
;
1283 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1290 if (opx
->offset
< -256 || opx
->offset
> 255) {
1291 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1292 "byte value exceeds bounds");
1294 if (opx
->segment
!= NO_SEG
) {
1296 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1297 opx
->segment
, opx
->wrt
);
1299 bytes
[0] = opx
->offset
;
1300 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1307 if (opx
->offset
< 0 || opx
->offset
> 255)
1308 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1309 "unsigned byte value exceeds bounds");
1310 if (opx
->segment
!= NO_SEG
) {
1312 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1313 opx
->segment
, opx
->wrt
);
1315 bytes
[0] = opx
->offset
;
1316 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1323 warn_overflow_opd(opx
, 2);
1325 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1326 opx
->segment
, opx
->wrt
);
1331 if (opx
->type
& (BITS16
| BITS32
))
1332 size
= (opx
->type
& BITS16
) ? 2 : 4;
1334 size
= (bits
== 16) ? 2 : 4;
1335 warn_overflow_opd(opx
, size
);
1337 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1338 opx
->segment
, opx
->wrt
);
1343 warn_overflow_opd(opx
, 4);
1345 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1346 opx
->segment
, opx
->wrt
);
1352 size
= ins
->addr_size
>> 3;
1353 warn_overflow_opd(opx
, size
);
1354 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1355 opx
->segment
, opx
->wrt
);
1360 if (opx
->segment
!= segment
) {
1362 out(offset
, segment
, &data
,
1363 OUT_REL1ADR
, insn_end
- offset
,
1364 opx
->segment
, opx
->wrt
);
1366 data
= opx
->offset
- insn_end
;
1367 if (data
> 127 || data
< -128)
1368 errfunc(ERR_NONFATAL
, "short jump is out of range");
1369 out(offset
, segment
, &data
,
1370 OUT_ADDRESS
, 1, NO_SEG
, NO_SEG
);
1376 data
= (int64_t)opx
->offset
;
1377 out(offset
, segment
, &data
, OUT_ADDRESS
, 8,
1378 opx
->segment
, opx
->wrt
);
1383 if (opx
->segment
!= segment
) {
1385 out(offset
, segment
, &data
,
1386 OUT_REL2ADR
, insn_end
- offset
,
1387 opx
->segment
, opx
->wrt
);
1389 data
= opx
->offset
- insn_end
;
1390 out(offset
, segment
, &data
,
1391 OUT_ADDRESS
, 2, NO_SEG
, NO_SEG
);
1397 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
1398 size
= (opx
->type
& BITS16
) ? 2 : 4;
1400 size
= (bits
== 16) ? 2 : 4;
1401 if (opx
->segment
!= segment
) {
1403 out(offset
, segment
, &data
,
1404 size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
,
1405 insn_end
- offset
, opx
->segment
, opx
->wrt
);
1407 data
= opx
->offset
- insn_end
;
1408 out(offset
, segment
, &data
,
1409 OUT_ADDRESS
, size
, NO_SEG
, NO_SEG
);
1415 if (opx
->segment
!= segment
) {
1417 out(offset
, segment
, &data
,
1418 OUT_REL4ADR
, insn_end
- offset
,
1419 opx
->segment
, opx
->wrt
);
1421 data
= opx
->offset
- insn_end
;
1422 out(offset
, segment
, &data
,
1423 OUT_ADDRESS
, 4, NO_SEG
, NO_SEG
);
1429 if (opx
->segment
== NO_SEG
)
1430 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1433 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1434 outfmt
->segbase(1 + opx
->segment
),
1441 warn_overflow_opd(opx
, 2);
1442 if (is_sbyte16(opx
)) {
1444 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1448 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1449 opx
->segment
, opx
->wrt
);
1456 bytes
[0] = *codes
++;
1457 if (is_sbyte16(opx
))
1458 bytes
[0] |= 2; /* s-bit */
1459 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1465 warn_overflow_opd(opx
, 4);
1466 if (is_sbyte32(opx
)) {
1468 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1472 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1473 opx
->segment
, opx
->wrt
);
1480 bytes
[0] = *codes
++;
1481 if (is_sbyte32(opx
))
1482 bytes
[0] |= 2; /* s-bit */
1483 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1493 (ins
->drexdst
<< 4) |
1494 (ins
->rex
& REX_OC
? 0x08 : 0) |
1495 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1497 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1503 opx
= &ins
->oprs
[c
>> 3];
1504 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1505 opx
= &ins
->oprs
[c
& 7];
1506 if (opx
->segment
!= NO_SEG
|| opx
->wrt
!= NO_SEG
) {
1507 errfunc(ERR_NONFATAL
,
1508 "non-absolute expression not permitted as argument %d",
1511 if (opx
->offset
& ~15) {
1512 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1513 "four-bit argument exceeds bounds");
1515 bytes
[0] |= opx
->offset
& 15;
1517 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1523 opx
= &ins
->oprs
[c
>> 4];
1524 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1526 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1532 opx
= &ins
->oprs
[c
];
1533 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1534 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1540 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1541 (int32_t)data
!= (int64_t)data
) {
1542 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1543 "signed dword immediate exceeds bounds");
1545 if (is_sbyte32(opx
)) {
1547 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1551 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1552 opx
->segment
, opx
->wrt
);
1559 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1560 (int32_t)data
!= (int64_t)data
) {
1561 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1562 "signed dword immediate exceeds bounds");
1564 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1565 opx
->segment
, opx
->wrt
);
1572 if (ins
->vex_cm
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
))) {
1573 bytes
[0] = (ins
->vex_cm
>> 6) ? 0x8f : 0xc4;
1574 bytes
[1] = (ins
->vex_cm
& 31) | ((~ins
->rex
& 7) << 5);
1575 bytes
[2] = ((ins
->rex
& REX_W
) << (7-3)) |
1576 ((~ins
->drexdst
& 15)<< 3) | (ins
->vex_wlp
& 07);
1577 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 3, NO_SEG
, NO_SEG
);
1581 bytes
[1] = ((~ins
->rex
& REX_R
) << (7-2)) |
1582 ((~ins
->drexdst
& 15) << 3) | (ins
->vex_wlp
& 07);
1583 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 2, NO_SEG
, NO_SEG
);
1593 if (ins
->rex
& REX_W
)
1595 else if (ins
->prefixes
[PPS_OSIZE
] == P_O16
)
1597 else if (ins
->prefixes
[PPS_OSIZE
] == P_O32
)
1602 um
= (uint64_t)2 << (s
-1);
1605 if (uv
> 127 && uv
< (uint64_t)-128 &&
1606 (uv
< um
-128 || uv
> um
-1)) {
1607 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1608 "signed byte value exceeds bounds");
1610 if (opx
->segment
!= NO_SEG
) {
1612 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1613 opx
->segment
, opx
->wrt
);
1616 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1627 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1629 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1636 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1638 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1670 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1671 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1680 *bytes
= c
- 0332 + 0xF2;
1681 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1686 if (ins
->rex
& REX_R
) {
1688 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1691 ins
->rex
&= ~(REX_L
|REX_R
);
1702 if (ins
->oprs
[0].segment
!= NO_SEG
)
1703 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1705 int64_t size
= ins
->oprs
[0].offset
;
1707 out(offset
, segment
, NULL
,
1708 OUT_RESERVE
, size
, NO_SEG
, NO_SEG
);
1719 switch (ins
->oprs
[0].basereg
) {
1734 "bizarre 8086 segment register received");
1736 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1743 switch (ins
->oprs
[0].basereg
) {
1752 "bizarre 386 segment register received");
1754 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1763 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1769 bytes
[0] = c
- 0362 + 0xf2;
1770 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1780 *bytes
= c
- 0366 + 0x66;
1781 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1791 *bytes
= bits
== 16 ? 3 : 5;
1792 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1815 struct operand
*opy
= &ins
->oprs
[op2
];
1818 /* pick rfield from operand b (opx) */
1819 rflags
= regflag(opx
);
1820 rfield
= nasm_regvals
[opx
->basereg
];
1822 /* rfield is constant */
1827 if (!process_ea(opy
, &ea_data
, bits
, ins
->addr_size
,
1829 errfunc(ERR_NONFATAL
, "invalid effective address");
1834 *p
++ = ea_data
.modrm
;
1835 if (ea_data
.sib_present
)
1838 /* DREX suffixes come between the SIB and the displacement */
1839 if (ins
->rex
& REX_D
) {
1840 *p
++ = (ins
->drexdst
<< 4) |
1841 (ins
->rex
& REX_OC
? 0x08 : 0) |
1842 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1847 out(offset
, segment
, bytes
, OUT_RAWDATA
, s
, NO_SEG
, NO_SEG
);
1850 * Make sure the address gets the right offset in case
1851 * the line breaks in the .lst file (BR 1197827)
1856 switch (ea_data
.bytes
) {
1866 if (opy
->segment
== segment
) {
1868 if (overflow_signed(data
, ea_data
.bytes
))
1869 warn_overflow(ERR_PASS2
, ea_data
.bytes
);
1870 out(offset
, segment
, &data
, OUT_ADDRESS
,
1871 ea_data
.bytes
, NO_SEG
, NO_SEG
);
1873 /* overflow check in output/linker? */
1874 out(offset
, segment
, &data
, OUT_REL4ADR
,
1875 insn_end
- offset
, opy
->segment
, opy
->wrt
);
1878 if (overflow_general(opy
->offset
, ins
->addr_size
>> 3) ||
1879 signed_bits(opy
->offset
, ins
->addr_size
) !=
1880 signed_bits(opy
->offset
, ea_data
.bytes
* 8))
1881 warn_overflow(ERR_PASS2
, ea_data
.bytes
);
1884 out(offset
, segment
, &data
, OUT_ADDRESS
,
1885 ea_data
.bytes
, opy
->segment
, opy
->wrt
);
1891 "Invalid amount of bytes (%d) for offset?!",
1900 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1901 ": instruction code \\%o (0x%02X) given", c
, c
);
1907 static opflags_t
regflag(const operand
* o
)
1909 if (!is_register(o
->basereg
))
1910 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1911 return nasm_reg_flags
[o
->basereg
];
1914 static int32_t regval(const operand
* o
)
1916 if (!is_register(o
->basereg
))
1917 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1918 return nasm_regvals
[o
->basereg
];
1921 static int op_rexflags(const operand
* o
, int mask
)
1926 if (!is_register(o
->basereg
))
1927 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1929 flags
= nasm_reg_flags
[o
->basereg
];
1930 val
= nasm_regvals
[o
->basereg
];
1932 return rexflags(val
, flags
, mask
);
1935 static int rexflags(int val
, opflags_t flags
, int mask
)
1940 rex
|= REX_B
|REX_X
|REX_R
;
1943 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1945 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1951 static enum match_result
find_match(const struct itemplate
**tempp
,
1953 int32_t segment
, int64_t offset
, int bits
)
1955 const struct itemplate
*temp
;
1956 enum match_result m
, merr
;
1957 opflags_t xsizeflags
[MAX_OPERANDS
];
1958 bool opsizemissing
= false;
1961 for (i
= 0; i
< instruction
->operands
; i
++)
1962 xsizeflags
[i
] = instruction
->oprs
[i
].type
& SIZE_MASK
;
1964 merr
= MERR_INVALOP
;
1966 for (temp
= nasm_instructions
[instruction
->opcode
];
1967 temp
->opcode
!= I_none
; temp
++) {
1968 m
= matches(temp
, instruction
, bits
);
1969 if (m
== MOK_JUMP
) {
1970 if (jmp_match(segment
, offset
, bits
, instruction
, temp
->code
))
1974 } else if (m
== MERR_OPSIZEMISSING
&&
1975 (temp
->flags
& IF_SMASK
) != IF_SX
) {
1977 * Missing operand size and a candidate for fuzzy matching...
1979 for (i
= 0; i
< temp
->operands
; i
++) {
1980 if ((temp
->opd
[i
] & SAME_AS
) == 0)
1981 xsizeflags
[i
] |= temp
->opd
[i
] & SIZE_MASK
;
1983 opsizemissing
= true;
1987 if (merr
== MOK_GOOD
)
1991 /* No match, but see if we can get a fuzzy operand size match... */
1995 for (i
= 0; i
< instruction
->operands
; i
++) {
1997 * We ignore extrinsic operand sizes on registers, so we should
1998 * never try to fuzzy-match on them. This also resolves the case
1999 * when we have e.g. "xmmrm128" in two different positions.
2001 if (is_class(REGISTER
, instruction
->oprs
[i
].type
))
2004 /* This tests if xsizeflags[i] has more than one bit set */
2005 if ((xsizeflags
[i
] & (xsizeflags
[i
]-1)))
2006 goto done
; /* No luck */
2008 instruction
->oprs
[i
].type
|= xsizeflags
[i
]; /* Set the size */
2011 /* Try matching again... */
2012 for (temp
= nasm_instructions
[instruction
->opcode
];
2013 temp
->opcode
!= I_none
; temp
++) {
2014 m
= matches(temp
, instruction
, bits
);
2015 if (m
== MOK_JUMP
) {
2016 if (jmp_match(segment
, offset
, bits
, instruction
, temp
->code
))
2023 if (merr
== MOK_GOOD
)
2032 static enum match_result
matches(const struct itemplate
*itemp
,
2033 insn
*instruction
, int bits
)
2035 int i
, size
[MAX_OPERANDS
], asize
, oprs
;
2036 bool opsizemissing
= false;
2041 if (itemp
->opcode
!= instruction
->opcode
)
2042 return MERR_INVALOP
;
2045 * Count the operands
2047 if (itemp
->operands
!= instruction
->operands
)
2048 return MERR_INVALOP
;
2053 if (!(optimizing
> 0) && (itemp
->flags
& IF_OPT
))
2054 return MERR_INVALOP
;
2057 * Check that no spurious colons or TOs are present
2059 for (i
= 0; i
< itemp
->operands
; i
++)
2060 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
2061 return MERR_INVALOP
;
2064 * Process size flags
2066 switch (itemp
->flags
& IF_SMASK
) {
2106 if (itemp
->flags
& IF_ARMASK
) {
2107 /* S- flags only apply to a specific operand */
2108 i
= ((itemp
->flags
& IF_ARMASK
) >> IF_ARSHFT
) - 1;
2109 memset(size
, 0, sizeof size
);
2112 /* S- flags apply to all operands */
2113 for (i
= 0; i
< MAX_OPERANDS
; i
++)
2118 * Check that the operand flags all match up,
2119 * it's a bit tricky so lets be verbose:
2121 * 1) Find out the size of operand. If instruction
2122 * doesn't have one specified -- we're trying to
2123 * guess it either from template (IF_S* flag) or
2126 * 2) If template operand (i) has SAME_AS flag [used for registers only]
2127 * (ie the same operand as was specified somewhere in template, and
2128 * this referred operand index is being achieved via ~SAME_AS)
2129 * we are to be sure that both registers (in template and instruction)
2132 * 3) If template operand do not match the instruction OR
2133 * template has an operand size specified AND this size differ
2134 * from which instruction has (perhaps we got it from code bits)
2136 * a) Check that only size of instruction and operand is differ
2137 * other characteristics do match
2138 * b) Perhaps it's a register specified in instruction so
2139 * for such a case we just mark that operand as "size
2140 * missing" and this will turn on fuzzy operand size
2141 * logic facility (handled by a caller)
2143 for (i
= 0; i
< itemp
->operands
; i
++) {
2144 opflags_t type
= instruction
->oprs
[i
].type
;
2145 if (!(type
& SIZE_MASK
))
2148 if (itemp
->opd
[i
] & SAME_AS
) {
2149 int j
= itemp
->opd
[i
] & ~SAME_AS
;
2150 if (type
!= instruction
->oprs
[j
].type
||
2151 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
2152 return MERR_INVALOP
;
2153 } else if (itemp
->opd
[i
] & ~type
||
2154 ((itemp
->opd
[i
] & SIZE_MASK
) &&
2155 ((itemp
->opd
[i
] ^ type
) & SIZE_MASK
))) {
2156 if ((itemp
->opd
[i
] & ~type
& ~SIZE_MASK
) || (type
& SIZE_MASK
)) {
2157 return MERR_INVALOP
;
2158 } else if (!is_class(REGISTER
, type
)) {
2160 * Note: we don't honor extrinsic operand sizes for registers,
2161 * so "missing operand size" for a register should be
2162 * considered a wildcard match rather than an error.
2164 opsizemissing
= true;
2170 return MERR_OPSIZEMISSING
;
2173 * Check operand sizes
2175 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
2176 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
2177 for (i
= 0; i
< oprs
; i
++) {
2178 asize
= itemp
->opd
[i
] & SIZE_MASK
;
2180 for (i
= 0; i
< oprs
; i
++)
2186 oprs
= itemp
->operands
;
2189 for (i
= 0; i
< itemp
->operands
; i
++) {
2190 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
2191 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
2192 return MERR_OPSIZEMISMATCH
;
2196 * Check template is okay at the set cpu level
2198 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
2202 * Verify the appropriate long mode flag.
2204 if ((itemp
->flags
& (bits
== 64 ? IF_NOLONG
: IF_LONG
)))
2205 return MERR_BADMODE
;
2208 * Check if special handling needed for Jumps
2210 if ((itemp
->code
[0] & 0374) == 0370)
2216 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
2217 int addrbits
, int rfield
, opflags_t rflags
)
2219 bool forw_ref
= !!(input
->opflags
& OPFLAG_UNKNOWN
);
2221 output
->rip
= false;
2223 /* REX flags for the rfield operand */
2224 output
->rex
|= rexflags(rfield
, rflags
, REX_R
| REX_P
| REX_W
| REX_H
);
2226 if (is_class(REGISTER
, input
->type
)) { /* register direct */
2230 if (!is_register(input
->basereg
))
2233 i
= nasm_regvals
[input
->basereg
];
2236 return NULL
; /* Invalid EA register */
2238 output
->rex
|= op_rexflags(input
, REX_B
| REX_P
| REX_W
| REX_H
);
2240 output
->sib_present
= false; /* no SIB necessary */
2241 output
->bytes
= 0; /* no offset necessary either */
2242 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
2243 } else { /* it's a memory reference */
2244 if (input
->basereg
== -1 &&
2245 (input
->indexreg
== -1 || input
->scale
== 0)) {
2246 /* it's a pure offset */
2248 if (bits
== 64 && ((input
->type
& IP_REL
) == IP_REL
) &&
2249 input
->segment
== NO_SEG
) {
2250 nasm_error(ERR_WARNING
| ERR_PASS1
, "absolute address can not be RIP-relative");
2251 input
->type
&= ~IP_REL
;
2252 input
->type
|= MEMORY
;
2255 if (input
->eaflags
& EAF_BYTEOFFS
||
2256 (input
->eaflags
& EAF_WORDOFFS
&&
2257 input
->disp_size
!= (addrbits
!= 16 ? 32 : 16))) {
2258 nasm_error(ERR_WARNING
| ERR_PASS1
, "displacement size ignored on absolute address");
2261 if (bits
== 64 && (~input
->type
& IP_REL
)) {
2262 int scale
, index
, base
;
2263 output
->sib_present
= true;
2267 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2269 output
->modrm
= 4 | ((rfield
& 7) << 3);
2270 output
->rip
= false;
2272 output
->sib_present
= false;
2273 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
2274 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
2275 output
->rip
= bits
== 64;
2277 } else { /* it's an indirection */
2278 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
2279 int32_t seg
= input
->segment
;
2280 int hb
= input
->hintbase
, ht
= input
->hinttype
;
2281 int t
, it
, bt
; /* register numbers */
2282 opflags_t x
, ix
, bx
; /* register flags */
2285 i
= -1; /* make this easy, at least */
2287 if (is_register(i
)) {
2288 it
= nasm_regvals
[i
];
2289 ix
= nasm_reg_flags
[i
];
2295 if (is_register(b
)) {
2296 bt
= nasm_regvals
[b
];
2297 bx
= nasm_reg_flags
[b
];
2303 /* check for a 32/64-bit memory reference... */
2304 if ((ix
|bx
) & (BITS32
|BITS64
)) {
2306 * it must be a 32/64-bit memory reference. Firstly we have
2307 * to check that all registers involved are type E/Rxx.
2309 int32_t sok
= BITS32
| BITS64
, o
= input
->offset
;
2312 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
2320 return NULL
; /* Invalid register */
2321 if (~sok
& bx
& SIZE_MASK
)
2322 return NULL
; /* Invalid size */
2327 * While we're here, ensure the user didn't specify
2330 if (input
->disp_size
== 16 || input
->disp_size
== 64)
2333 if (addrbits
== 16 ||
2334 (addrbits
== 32 && !(sok
& BITS32
)) ||
2335 (addrbits
== 64 && !(sok
& BITS64
)))
2338 /* now reorganize base/index */
2339 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
2340 ((hb
== b
&& ht
== EAH_NOTBASE
) ||
2341 (hb
== i
&& ht
== EAH_MAKEBASE
))) {
2342 /* swap if hints say so */
2343 t
= bt
, bt
= it
, it
= t
;
2344 x
= bx
, bx
= ix
, ix
= x
;
2346 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
2347 bt
= -1, bx
= 0, s
++;
2348 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
2349 /* make single reg base, unless hint */
2350 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
2352 if (((s
== 2 && it
!= REG_NUM_ESP
&& !(input
->eaflags
& EAF_TIMESTWO
)) ||
2353 s
== 3 || s
== 5 || s
== 9) && bt
== -1)
2354 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
2355 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
&&
2356 (input
->eaflags
& EAF_TIMESTWO
))
2357 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
2358 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2359 if (s
== 1 && it
== REG_NUM_ESP
) {
2360 /* swap ESP into base if scale is 1 */
2361 t
= it
, it
= bt
, bt
= t
;
2362 x
= ix
, ix
= bx
, bx
= x
;
2364 if (it
== REG_NUM_ESP
||
2365 (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2366 return NULL
; /* wrong, for various reasons */
2368 output
->rex
|= rexflags(it
, ix
, REX_X
);
2369 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2371 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2380 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2381 seg
== NO_SEG
&& !forw_ref
&&
2382 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2384 else if (input
->eaflags
& EAF_BYTEOFFS
||
2385 (o
>= -128 && o
<= 127 &&
2386 seg
== NO_SEG
&& !forw_ref
&&
2387 !(input
->eaflags
& EAF_WORDOFFS
)))
2393 output
->sib_present
= false;
2394 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2395 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2398 int mod
, scale
, index
, base
;
2418 default: /* then what the smeg is it? */
2419 return NULL
; /* panic */
2427 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2428 seg
== NO_SEG
&& !forw_ref
&&
2429 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2431 else if (input
->eaflags
& EAF_BYTEOFFS
||
2432 (o
>= -128 && o
<= 127 &&
2433 seg
== NO_SEG
&& !forw_ref
&&
2434 !(input
->eaflags
& EAF_WORDOFFS
)))
2440 output
->sib_present
= true;
2441 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2442 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2443 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2445 } else { /* it's 16-bit */
2447 int16_t o
= input
->offset
;
2449 /* check for 64-bit long mode */
2453 /* check all registers are BX, BP, SI or DI */
2454 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
&& b
!= R_DI
) ||
2455 (i
!= -1 && i
!= R_BP
&& i
!= R_BX
&& i
!= R_SI
&& i
!= R_DI
))
2458 /* ensure the user didn't specify DWORD/QWORD */
2459 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2462 if (s
!= 1 && i
!= -1)
2463 return NULL
; /* no can do, in 16-bit EA */
2464 if (b
== -1 && i
!= -1) {
2469 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2474 /* have BX/BP as base, SI/DI index */
2476 return NULL
; /* shouldn't ever happen, in theory */
2477 if (i
!= -1 && b
!= -1 &&
2478 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2479 return NULL
; /* invalid combinations */
2480 if (b
== -1) /* pure offset: handled above */
2481 return NULL
; /* so if it gets to here, panic! */
2485 switch (i
* 256 + b
) {
2486 case R_SI
* 256 + R_BX
:
2489 case R_DI
* 256 + R_BX
:
2492 case R_SI
* 256 + R_BP
:
2495 case R_DI
* 256 + R_BP
:
2513 if (rm
== -1) /* can't happen, in theory */
2514 return NULL
; /* so panic if it does */
2516 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2517 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2519 else if (input
->eaflags
& EAF_BYTEOFFS
||
2520 (o
>= -128 && o
<= 127 && seg
== NO_SEG
&&
2521 !forw_ref
&& !(input
->eaflags
& EAF_WORDOFFS
)))
2526 output
->sib_present
= false; /* no SIB - it's 16-bit */
2527 output
->bytes
= mod
; /* bytes of offset needed */
2528 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2533 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2537 static void add_asp(insn
*ins
, int addrbits
)
2542 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2544 switch (ins
->prefixes
[PPS_ASIZE
]) {
2555 valid
&= (addrbits
== 32) ? 16 : 32;
2561 for (j
= 0; j
< ins
->operands
; j
++) {
2562 if (is_class(MEMORY
, ins
->oprs
[j
].type
)) {
2565 /* Verify as Register */
2566 if (!is_register(ins
->oprs
[j
].indexreg
))
2569 i
= nasm_reg_flags
[ins
->oprs
[j
].indexreg
];
2571 /* Verify as Register */
2572 if (!is_register(ins
->oprs
[j
].basereg
))
2575 b
= nasm_reg_flags
[ins
->oprs
[j
].basereg
];
2577 if (ins
->oprs
[j
].scale
== 0)
2581 int ds
= ins
->oprs
[j
].disp_size
;
2582 if ((addrbits
!= 64 && ds
> 8) ||
2583 (addrbits
== 64 && ds
== 16))
2603 if (valid
& addrbits
) {
2604 ins
->addr_size
= addrbits
;
2605 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2606 /* Add an address size prefix */
2607 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2608 ins
->prefixes
[PPS_ASIZE
] = pref
;
2609 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2612 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2613 ins
->addr_size
= addrbits
; /* Error recovery */
2616 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2618 for (j
= 0; j
< ins
->operands
; j
++) {
2619 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2620 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
) != ins
->addr_size
) {
2622 * mem_offs sizes must match the address size; if not,
2623 * strip the MEM_OFFS bit and match only EA instructions
2625 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);