1 /* assemble.c code generation for the Netwide Assembler
3 * The Netwide Assembler is copyright (C) 1996 Simon Tatham and
4 * Julian Hall. All rights reserved. The software is
5 * redistributable under the license given in the file "LICENSE"
6 * distributed in the NASM archive.
8 * the actual codes (C syntax, i.e. octal):
9 * \0 - terminates the code. (Unless it's a literal of course.)
10 * \1..\4 - that many literal bytes follow in the code stream
11 * \5 - add 4 to the primary operand number (b, low octdigit)
12 * \6 - add 4 to the secondary operand number (a, middle octdigit)
13 * \7 - add 4 to both the primary and the secondary operand number
14 * \10..\13 - a literal byte follows in the code stream, to be added
15 * to the register value of operand 0..3
16 * \14..\17 - a signed byte immediate operand, from operand 0..3
17 * \20..\23 - a byte immediate operand, from operand 0..3
18 * \24..\27 - an unsigned byte immediate operand, from operand 0..3
19 * \30..\33 - a word immediate operand, from operand 0..3
20 * \34..\37 - select between \3[0-3] and \4[0-3] depending on 16/32 bit
21 * assembly mode or the operand-size override on the operand
22 * \40..\43 - a long immediate operand, from operand 0..3
23 * \44..\47 - select between \3[0-3], \4[0-3] and \5[4-7]
24 * depending on the address size of the instruction.
25 * \50..\53 - a byte relative operand, from operand 0..3
26 * \54..\57 - a qword immediate operand, from operand 0..3
27 * \60..\63 - a word relative operand, from operand 0..3
28 * \64..\67 - select between \6[0-3] and \7[0-3] depending on 16/32 bit
29 * assembly mode or the operand-size override on the operand
30 * \70..\73 - a long relative operand, from operand 0..3
31 * \74..\77 - a word constant, from the _segment_ part of operand 0..3
32 * \1ab - a ModRM, calculated on EA in operand a, with the spare
33 * field the register value of operand b.
34 * \140..\143 - an immediate word or signed byte for operand 0..3
35 * \144..\147 - or 2 (s-field) into opcode byte if operand 0..3
36 * is a signed byte rather than a word. Opcode byte follows.
37 * \150..\153 - an immediate dword or signed byte for operand 0..3
38 * \154..\157 - or 2 (s-field) into opcode byte if operand 0..3
39 * is a signed byte rather than a dword. Opcode byte follows.
40 * \160..\163 - this instruction uses DREX rather than REX, with the
41 * OC0 field set to 0, and the dest field taken from
43 * \164..\167 - this instruction uses DREX rather than REX, with the
44 * OC0 field set to 1, and the dest field taken from
46 * \171 - placement of DREX suffix in the absence of an EA
47 * \172\ab - the register number from operand a in bits 7..4, with
48 * the 4-bit immediate from operand b in bits 3..0.
49 * \173\xab - the register number from operand a in bits 7..4, with
50 * the value b in bits 3..0.
51 * \174\a - the register number from operand a in bits 7..4, and
52 * an arbitrary value in bits 3..0 (assembled as zero.)
53 * \2ab - a ModRM, calculated on EA in operand a, with the spare
54 * field equal to digit b.
55 * \250..\253 - same as \150..\153, except warn if the 64-bit operand
56 * is not equal to the truncated and sign-extended 32-bit
57 * operand; used for 32-bit immediates in 64-bit mode.
58 * \254..\257 - a signed 32-bit operand to be extended to 64 bits.
59 * \260..\263 - this instruction uses VEX rather than REX, with the
60 * V field taken from operand 0..3.
61 * \270 - this instruction uses VEX rather than REX, with the
62 * V field set to 1111b.
64 * VEX prefixes are followed by the sequence:
65 * \mm\wlp where mm is the M field; and wlp is:
67 * [w0] ww = 0 for W = 0
68 * [w1] ww = 1 for W = 1
69 * [wx] ww = 2 for W don't care (always assembled as 0)
70 * [ww] ww = 3 for W used as REX.W
73 * \274..\277 - a signed byte immediate operand, from operand 0..3,
74 * which is to be extended to the operand size.
75 * \310 - indicates fixed 16-bit address size, i.e. optional 0x67.
76 * \311 - indicates fixed 32-bit address size, i.e. optional 0x67.
77 * \312 - (disassembler only) marker on LOOP, LOOPxx instructions.
78 * \313 - indicates fixed 64-bit address size, 0x67 invalid.
79 * \314 - (disassembler only) invalid with REX.B
80 * \315 - (disassembler only) invalid with REX.X
81 * \316 - (disassembler only) invalid with REX.R
82 * \317 - (disassembler only) invalid with REX.W
83 * \320 - indicates fixed 16-bit operand size, i.e. optional 0x66.
84 * \321 - indicates fixed 32-bit operand size, i.e. optional 0x66.
85 * \322 - indicates that this instruction is only valid when the
86 * operand size is the default (instruction to disassembler,
87 * generates no code in the assembler)
88 * \323 - indicates fixed 64-bit operand size, REX on extensions only.
89 * \324 - indicates 64-bit operand size requiring REX prefix.
90 * \330 - a literal byte follows in the code stream, to be added
91 * to the condition code value of the instruction.
92 * \331 - instruction not valid with REP prefix. Hint for
93 * disassembler only; for SSE instructions.
94 * \332 - REP prefix (0xF2 byte) used as opcode extension.
95 * \333 - REP prefix (0xF3 byte) used as opcode extension.
96 * \334 - LOCK prefix used instead of REX.R
97 * \335 - disassemble a rep (0xF3 byte) prefix as repe not rep.
98 * \336 - force a REP(E) prefix (0xF2) even if not specified.
99 * \337 - force a REPNE prefix (0xF3) even if not specified.
100 * \336-\337 are still listed as prefixes in the disassembler.
101 * \340 - reserve <operand 0> bytes of uninitialized storage.
102 * Operand 0 had better be a segmentless constant.
103 * \344,\345 - the PUSH/POP (respectively) codes for CS, DS, ES, SS
104 * (POP is never used for CS) depending on operand 0
105 * \346,\347 - the second byte of PUSH/POP codes for FS, GS, depending
107 * \360 - no SSE prefix (== \364\331)
108 * \361 - 66 SSE prefix (== \366\331)
109 * \362 - F2 SSE prefix (== \364\332)
110 * \363 - F3 SSE prefix (== \364\333)
111 * \364 - operand-size prefix (0x66) not permitted
112 * \365 - address-size prefix (0x67) not permitted
113 * \366 - operand-size prefix (0x66) used as opcode extension
114 * \367 - address-size prefix (0x67) used as opcode extension
115 * \370,\371,\372 - match only if operand 0 meets byte jump criteria.
116 * 370 is used for Jcc, 371 is used for JMP.
117 * \373 - assemble 0x03 if bits==16, 0x05 if bits==32;
118 * used for conditional jump over longer jump
121 #include "compiler.h"
125 #include <inttypes.h>
129 #include "assemble.h"
134 int sib_present
; /* is a SIB byte necessary? */
135 int bytes
; /* # of bytes of offset needed */
136 int size
; /* lazy - this is sib+bytes+1 */
137 uint8_t modrm
, sib
, rex
, rip
; /* the bytes themselves */
140 static uint32_t cpu
; /* cpu level received from nasm.c */
141 static efunc errfunc
;
142 static struct ofmt
*outfmt
;
143 static ListGen
*list
;
145 static int64_t calcsize(int32_t, int64_t, int, insn
*, const uint8_t *);
146 static void gencode(int32_t segment
, int64_t offset
, int bits
,
147 insn
* ins
, const struct itemplate
*temp
,
149 static int matches(const struct itemplate
*, insn
*, int bits
);
150 static int32_t regflag(const operand
*);
151 static int32_t regval(const operand
*);
152 static int rexflags(int, int32_t, int);
153 static int op_rexflags(const operand
*, int);
154 static ea
*process_ea(operand
*, ea
*, int, int, int, int32_t);
155 static void add_asp(insn
*, int);
157 static int has_prefix(insn
* ins
, enum prefix_pos pos
, enum prefixes prefix
)
159 return ins
->prefixes
[pos
] == prefix
;
162 static void assert_no_prefix(insn
* ins
, enum prefix_pos pos
)
164 if (ins
->prefixes
[pos
])
165 errfunc(ERR_NONFATAL
, "invalid %s prefix",
166 prefix_name(ins
->prefixes
[pos
]));
169 static const char *size_name(int size
)
191 static void warn_overflow(int size
, const struct operand
*o
)
193 if (size
< 8 && o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
) {
194 int64_t lim
= ((int64_t)1 << (size
*8))-1;
195 int64_t data
= o
->offset
;
197 if (data
< ~lim
|| data
> lim
)
198 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
199 "%s data exceeds bounds", size_name(size
));
203 * This routine wrappers the real output format's output routine,
204 * in order to pass a copy of the data off to the listing file
205 * generator at the same time.
207 static void out(int64_t offset
, int32_t segto
, const void *data
,
208 enum out_type type
, uint64_t size
,
209 int32_t segment
, int32_t wrt
)
211 static int32_t lineno
= 0; /* static!!! */
212 static char *lnfname
= NULL
;
215 if (type
== OUT_ADDRESS
&& segment
== NO_SEG
&& wrt
== NO_SEG
) {
217 * This is a non-relocated address, and we're going to
218 * convert it into RAWDATA format.
223 errfunc(ERR_PANIC
, "OUT_ADDRESS with size > 8");
227 WRITEADDR(q
, *(int64_t *)data
, size
);
232 list
->output(offset
, data
, type
, size
);
235 * this call to src_get determines when we call the
236 * debug-format-specific "linenum" function
237 * it updates lineno and lnfname to the current values
238 * returning 0 if "same as last time", -2 if lnfname
239 * changed, and the amount by which lineno changed,
240 * if it did. thus, these variables must be static
243 if (src_get(&lineno
, &lnfname
)) {
244 outfmt
->current_dfmt
->linenum(lnfname
, lineno
, segto
);
247 outfmt
->output(segto
, data
, type
, size
, segment
, wrt
);
250 static bool jmp_match(int32_t segment
, int64_t offset
, int bits
,
251 insn
* ins
, const uint8_t *code
)
256 if ((c
!= 0370 && c
!= 0371) || (ins
->oprs
[0].type
& STRICT
))
260 if (optimizing
< 0 && c
== 0371)
263 isize
= calcsize(segment
, offset
, bits
, ins
, code
);
264 if (ins
->oprs
[0].segment
!= segment
)
267 isize
= ins
->oprs
[0].offset
- offset
- isize
; /* isize is delta */
268 return (isize
>= -128 && isize
<= 127); /* is it byte size? */
271 int64_t assemble(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
272 insn
* instruction
, struct ofmt
*output
, efunc error
,
275 const struct itemplate
*temp
;
280 int64_t start
= offset
;
281 int64_t wsize
= 0; /* size for DB etc. */
283 errfunc
= error
; /* to pass to other functions */
285 outfmt
= output
; /* likewise */
286 list
= listgen
; /* and again */
288 switch (instruction
->opcode
) {
318 int32_t t
= instruction
->times
;
321 "instruction->times < 0 (%ld) in assemble()", t
);
323 while (t
--) { /* repeat TIMES times */
324 for (e
= instruction
->eops
; e
; e
= e
->next
) {
325 if (e
->type
== EOT_DB_NUMBER
) {
327 if (e
->segment
!= NO_SEG
)
328 errfunc(ERR_NONFATAL
,
329 "one-byte relocation attempted");
331 uint8_t out_byte
= e
->offset
;
332 out(offset
, segment
, &out_byte
,
333 OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
335 } else if (wsize
> 8) {
336 errfunc(ERR_NONFATAL
,
337 "integer supplied to a DT, DO or DY"
340 out(offset
, segment
, &e
->offset
,
341 OUT_ADDRESS
, wsize
, e
->segment
, e
->wrt
);
343 } else if (e
->type
== EOT_DB_STRING
||
344 e
->type
== EOT_DB_STRING_FREE
) {
347 out(offset
, segment
, e
->stringval
,
348 OUT_RAWDATA
, e
->stringlen
, NO_SEG
, NO_SEG
);
349 align
= e
->stringlen
% wsize
;
352 align
= wsize
- align
;
353 out(offset
, segment
, zero_buffer
,
354 OUT_RAWDATA
, align
, NO_SEG
, NO_SEG
);
356 offset
+= e
->stringlen
+ align
;
359 if (t
> 0 && t
== instruction
->times
- 1) {
361 * Dummy call to list->output to give the offset to the
364 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
365 list
->uplevel(LIST_TIMES
);
368 if (instruction
->times
> 1)
369 list
->downlevel(LIST_TIMES
);
370 return offset
- start
;
373 if (instruction
->opcode
== I_INCBIN
) {
374 const char *fname
= instruction
->eops
->stringval
;
377 fp
= fopen(fname
, "rb");
379 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
381 } else if (fseek(fp
, 0L, SEEK_END
) < 0) {
382 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
385 static char buf
[4096];
386 size_t t
= instruction
->times
;
391 if (instruction
->eops
->next
) {
392 base
= instruction
->eops
->next
->offset
;
394 if (instruction
->eops
->next
->next
&&
395 len
> (size_t)instruction
->eops
->next
->next
->offset
)
396 len
= (size_t)instruction
->eops
->next
->next
->offset
;
399 * Dummy call to list->output to give the offset to the
402 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
403 list
->uplevel(LIST_INCBIN
);
407 fseek(fp
, base
, SEEK_SET
);
411 fread(buf
, 1, (l
> (int32_t) sizeof(buf
) ? (int32_t) sizeof(buf
) : l
),
415 * This shouldn't happen unless the file
416 * actually changes while we are reading
420 "`incbin': unexpected EOF while"
421 " reading file `%s'", fname
);
422 t
= 0; /* Try to exit cleanly */
425 out(offset
, segment
, buf
, OUT_RAWDATA
, m
,
430 list
->downlevel(LIST_INCBIN
);
431 if (instruction
->times
> 1) {
433 * Dummy call to list->output to give the offset to the
436 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
437 list
->uplevel(LIST_TIMES
);
438 list
->downlevel(LIST_TIMES
);
441 return instruction
->times
* len
;
443 return 0; /* if we're here, there's an error */
446 /* Check to see if we need an address-size prefix */
447 add_asp(instruction
, bits
);
451 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++){
452 int m
= matches(temp
, instruction
, bits
);
454 (m
== 99 && jmp_match(segment
, offset
, bits
,
455 instruction
, temp
->code
))) {
457 int64_t insn_size
= calcsize(segment
, offset
, bits
,
458 instruction
, temp
->code
);
459 itimes
= instruction
->times
;
460 if (insn_size
< 0) /* shouldn't be, on pass two */
461 error(ERR_PANIC
, "errors made it through from pass one");
464 for (j
= 0; j
< MAXPREFIX
; j
++) {
466 switch (instruction
->prefixes
[j
]) {
481 error(ERR_WARNING
| ERR_PASS2
,
482 "cs segment base generated, but will be ignored in 64-bit mode");
488 error(ERR_WARNING
| ERR_PASS2
,
489 "ds segment base generated, but will be ignored in 64-bit mode");
495 error(ERR_WARNING
| ERR_PASS2
,
496 "es segment base generated, but will be ignored in 64-bit mode");
508 error(ERR_WARNING
| ERR_PASS2
,
509 "ss segment base generated, but will be ignored in 64-bit mode");
516 "segr6 and segr7 cannot be used as prefixes");
521 "16-bit addressing is not supported "
523 } else if (bits
!= 16)
533 "64-bit addressing is only supported "
557 error(ERR_PANIC
, "invalid instruction prefix");
560 out(offset
, segment
, &c
, OUT_RAWDATA
, 1,
565 insn_end
= offset
+ insn_size
;
566 gencode(segment
, offset
, bits
, instruction
,
569 if (itimes
> 0 && itimes
== instruction
->times
- 1) {
571 * Dummy call to list->output to give the offset to the
574 list
->output(offset
, NULL
, OUT_RAWDATA
, 0);
575 list
->uplevel(LIST_TIMES
);
578 if (instruction
->times
> 1)
579 list
->downlevel(LIST_TIMES
);
580 return offset
- start
;
581 } else if (m
> 0 && m
> size_prob
) {
586 if (temp
->opcode
== -1) { /* didn't match any instruction */
589 error(ERR_NONFATAL
, "operation size not specified");
592 error(ERR_NONFATAL
, "mismatch in operand sizes");
595 error(ERR_NONFATAL
, "no instruction for this cpu level");
598 error(ERR_NONFATAL
, "instruction not supported in %d-bit mode",
603 "invalid combination of opcode and operands");
610 int64_t insn_size(int32_t segment
, int64_t offset
, int bits
, uint32_t cp
,
611 insn
* instruction
, efunc error
)
613 const struct itemplate
*temp
;
615 errfunc
= error
; /* to pass to other functions */
618 if (instruction
->opcode
== -1)
621 if (instruction
->opcode
== I_DB
|| instruction
->opcode
== I_DW
||
622 instruction
->opcode
== I_DD
|| instruction
->opcode
== I_DQ
||
623 instruction
->opcode
== I_DT
|| instruction
->opcode
== I_DO
||
624 instruction
->opcode
== I_DY
) {
626 int32_t isize
, osize
, wsize
= 0; /* placate gcc */
629 switch (instruction
->opcode
) {
655 for (e
= instruction
->eops
; e
; e
= e
->next
) {
659 if (e
->type
== EOT_DB_NUMBER
)
661 else if (e
->type
== EOT_DB_STRING
||
662 e
->type
== EOT_DB_STRING_FREE
)
663 osize
= e
->stringlen
;
665 align
= (-osize
) % wsize
;
668 isize
+= osize
+ align
;
670 return isize
* instruction
->times
;
673 if (instruction
->opcode
== I_INCBIN
) {
674 const char *fname
= instruction
->eops
->stringval
;
678 fp
= fopen(fname
, "rb");
680 error(ERR_NONFATAL
, "`incbin': unable to open file `%s'",
682 else if (fseek(fp
, 0L, SEEK_END
) < 0)
683 error(ERR_NONFATAL
, "`incbin': unable to seek on file `%s'",
688 if (instruction
->eops
->next
) {
689 len
-= instruction
->eops
->next
->offset
;
690 if (instruction
->eops
->next
->next
&&
691 len
> (size_t)instruction
->eops
->next
->next
->offset
) {
692 len
= (size_t)instruction
->eops
->next
->next
->offset
;
695 return instruction
->times
* len
;
697 return 0; /* if we're here, there's an error */
700 /* Check to see if we need an address-size prefix */
701 add_asp(instruction
, bits
);
703 for (temp
= nasm_instructions
[instruction
->opcode
]; temp
->opcode
!= -1; temp
++) {
704 int m
= matches(temp
, instruction
, bits
);
706 (m
== 99 && jmp_match(segment
, offset
, bits
,
707 instruction
, temp
->code
))) {
708 /* we've matched an instruction. */
710 const uint8_t *codes
= temp
->code
;
713 isize
= calcsize(segment
, offset
, bits
, instruction
, codes
);
716 for (j
= 0; j
< MAXPREFIX
; j
++) {
717 switch (instruction
->prefixes
[j
]) {
743 return isize
* instruction
->times
;
746 return -1; /* didn't match any instruction */
749 static bool possible_sbyte(operand
*o
)
751 return o
->wrt
== NO_SEG
&& o
->segment
== NO_SEG
&&
752 !(o
->opflags
& OPFLAG_FORWARD
) &&
753 optimizing
>= 0 && !(o
->type
& STRICT
);
756 /* check that opn[op] is a signed byte of size 16 or 32 */
757 static bool is_sbyte16(operand
*o
)
761 if (!possible_sbyte(o
))
765 return v
>= -128 && v
<= 127;
768 static bool is_sbyte32(operand
*o
)
772 if (!possible_sbyte(o
))
776 return v
>= -128 && v
<= 127;
779 /* Common construct */
780 #define case4(x) case (x): case (x)+1: case (x)+2: case (x)+3
782 static int64_t calcsize(int32_t segment
, int64_t offset
, int bits
,
783 insn
* ins
, const uint8_t *codes
)
792 ins
->rex
= 0; /* Ensure REX is reset */
794 if (ins
->prefixes
[PPS_OSIZE
] == P_O64
)
797 (void)segment
; /* Don't warn that this parameter is unused */
798 (void)offset
; /* Don't warn that this parameter is unused */
802 op1
= (c
& 3) + ((opex
& 1) << 2);
803 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
804 opx
= &ins
->oprs
[op1
];
805 opex
= 0; /* For the next iteration */
812 codes
+= c
, length
+= c
;
823 op_rexflags(opx
, REX_B
|REX_H
|REX_P
|REX_W
);
838 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
839 length
+= (opx
->type
& BITS16
) ? 2 : 4;
841 length
+= (bits
== 16) ? 2 : 4;
849 length
+= ins
->addr_size
>> 3;
857 length
+= 8; /* MOV reg64/imm */
865 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
866 length
+= (opx
->type
& BITS16
) ? 2 : 4;
868 length
+= (bits
== 16) ? 2 : 4;
880 length
+= is_sbyte16(opx
) ? 1 : 2;
889 length
+= is_sbyte32(opx
) ? 1 : 4;
900 ins
->drexdst
= regval(opx
);
905 ins
->rex
|= REX_D
|REX_OC
;
906 ins
->drexdst
= regval(opx
);
920 length
+= is_sbyte32(opx
) ? 1 : 4;
929 ins
->drexdst
= regval(opx
);
930 ins
->vex_m
= *codes
++;
931 ins
->vex_wlp
= *codes
++;
937 ins
->vex_m
= *codes
++;
938 ins
->vex_wlp
= *codes
++;
951 length
+= (bits
!= 16) && !has_prefix(ins
, PPS_ASIZE
, P_A16
);
955 length
+= (bits
!= 32) && !has_prefix(ins
, PPS_ASIZE
, P_A32
);
962 if (bits
!= 64 || has_prefix(ins
, PPS_ASIZE
, P_A16
) ||
963 has_prefix(ins
, PPS_ASIZE
, P_A32
))
971 length
+= (bits
!= 16);
975 length
+= (bits
== 16);
1009 if (!ins
->prefixes
[PPS_LREP
])
1010 ins
->prefixes
[PPS_LREP
] = P_REP
;
1014 if (!ins
->prefixes
[PPS_LREP
])
1015 ins
->prefixes
[PPS_LREP
] = P_REPNE
;
1019 if (ins
->oprs
[0].segment
!= NO_SEG
)
1020 errfunc(ERR_NONFATAL
, "attempt to reserve non-constant"
1021 " quantity of BSS space");
1023 length
+= ins
->oprs
[0].offset
;
1073 struct operand
*opy
= &ins
->oprs
[op2
];
1075 ea_data
.rex
= 0; /* Ensure ea.REX is initially 0 */
1078 /* pick rfield from operand b (opx) */
1079 rflags
= regflag(opx
);
1080 rfield
= nasm_regvals
[opx
->basereg
];
1085 if (!process_ea(opy
, &ea_data
, bits
,
1086 ins
->addr_size
, rfield
, rflags
)) {
1087 errfunc(ERR_NONFATAL
, "invalid effective address");
1090 ins
->rex
|= ea_data
.rex
;
1091 length
+= ea_data
.size
;
1097 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1098 ": instruction code 0x%02X given", c
);
1103 ins
->rex
&= rex_mask
;
1105 if (ins
->rex
& REX_V
) {
1106 int bad32
= REX_R
|REX_W
|REX_X
|REX_B
;
1108 if (ins
->rex
& REX_H
) {
1109 errfunc(ERR_NONFATAL
, "cannot use high register in vex instruction");
1112 switch (ins
->vex_wlp
& 030) {
1126 if (bits
!= 64 && ((ins
->rex
& bad32
) || ins
->drexdst
> 7)) {
1127 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1130 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_R
|REX_B
)))
1134 } else if (ins
->rex
& REX_D
) {
1135 if (ins
->rex
& REX_H
) {
1136 errfunc(ERR_NONFATAL
, "cannot use high register in drex instruction");
1139 if (bits
!= 64 && ((ins
->rex
& (REX_R
|REX_W
|REX_X
|REX_B
)) ||
1140 ins
->drexdst
> 7)) {
1141 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1145 } else if (ins
->rex
& REX_REAL
) {
1146 if (ins
->rex
& REX_H
) {
1147 errfunc(ERR_NONFATAL
, "cannot use high register in rex instruction");
1149 } else if (bits
== 64) {
1151 } else if ((ins
->rex
& REX_L
) &&
1152 !(ins
->rex
& (REX_P
|REX_W
|REX_X
|REX_B
)) &&
1155 assert_no_prefix(ins
, PPS_LREP
);
1158 errfunc(ERR_NONFATAL
, "invalid operands in non-64-bit mode");
1166 #define EMIT_REX() \
1167 if (!(ins->rex & (REX_D|REX_V)) && (ins->rex & REX_REAL) && (bits == 64)) { \
1168 ins->rex = (ins->rex & REX_REAL)|REX_P; \
1169 out(offset, segment, &ins->rex, OUT_RAWDATA, 1, NO_SEG, NO_SEG); \
1174 static void gencode(int32_t segment
, int64_t offset
, int bits
,
1175 insn
* ins
, const struct itemplate
*temp
,
1178 static char condval
[] = { /* conditional opcodes */
1179 0x7, 0x3, 0x2, 0x6, 0x2, 0x4, 0xF, 0xD, 0xC, 0xE, 0x6, 0x2,
1180 0x3, 0x7, 0x3, 0x5, 0xE, 0xC, 0xD, 0xF, 0x1, 0xB, 0x9, 0x5,
1181 0x0, 0xA, 0xA, 0xB, 0x8, 0x4
1188 struct operand
*opx
;
1189 const uint8_t *codes
= temp
->code
;
1194 op1
= (c
& 3) + ((opex
& 1) << 2);
1195 op2
= ((c
>> 3) & 3) + ((opex
& 2) << 1);
1196 opx
= &ins
->oprs
[op1
];
1197 opex
= 0; /* For the next iteration */
1205 out(offset
, segment
, codes
, OUT_RAWDATA
, c
, NO_SEG
, NO_SEG
);
1218 bytes
[0] = *codes
++ + (regval(opx
) & 7);
1219 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1224 /* The test for BITS8 and SBYTE here is intended to avoid
1225 warning on optimizer actions due to SBYTE, while still
1226 warn on explicit BYTE directives. Also warn, obviously,
1227 if the optimizer isn't enabled. */
1228 if (((opx
->type
& BITS8
) ||
1229 !(opx
->type
& temp
->opd
[op1
] & BYTENESS
)) &&
1230 (opx
->offset
< -128 || opx
->offset
> 127)) {
1231 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1232 "signed byte value exceeds bounds");
1234 if (opx
->segment
!= NO_SEG
) {
1236 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1237 opx
->segment
, opx
->wrt
);
1239 bytes
[0] = opx
->offset
;
1240 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1247 if (opx
->offset
< -256 || opx
->offset
> 255) {
1248 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1249 "byte value exceeds bounds");
1251 if (opx
->segment
!= NO_SEG
) {
1253 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1254 opx
->segment
, opx
->wrt
);
1256 bytes
[0] = opx
->offset
;
1257 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1264 if (opx
->offset
< 0 || opx
->offset
> 255)
1265 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1266 "unsigned byte value exceeds bounds");
1267 if (opx
->segment
!= NO_SEG
) {
1269 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1270 opx
->segment
, opx
->wrt
);
1272 bytes
[0] = opx
->offset
;
1273 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1280 warn_overflow(2, opx
);
1282 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1283 opx
->segment
, opx
->wrt
);
1288 if (opx
->type
& (BITS16
| BITS32
))
1289 size
= (opx
->type
& BITS16
) ? 2 : 4;
1291 size
= (bits
== 16) ? 2 : 4;
1292 warn_overflow(size
, opx
);
1294 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1295 opx
->segment
, opx
->wrt
);
1300 warn_overflow(4, opx
);
1302 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1303 opx
->segment
, opx
->wrt
);
1309 size
= ins
->addr_size
>> 3;
1310 warn_overflow(size
, opx
);
1311 out(offset
, segment
, &data
, OUT_ADDRESS
, size
,
1312 opx
->segment
, opx
->wrt
);
1317 if (opx
->segment
!= segment
)
1318 errfunc(ERR_NONFATAL
,
1319 "short relative jump outside segment");
1320 data
= opx
->offset
- insn_end
;
1321 if (data
> 127 || data
< -128)
1322 errfunc(ERR_NONFATAL
, "short jump is out of range");
1324 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1329 data
= (int64_t)opx
->offset
;
1330 out(offset
, segment
, &data
, OUT_ADDRESS
, 8,
1331 opx
->segment
, opx
->wrt
);
1336 if (opx
->segment
!= segment
) {
1338 out(offset
, segment
, &data
,
1339 OUT_REL2ADR
, insn_end
- offset
,
1340 opx
->segment
, opx
->wrt
);
1342 data
= opx
->offset
- insn_end
;
1343 out(offset
, segment
, &data
,
1344 OUT_ADDRESS
, 2, NO_SEG
, NO_SEG
);
1350 if (opx
->type
& (BITS16
| BITS32
| BITS64
))
1351 size
= (opx
->type
& BITS16
) ? 2 : 4;
1353 size
= (bits
== 16) ? 2 : 4;
1354 if (opx
->segment
!= segment
) {
1356 out(offset
, segment
, &data
,
1357 size
== 2 ? OUT_REL2ADR
: OUT_REL4ADR
,
1358 insn_end
- offset
, opx
->segment
, opx
->wrt
);
1360 data
= opx
->offset
- insn_end
;
1361 out(offset
, segment
, &data
,
1362 OUT_ADDRESS
, size
, NO_SEG
, NO_SEG
);
1368 if (opx
->segment
!= segment
) {
1370 out(offset
, segment
, &data
,
1371 OUT_REL4ADR
, insn_end
- offset
,
1372 opx
->segment
, opx
->wrt
);
1374 data
= opx
->offset
- insn_end
;
1375 out(offset
, segment
, &data
,
1376 OUT_ADDRESS
, 4, NO_SEG
, NO_SEG
);
1382 if (opx
->segment
== NO_SEG
)
1383 errfunc(ERR_NONFATAL
, "value referenced by FAR is not"
1386 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1387 outfmt
->segbase(1 + opx
->segment
),
1394 warn_overflow(2, opx
);
1395 if (is_sbyte16(opx
)) {
1397 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1401 out(offset
, segment
, &data
, OUT_ADDRESS
, 2,
1402 opx
->segment
, opx
->wrt
);
1409 bytes
[0] = *codes
++;
1410 if (is_sbyte16(opx
))
1411 bytes
[0] |= 2; /* s-bit */
1412 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1418 warn_overflow(4, opx
);
1419 if (is_sbyte32(opx
)) {
1421 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1425 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1426 opx
->segment
, opx
->wrt
);
1433 bytes
[0] = *codes
++;
1434 if (is_sbyte32(opx
))
1435 bytes
[0] |= 2; /* s-bit */
1436 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1446 (ins
->drexdst
<< 4) |
1447 (ins
->rex
& REX_OC
? 0x08 : 0) |
1448 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1450 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1456 opx
= &ins
->oprs
[c
>> 3];
1457 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1458 opx
= &ins
->oprs
[c
& 7];
1459 if (opx
->segment
!= NO_SEG
|| opx
->wrt
!= NO_SEG
) {
1460 errfunc(ERR_NONFATAL
,
1461 "non-absolute expression not permitted as argument %d",
1464 if (opx
->offset
& ~15) {
1465 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1466 "four-bit argument exceeds bounds");
1468 bytes
[0] |= opx
->offset
& 15;
1470 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1476 opx
= &ins
->oprs
[c
>> 4];
1477 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1479 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1485 opx
= &ins
->oprs
[c
];
1486 bytes
[0] = nasm_regvals
[opx
->basereg
] << 4;
1487 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1493 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1494 (int32_t)data
!= (int64_t)data
) {
1495 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1496 "signed dword immediate exceeds bounds");
1498 if (is_sbyte32(opx
)) {
1500 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1504 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1505 opx
->segment
, opx
->wrt
);
1512 if (opx
->wrt
== NO_SEG
&& opx
->segment
== NO_SEG
&&
1513 (int32_t)data
!= (int64_t)data
) {
1514 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1515 "signed dword immediate exceeds bounds");
1517 out(offset
, segment
, &data
, OUT_ADDRESS
, 4,
1518 opx
->segment
, opx
->wrt
);
1525 if (ins
->vex_m
!= 1 || (ins
->rex
& (REX_W
|REX_X
|REX_B
))) {
1527 bytes
[1] = ins
->vex_m
| ((~ins
->rex
& 7) << 5);
1528 bytes
[2] = ((ins
->rex
& REX_W
) << (7-3)) |
1529 ((~ins
->drexdst
& 15)<< 3) | (ins
->vex_wlp
& 07);
1530 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 3, NO_SEG
, NO_SEG
);
1534 bytes
[1] = ((~ins
->rex
& REX_R
) << (7-2)) |
1535 ((~ins
->drexdst
& 15) << 3) | (ins
->vex_wlp
& 07);
1536 out(offset
, segment
, &bytes
, OUT_RAWDATA
, 2, NO_SEG
, NO_SEG
);
1546 if (ins
->rex
& REX_W
)
1548 else if (ins
->prefixes
[PPS_OSIZE
] == P_O16
)
1550 else if (ins
->prefixes
[PPS_OSIZE
] == P_O32
)
1555 um
= (uint64_t)2 << (s
-1);
1558 if (uv
> 127 && uv
< (uint64_t)-128 &&
1559 (uv
< um
-128 || uv
> um
-1)) {
1560 errfunc(ERR_WARNING
| ERR_PASS2
| ERR_WARN_NOV
,
1561 "signed byte value exceeds bounds");
1563 if (opx
->segment
!= NO_SEG
) {
1565 out(offset
, segment
, &data
, OUT_ADDRESS
, 1,
1566 opx
->segment
, opx
->wrt
);
1569 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
,
1580 if (bits
== 32 && !has_prefix(ins
, PPS_ASIZE
, P_A16
)) {
1582 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1589 if (bits
!= 32 && !has_prefix(ins
, PPS_ASIZE
, P_A32
)) {
1591 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1610 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1619 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1634 *bytes
= *codes
++ ^ condval
[ins
->condition
];
1635 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1644 *bytes
= c
- 0332 + 0xF2;
1645 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1650 if (ins
->rex
& REX_R
) {
1652 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1655 ins
->rex
&= ~(REX_L
|REX_R
);
1666 if (ins
->oprs
[0].segment
!= NO_SEG
)
1667 errfunc(ERR_PANIC
, "non-constant BSS size in pass two");
1669 int64_t size
= ins
->oprs
[0].offset
;
1671 out(offset
, segment
, NULL
,
1672 OUT_RESERVE
, size
, NO_SEG
, NO_SEG
);
1680 switch (ins
->oprs
[0].basereg
) {
1695 "bizarre 8086 segment register received");
1697 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1704 switch (ins
->oprs
[0].basereg
) {
1713 "bizarre 386 segment register received");
1715 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1724 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1730 bytes
[0] = c
- 0362 + 0xf2;
1731 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1741 *bytes
= c
- 0366 + 0x66;
1742 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1752 *bytes
= bits
== 16 ? 3 : 5;
1753 out(offset
, segment
, bytes
, OUT_RAWDATA
, 1, NO_SEG
, NO_SEG
);
1776 struct operand
*opy
= &ins
->oprs
[op2
];
1779 /* pick rfield from operand b (opx) */
1780 rflags
= regflag(opx
);
1781 rfield
= nasm_regvals
[opx
->basereg
];
1783 /* rfield is constant */
1788 if (!process_ea(opy
, &ea_data
, bits
, ins
->addr_size
,
1790 errfunc(ERR_NONFATAL
, "invalid effective address");
1795 *p
++ = ea_data
.modrm
;
1796 if (ea_data
.sib_present
)
1799 /* DREX suffixes come between the SIB and the displacement */
1800 if (ins
->rex
& REX_D
) {
1801 *p
++ = (ins
->drexdst
<< 4) |
1802 (ins
->rex
& REX_OC
? 0x08 : 0) |
1803 (ins
->rex
& (REX_R
|REX_X
|REX_B
));
1808 out(offset
, segment
, bytes
, OUT_RAWDATA
, s
, NO_SEG
, NO_SEG
);
1811 * Make sure the address gets the right offset in case
1812 * the line breaks in the .lst file (BR 1197827)
1817 switch (ea_data
.bytes
) {
1825 warn_overflow(ea_data
.bytes
, opy
);
1828 if (opy
->segment
== segment
) {
1830 out(offset
, segment
, &data
, OUT_ADDRESS
,
1831 ea_data
.bytes
, NO_SEG
, NO_SEG
);
1833 out(offset
, segment
, &data
, OUT_REL4ADR
,
1834 insn_end
- offset
, opy
->segment
, opy
->wrt
);
1838 out(offset
, segment
, &data
, OUT_ADDRESS
,
1839 ea_data
.bytes
, opy
->segment
, opy
->wrt
);
1845 "Invalid amount of bytes (%d) for offset?!",
1854 errfunc(ERR_PANIC
, "internal instruction table corrupt"
1855 ": instruction code 0x%02X given", c
);
1861 static int32_t regflag(const operand
* o
)
1863 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1864 errfunc(ERR_PANIC
, "invalid operand passed to regflag()");
1866 return nasm_reg_flags
[o
->basereg
];
1869 static int32_t regval(const operand
* o
)
1871 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1872 errfunc(ERR_PANIC
, "invalid operand passed to regval()");
1874 return nasm_regvals
[o
->basereg
];
1877 static int op_rexflags(const operand
* o
, int mask
)
1882 if (o
->basereg
< EXPR_REG_START
|| o
->basereg
>= REG_ENUM_LIMIT
) {
1883 errfunc(ERR_PANIC
, "invalid operand passed to op_rexflags()");
1886 flags
= nasm_reg_flags
[o
->basereg
];
1887 val
= nasm_regvals
[o
->basereg
];
1889 return rexflags(val
, flags
, mask
);
1892 static int rexflags(int val
, int32_t flags
, int mask
)
1897 rex
|= REX_B
|REX_X
|REX_R
;
1900 if (!(REG_HIGH
& ~flags
)) /* AH, CH, DH, BH */
1902 else if (!(REG8
& ~flags
) && val
>= 4) /* SPL, BPL, SIL, DIL */
1908 static int matches(const struct itemplate
*itemp
, insn
* instruction
, int bits
)
1910 int i
, size
[MAX_OPERANDS
], asize
, oprs
, ret
;
1917 if (itemp
->opcode
!= instruction
->opcode
)
1921 * Count the operands
1923 if (itemp
->operands
!= instruction
->operands
)
1927 * Check that no spurious colons or TOs are present
1929 for (i
= 0; i
< itemp
->operands
; i
++)
1930 if (instruction
->oprs
[i
].type
& ~itemp
->opd
[i
] & (COLON
| TO
))
1934 * Process size flags
1936 if (itemp
->flags
& IF_ARMASK
) {
1937 memset(size
, 0, sizeof size
);
1939 i
= ((itemp
->flags
& IF_ARMASK
) >> IF_ARSHFT
) - 1;
1941 switch (itemp
->flags
& IF_SMASK
) {
1978 switch (itemp
->flags
& IF_SMASK
) {
2013 for (i
= 0; i
< MAX_OPERANDS
; i
++)
2018 * Check that the operand flags all match up
2020 for (i
= 0; i
< itemp
->operands
; i
++) {
2021 int32_t type
= instruction
->oprs
[i
].type
;
2022 if (!(type
& SIZE_MASK
))
2025 if (itemp
->opd
[i
] & SAME_AS
) {
2026 int j
= itemp
->opd
[i
] & ~SAME_AS
;
2027 if (type
!= instruction
->oprs
[j
].type
||
2028 instruction
->oprs
[i
].basereg
!= instruction
->oprs
[j
].basereg
)
2030 } else if (itemp
->opd
[i
] & ~type
||
2031 ((itemp
->opd
[i
] & SIZE_MASK
) &&
2032 ((itemp
->opd
[i
] ^ type
) & SIZE_MASK
))) {
2033 if ((itemp
->opd
[i
] & ~type
& ~SIZE_MASK
) ||
2042 * Check operand sizes
2044 if (itemp
->flags
& (IF_SM
| IF_SM2
)) {
2045 oprs
= (itemp
->flags
& IF_SM2
? 2 : itemp
->operands
);
2047 for (i
= 0; i
< oprs
; i
++) {
2048 if ((asize
= itemp
->opd
[i
] & SIZE_MASK
) != 0) {
2050 for (j
= 0; j
< oprs
; j
++)
2056 oprs
= itemp
->operands
;
2059 for (i
= 0; i
< itemp
->operands
; i
++) {
2060 if (!(itemp
->opd
[i
] & SIZE_MASK
) &&
2061 (instruction
->oprs
[i
].type
& SIZE_MASK
& ~size
[i
]))
2066 * Check template is okay at the set cpu level
2068 if (((itemp
->flags
& IF_PLEVEL
) > cpu
))
2072 * Verify the appropriate long mode flag.
2074 if ((itemp
->flags
& (bits
== 64 ? IF_NOLONG
: IF_LONG
)))
2078 * Check if special handling needed for Jumps
2080 if ((uint8_t)(itemp
->code
[0]) >= 0370)
2086 static ea
*process_ea(operand
* input
, ea
* output
, int bits
,
2087 int addrbits
, int rfield
, int32_t rflags
)
2089 bool forw_ref
= !!(input
->opflags
& OPFLAG_FORWARD
);
2091 output
->rip
= false;
2093 /* REX flags for the rfield operand */
2094 output
->rex
|= rexflags(rfield
, rflags
, REX_R
|REX_P
|REX_W
|REX_H
);
2096 if (!(REGISTER
& ~input
->type
)) { /* register direct */
2100 if (input
->basereg
< EXPR_REG_START
/* Verify as Register */
2101 || input
->basereg
>= REG_ENUM_LIMIT
)
2104 i
= nasm_regvals
[input
->basereg
];
2107 return NULL
; /* Invalid EA register */
2109 output
->rex
|= op_rexflags(input
, REX_B
|REX_P
|REX_W
|REX_H
);
2111 output
->sib_present
= false; /* no SIB necessary */
2112 output
->bytes
= 0; /* no offset necessary either */
2113 output
->modrm
= 0xC0 | ((rfield
& 7) << 3) | (i
& 7);
2114 } else { /* it's a memory reference */
2115 if (input
->basereg
== -1
2116 && (input
->indexreg
== -1 || input
->scale
== 0)) {
2117 /* it's a pure offset */
2118 if (bits
== 64 && (~input
->type
& IP_REL
)) {
2119 int scale
, index
, base
;
2120 output
->sib_present
= true;
2124 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2126 output
->modrm
= 4 | ((rfield
& 7) << 3);
2127 output
->rip
= false;
2129 output
->sib_present
= false;
2130 output
->bytes
= (addrbits
!= 16 ? 4 : 2);
2131 output
->modrm
= (addrbits
!= 16 ? 5 : 6) | ((rfield
& 7) << 3);
2132 output
->rip
= bits
== 64;
2134 } else { /* it's an indirection */
2135 int i
= input
->indexreg
, b
= input
->basereg
, s
= input
->scale
;
2136 int32_t o
= input
->offset
, seg
= input
->segment
;
2137 int hb
= input
->hintbase
, ht
= input
->hinttype
;
2140 int32_t ix
, bx
; /* register flags */
2143 i
= -1; /* make this easy, at least */
2145 if (i
>= EXPR_REG_START
&& i
< REG_ENUM_LIMIT
) {
2146 it
= nasm_regvals
[i
];
2147 ix
= nasm_reg_flags
[i
];
2153 if (b
>= EXPR_REG_START
&& b
< REG_ENUM_LIMIT
) {
2154 bt
= nasm_regvals
[b
];
2155 bx
= nasm_reg_flags
[b
];
2161 /* check for a 32/64-bit memory reference... */
2162 if ((ix
|bx
) & (BITS32
|BITS64
)) {
2163 /* it must be a 32/64-bit memory reference. Firstly we have
2164 * to check that all registers involved are type E/Rxx. */
2165 int32_t sok
= BITS32
|BITS64
;
2168 if (!(REG64
& ~ix
) || !(REG32
& ~ix
))
2176 return NULL
; /* Invalid register */
2177 if (~sok
& bx
& SIZE_MASK
)
2178 return NULL
; /* Invalid size */
2182 /* While we're here, ensure the user didn't specify
2184 if (input
->disp_size
== 16 || input
->disp_size
== 64)
2187 if (addrbits
== 16 ||
2188 (addrbits
== 32 && !(sok
& BITS32
)) ||
2189 (addrbits
== 64 && !(sok
& BITS64
)))
2192 /* now reorganize base/index */
2193 if (s
== 1 && bt
!= it
&& bt
!= -1 && it
!= -1 &&
2194 ((hb
== b
&& ht
== EAH_NOTBASE
)
2195 || (hb
== i
&& ht
== EAH_MAKEBASE
))) {
2196 /* swap if hints say so */
2197 t
= bt
, bt
= it
, it
= t
;
2198 t
= bx
, bx
= ix
, ix
= t
;
2200 if (bt
== it
) /* convert EAX+2*EAX to 3*EAX */
2201 bt
= -1, bx
= 0, s
++;
2202 if (bt
== -1 && s
== 1 && !(hb
== it
&& ht
== EAH_NOTBASE
)) {
2203 /* make single reg base, unless hint */
2204 bt
= it
, bx
= ix
, it
= -1, ix
= 0;
2206 if (((s
== 2 && it
!= REG_NUM_ESP
2207 && !(input
->eaflags
& EAF_TIMESTWO
)) || s
== 3
2208 || s
== 5 || s
== 9) && bt
== -1)
2209 bt
= it
, bx
= ix
, s
--; /* convert 3*EAX to EAX+2*EAX */
2210 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
2211 && (input
->eaflags
& EAF_TIMESTWO
))
2212 it
= bt
, ix
= bx
, bt
= -1, bx
= 0, s
= 1;
2213 /* convert [NOSPLIT EAX] to sib format with 0x0 displacement */
2214 if (s
== 1 && it
== REG_NUM_ESP
) {
2215 /* swap ESP into base if scale is 1 */
2216 t
= it
, it
= bt
, bt
= t
;
2217 t
= ix
, ix
= bx
, bx
= t
;
2219 if (it
== REG_NUM_ESP
2220 || (s
!= 1 && s
!= 2 && s
!= 4 && s
!= 8 && it
!= -1))
2221 return NULL
; /* wrong, for various reasons */
2223 output
->rex
|= rexflags(it
, ix
, REX_X
);
2224 output
->rex
|= rexflags(bt
, bx
, REX_B
);
2226 if (it
== -1 && (bt
& 7) != REG_NUM_ESP
) {
2235 if (rm
!= REG_NUM_EBP
&& o
== 0 &&
2236 seg
== NO_SEG
&& !forw_ref
&&
2238 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2240 else if (input
->eaflags
& EAF_BYTEOFFS
||
2241 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2243 && !(input
->eaflags
& EAF_WORDOFFS
)))
2249 output
->sib_present
= false;
2250 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2251 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2254 int mod
, scale
, index
, base
;
2274 default: /* then what the smeg is it? */
2275 return NULL
; /* panic */
2283 if (base
!= REG_NUM_EBP
&& o
== 0 &&
2284 seg
== NO_SEG
&& !forw_ref
&&
2286 (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2288 else if (input
->eaflags
& EAF_BYTEOFFS
||
2289 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2291 && !(input
->eaflags
& EAF_WORDOFFS
)))
2297 output
->sib_present
= true;
2298 output
->bytes
= (bt
== -1 || mod
== 2 ? 4 : mod
);
2299 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | 4;
2300 output
->sib
= (scale
<< 6) | (index
<< 3) | base
;
2302 } else { /* it's 16-bit */
2305 /* check for 64-bit long mode */
2309 /* check all registers are BX, BP, SI or DI */
2310 if ((b
!= -1 && b
!= R_BP
&& b
!= R_BX
&& b
!= R_SI
2311 && b
!= R_DI
) || (i
!= -1 && i
!= R_BP
&& i
!= R_BX
2312 && i
!= R_SI
&& i
!= R_DI
))
2315 /* ensure the user didn't specify DWORD/QWORD */
2316 if (input
->disp_size
== 32 || input
->disp_size
== 64)
2319 if (s
!= 1 && i
!= -1)
2320 return NULL
; /* no can do, in 16-bit EA */
2321 if (b
== -1 && i
!= -1) {
2326 if ((b
== R_SI
|| b
== R_DI
) && i
!= -1) {
2331 /* have BX/BP as base, SI/DI index */
2333 return NULL
; /* shouldn't ever happen, in theory */
2334 if (i
!= -1 && b
!= -1 &&
2335 (i
== R_BP
|| i
== R_BX
|| b
== R_SI
|| b
== R_DI
))
2336 return NULL
; /* invalid combinations */
2337 if (b
== -1) /* pure offset: handled above */
2338 return NULL
; /* so if it gets to here, panic! */
2342 switch (i
* 256 + b
) {
2343 case R_SI
* 256 + R_BX
:
2346 case R_DI
* 256 + R_BX
:
2349 case R_SI
* 256 + R_BP
:
2352 case R_DI
* 256 + R_BP
:
2370 if (rm
== -1) /* can't happen, in theory */
2371 return NULL
; /* so panic if it does */
2373 if (o
== 0 && seg
== NO_SEG
&& !forw_ref
&& rm
!= 6 &&
2374 !(input
->eaflags
& (EAF_BYTEOFFS
| EAF_WORDOFFS
)))
2376 else if (input
->eaflags
& EAF_BYTEOFFS
||
2377 (o
>= -128 && o
<= 127 && seg
== NO_SEG
2379 && !(input
->eaflags
& EAF_WORDOFFS
)))
2384 output
->sib_present
= false; /* no SIB - it's 16-bit */
2385 output
->bytes
= mod
; /* bytes of offset needed */
2386 output
->modrm
= (mod
<< 6) | ((rfield
& 7) << 3) | rm
;
2391 output
->size
= 1 + output
->sib_present
+ output
->bytes
;
2395 static void add_asp(insn
*ins
, int addrbits
)
2400 valid
= (addrbits
== 64) ? 64|32 : 32|16;
2402 switch (ins
->prefixes
[PPS_ASIZE
]) {
2413 valid
&= (addrbits
== 32) ? 16 : 32;
2419 for (j
= 0; j
< ins
->operands
; j
++) {
2420 if (!(MEMORY
& ~ins
->oprs
[j
].type
)) {
2423 /* Verify as Register */
2424 if (ins
->oprs
[j
].indexreg
< EXPR_REG_START
2425 || ins
->oprs
[j
].indexreg
>= REG_ENUM_LIMIT
)
2428 i
= nasm_reg_flags
[ins
->oprs
[j
].indexreg
];
2430 /* Verify as Register */
2431 if (ins
->oprs
[j
].basereg
< EXPR_REG_START
2432 || ins
->oprs
[j
].basereg
>= REG_ENUM_LIMIT
)
2435 b
= nasm_reg_flags
[ins
->oprs
[j
].basereg
];
2437 if (ins
->oprs
[j
].scale
== 0)
2441 int ds
= ins
->oprs
[j
].disp_size
;
2442 if ((addrbits
!= 64 && ds
> 8) ||
2443 (addrbits
== 64 && ds
== 16))
2463 if (valid
& addrbits
) {
2464 ins
->addr_size
= addrbits
;
2465 } else if (valid
& ((addrbits
== 32) ? 16 : 32)) {
2466 /* Add an address size prefix */
2467 enum prefixes pref
= (addrbits
== 32) ? P_A16
: P_A32
;
2468 ins
->prefixes
[PPS_ASIZE
] = pref
;
2469 ins
->addr_size
= (addrbits
== 32) ? 16 : 32;
2472 errfunc(ERR_NONFATAL
, "impossible combination of address sizes");
2473 ins
->addr_size
= addrbits
; /* Error recovery */
2476 defdisp
= ins
->addr_size
== 16 ? 16 : 32;
2478 for (j
= 0; j
< ins
->operands
; j
++) {
2479 if (!(MEM_OFFS
& ~ins
->oprs
[j
].type
) &&
2480 (ins
->oprs
[j
].disp_size
? ins
->oprs
[j
].disp_size
: defdisp
)
2481 != ins
->addr_size
) {
2482 /* mem_offs sizes must match the address size; if not,
2483 strip the MEM_OFFS bit and match only EA instructions */
2484 ins
->oprs
[j
].type
&= ~(MEM_OFFS
& ~MEMORY
);