1 //===-- X86MCCodeEmitter.cpp - Convert X86 code to machine code -----------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file implements the X86MCCodeEmitter class.
11 //===----------------------------------------------------------------------===//
13 #include "MCTargetDesc/X86BaseInfo.h"
14 #include "MCTargetDesc/X86FixupKinds.h"
15 #include "MCTargetDesc/X86MCTargetDesc.h"
16 #include "llvm/ADT/SmallVector.h"
17 #include "llvm/MC/MCCodeEmitter.h"
18 #include "llvm/MC/MCContext.h"
19 #include "llvm/MC/MCExpr.h"
20 #include "llvm/MC/MCFixup.h"
21 #include "llvm/MC/MCInst.h"
22 #include "llvm/MC/MCInstrDesc.h"
23 #include "llvm/MC/MCInstrInfo.h"
24 #include "llvm/MC/MCRegisterInfo.h"
25 #include "llvm/MC/MCSubtargetInfo.h"
26 #include "llvm/MC/MCSymbol.h"
27 #include "llvm/Support/ErrorHandling.h"
28 #include "llvm/Support/raw_ostream.h"
35 #define DEBUG_TYPE "mccodeemitter"
39 class X86MCCodeEmitter
: public MCCodeEmitter
{
40 const MCInstrInfo
&MCII
;
44 X86MCCodeEmitter(const MCInstrInfo
&mcii
, MCContext
&ctx
)
45 : MCII(mcii
), Ctx(ctx
) {
47 X86MCCodeEmitter(const X86MCCodeEmitter
&) = delete;
48 X86MCCodeEmitter
&operator=(const X86MCCodeEmitter
&) = delete;
49 ~X86MCCodeEmitter() override
= default;
51 bool is64BitMode(const MCSubtargetInfo
&STI
) const {
52 return STI
.getFeatureBits()[X86::Mode64Bit
];
55 bool is32BitMode(const MCSubtargetInfo
&STI
) const {
56 return STI
.getFeatureBits()[X86::Mode32Bit
];
59 bool is16BitMode(const MCSubtargetInfo
&STI
) const {
60 return STI
.getFeatureBits()[X86::Mode16Bit
];
63 /// Is16BitMemOperand - Return true if the specified instruction has
64 /// a 16-bit memory operand. Op specifies the operand # of the memoperand.
65 bool Is16BitMemOperand(const MCInst
&MI
, unsigned Op
,
66 const MCSubtargetInfo
&STI
) const {
67 const MCOperand
&BaseReg
= MI
.getOperand(Op
+X86::AddrBaseReg
);
68 const MCOperand
&IndexReg
= MI
.getOperand(Op
+X86::AddrIndexReg
);
69 const MCOperand
&Disp
= MI
.getOperand(Op
+X86::AddrDisp
);
71 if (is16BitMode(STI
) && BaseReg
.getReg() == 0 &&
72 Disp
.isImm() && Disp
.getImm() < 0x10000)
74 if ((BaseReg
.getReg() != 0 &&
75 X86MCRegisterClasses
[X86::GR16RegClassID
].contains(BaseReg
.getReg())) ||
76 (IndexReg
.getReg() != 0 &&
77 X86MCRegisterClasses
[X86::GR16RegClassID
].contains(IndexReg
.getReg())))
82 unsigned GetX86RegNum(const MCOperand
&MO
) const {
83 return Ctx
.getRegisterInfo()->getEncodingValue(MO
.getReg()) & 0x7;
86 unsigned getX86RegEncoding(const MCInst
&MI
, unsigned OpNum
) const {
87 return Ctx
.getRegisterInfo()->getEncodingValue(
88 MI
.getOperand(OpNum
).getReg());
91 // Does this register require a bit to be set in REX prefix.
92 bool isREXExtendedReg(const MCInst
&MI
, unsigned OpNum
) const {
93 return (getX86RegEncoding(MI
, OpNum
) >> 3) & 1;
96 void EmitByte(uint8_t C
, unsigned &CurByte
, raw_ostream
&OS
) const {
101 void EmitConstant(uint64_t Val
, unsigned Size
, unsigned &CurByte
,
102 raw_ostream
&OS
) const {
103 // Output the constant in little endian byte order.
104 for (unsigned i
= 0; i
!= Size
; ++i
) {
105 EmitByte(Val
& 255, CurByte
, OS
);
110 void EmitImmediate(const MCOperand
&Disp
, SMLoc Loc
,
111 unsigned ImmSize
, MCFixupKind FixupKind
,
112 unsigned &CurByte
, raw_ostream
&OS
,
113 SmallVectorImpl
<MCFixup
> &Fixups
,
114 int ImmOffset
= 0) const;
116 static uint8_t ModRMByte(unsigned Mod
, unsigned RegOpcode
, unsigned RM
) {
117 assert(Mod
< 4 && RegOpcode
< 8 && RM
< 8 && "ModRM Fields out of range!");
118 return RM
| (RegOpcode
<< 3) | (Mod
<< 6);
121 void EmitRegModRMByte(const MCOperand
&ModRMReg
, unsigned RegOpcodeFld
,
122 unsigned &CurByte
, raw_ostream
&OS
) const {
123 EmitByte(ModRMByte(3, RegOpcodeFld
, GetX86RegNum(ModRMReg
)), CurByte
, OS
);
126 void EmitSIBByte(unsigned SS
, unsigned Index
, unsigned Base
,
127 unsigned &CurByte
, raw_ostream
&OS
) const {
128 // SIB byte is in the same format as the ModRMByte.
129 EmitByte(ModRMByte(SS
, Index
, Base
), CurByte
, OS
);
132 void emitMemModRMByte(const MCInst
&MI
, unsigned Op
, unsigned RegOpcodeField
,
133 uint64_t TSFlags
, bool Rex
, unsigned &CurByte
,
134 raw_ostream
&OS
, SmallVectorImpl
<MCFixup
> &Fixups
,
135 const MCSubtargetInfo
&STI
) const;
137 void encodeInstruction(const MCInst
&MI
, raw_ostream
&OS
,
138 SmallVectorImpl
<MCFixup
> &Fixups
,
139 const MCSubtargetInfo
&STI
) const override
;
141 void EmitVEXOpcodePrefix(uint64_t TSFlags
, unsigned &CurByte
, int MemOperand
,
142 const MCInst
&MI
, const MCInstrDesc
&Desc
,
143 raw_ostream
&OS
) const;
145 void EmitSegmentOverridePrefix(unsigned &CurByte
, unsigned SegOperand
,
146 const MCInst
&MI
, raw_ostream
&OS
) const;
148 bool emitOpcodePrefix(uint64_t TSFlags
, unsigned &CurByte
, int MemOperand
,
149 const MCInst
&MI
, const MCInstrDesc
&Desc
,
150 const MCSubtargetInfo
&STI
, raw_ostream
&OS
) const;
152 uint8_t DetermineREXPrefix(const MCInst
&MI
, uint64_t TSFlags
,
153 int MemOperand
, const MCInstrDesc
&Desc
) const;
155 bool isPCRel32Branch(const MCInst
&MI
) const;
158 } // end anonymous namespace
160 /// isDisp8 - Return true if this signed displacement fits in a 8-bit
161 /// sign-extended field.
162 static bool isDisp8(int Value
) {
163 return Value
== (int8_t)Value
;
166 /// isCDisp8 - Return true if this signed displacement fits in a 8-bit
167 /// compressed dispacement field.
168 static bool isCDisp8(uint64_t TSFlags
, int Value
, int& CValue
) {
169 assert(((TSFlags
& X86II::EncodingMask
) == X86II::EVEX
) &&
170 "Compressed 8-bit displacement is only valid for EVEX inst.");
173 (TSFlags
& X86II::CD8_Scale_Mask
) >> X86II::CD8_Scale_Shift
;
174 if (CD8_Scale
== 0) {
176 return isDisp8(Value
);
179 unsigned Mask
= CD8_Scale
- 1;
180 assert((CD8_Scale
& Mask
) == 0 && "Invalid memory object size.");
181 if (Value
& Mask
) // Unaligned offset
183 Value
/= (int)CD8_Scale
;
184 bool Ret
= (Value
== (int8_t)Value
);
191 /// getImmFixupKind - Return the appropriate fixup kind to use for an immediate
192 /// in an instruction with the specified TSFlags.
193 static MCFixupKind
getImmFixupKind(uint64_t TSFlags
) {
194 unsigned Size
= X86II::getSizeOfImm(TSFlags
);
195 bool isPCRel
= X86II::isImmPCRel(TSFlags
);
197 if (X86II::isImmSigned(TSFlags
)) {
199 default: llvm_unreachable("Unsupported signed fixup size!");
200 case 4: return MCFixupKind(X86::reloc_signed_4byte
);
203 return MCFixup::getKindForSize(Size
, isPCRel
);
206 /// Is32BitMemOperand - Return true if the specified instruction has
207 /// a 32-bit memory operand. Op specifies the operand # of the memoperand.
208 static bool Is32BitMemOperand(const MCInst
&MI
, unsigned Op
) {
209 const MCOperand
&BaseReg
= MI
.getOperand(Op
+X86::AddrBaseReg
);
210 const MCOperand
&IndexReg
= MI
.getOperand(Op
+X86::AddrIndexReg
);
212 if ((BaseReg
.getReg() != 0 &&
213 X86MCRegisterClasses
[X86::GR32RegClassID
].contains(BaseReg
.getReg())) ||
214 (IndexReg
.getReg() != 0 &&
215 X86MCRegisterClasses
[X86::GR32RegClassID
].contains(IndexReg
.getReg())))
217 if (BaseReg
.getReg() == X86::EIP
) {
218 assert(IndexReg
.getReg() == 0 && "Invalid eip-based address.");
221 if (IndexReg
.getReg() == X86::EIZ
)
226 /// Is64BitMemOperand - Return true if the specified instruction has
227 /// a 64-bit memory operand. Op specifies the operand # of the memoperand.
229 static bool Is64BitMemOperand(const MCInst
&MI
, unsigned Op
) {
230 const MCOperand
&BaseReg
= MI
.getOperand(Op
+X86::AddrBaseReg
);
231 const MCOperand
&IndexReg
= MI
.getOperand(Op
+X86::AddrIndexReg
);
233 if ((BaseReg
.getReg() != 0 &&
234 X86MCRegisterClasses
[X86::GR64RegClassID
].contains(BaseReg
.getReg())) ||
235 (IndexReg
.getReg() != 0 &&
236 X86MCRegisterClasses
[X86::GR64RegClassID
].contains(IndexReg
.getReg())))
242 /// StartsWithGlobalOffsetTable - Check if this expression starts with
243 /// _GLOBAL_OFFSET_TABLE_ and if it is of the form
244 /// _GLOBAL_OFFSET_TABLE_-symbol. This is needed to support PIC on ELF
245 /// i386 as _GLOBAL_OFFSET_TABLE_ is magical. We check only simple case that
246 /// are know to be used: _GLOBAL_OFFSET_TABLE_ by itself or at the start
247 /// of a binary expression.
248 enum GlobalOffsetTableExprKind
{
253 static GlobalOffsetTableExprKind
254 StartsWithGlobalOffsetTable(const MCExpr
*Expr
) {
255 const MCExpr
*RHS
= nullptr;
256 if (Expr
->getKind() == MCExpr::Binary
) {
257 const MCBinaryExpr
*BE
= static_cast<const MCBinaryExpr
*>(Expr
);
262 if (Expr
->getKind() != MCExpr::SymbolRef
)
265 const MCSymbolRefExpr
*Ref
= static_cast<const MCSymbolRefExpr
*>(Expr
);
266 const MCSymbol
&S
= Ref
->getSymbol();
267 if (S
.getName() != "_GLOBAL_OFFSET_TABLE_")
269 if (RHS
&& RHS
->getKind() == MCExpr::SymbolRef
)
274 static bool HasSecRelSymbolRef(const MCExpr
*Expr
) {
275 if (Expr
->getKind() == MCExpr::SymbolRef
) {
276 const MCSymbolRefExpr
*Ref
= static_cast<const MCSymbolRefExpr
*>(Expr
);
277 return Ref
->getKind() == MCSymbolRefExpr::VK_SECREL
;
282 bool X86MCCodeEmitter::isPCRel32Branch(const MCInst
&MI
) const {
283 unsigned Opcode
= MI
.getOpcode();
284 const MCInstrDesc
&Desc
= MCII
.get(Opcode
);
285 if ((Opcode
!= X86::CALL64pcrel32
&& Opcode
!= X86::JMP_4
) ||
286 getImmFixupKind(Desc
.TSFlags
) != FK_PCRel_4
)
289 unsigned CurOp
= X86II::getOperandBias(Desc
);
290 const MCOperand
&Op
= MI
.getOperand(CurOp
);
294 const MCSymbolRefExpr
*Ref
= dyn_cast
<MCSymbolRefExpr
>(Op
.getExpr());
295 return Ref
&& Ref
->getKind() == MCSymbolRefExpr::VK_None
;
298 void X86MCCodeEmitter::
299 EmitImmediate(const MCOperand
&DispOp
, SMLoc Loc
, unsigned Size
,
300 MCFixupKind FixupKind
, unsigned &CurByte
, raw_ostream
&OS
,
301 SmallVectorImpl
<MCFixup
> &Fixups
, int ImmOffset
) const {
302 const MCExpr
*Expr
= nullptr;
303 if (DispOp
.isImm()) {
304 // If this is a simple integer displacement that doesn't require a
305 // relocation, emit it now.
306 if (FixupKind
!= FK_PCRel_1
&&
307 FixupKind
!= FK_PCRel_2
&&
308 FixupKind
!= FK_PCRel_4
) {
309 EmitConstant(DispOp
.getImm()+ImmOffset
, Size
, CurByte
, OS
);
312 Expr
= MCConstantExpr::create(DispOp
.getImm(), Ctx
);
314 Expr
= DispOp
.getExpr();
317 // If we have an immoffset, add it to the expression.
318 if ((FixupKind
== FK_Data_4
||
319 FixupKind
== FK_Data_8
||
320 FixupKind
== MCFixupKind(X86::reloc_signed_4byte
))) {
321 GlobalOffsetTableExprKind Kind
= StartsWithGlobalOffsetTable(Expr
);
322 if (Kind
!= GOT_None
) {
323 assert(ImmOffset
== 0);
326 FixupKind
= MCFixupKind(X86::reloc_global_offset_table8
);
329 FixupKind
= MCFixupKind(X86::reloc_global_offset_table
);
332 if (Kind
== GOT_Normal
)
334 } else if (Expr
->getKind() == MCExpr::SymbolRef
) {
335 if (HasSecRelSymbolRef(Expr
)) {
336 FixupKind
= MCFixupKind(FK_SecRel_4
);
338 } else if (Expr
->getKind() == MCExpr::Binary
) {
339 const MCBinaryExpr
*Bin
= static_cast<const MCBinaryExpr
*>(Expr
);
340 if (HasSecRelSymbolRef(Bin
->getLHS())
341 || HasSecRelSymbolRef(Bin
->getRHS())) {
342 FixupKind
= MCFixupKind(FK_SecRel_4
);
347 // If the fixup is pc-relative, we need to bias the value to be relative to
348 // the start of the field, not the end of the field.
349 if (FixupKind
== FK_PCRel_4
||
350 FixupKind
== MCFixupKind(X86::reloc_riprel_4byte
) ||
351 FixupKind
== MCFixupKind(X86::reloc_riprel_4byte_movq_load
) ||
352 FixupKind
== MCFixupKind(X86::reloc_riprel_4byte_relax
) ||
353 FixupKind
== MCFixupKind(X86::reloc_riprel_4byte_relax_rex
) ||
354 FixupKind
== MCFixupKind(X86::reloc_branch_4byte_pcrel
)) {
356 // If this is a pc-relative load off _GLOBAL_OFFSET_TABLE_:
357 // leaq _GLOBAL_OFFSET_TABLE_(%rip), %r15
358 // this needs to be a GOTPC32 relocation.
359 if (StartsWithGlobalOffsetTable(Expr
) != GOT_None
)
360 FixupKind
= MCFixupKind(X86::reloc_global_offset_table
);
362 if (FixupKind
== FK_PCRel_2
)
364 if (FixupKind
== FK_PCRel_1
)
368 Expr
= MCBinaryExpr::createAdd(Expr
, MCConstantExpr::create(ImmOffset
, Ctx
),
371 // Emit a symbolic constant as a fixup and 4 zeros.
372 Fixups
.push_back(MCFixup::create(CurByte
, Expr
, FixupKind
, Loc
));
373 EmitConstant(0, Size
, CurByte
, OS
);
376 void X86MCCodeEmitter::emitMemModRMByte(const MCInst
&MI
, unsigned Op
,
377 unsigned RegOpcodeField
,
378 uint64_t TSFlags
, bool Rex
,
379 unsigned &CurByte
, raw_ostream
&OS
,
380 SmallVectorImpl
<MCFixup
> &Fixups
,
381 const MCSubtargetInfo
&STI
) const {
382 const MCOperand
&Disp
= MI
.getOperand(Op
+X86::AddrDisp
);
383 const MCOperand
&Base
= MI
.getOperand(Op
+X86::AddrBaseReg
);
384 const MCOperand
&Scale
= MI
.getOperand(Op
+X86::AddrScaleAmt
);
385 const MCOperand
&IndexReg
= MI
.getOperand(Op
+X86::AddrIndexReg
);
386 unsigned BaseReg
= Base
.getReg();
387 bool HasEVEX
= (TSFlags
& X86II::EncodingMask
) == X86II::EVEX
;
389 // Handle %rip relative addressing.
390 if (BaseReg
== X86::RIP
||
391 BaseReg
== X86::EIP
) { // [disp32+rIP] in X86-64 mode
392 assert(is64BitMode(STI
) && "Rip-relative addressing requires 64-bit mode");
393 assert(IndexReg
.getReg() == 0 && "Invalid rip-relative address");
394 EmitByte(ModRMByte(0, RegOpcodeField
, 5), CurByte
, OS
);
396 unsigned Opcode
= MI
.getOpcode();
397 // movq loads are handled with a special relocation form which allows the
398 // linker to eliminate some loads for GOT references which end up in the
399 // same linkage unit.
400 unsigned FixupKind
= [=]() {
403 return X86::reloc_riprel_4byte
;
406 return X86::reloc_riprel_4byte_movq_load
;
409 case X86::TAILJMPm64
:
419 return Rex
? X86::reloc_riprel_4byte_relax_rex
420 : X86::reloc_riprel_4byte_relax
;
424 // rip-relative addressing is actually relative to the *next* instruction.
425 // Since an immediate can follow the mod/rm byte for an instruction, this
426 // means that we need to bias the displacement field of the instruction with
427 // the size of the immediate field. If we have this case, add it into the
428 // expression to emit.
429 // Note: rip-relative addressing using immediate displacement values should
430 // not be adjusted, assuming it was the user's intent.
431 int ImmSize
= !Disp
.isImm() && X86II::hasImm(TSFlags
)
432 ? X86II::getSizeOfImm(TSFlags
)
435 EmitImmediate(Disp
, MI
.getLoc(), 4, MCFixupKind(FixupKind
),
436 CurByte
, OS
, Fixups
, -ImmSize
);
440 unsigned BaseRegNo
= BaseReg
? GetX86RegNum(Base
) : -1U;
442 // 16-bit addressing forms of the ModR/M byte have a different encoding for
443 // the R/M field and are far more limited in which registers can be used.
444 if (Is16BitMemOperand(MI
, Op
, STI
)) {
446 // For 32-bit addressing, the row and column values in Table 2-2 are
447 // basically the same. It's AX/CX/DX/BX/SP/BP/SI/DI in that order, with
448 // some special cases. And GetX86RegNum reflects that numbering.
449 // For 16-bit addressing it's more fun, as shown in the SDM Vol 2A,
450 // Table 2-1 "16-Bit Addressing Forms with the ModR/M byte". We can only
451 // use SI/DI/BP/BX, which have "row" values 4-7 in no particular order,
452 // while values 0-3 indicate the allowed combinations (base+index) of
453 // those: 0 for BX+SI, 1 for BX+DI, 2 for BP+SI, 3 for BP+DI.
455 // R16Table[] is a lookup from the normal RegNo, to the row values from
456 // Table 2-1 for 16-bit addressing modes. Where zero means disallowed.
457 static const unsigned R16Table
[] = { 0, 0, 0, 7, 0, 6, 4, 5 };
458 unsigned RMfield
= R16Table
[BaseRegNo
];
460 assert(RMfield
&& "invalid 16-bit base register");
462 if (IndexReg
.getReg()) {
463 unsigned IndexReg16
= R16Table
[GetX86RegNum(IndexReg
)];
465 assert(IndexReg16
&& "invalid 16-bit index register");
466 // We must have one of SI/DI (4,5), and one of BP/BX (6,7).
467 assert(((IndexReg16
^ RMfield
) & 2) &&
468 "invalid 16-bit base/index register combination");
469 assert(Scale
.getImm() == 1 &&
470 "invalid scale for 16-bit memory reference");
472 // Allow base/index to appear in either order (although GAS doesn't).
474 RMfield
= (RMfield
& 1) | ((7 - IndexReg16
) << 1);
476 RMfield
= (IndexReg16
& 1) | ((7 - RMfield
) << 1);
479 if (Disp
.isImm() && isDisp8(Disp
.getImm())) {
480 if (Disp
.getImm() == 0 && RMfield
!= 6) {
481 // There is no displacement; just the register.
482 EmitByte(ModRMByte(0, RegOpcodeField
, RMfield
), CurByte
, OS
);
485 // Use the [REG]+disp8 form, including for [BP] which cannot be encoded.
486 EmitByte(ModRMByte(1, RegOpcodeField
, RMfield
), CurByte
, OS
);
487 EmitImmediate(Disp
, MI
.getLoc(), 1, FK_Data_1
, CurByte
, OS
, Fixups
);
490 // This is the [REG]+disp16 case.
491 EmitByte(ModRMByte(2, RegOpcodeField
, RMfield
), CurByte
, OS
);
493 // There is no BaseReg; this is the plain [disp16] case.
494 EmitByte(ModRMByte(0, RegOpcodeField
, 6), CurByte
, OS
);
497 // Emit 16-bit displacement for plain disp16 or [REG]+disp16 cases.
498 EmitImmediate(Disp
, MI
.getLoc(), 2, FK_Data_2
, CurByte
, OS
, Fixups
);
502 // Determine whether a SIB byte is needed.
503 // If no BaseReg, issue a RIP relative instruction only if the MCE can
504 // resolve addresses on-the-fly, otherwise use SIB (Intel Manual 2A, table
505 // 2-7) and absolute references.
507 if (// The SIB byte must be used if there is an index register.
508 IndexReg
.getReg() == 0 &&
509 // The SIB byte must be used if the base is ESP/RSP/R12, all of which
510 // encode to an R/M value of 4, which indicates that a SIB byte is
512 BaseRegNo
!= N86::ESP
&&
513 // If there is no base register and we're in 64-bit mode, we need a SIB
514 // byte to emit an addr that is just 'disp32' (the non-RIP relative form).
515 (!is64BitMode(STI
) || BaseReg
!= 0)) {
517 if (BaseReg
== 0) { // [disp32] in X86-32 mode
518 EmitByte(ModRMByte(0, RegOpcodeField
, 5), CurByte
, OS
);
519 EmitImmediate(Disp
, MI
.getLoc(), 4, FK_Data_4
, CurByte
, OS
, Fixups
);
523 // If the base is not EBP/ESP and there is no displacement, use simple
524 // indirect register encoding, this handles addresses like [EAX]. The
525 // encoding for [EBP] with no displacement means [disp32] so we handle it
526 // by emitting a displacement of 0 below.
527 if (Disp
.isImm() && Disp
.getImm() == 0 && BaseRegNo
!= N86::EBP
) {
528 EmitByte(ModRMByte(0, RegOpcodeField
, BaseRegNo
), CurByte
, OS
);
532 // Otherwise, if the displacement fits in a byte, encode as [REG+disp8].
534 if (!HasEVEX
&& isDisp8(Disp
.getImm())) {
535 EmitByte(ModRMByte(1, RegOpcodeField
, BaseRegNo
), CurByte
, OS
);
536 EmitImmediate(Disp
, MI
.getLoc(), 1, FK_Data_1
, CurByte
, OS
, Fixups
);
539 // Try EVEX compressed 8-bit displacement first; if failed, fall back to
540 // 32-bit displacement.
542 if (HasEVEX
&& isCDisp8(TSFlags
, Disp
.getImm(), CDisp8
)) {
543 EmitByte(ModRMByte(1, RegOpcodeField
, BaseRegNo
), CurByte
, OS
);
544 EmitImmediate(Disp
, MI
.getLoc(), 1, FK_Data_1
, CurByte
, OS
, Fixups
,
545 CDisp8
- Disp
.getImm());
550 // Otherwise, emit the most general non-SIB encoding: [REG+disp32]
551 EmitByte(ModRMByte(2, RegOpcodeField
, BaseRegNo
), CurByte
, OS
);
552 unsigned Opcode
= MI
.getOpcode();
553 unsigned FixupKind
= Opcode
== X86::MOV32rm
? X86::reloc_signed_4byte_relax
554 : X86::reloc_signed_4byte
;
555 EmitImmediate(Disp
, MI
.getLoc(), 4, MCFixupKind(FixupKind
), CurByte
, OS
,
560 // We need a SIB byte, so start by outputting the ModR/M byte first
561 assert(IndexReg
.getReg() != X86::ESP
&&
562 IndexReg
.getReg() != X86::RSP
&& "Cannot use ESP as index reg!");
564 bool ForceDisp32
= false;
565 bool ForceDisp8
= false;
569 // If there is no base register, we emit the special case SIB byte with
570 // MOD=0, BASE=5, to JUST get the index, scale, and displacement.
571 EmitByte(ModRMByte(0, RegOpcodeField
, 4), CurByte
, OS
);
573 } else if (!Disp
.isImm()) {
574 // Emit the normal disp32 encoding.
575 EmitByte(ModRMByte(2, RegOpcodeField
, 4), CurByte
, OS
);
577 } else if (Disp
.getImm() == 0 &&
578 // Base reg can't be anything that ends up with '5' as the base
579 // reg, it is the magic [*] nomenclature that indicates no base.
580 BaseRegNo
!= N86::EBP
) {
581 // Emit no displacement ModR/M byte
582 EmitByte(ModRMByte(0, RegOpcodeField
, 4), CurByte
, OS
);
583 } else if (!HasEVEX
&& isDisp8(Disp
.getImm())) {
584 // Emit the disp8 encoding.
585 EmitByte(ModRMByte(1, RegOpcodeField
, 4), CurByte
, OS
);
586 ForceDisp8
= true; // Make sure to force 8 bit disp if Base=EBP
587 } else if (HasEVEX
&& isCDisp8(TSFlags
, Disp
.getImm(), CDisp8
)) {
588 // Emit the disp8 encoding.
589 EmitByte(ModRMByte(1, RegOpcodeField
, 4), CurByte
, OS
);
590 ForceDisp8
= true; // Make sure to force 8 bit disp if Base=EBP
591 ImmOffset
= CDisp8
- Disp
.getImm();
593 // Emit the normal disp32 encoding.
594 EmitByte(ModRMByte(2, RegOpcodeField
, 4), CurByte
, OS
);
597 // Calculate what the SS field value should be...
598 static const unsigned SSTable
[] = { ~0U, 0, 1, ~0U, 2, ~0U, ~0U, ~0U, 3 };
599 unsigned SS
= SSTable
[Scale
.getImm()];
602 // Handle the SIB byte for the case where there is no base, see Intel
603 // Manual 2A, table 2-7. The displacement has already been output.
605 if (IndexReg
.getReg())
606 IndexRegNo
= GetX86RegNum(IndexReg
);
607 else // Examples: [ESP+1*<noreg>+4] or [scaled idx]+disp32 (MOD=0,BASE=5)
609 EmitSIBByte(SS
, IndexRegNo
, 5, CurByte
, OS
);
612 if (IndexReg
.getReg())
613 IndexRegNo
= GetX86RegNum(IndexReg
);
615 IndexRegNo
= 4; // For example [ESP+1*<noreg>+4]
616 EmitSIBByte(SS
, IndexRegNo
, GetX86RegNum(Base
), CurByte
, OS
);
619 // Do we need to output a displacement?
621 EmitImmediate(Disp
, MI
.getLoc(), 1, FK_Data_1
, CurByte
, OS
, Fixups
, ImmOffset
);
622 else if (ForceDisp32
|| Disp
.getImm() != 0)
623 EmitImmediate(Disp
, MI
.getLoc(), 4, MCFixupKind(X86::reloc_signed_4byte
),
624 CurByte
, OS
, Fixups
);
627 /// EmitVEXOpcodePrefix - AVX instructions are encoded using a opcode prefix
629 void X86MCCodeEmitter::EmitVEXOpcodePrefix(uint64_t TSFlags
, unsigned &CurByte
,
630 int MemOperand
, const MCInst
&MI
,
631 const MCInstrDesc
&Desc
,
632 raw_ostream
&OS
) const {
633 assert(!(TSFlags
& X86II::LOCK
) && "Can't have LOCK VEX.");
635 uint64_t Encoding
= TSFlags
& X86II::EncodingMask
;
636 bool HasEVEX_K
= TSFlags
& X86II::EVEX_K
;
637 bool HasVEX_4V
= TSFlags
& X86II::VEX_4V
;
638 bool HasEVEX_RC
= TSFlags
& X86II::EVEX_RC
;
640 // VEX_R: opcode externsion equivalent to REX.R in
641 // 1's complement (inverted) form
643 // 1: Same as REX_R=0 (must be 1 in 32-bit mode)
644 // 0: Same as REX_R=1 (64 bit mode only)
647 uint8_t EVEX_R2
= 0x1;
649 // VEX_X: equivalent to REX.X, only used when a
650 // register is used for index in SIB Byte.
652 // 1: Same as REX.X=0 (must be 1 in 32-bit mode)
653 // 0: Same as REX.X=1 (64-bit mode only)
658 // 1: Same as REX_B=0 (ignored in 32-bit mode)
659 // 0: Same as REX_B=1 (64 bit mode only)
663 // VEX_W: opcode specific (use like REX.W, or used for
664 // opcode extension, or ignored, depending on the opcode byte)
665 uint8_t VEX_W
= (TSFlags
& X86II::VEX_W
) ? 1 : 0;
667 // VEX_5M (VEX m-mmmmm field):
669 // 0b00000: Reserved for future use
670 // 0b00001: implied 0F leading opcode
671 // 0b00010: implied 0F 38 leading opcode bytes
672 // 0b00011: implied 0F 3A leading opcode bytes
673 // 0b00100-0b11111: Reserved for future use
674 // 0b01000: XOP map select - 08h instructions with imm byte
675 // 0b01001: XOP map select - 09h instructions with no imm byte
676 // 0b01010: XOP map select - 0Ah instructions with imm dword
678 switch (TSFlags
& X86II::OpMapMask
) {
679 default: llvm_unreachable("Invalid prefix!");
680 case X86II::TB
: VEX_5M
= 0x1; break; // 0F
681 case X86II::T8
: VEX_5M
= 0x2; break; // 0F 38
682 case X86II::TA
: VEX_5M
= 0x3; break; // 0F 3A
683 case X86II::XOP8
: VEX_5M
= 0x8; break;
684 case X86II::XOP9
: VEX_5M
= 0x9; break;
685 case X86II::XOPA
: VEX_5M
= 0xA; break;
688 // VEX_4V (VEX vvvv field): a register specifier
689 // (in 1's complement form) or 1111 if unused.
690 uint8_t VEX_4V
= 0xf;
691 uint8_t EVEX_V2
= 0x1;
693 // EVEX_L2/VEX_L (Vector Length):
696 // 0 0: scalar or 128-bit vector
697 // 0 1: 256-bit vector
698 // 1 0: 512-bit vector
700 uint8_t VEX_L
= (TSFlags
& X86II::VEX_L
) ? 1 : 0;
701 uint8_t EVEX_L2
= (TSFlags
& X86II::EVEX_L2
) ? 1 : 0;
703 // VEX_PP: opcode extension providing equivalent
704 // functionality of a SIMD prefix
712 switch (TSFlags
& X86II::OpPrefixMask
) {
713 case X86II::PD
: VEX_PP
= 0x1; break; // 66
714 case X86II::XS
: VEX_PP
= 0x2; break; // F3
715 case X86II::XD
: VEX_PP
= 0x3; break; // F2
719 uint8_t EVEX_U
= 1; // Always '1' so far
722 uint8_t EVEX_z
= (HasEVEX_K
&& (TSFlags
& X86II::EVEX_Z
)) ? 1 : 0;
725 uint8_t EVEX_b
= (TSFlags
& X86II::EVEX_B
) ? 1 : 0;
731 uint8_t EVEX_aaa
= 0;
733 bool EncodeRC
= false;
735 // Classify VEX_B, VEX_4V, VEX_R, VEX_X
736 unsigned NumOps
= Desc
.getNumOperands();
737 unsigned CurOp
= X86II::getOperandBias(Desc
);
739 switch (TSFlags
& X86II::FormMask
) {
740 default: llvm_unreachable("Unexpected form in EmitVEXOpcodePrefix!");
743 case X86II::MRMDestMem
: {
744 // MRMDestMem instructions forms:
745 // MemAddr, src1(ModR/M)
746 // MemAddr, src1(VEX_4V), src2(ModR/M)
747 // MemAddr, src1(ModR/M), imm8
749 unsigned BaseRegEnc
= getX86RegEncoding(MI
, MemOperand
+ X86::AddrBaseReg
);
750 VEX_B
= ~(BaseRegEnc
>> 3) & 1;
751 unsigned IndexRegEnc
= getX86RegEncoding(MI
, MemOperand
+X86::AddrIndexReg
);
752 VEX_X
= ~(IndexRegEnc
>> 3) & 1;
753 if (!HasVEX_4V
) // Only needed with VSIB which don't use VVVV.
754 EVEX_V2
= ~(IndexRegEnc
>> 4) & 1;
756 CurOp
+= X86::AddrNumOperands
;
759 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
762 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
763 VEX_4V
= ~VRegEnc
& 0xf;
764 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
767 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
768 VEX_R
= ~(RegEnc
>> 3) & 1;
769 EVEX_R2
= ~(RegEnc
>> 4) & 1;
772 case X86II::MRMSrcMem
: {
773 // MRMSrcMem instructions forms:
774 // src1(ModR/M), MemAddr
775 // src1(ModR/M), src2(VEX_4V), MemAddr
776 // src1(ModR/M), MemAddr, imm8
777 // src1(ModR/M), MemAddr, src2(Imm[7:4])
780 // dst(ModR/M.reg), src1(VEX_4V), src2(ModR/M), src3(Imm[7:4])
781 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
782 VEX_R
= ~(RegEnc
>> 3) & 1;
783 EVEX_R2
= ~(RegEnc
>> 4) & 1;
786 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
789 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
790 VEX_4V
= ~VRegEnc
& 0xf;
791 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
794 unsigned BaseRegEnc
= getX86RegEncoding(MI
, MemOperand
+ X86::AddrBaseReg
);
795 VEX_B
= ~(BaseRegEnc
>> 3) & 1;
796 unsigned IndexRegEnc
= getX86RegEncoding(MI
, MemOperand
+X86::AddrIndexReg
);
797 VEX_X
= ~(IndexRegEnc
>> 3) & 1;
798 if (!HasVEX_4V
) // Only needed with VSIB which don't use VVVV.
799 EVEX_V2
= ~(IndexRegEnc
>> 4) & 1;
803 case X86II::MRMSrcMem4VOp3
: {
804 // Instruction format for 4VOp3:
805 // src1(ModR/M), MemAddr, src3(VEX_4V)
806 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
807 VEX_R
= ~(RegEnc
>> 3) & 1;
809 unsigned BaseRegEnc
= getX86RegEncoding(MI
, MemOperand
+ X86::AddrBaseReg
);
810 VEX_B
= ~(BaseRegEnc
>> 3) & 1;
811 unsigned IndexRegEnc
= getX86RegEncoding(MI
, MemOperand
+X86::AddrIndexReg
);
812 VEX_X
= ~(IndexRegEnc
>> 3) & 1;
814 VEX_4V
= ~getX86RegEncoding(MI
, CurOp
+ X86::AddrNumOperands
) & 0xf;
817 case X86II::MRMSrcMemOp4
: {
818 // dst(ModR/M.reg), src1(VEX_4V), src2(Imm[7:4]), src3(ModR/M),
819 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
820 VEX_R
= ~(RegEnc
>> 3) & 1;
822 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
823 VEX_4V
= ~VRegEnc
& 0xf;
825 unsigned BaseRegEnc
= getX86RegEncoding(MI
, MemOperand
+ X86::AddrBaseReg
);
826 VEX_B
= ~(BaseRegEnc
>> 3) & 1;
827 unsigned IndexRegEnc
= getX86RegEncoding(MI
, MemOperand
+X86::AddrIndexReg
);
828 VEX_X
= ~(IndexRegEnc
>> 3) & 1;
831 case X86II::MRM0m
: case X86II::MRM1m
:
832 case X86II::MRM2m
: case X86II::MRM3m
:
833 case X86II::MRM4m
: case X86II::MRM5m
:
834 case X86II::MRM6m
: case X86II::MRM7m
: {
835 // MRM[0-9]m instructions forms:
837 // src1(VEX_4V), MemAddr
839 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
840 VEX_4V
= ~VRegEnc
& 0xf;
841 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
845 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
847 unsigned BaseRegEnc
= getX86RegEncoding(MI
, MemOperand
+ X86::AddrBaseReg
);
848 VEX_B
= ~(BaseRegEnc
>> 3) & 1;
849 unsigned IndexRegEnc
= getX86RegEncoding(MI
, MemOperand
+X86::AddrIndexReg
);
850 VEX_X
= ~(IndexRegEnc
>> 3) & 1;
853 case X86II::MRMSrcReg
: {
854 // MRMSrcReg instructions forms:
855 // dst(ModR/M), src1(VEX_4V), src2(ModR/M), src3(Imm[7:4])
856 // dst(ModR/M), src1(ModR/M)
857 // dst(ModR/M), src1(ModR/M), imm8
860 // dst(ModR/M.reg), src1(VEX_4V), src2(Imm[7:4]), src3(ModR/M),
861 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
862 VEX_R
= ~(RegEnc
>> 3) & 1;
863 EVEX_R2
= ~(RegEnc
>> 4) & 1;
866 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
869 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
870 VEX_4V
= ~VRegEnc
& 0xf;
871 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
874 RegEnc
= getX86RegEncoding(MI
, CurOp
++);
875 VEX_B
= ~(RegEnc
>> 3) & 1;
876 VEX_X
= ~(RegEnc
>> 4) & 1;
880 unsigned RcOperand
= NumOps
-1;
881 assert(RcOperand
>= CurOp
);
882 EVEX_rc
= MI
.getOperand(RcOperand
).getImm() & 0x3;
888 case X86II::MRMSrcReg4VOp3
: {
889 // Instruction format for 4VOp3:
890 // src1(ModR/M), src2(ModR/M), src3(VEX_4V)
891 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
892 VEX_R
= ~(RegEnc
>> 3) & 1;
894 RegEnc
= getX86RegEncoding(MI
, CurOp
++);
895 VEX_B
= ~(RegEnc
>> 3) & 1;
897 VEX_4V
= ~getX86RegEncoding(MI
, CurOp
++) & 0xf;
900 case X86II::MRMSrcRegOp4
: {
901 // dst(ModR/M.reg), src1(VEX_4V), src2(Imm[7:4]), src3(ModR/M),
902 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
903 VEX_R
= ~(RegEnc
>> 3) & 1;
905 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
906 VEX_4V
= ~VRegEnc
& 0xf;
908 // Skip second register source (encoded in Imm[7:4])
911 RegEnc
= getX86RegEncoding(MI
, CurOp
++);
912 VEX_B
= ~(RegEnc
>> 3) & 1;
913 VEX_X
= ~(RegEnc
>> 4) & 1;
916 case X86II::MRMDestReg
: {
917 // MRMDestReg instructions forms:
918 // dst(ModR/M), src(ModR/M)
919 // dst(ModR/M), src(ModR/M), imm8
920 // dst(ModR/M), src1(VEX_4V), src2(ModR/M)
921 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
922 VEX_B
= ~(RegEnc
>> 3) & 1;
923 VEX_X
= ~(RegEnc
>> 4) & 1;
926 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
929 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
930 VEX_4V
= ~VRegEnc
& 0xf;
931 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
934 RegEnc
= getX86RegEncoding(MI
, CurOp
++);
935 VEX_R
= ~(RegEnc
>> 3) & 1;
936 EVEX_R2
= ~(RegEnc
>> 4) & 1;
941 case X86II::MRM0r
: case X86II::MRM1r
:
942 case X86II::MRM2r
: case X86II::MRM3r
:
943 case X86II::MRM4r
: case X86II::MRM5r
:
944 case X86II::MRM6r
: case X86II::MRM7r
: {
945 // MRM0r-MRM7r instructions forms:
946 // dst(VEX_4V), src(ModR/M), imm8
948 unsigned VRegEnc
= getX86RegEncoding(MI
, CurOp
++);
949 VEX_4V
= ~VRegEnc
& 0xf;
950 EVEX_V2
= ~(VRegEnc
>> 4) & 1;
953 EVEX_aaa
= getX86RegEncoding(MI
, CurOp
++);
955 unsigned RegEnc
= getX86RegEncoding(MI
, CurOp
++);
956 VEX_B
= ~(RegEnc
>> 3) & 1;
957 VEX_X
= ~(RegEnc
>> 4) & 1;
962 if (Encoding
== X86II::VEX
|| Encoding
== X86II::XOP
) {
963 // VEX opcode prefix can have 2 or 3 bytes
966 // +-----+ +--------------+ +-------------------+
967 // | C4h | | RXB | m-mmmm | | W | vvvv | L | pp |
968 // +-----+ +--------------+ +-------------------+
970 // +-----+ +-------------------+
971 // | C5h | | R | vvvv | L | pp |
972 // +-----+ +-------------------+
974 // XOP uses a similar prefix:
975 // +-----+ +--------------+ +-------------------+
976 // | 8Fh | | RXB | m-mmmm | | W | vvvv | L | pp |
977 // +-----+ +--------------+ +-------------------+
978 uint8_t LastByte
= VEX_PP
| (VEX_L
<< 2) | (VEX_4V
<< 3);
980 // Can we use the 2 byte VEX prefix?
981 if (Encoding
== X86II::VEX
&& VEX_B
&& VEX_X
&& !VEX_W
&& (VEX_5M
== 1)) {
982 EmitByte(0xC5, CurByte
, OS
);
983 EmitByte(LastByte
| (VEX_R
<< 7), CurByte
, OS
);
988 EmitByte(Encoding
== X86II::XOP
? 0x8F : 0xC4, CurByte
, OS
);
989 EmitByte(VEX_R
<< 7 | VEX_X
<< 6 | VEX_B
<< 5 | VEX_5M
, CurByte
, OS
);
990 EmitByte(LastByte
| (VEX_W
<< 7), CurByte
, OS
);
992 assert(Encoding
== X86II::EVEX
&& "unknown encoding!");
993 // EVEX opcode prefix can have 4 bytes
995 // +-----+ +--------------+ +-------------------+ +------------------------+
996 // | 62h | | RXBR' | 00mm | | W | vvvv | U | pp | | z | L'L | b | v' | aaa |
997 // +-----+ +--------------+ +-------------------+ +------------------------+
998 assert((VEX_5M
& 0x3) == VEX_5M
999 && "More than 2 significant bits in VEX.m-mmmm fields for EVEX!");
1001 EmitByte(0x62, CurByte
, OS
);
1002 EmitByte((VEX_R
<< 7) |
1006 VEX_5M
, CurByte
, OS
);
1007 EmitByte((VEX_W
<< 7) |
1010 VEX_PP
, CurByte
, OS
);
1012 EmitByte((EVEX_z
<< 7) |
1016 EVEX_aaa
, CurByte
, OS
);
1018 EmitByte((EVEX_z
<< 7) |
1023 EVEX_aaa
, CurByte
, OS
);
1027 /// DetermineREXPrefix - Determine if the MCInst has to be encoded with a X86-64
1028 /// REX prefix which specifies 1) 64-bit instructions, 2) non-default operand
1029 /// size, and 3) use of X86-64 extended registers.
1030 uint8_t X86MCCodeEmitter::DetermineREXPrefix(const MCInst
&MI
, uint64_t TSFlags
,
1032 const MCInstrDesc
&Desc
) const {
1034 bool UsesHighByteReg
= false;
1036 if (TSFlags
& X86II::REX_W
)
1037 REX
|= 1 << 3; // set REX.W
1039 if (MI
.getNumOperands() == 0) return REX
;
1041 unsigned NumOps
= MI
.getNumOperands();
1042 unsigned CurOp
= X86II::getOperandBias(Desc
);
1044 // If it accesses SPL, BPL, SIL, or DIL, then it requires a 0x40 REX prefix.
1045 for (unsigned i
= CurOp
; i
!= NumOps
; ++i
) {
1046 const MCOperand
&MO
= MI
.getOperand(i
);
1047 if (!MO
.isReg()) continue;
1048 unsigned Reg
= MO
.getReg();
1049 if (Reg
== X86::AH
|| Reg
== X86::BH
|| Reg
== X86::CH
|| Reg
== X86::DH
)
1050 UsesHighByteReg
= true;
1051 if (X86II::isX86_64NonExtLowByteReg(Reg
))
1052 // FIXME: The caller of DetermineREXPrefix slaps this prefix onto anything
1053 // that returns non-zero.
1054 REX
|= 0x40; // REX fixed encoding prefix
1057 switch (TSFlags
& X86II::FormMask
) {
1058 case X86II::AddRegFrm
:
1059 REX
|= isREXExtendedReg(MI
, CurOp
++) << 0; // REX.B
1061 case X86II::MRMSrcReg
:
1062 REX
|= isREXExtendedReg(MI
, CurOp
++) << 2; // REX.R
1063 REX
|= isREXExtendedReg(MI
, CurOp
++) << 0; // REX.B
1065 case X86II::MRMSrcMem
: {
1066 REX
|= isREXExtendedReg(MI
, CurOp
++) << 2; // REX.R
1067 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrBaseReg
) << 0; // REX.B
1068 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrIndexReg
) << 1; // REX.X
1069 CurOp
+= X86::AddrNumOperands
;
1072 case X86II::MRMDestReg
:
1073 REX
|= isREXExtendedReg(MI
, CurOp
++) << 0; // REX.B
1074 REX
|= isREXExtendedReg(MI
, CurOp
++) << 2; // REX.R
1076 case X86II::MRMDestMem
:
1077 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrBaseReg
) << 0; // REX.B
1078 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrIndexReg
) << 1; // REX.X
1079 CurOp
+= X86::AddrNumOperands
;
1080 REX
|= isREXExtendedReg(MI
, CurOp
++) << 2; // REX.R
1083 case X86II::MRM0m
: case X86II::MRM1m
:
1084 case X86II::MRM2m
: case X86II::MRM3m
:
1085 case X86II::MRM4m
: case X86II::MRM5m
:
1086 case X86II::MRM6m
: case X86II::MRM7m
:
1087 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrBaseReg
) << 0; // REX.B
1088 REX
|= isREXExtendedReg(MI
, MemOperand
+X86::AddrIndexReg
) << 1; // REX.X
1091 case X86II::MRM0r
: case X86II::MRM1r
:
1092 case X86II::MRM2r
: case X86II::MRM3r
:
1093 case X86II::MRM4r
: case X86II::MRM5r
:
1094 case X86II::MRM6r
: case X86II::MRM7r
:
1095 REX
|= isREXExtendedReg(MI
, CurOp
++) << 0; // REX.B
1098 if (REX
&& UsesHighByteReg
)
1099 report_fatal_error("Cannot encode high byte register in REX-prefixed instruction");
1104 /// EmitSegmentOverridePrefix - Emit segment override opcode prefix as needed
1105 void X86MCCodeEmitter::EmitSegmentOverridePrefix(unsigned &CurByte
,
1106 unsigned SegOperand
,
1108 raw_ostream
&OS
) const {
1109 // Check for explicit segment override on memory operand.
1110 switch (MI
.getOperand(SegOperand
).getReg()) {
1111 default: llvm_unreachable("Unknown segment register!");
1113 case X86::CS
: EmitByte(0x2E, CurByte
, OS
); break;
1114 case X86::SS
: EmitByte(0x36, CurByte
, OS
); break;
1115 case X86::DS
: EmitByte(0x3E, CurByte
, OS
); break;
1116 case X86::ES
: EmitByte(0x26, CurByte
, OS
); break;
1117 case X86::FS
: EmitByte(0x64, CurByte
, OS
); break;
1118 case X86::GS
: EmitByte(0x65, CurByte
, OS
); break;
1122 /// Emit all instruction prefixes prior to the opcode.
1124 /// MemOperand is the operand # of the start of a memory operand if present. If
1125 /// Not present, it is -1.
1127 /// Returns true if a REX prefix was used.
1128 bool X86MCCodeEmitter::emitOpcodePrefix(uint64_t TSFlags
, unsigned &CurByte
,
1129 int MemOperand
, const MCInst
&MI
,
1130 const MCInstrDesc
&Desc
,
1131 const MCSubtargetInfo
&STI
,
1132 raw_ostream
&OS
) const {
1134 // Emit the operand size opcode prefix as needed.
1135 if ((TSFlags
& X86II::OpSizeMask
) == (is16BitMode(STI
) ? X86II::OpSize32
1137 EmitByte(0x66, CurByte
, OS
);
1139 // Emit the LOCK opcode prefix.
1140 if (TSFlags
& X86II::LOCK
|| MI
.getFlags() & X86::IP_HAS_LOCK
)
1141 EmitByte(0xF0, CurByte
, OS
);
1143 // Emit the NOTRACK opcode prefix.
1144 if (TSFlags
& X86II::NOTRACK
|| MI
.getFlags() & X86::IP_HAS_NOTRACK
)
1145 EmitByte(0x3E, CurByte
, OS
);
1147 switch (TSFlags
& X86II::OpPrefixMask
) {
1148 case X86II::PD
: // 66
1149 EmitByte(0x66, CurByte
, OS
);
1151 case X86II::XS
: // F3
1152 EmitByte(0xF3, CurByte
, OS
);
1154 case X86II::XD
: // F2
1155 EmitByte(0xF2, CurByte
, OS
);
1159 // Handle REX prefix.
1160 // FIXME: Can this come before F2 etc to simplify emission?
1161 if (is64BitMode(STI
)) {
1162 if (uint8_t REX
= DetermineREXPrefix(MI
, TSFlags
, MemOperand
, Desc
)) {
1163 EmitByte(0x40 | REX
, CurByte
, OS
);
1167 assert(!(TSFlags
& X86II::REX_W
) && "REX.W requires 64bit mode.");
1170 // 0x0F escape code must be emitted just before the opcode.
1171 switch (TSFlags
& X86II::OpMapMask
) {
1172 case X86II::TB
: // Two-byte opcode map
1173 case X86II::T8
: // 0F 38
1174 case X86II::TA
: // 0F 3A
1175 case X86II::ThreeDNow
: // 0F 0F, second 0F emitted by caller.
1176 EmitByte(0x0F, CurByte
, OS
);
1180 switch (TSFlags
& X86II::OpMapMask
) {
1181 case X86II::T8
: // 0F 38
1182 EmitByte(0x38, CurByte
, OS
);
1184 case X86II::TA
: // 0F 3A
1185 EmitByte(0x3A, CurByte
, OS
);
1191 void X86MCCodeEmitter::
1192 encodeInstruction(const MCInst
&MI
, raw_ostream
&OS
,
1193 SmallVectorImpl
<MCFixup
> &Fixups
,
1194 const MCSubtargetInfo
&STI
) const {
1195 unsigned Opcode
= MI
.getOpcode();
1196 const MCInstrDesc
&Desc
= MCII
.get(Opcode
);
1197 uint64_t TSFlags
= Desc
.TSFlags
;
1198 unsigned Flags
= MI
.getFlags();
1200 // Pseudo instructions don't get encoded.
1201 if ((TSFlags
& X86II::FormMask
) == X86II::Pseudo
)
1204 unsigned NumOps
= Desc
.getNumOperands();
1205 unsigned CurOp
= X86II::getOperandBias(Desc
);
1207 // Keep track of the current byte being emitted.
1208 unsigned CurByte
= 0;
1210 // Encoding type for this instruction.
1211 uint64_t Encoding
= TSFlags
& X86II::EncodingMask
;
1213 // It uses the VEX.VVVV field?
1214 bool HasVEX_4V
= TSFlags
& X86II::VEX_4V
;
1215 bool HasVEX_I8Reg
= (TSFlags
& X86II::ImmMask
) == X86II::Imm8Reg
;
1217 // It uses the EVEX.aaa field?
1218 bool HasEVEX_K
= TSFlags
& X86II::EVEX_K
;
1219 bool HasEVEX_RC
= TSFlags
& X86II::EVEX_RC
;
1221 // Used if a register is encoded in 7:4 of immediate.
1222 unsigned I8RegNum
= 0;
1224 // Determine where the memory operand starts, if present.
1225 int MemoryOperand
= X86II::getMemoryOperandNo(TSFlags
);
1226 if (MemoryOperand
!= -1) MemoryOperand
+= CurOp
;
1228 // Emit segment override opcode prefix as needed.
1229 if (MemoryOperand
>= 0)
1230 EmitSegmentOverridePrefix(CurByte
, MemoryOperand
+X86::AddrSegmentReg
,
1233 // Emit the repeat opcode prefix as needed.
1234 if (TSFlags
& X86II::REP
|| Flags
& X86::IP_HAS_REPEAT
)
1235 EmitByte(0xF3, CurByte
, OS
);
1236 if (Flags
& X86::IP_HAS_REPEAT_NE
)
1237 EmitByte(0xF2, CurByte
, OS
);
1239 // Emit the address size opcode prefix as needed.
1240 bool need_address_override
;
1241 uint64_t AdSize
= TSFlags
& X86II::AdSizeMask
;
1242 if ((is16BitMode(STI
) && AdSize
== X86II::AdSize32
) ||
1243 (is32BitMode(STI
) && AdSize
== X86II::AdSize16
) ||
1244 (is64BitMode(STI
) && AdSize
== X86II::AdSize32
)) {
1245 need_address_override
= true;
1246 } else if (MemoryOperand
< 0) {
1247 need_address_override
= false;
1248 } else if (is64BitMode(STI
)) {
1249 assert(!Is16BitMemOperand(MI
, MemoryOperand
, STI
));
1250 need_address_override
= Is32BitMemOperand(MI
, MemoryOperand
);
1251 } else if (is32BitMode(STI
)) {
1252 assert(!Is64BitMemOperand(MI
, MemoryOperand
));
1253 need_address_override
= Is16BitMemOperand(MI
, MemoryOperand
, STI
);
1255 assert(is16BitMode(STI
));
1256 assert(!Is64BitMemOperand(MI
, MemoryOperand
));
1257 need_address_override
= !Is16BitMemOperand(MI
, MemoryOperand
, STI
);
1260 if (need_address_override
)
1261 EmitByte(0x67, CurByte
, OS
);
1265 Rex
= emitOpcodePrefix(TSFlags
, CurByte
, MemoryOperand
, MI
, Desc
, STI
, OS
);
1267 EmitVEXOpcodePrefix(TSFlags
, CurByte
, MemoryOperand
, MI
, Desc
, OS
);
1269 uint8_t BaseOpcode
= X86II::getBaseOpcodeFor(TSFlags
);
1271 if ((TSFlags
& X86II::OpMapMask
) == X86II::ThreeDNow
)
1272 BaseOpcode
= 0x0F; // Weird 3DNow! encoding.
1274 uint64_t Form
= TSFlags
& X86II::FormMask
;
1276 default: errs() << "FORM: " << Form
<< "\n";
1277 llvm_unreachable("Unknown FormMask value in X86MCCodeEmitter!");
1279 llvm_unreachable("Pseudo instruction shouldn't be emitted");
1280 case X86II::RawFrmDstSrc
: {
1281 unsigned siReg
= MI
.getOperand(1).getReg();
1282 assert(((siReg
== X86::SI
&& MI
.getOperand(0).getReg() == X86::DI
) ||
1283 (siReg
== X86::ESI
&& MI
.getOperand(0).getReg() == X86::EDI
) ||
1284 (siReg
== X86::RSI
&& MI
.getOperand(0).getReg() == X86::RDI
)) &&
1285 "SI and DI register sizes do not match");
1286 // Emit segment override opcode prefix as needed (not for %ds).
1287 if (MI
.getOperand(2).getReg() != X86::DS
)
1288 EmitSegmentOverridePrefix(CurByte
, 2, MI
, OS
);
1289 // Emit AdSize prefix as needed.
1290 if ((!is32BitMode(STI
) && siReg
== X86::ESI
) ||
1291 (is32BitMode(STI
) && siReg
== X86::SI
))
1292 EmitByte(0x67, CurByte
, OS
);
1293 CurOp
+= 3; // Consume operands.
1294 EmitByte(BaseOpcode
, CurByte
, OS
);
1297 case X86II::RawFrmSrc
: {
1298 unsigned siReg
= MI
.getOperand(0).getReg();
1299 // Emit segment override opcode prefix as needed (not for %ds).
1300 if (MI
.getOperand(1).getReg() != X86::DS
)
1301 EmitSegmentOverridePrefix(CurByte
, 1, MI
, OS
);
1302 // Emit AdSize prefix as needed.
1303 if ((!is32BitMode(STI
) && siReg
== X86::ESI
) ||
1304 (is32BitMode(STI
) && siReg
== X86::SI
))
1305 EmitByte(0x67, CurByte
, OS
);
1306 CurOp
+= 2; // Consume operands.
1307 EmitByte(BaseOpcode
, CurByte
, OS
);
1310 case X86II::RawFrmDst
: {
1311 unsigned siReg
= MI
.getOperand(0).getReg();
1312 // Emit AdSize prefix as needed.
1313 if ((!is32BitMode(STI
) && siReg
== X86::EDI
) ||
1314 (is32BitMode(STI
) && siReg
== X86::DI
))
1315 EmitByte(0x67, CurByte
, OS
);
1316 ++CurOp
; // Consume operand.
1317 EmitByte(BaseOpcode
, CurByte
, OS
);
1320 case X86II::RawFrm
: {
1321 EmitByte(BaseOpcode
, CurByte
, OS
);
1323 if (!is64BitMode(STI
) || !isPCRel32Branch(MI
))
1326 const MCOperand
&Op
= MI
.getOperand(CurOp
++);
1327 EmitImmediate(Op
, MI
.getLoc(), X86II::getSizeOfImm(TSFlags
),
1328 MCFixupKind(X86::reloc_branch_4byte_pcrel
), CurByte
, OS
,
1332 case X86II::RawFrmMemOffs
:
1333 // Emit segment override opcode prefix as needed.
1334 EmitSegmentOverridePrefix(CurByte
, 1, MI
, OS
);
1335 EmitByte(BaseOpcode
, CurByte
, OS
);
1336 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(),
1337 X86II::getSizeOfImm(TSFlags
), getImmFixupKind(TSFlags
),
1338 CurByte
, OS
, Fixups
);
1339 ++CurOp
; // skip segment operand
1341 case X86II::RawFrmImm8
:
1342 EmitByte(BaseOpcode
, CurByte
, OS
);
1343 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(),
1344 X86II::getSizeOfImm(TSFlags
), getImmFixupKind(TSFlags
),
1345 CurByte
, OS
, Fixups
);
1346 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(), 1, FK_Data_1
, CurByte
,
1349 case X86II::RawFrmImm16
:
1350 EmitByte(BaseOpcode
, CurByte
, OS
);
1351 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(),
1352 X86II::getSizeOfImm(TSFlags
), getImmFixupKind(TSFlags
),
1353 CurByte
, OS
, Fixups
);
1354 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(), 2, FK_Data_2
, CurByte
,
1358 case X86II::AddRegFrm
:
1359 EmitByte(BaseOpcode
+ GetX86RegNum(MI
.getOperand(CurOp
++)), CurByte
, OS
);
1362 case X86II::MRMDestReg
: {
1363 EmitByte(BaseOpcode
, CurByte
, OS
);
1364 unsigned SrcRegNum
= CurOp
+ 1;
1366 if (HasEVEX_K
) // Skip writemask
1369 if (HasVEX_4V
) // Skip 1st src (which is encoded in VEX_VVVV)
1372 EmitRegModRMByte(MI
.getOperand(CurOp
),
1373 GetX86RegNum(MI
.getOperand(SrcRegNum
)), CurByte
, OS
);
1374 CurOp
= SrcRegNum
+ 1;
1377 case X86II::MRMDestMem
: {
1378 EmitByte(BaseOpcode
, CurByte
, OS
);
1379 unsigned SrcRegNum
= CurOp
+ X86::AddrNumOperands
;
1381 if (HasEVEX_K
) // Skip writemask
1384 if (HasVEX_4V
) // Skip 1st src (which is encoded in VEX_VVVV)
1387 emitMemModRMByte(MI
, CurOp
, GetX86RegNum(MI
.getOperand(SrcRegNum
)), TSFlags
,
1388 Rex
, CurByte
, OS
, Fixups
, STI
);
1389 CurOp
= SrcRegNum
+ 1;
1392 case X86II::MRMSrcReg
: {
1393 EmitByte(BaseOpcode
, CurByte
, OS
);
1394 unsigned SrcRegNum
= CurOp
+ 1;
1396 if (HasEVEX_K
) // Skip writemask
1399 if (HasVEX_4V
) // Skip 1st src (which is encoded in VEX_VVVV)
1402 EmitRegModRMByte(MI
.getOperand(SrcRegNum
),
1403 GetX86RegNum(MI
.getOperand(CurOp
)), CurByte
, OS
);
1404 CurOp
= SrcRegNum
+ 1;
1406 I8RegNum
= getX86RegEncoding(MI
, CurOp
++);
1407 // do not count the rounding control operand
1412 case X86II::MRMSrcReg4VOp3
: {
1413 EmitByte(BaseOpcode
, CurByte
, OS
);
1414 unsigned SrcRegNum
= CurOp
+ 1;
1416 EmitRegModRMByte(MI
.getOperand(SrcRegNum
),
1417 GetX86RegNum(MI
.getOperand(CurOp
)), CurByte
, OS
);
1418 CurOp
= SrcRegNum
+ 1;
1419 ++CurOp
; // Encoded in VEX.VVVV
1422 case X86II::MRMSrcRegOp4
: {
1423 EmitByte(BaseOpcode
, CurByte
, OS
);
1424 unsigned SrcRegNum
= CurOp
+ 1;
1426 // Skip 1st src (which is encoded in VEX_VVVV)
1429 // Capture 2nd src (which is encoded in Imm[7:4])
1430 assert(HasVEX_I8Reg
&& "MRMSrcRegOp4 should imply VEX_I8Reg");
1431 I8RegNum
= getX86RegEncoding(MI
, SrcRegNum
++);
1433 EmitRegModRMByte(MI
.getOperand(SrcRegNum
),
1434 GetX86RegNum(MI
.getOperand(CurOp
)), CurByte
, OS
);
1435 CurOp
= SrcRegNum
+ 1;
1438 case X86II::MRMSrcMem
: {
1439 unsigned FirstMemOp
= CurOp
+1;
1441 if (HasEVEX_K
) // Skip writemask
1445 ++FirstMemOp
; // Skip the register source (which is encoded in VEX_VVVV).
1447 EmitByte(BaseOpcode
, CurByte
, OS
);
1449 emitMemModRMByte(MI
, FirstMemOp
, GetX86RegNum(MI
.getOperand(CurOp
)),
1450 TSFlags
, Rex
, CurByte
, OS
, Fixups
, STI
);
1451 CurOp
= FirstMemOp
+ X86::AddrNumOperands
;
1453 I8RegNum
= getX86RegEncoding(MI
, CurOp
++);
1456 case X86II::MRMSrcMem4VOp3
: {
1457 unsigned FirstMemOp
= CurOp
+1;
1459 EmitByte(BaseOpcode
, CurByte
, OS
);
1461 emitMemModRMByte(MI
, FirstMemOp
, GetX86RegNum(MI
.getOperand(CurOp
)),
1462 TSFlags
, Rex
, CurByte
, OS
, Fixups
, STI
);
1463 CurOp
= FirstMemOp
+ X86::AddrNumOperands
;
1464 ++CurOp
; // Encoded in VEX.VVVV.
1467 case X86II::MRMSrcMemOp4
: {
1468 unsigned FirstMemOp
= CurOp
+1;
1470 ++FirstMemOp
; // Skip the register source (which is encoded in VEX_VVVV).
1472 // Capture second register source (encoded in Imm[7:4])
1473 assert(HasVEX_I8Reg
&& "MRMSrcRegOp4 should imply VEX_I8Reg");
1474 I8RegNum
= getX86RegEncoding(MI
, FirstMemOp
++);
1476 EmitByte(BaseOpcode
, CurByte
, OS
);
1478 emitMemModRMByte(MI
, FirstMemOp
, GetX86RegNum(MI
.getOperand(CurOp
)),
1479 TSFlags
, Rex
, CurByte
, OS
, Fixups
, STI
);
1480 CurOp
= FirstMemOp
+ X86::AddrNumOperands
;
1485 case X86II::MRM0r
: case X86II::MRM1r
:
1486 case X86II::MRM2r
: case X86II::MRM3r
:
1487 case X86II::MRM4r
: case X86II::MRM5r
:
1488 case X86II::MRM6r
: case X86II::MRM7r
:
1489 if (HasVEX_4V
) // Skip the register dst (which is encoded in VEX_VVVV).
1491 if (HasEVEX_K
) // Skip writemask
1493 EmitByte(BaseOpcode
, CurByte
, OS
);
1494 EmitRegModRMByte(MI
.getOperand(CurOp
++),
1495 (Form
== X86II::MRMXr
) ? 0 : Form
-X86II::MRM0r
,
1500 case X86II::MRM0m
: case X86II::MRM1m
:
1501 case X86II::MRM2m
: case X86II::MRM3m
:
1502 case X86II::MRM4m
: case X86II::MRM5m
:
1503 case X86II::MRM6m
: case X86II::MRM7m
:
1504 if (HasVEX_4V
) // Skip the register dst (which is encoded in VEX_VVVV).
1506 if (HasEVEX_K
) // Skip writemask
1508 EmitByte(BaseOpcode
, CurByte
, OS
);
1509 emitMemModRMByte(MI
, CurOp
,
1510 (Form
== X86II::MRMXm
) ? 0 : Form
- X86II::MRM0m
, TSFlags
,
1511 Rex
, CurByte
, OS
, Fixups
, STI
);
1512 CurOp
+= X86::AddrNumOperands
;
1515 case X86II::MRM_C0
: case X86II::MRM_C1
: case X86II::MRM_C2
:
1516 case X86II::MRM_C3
: case X86II::MRM_C4
: case X86II::MRM_C5
:
1517 case X86II::MRM_C6
: case X86II::MRM_C7
: case X86II::MRM_C8
:
1518 case X86II::MRM_C9
: case X86II::MRM_CA
: case X86II::MRM_CB
:
1519 case X86II::MRM_CC
: case X86II::MRM_CD
: case X86II::MRM_CE
:
1520 case X86II::MRM_CF
: case X86II::MRM_D0
: case X86II::MRM_D1
:
1521 case X86II::MRM_D2
: case X86II::MRM_D3
: case X86II::MRM_D4
:
1522 case X86II::MRM_D5
: case X86II::MRM_D6
: case X86II::MRM_D7
:
1523 case X86II::MRM_D8
: case X86II::MRM_D9
: case X86II::MRM_DA
:
1524 case X86II::MRM_DB
: case X86II::MRM_DC
: case X86II::MRM_DD
:
1525 case X86II::MRM_DE
: case X86II::MRM_DF
: case X86II::MRM_E0
:
1526 case X86II::MRM_E1
: case X86II::MRM_E2
: case X86II::MRM_E3
:
1527 case X86II::MRM_E4
: case X86II::MRM_E5
: case X86II::MRM_E6
:
1528 case X86II::MRM_E7
: case X86II::MRM_E8
: case X86II::MRM_E9
:
1529 case X86II::MRM_EA
: case X86II::MRM_EB
: case X86II::MRM_EC
:
1530 case X86II::MRM_ED
: case X86II::MRM_EE
: case X86II::MRM_EF
:
1531 case X86II::MRM_F0
: case X86II::MRM_F1
: case X86II::MRM_F2
:
1532 case X86II::MRM_F3
: case X86II::MRM_F4
: case X86II::MRM_F5
:
1533 case X86II::MRM_F6
: case X86II::MRM_F7
: case X86II::MRM_F8
:
1534 case X86II::MRM_F9
: case X86II::MRM_FA
: case X86II::MRM_FB
:
1535 case X86II::MRM_FC
: case X86II::MRM_FD
: case X86II::MRM_FE
:
1537 EmitByte(BaseOpcode
, CurByte
, OS
);
1538 EmitByte(0xC0 + Form
- X86II::MRM_C0
, CurByte
, OS
);
1543 // The last source register of a 4 operand instruction in AVX is encoded
1544 // in bits[7:4] of a immediate byte.
1545 assert(I8RegNum
< 16 && "Register encoding out of range");
1547 if (CurOp
!= NumOps
) {
1548 unsigned Val
= MI
.getOperand(CurOp
++).getImm();
1549 assert(Val
< 16 && "Immediate operand value out of range");
1552 EmitImmediate(MCOperand::createImm(I8RegNum
), MI
.getLoc(), 1, FK_Data_1
,
1553 CurByte
, OS
, Fixups
);
1555 // If there is a remaining operand, it must be a trailing immediate. Emit it
1556 // according to the right size for the instruction. Some instructions
1557 // (SSE4a extrq and insertq) have two trailing immediates.
1558 while (CurOp
!= NumOps
&& NumOps
- CurOp
<= 2) {
1559 EmitImmediate(MI
.getOperand(CurOp
++), MI
.getLoc(),
1560 X86II::getSizeOfImm(TSFlags
), getImmFixupKind(TSFlags
),
1561 CurByte
, OS
, Fixups
);
1565 if ((TSFlags
& X86II::OpMapMask
) == X86II::ThreeDNow
)
1566 EmitByte(X86II::getBaseOpcodeFor(TSFlags
), CurByte
, OS
);
1570 if (/*!Desc.isVariadic() &&*/ CurOp
!= NumOps
) {
1571 errs() << "Cannot encode all operands of: ";
1579 MCCodeEmitter
*llvm::createX86MCCodeEmitter(const MCInstrInfo
&MCII
,
1580 const MCRegisterInfo
&MRI
,
1582 return new X86MCCodeEmitter(MCII
, Ctx
);