1 //===-- AsmPrinterInlineAsm.cpp - AsmPrinter Inline Asm Handling ----------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file implements the inline assembler pieces of the AsmPrinter class.
11 //===----------------------------------------------------------------------===//
13 #include "llvm/ADT/SmallString.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/StringExtras.h"
16 #include "llvm/ADT/Twine.h"
17 #include "llvm/CodeGen/AsmPrinter.h"
18 #include "llvm/CodeGen/MachineBasicBlock.h"
19 #include "llvm/CodeGen/MachineFunction.h"
20 #include "llvm/CodeGen/MachineModuleInfo.h"
21 #include "llvm/CodeGen/TargetRegisterInfo.h"
22 #include "llvm/CodeGen/TargetSubtargetInfo.h"
23 #include "llvm/IR/Constants.h"
24 #include "llvm/IR/DataLayout.h"
25 #include "llvm/IR/DiagnosticInfo.h"
26 #include "llvm/IR/InlineAsm.h"
27 #include "llvm/IR/LLVMContext.h"
28 #include "llvm/IR/Module.h"
29 #include "llvm/MC/MCAsmInfo.h"
30 #include "llvm/MC/MCInstrInfo.h"
31 #include "llvm/MC/MCParser/MCAsmLexer.h"
32 #include "llvm/MC/MCParser/MCTargetAsmParser.h"
33 #include "llvm/MC/MCStreamer.h"
34 #include "llvm/MC/MCSymbol.h"
35 #include "llvm/MC/TargetRegistry.h"
36 #include "llvm/Support/ErrorHandling.h"
37 #include "llvm/Support/MemoryBuffer.h"
38 #include "llvm/Support/SourceMgr.h"
39 #include "llvm/Support/raw_ostream.h"
40 #include "llvm/Target/TargetMachine.h"
43 #define DEBUG_TYPE "asm-printer"
45 unsigned AsmPrinter::addInlineAsmDiagBuffer(StringRef AsmStr
,
46 const MDNode
*LocMDNode
) const {
47 MCContext
&Context
= MMI
->getContext();
48 Context
.initInlineSourceManager();
49 SourceMgr
&SrcMgr
= *Context
.getInlineSourceManager();
50 std::vector
<const MDNode
*> &LocInfos
= Context
.getLocInfos();
52 std::unique_ptr
<MemoryBuffer
> Buffer
;
53 // The inline asm source manager will outlive AsmStr, so make a copy of the
54 // string for SourceMgr to own.
55 Buffer
= MemoryBuffer::getMemBufferCopy(AsmStr
, "<inline asm>");
57 // Tell SrcMgr about this buffer, it takes ownership of the buffer.
58 unsigned BufNum
= SrcMgr
.AddNewSourceBuffer(std::move(Buffer
), SMLoc());
60 // Store LocMDNode in DiagInfo, using BufNum as an identifier.
62 LocInfos
.resize(BufNum
);
63 LocInfos
[BufNum
- 1] = LocMDNode
;
70 /// EmitInlineAsm - Emit a blob of inline asm to the output streamer.
71 void AsmPrinter::emitInlineAsm(StringRef Str
, const MCSubtargetInfo
&STI
,
72 const MCTargetOptions
&MCOptions
,
73 const MDNode
*LocMDNode
,
74 InlineAsm::AsmDialect Dialect
) const {
75 assert(!Str
.empty() && "Can't emit empty inline asm block");
77 // Remember if the buffer is nul terminated or not so we can avoid a copy.
78 bool isNullTerminated
= Str
.back() == 0;
80 Str
= Str
.substr(0, Str
.size()-1);
82 // If the output streamer does not have mature MC support or the integrated
83 // assembler has been disabled or not required, just emit the blob textually.
84 // Otherwise parse the asm and emit it via MC support.
85 // This is useful in case the asm parser doesn't handle something but the
86 // system assembler does.
87 const MCAsmInfo
*MCAI
= TM
.getMCAsmInfo();
88 assert(MCAI
&& "No MCAsmInfo");
89 if (!MCAI
->useIntegratedAssembler() &&
90 !MCAI
->parseInlineAsmUsingAsmParser() &&
91 !OutStreamer
->isIntegratedAssemblerRequired()) {
93 OutStreamer
->emitRawText(Str
);
94 emitInlineAsmEnd(STI
, nullptr);
98 unsigned BufNum
= addInlineAsmDiagBuffer(Str
, LocMDNode
);
99 SourceMgr
&SrcMgr
= *MMI
->getContext().getInlineSourceManager();
100 SrcMgr
.setIncludeDirs(MCOptions
.IASSearchPaths
);
102 std::unique_ptr
<MCAsmParser
> Parser(
103 createMCAsmParser(SrcMgr
, OutContext
, *OutStreamer
, *MAI
, BufNum
));
105 // We create a new MCInstrInfo here since we might be at the module level
106 // and not have a MachineFunction to initialize the TargetInstrInfo from and
107 // we only need MCInstrInfo for asm parsing. We create one unconditionally
108 // because it's not subtarget dependent.
109 std::unique_ptr
<MCInstrInfo
> MII(TM
.getTarget().createMCInstrInfo());
110 assert(MII
&& "Failed to create instruction info");
111 std::unique_ptr
<MCTargetAsmParser
> TAP(TM
.getTarget().createMCAsmParser(
112 STI
, *Parser
, *MII
, MCOptions
));
114 report_fatal_error("Inline asm not supported by this streamer because"
115 " we don't have an asm parser for this target\n");
117 // Respect inlineasm dialect on X86 targets only
118 if (TM
.getTargetTriple().isX86()) {
119 Parser
->setAssemblerDialect(Dialect
);
120 // Enable lexing Masm binary and hex integer literals in intel inline
122 if (Dialect
== InlineAsm::AD_Intel
)
123 Parser
->getLexer().setLexMasmIntegers(true);
125 Parser
->setTargetParser(*TAP
);
127 emitInlineAsmStart();
128 // Don't implicitly switch to the text section before the asm.
129 (void)Parser
->Run(/*NoInitialTextSection*/ true,
130 /*NoFinalize*/ true);
131 emitInlineAsmEnd(STI
, &TAP
->getSTI());
134 static void EmitInlineAsmStr(const char *AsmStr
, const MachineInstr
*MI
,
135 MachineModuleInfo
*MMI
, const MCAsmInfo
*MAI
,
136 AsmPrinter
*AP
, uint64_t LocCookie
,
138 bool InputIsIntelDialect
= MI
->getInlineAsmDialect() == InlineAsm::AD_Intel
;
140 if (InputIsIntelDialect
) {
141 // Switch to the inline assembly variant.
142 OS
<< "\t.intel_syntax\n\t";
145 int CurVariant
= -1; // The number of the {.|.|.} region we are in.
146 const char *LastEmitted
= AsmStr
; // One past the last character emitted.
147 unsigned NumOperands
= MI
->getNumOperands();
149 int AsmPrinterVariant
;
150 if (InputIsIntelDialect
)
151 AsmPrinterVariant
= 1; // X86MCAsmInfo.cpp's AsmWriterFlavorTy::Intel.
153 AsmPrinterVariant
= MMI
->getTarget().unqualifiedInlineAsmVariant();
155 // FIXME: Should this happen for `asm inteldialect` as well?
156 if (!InputIsIntelDialect
&& MAI
->getEmitGNUAsmStartIndentationMarker())
159 while (*LastEmitted
) {
160 switch (*LastEmitted
) {
162 // Not a special case, emit the string section literally.
163 const char *LiteralEnd
= LastEmitted
+1;
164 while (*LiteralEnd
&& *LiteralEnd
!= '{' && *LiteralEnd
!= '|' &&
165 *LiteralEnd
!= '}' && *LiteralEnd
!= '$' && *LiteralEnd
!= '\n')
167 if (CurVariant
== -1 || CurVariant
== AsmPrinterVariant
)
168 OS
.write(LastEmitted
, LiteralEnd
- LastEmitted
);
169 LastEmitted
= LiteralEnd
;
173 ++LastEmitted
; // Consume newline character.
174 OS
<< '\n'; // Indent code with newline.
177 ++LastEmitted
; // Consume '$' character.
181 switch (*LastEmitted
) {
182 default: Done
= false; break;
184 if (!InputIsIntelDialect
)
185 if (CurVariant
== -1 || CurVariant
== AsmPrinterVariant
)
187 ++LastEmitted
; // Consume second '$' character.
189 case '(': // $( -> same as GCC's { character.
190 ++LastEmitted
; // Consume '(' character.
191 if (CurVariant
!= -1)
192 report_fatal_error("Nested variants found in inline asm string: '" +
193 Twine(AsmStr
) + "'");
194 CurVariant
= 0; // We're in the first variant now.
197 ++LastEmitted
; // Consume '|' character.
198 if (CurVariant
== -1)
199 OS
<< '|'; // This is gcc's behavior for | outside a variant.
201 ++CurVariant
; // We're in the next variant.
203 case ')': // $) -> same as GCC's } char.
204 ++LastEmitted
; // Consume ')' character.
205 if (CurVariant
== -1)
206 OS
<< '}'; // This is gcc's behavior for } outside a variant.
213 bool HasCurlyBraces
= false;
214 if (*LastEmitted
== '{') { // ${variable}
215 ++LastEmitted
; // Consume '{' character.
216 HasCurlyBraces
= true;
219 // If we have ${:foo}, then this is not a real operand reference, it is a
220 // "magic" string reference, just like in .td files. Arrange to call
222 if (HasCurlyBraces
&& *LastEmitted
== ':') {
224 const char *StrStart
= LastEmitted
;
225 const char *StrEnd
= strchr(StrStart
, '}');
227 report_fatal_error("Unterminated ${:foo} operand in inline asm"
228 " string: '" + Twine(AsmStr
) + "'");
229 if (CurVariant
== -1 || CurVariant
== AsmPrinterVariant
)
230 AP
->PrintSpecial(MI
, OS
, StringRef(StrStart
, StrEnd
- StrStart
));
231 LastEmitted
= StrEnd
+1;
235 const char *IDStart
= LastEmitted
;
236 const char *IDEnd
= IDStart
;
237 while (isDigit(*IDEnd
))
241 if (StringRef(IDStart
, IDEnd
-IDStart
).getAsInteger(10, Val
))
242 report_fatal_error("Bad $ operand number in inline asm string: '" +
243 Twine(AsmStr
) + "'");
246 if (Val
>= NumOperands
- 1)
247 report_fatal_error("Invalid $ operand number in inline asm string: '" +
248 Twine(AsmStr
) + "'");
250 char Modifier
[2] = { 0, 0 };
252 if (HasCurlyBraces
) {
253 // If we have curly braces, check for a modifier character. This
254 // supports syntax like ${0:u}, which correspond to "%u0" in GCC asm.
255 if (*LastEmitted
== ':') {
256 ++LastEmitted
; // Consume ':' character.
257 if (*LastEmitted
== 0)
258 report_fatal_error("Bad ${:} expression in inline asm string: '" +
259 Twine(AsmStr
) + "'");
261 Modifier
[0] = *LastEmitted
;
262 ++LastEmitted
; // Consume modifier character.
265 if (*LastEmitted
!= '}')
266 report_fatal_error("Bad ${} expression in inline asm string: '" +
267 Twine(AsmStr
) + "'");
268 ++LastEmitted
; // Consume '}' character.
271 // Okay, we finally have a value number. Ask the target to print this
273 if (CurVariant
== -1 || CurVariant
== AsmPrinterVariant
) {
274 unsigned OpNo
= InlineAsm::MIOp_FirstOperand
;
278 // Scan to find the machine operand number for the operand.
280 if (OpNo
>= MI
->getNumOperands())
282 const InlineAsm::Flag
F(MI
->getOperand(OpNo
).getImm());
283 OpNo
+= F
.getNumOperandRegisters() + 1;
286 // We may have a location metadata attached to the end of the
287 // instruction, and at no point should see metadata at any
288 // other point while processing. It's an error if so.
289 if (OpNo
>= MI
->getNumOperands() || MI
->getOperand(OpNo
).isMetadata()) {
292 const InlineAsm::Flag
F(MI
->getOperand(OpNo
).getImm());
293 ++OpNo
; // Skip over the ID number.
295 // FIXME: Shouldn't arch-independent output template handling go into
297 // Labels are target independent.
298 if (MI
->getOperand(OpNo
).isBlockAddress()) {
299 const BlockAddress
*BA
= MI
->getOperand(OpNo
).getBlockAddress();
300 MCSymbol
*Sym
= AP
->GetBlockAddressSymbol(BA
);
301 Sym
->print(OS
, AP
->MAI
);
302 MMI
->getContext().registerInlineAsmLabel(Sym
);
303 } else if (MI
->getOperand(OpNo
).isMBB()) {
304 const MCSymbol
*Sym
= MI
->getOperand(OpNo
).getMBB()->getSymbol();
305 Sym
->print(OS
, AP
->MAI
);
306 } else if (F
.isMemKind()) {
307 Error
= AP
->PrintAsmMemoryOperand(
308 MI
, OpNo
, Modifier
[0] ? Modifier
: nullptr, OS
);
310 Error
= AP
->PrintAsmOperand(MI
, OpNo
,
311 Modifier
[0] ? Modifier
: nullptr, OS
);
315 const Function
&Fn
= MI
->getMF()->getFunction();
316 Fn
.getContext().diagnose(DiagnosticInfoInlineAsm(
318 "invalid operand in inline asm: '" + Twine(AsmStr
) + "'"));
325 if (InputIsIntelDialect
)
326 OS
<< "\n\t.att_syntax";
327 OS
<< '\n' << (char)0; // null terminate string.
330 /// This method formats and emits the specified machine instruction that is an
332 void AsmPrinter::emitInlineAsm(const MachineInstr
*MI
) const {
333 assert(MI
->isInlineAsm() && "printInlineAsm only works on inline asms");
335 // Disassemble the AsmStr, printing out the literal pieces, the operands, etc.
336 const char *AsmStr
= MI
->getOperand(0).getSymbolName();
338 // If this asmstr is empty, just print the #APP/#NOAPP markers.
339 // These are useful to see where empty asm's wound up.
340 if (AsmStr
[0] == 0) {
341 OutStreamer
->emitRawComment(MAI
->getInlineAsmStart());
342 OutStreamer
->emitRawComment(MAI
->getInlineAsmEnd());
346 // Emit the #APP start marker. This has to happen even if verbose-asm isn't
347 // enabled, so we use emitRawComment.
348 OutStreamer
->emitRawComment(MAI
->getInlineAsmStart());
350 const MDNode
*LocMD
= MI
->getLocCookieMD();
353 ? mdconst::extract
<ConstantInt
>(LocMD
->getOperand(0))->getZExtValue()
356 // Emit the inline asm to a temporary string so we can emit it through
358 SmallString
<256> StringData
;
359 raw_svector_ostream
OS(StringData
);
361 AsmPrinter
*AP
= const_cast<AsmPrinter
*>(this);
362 EmitInlineAsmStr(AsmStr
, MI
, MMI
, MAI
, AP
, LocCookie
, OS
);
364 // Emit warnings if we use reserved registers on the clobber list, as
365 // that might lead to undefined behaviour.
366 SmallVector
<Register
, 8> RestrRegs
;
367 const TargetRegisterInfo
*TRI
= MF
->getSubtarget().getRegisterInfo();
368 // Start with the first operand descriptor, and iterate over them.
369 for (unsigned I
= InlineAsm::MIOp_FirstOperand
, NumOps
= MI
->getNumOperands();
371 const MachineOperand
&MO
= MI
->getOperand(I
);
374 const InlineAsm::Flag
F(MO
.getImm());
375 if (F
.isClobberKind()) {
376 Register Reg
= MI
->getOperand(I
+ 1).getReg();
377 if (!TRI
->isAsmClobberable(*MF
, Reg
))
378 RestrRegs
.push_back(Reg
);
380 // Skip to one before the next operand descriptor, if it exists.
381 I
+= F
.getNumOperandRegisters();
384 if (!RestrRegs
.empty()) {
385 std::string Msg
= "inline asm clobber list contains reserved registers: ";
387 for (const Register RR
: RestrRegs
) {
389 Msg
+= TRI
->getRegAsmName(RR
);
392 const Function
&Fn
= MF
->getFunction();
394 "Reserved registers on the clobber list may not be "
395 "preserved across the asm statement, and clobbering them may "
396 "lead to undefined behaviour.";
397 LLVMContext
&Ctx
= Fn
.getContext();
398 Ctx
.diagnose(DiagnosticInfoInlineAsm(LocCookie
, Msg
,
399 DiagnosticSeverity::DS_Warning
));
401 DiagnosticInfoInlineAsm(LocCookie
, Note
, DiagnosticSeverity::DS_Note
));
403 for (const Register RR
: RestrRegs
) {
404 if (std::optional
<std::string
> reason
=
405 TRI
->explainReservedReg(*MF
, RR
)) {
406 Ctx
.diagnose(DiagnosticInfoInlineAsm(LocCookie
, *reason
,
407 DiagnosticSeverity::DS_Note
));
412 emitInlineAsm(StringData
, getSubtargetInfo(), TM
.Options
.MCOptions
, LocMD
,
413 MI
->getInlineAsmDialect());
415 // Emit the #NOAPP end marker. This has to happen even if verbose-asm isn't
416 // enabled, so we use emitRawComment.
417 OutStreamer
->emitRawComment(MAI
->getInlineAsmEnd());
420 /// PrintSpecial - Print information related to the specified machine instr
421 /// that is independent of the operand, and may be independent of the instr
422 /// itself. This can be useful for portably encoding the comment character
423 /// or other bits of target-specific knowledge into the asmstrings. The
424 /// syntax used is ${:comment}. Targets can override this to add support
425 /// for their own strange codes.
426 void AsmPrinter::PrintSpecial(const MachineInstr
*MI
, raw_ostream
&OS
,
427 StringRef Code
) const {
428 if (Code
== "private") {
429 const DataLayout
&DL
= MF
->getDataLayout();
430 OS
<< DL
.getPrivateGlobalPrefix();
431 } else if (Code
== "comment") {
432 OS
<< MAI
->getCommentString();
433 } else if (Code
== "uid") {
434 // Comparing the address of MI isn't sufficient, because machineinstrs may
435 // be allocated to the same address across functions.
437 // If this is a new LastFn instruction, bump the counter.
438 if (LastMI
!= MI
|| LastFn
!= getFunctionNumber()) {
441 LastFn
= getFunctionNumber();
446 raw_string_ostream
Msg(msg
);
447 Msg
<< "Unknown special formatter '" << Code
448 << "' for machine instr: " << *MI
;
449 report_fatal_error(Twine(Msg
.str()));
453 void AsmPrinter::PrintSymbolOperand(const MachineOperand
&MO
, raw_ostream
&OS
) {
454 assert(MO
.isGlobal() && "caller should check MO.isGlobal");
455 getSymbolPreferLocal(*MO
.getGlobal())->print(OS
, MAI
);
456 printOffset(MO
.getOffset(), OS
);
459 /// PrintAsmOperand - Print the specified operand of MI, an INLINEASM
460 /// instruction, using the specified assembler variant. Targets should
461 /// override this to format as appropriate for machine specific ExtraCodes
462 /// or when the arch-independent handling would be too complex otherwise.
463 bool AsmPrinter::PrintAsmOperand(const MachineInstr
*MI
, unsigned OpNo
,
464 const char *ExtraCode
, raw_ostream
&O
) {
465 // Does this asm operand have a single letter operand modifier?
466 if (ExtraCode
&& ExtraCode
[0]) {
467 if (ExtraCode
[1] != 0) return true; // Unknown modifier.
469 // https://gcc.gnu.org/onlinedocs/gccint/Output-Template.html
470 const MachineOperand
&MO
= MI
->getOperand(OpNo
);
471 switch (ExtraCode
[0]) {
473 return true; // Unknown modifier.
474 case 'a': // Print as memory address.
476 PrintAsmMemoryOperand(MI
, OpNo
, nullptr, O
);
479 [[fallthrough
]]; // GCC allows '%a' to behave like '%c' with immediates.
480 case 'c': // Substitute immediate value without immediate syntax
486 PrintSymbolOperand(MO
, O
);
490 case 'n': // Negate the immediate constant.
495 case 's': // The GCC deprecated s modifier
498 O
<< ((32 - MO
.getImm()) & 31);
505 bool AsmPrinter::PrintAsmMemoryOperand(const MachineInstr
*MI
, unsigned OpNo
,
506 const char *ExtraCode
, raw_ostream
&O
) {
507 // Target doesn't support this yet!
511 void AsmPrinter::emitInlineAsmStart() const {}
513 void AsmPrinter::emitInlineAsmEnd(const MCSubtargetInfo
&StartInfo
,
514 const MCSubtargetInfo
*EndInfo
) const {}