1 //===-- llvm-mcmarkup.cpp - Parse the MC assembly markup tags -------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // Example simple parser implementation for the MC assembly markup language.
12 //===----------------------------------------------------------------------===//
14 #include "llvm/Support/CommandLine.h"
15 #include "llvm/Support/Format.h"
16 #include "llvm/Support/ManagedStatic.h"
17 #include "llvm/Support/MemoryBuffer.h"
18 #include "llvm/Support/PrettyStackTrace.h"
19 #include "llvm/Support/Signals.h"
20 #include "llvm/Support/SourceMgr.h"
21 #include "llvm/Support/raw_ostream.h"
22 #include <system_error>
25 static cl::list
<std::string
>
26 InputFilenames(cl::Positional
, cl::desc("<input files>"),
29 DumpTags("dump-tags", cl::desc("List all tags encountered in input"));
31 static StringRef ToolName
;
33 /// Trivial lexer for the markup parser. Input is always handled a character
34 /// at a time. The lexer just encapsulates EOF and lookahead handling.
36 StringRef::const_iterator Start
;
37 StringRef::const_iterator CurPtr
;
38 StringRef::const_iterator End
;
40 MarkupLexer(StringRef Source
)
41 : Start(Source
.begin()), CurPtr(Source
.begin()), End(Source
.end()) {}
42 // When processing non-markup, input is consumed a character at a time.
43 bool isEOF() { return CurPtr
== End
; }
45 if (CurPtr
== End
) return EOF
;
49 if (CurPtr
== End
) return EOF
;
52 StringRef::const_iterator
getPosition() const { return CurPtr
; }
55 /// A markup tag is a name and a (usually empty) list of modifiers.
61 MarkupTag(StringRef n
, StringRef m
, SMLoc Loc
)
62 : Name(n
), Modifiers(m
), StartLoc(Loc
) {}
63 StringRef
getName() const { return Name
; }
64 StringRef
getModifiers() const { return Modifiers
; }
65 SMLoc
getLoc() const { return StartLoc
; }
68 /// A simple parser implementation for creating MarkupTags from input text.
73 MarkupParser(MarkupLexer
&lex
, SourceMgr
&SrcMgr
) : Lex(lex
), SM(SrcMgr
) {}
74 /// Create a MarkupTag from the current position in the MarkupLexer.
75 /// The parseTag() method should be called when the lexer has processed
76 /// the opening '<' character. Input will be consumed up to and including
77 /// the ':' which terminates the tag open.
79 /// Issue a diagnostic and terminate program execution.
80 void FatalError(SMLoc Loc
, StringRef Msg
);
83 void MarkupParser::FatalError(SMLoc Loc
, StringRef Msg
) {
84 SM
.PrintMessage(Loc
, SourceMgr::DK_Error
, Msg
);
88 // Example handler for when a tag is recognized.
89 static void processStartTag(MarkupTag
&Tag
) {
90 // If we're just printing the tags, do that, otherwise do some simple
93 outs() << Tag
.getName();
94 if (Tag
.getModifiers().size())
95 outs() << " " << Tag
.getModifiers();
100 if (!outs().has_colors())
102 // Color registers as red and immediates as cyan. Those don't have nested
103 // tags, so don't bother keeping a stack of colors to reset to.
104 if (Tag
.getName() == "reg")
105 outs().changeColor(raw_ostream::RED
);
106 else if (Tag
.getName() == "imm")
107 outs().changeColor(raw_ostream::CYAN
);
110 // Example handler for when the end of a tag is recognized.
111 static void processEndTag(MarkupTag
&Tag
) {
112 // If we're printing the tags, there's nothing more to do here. Otherwise,
113 // set the color back the normal.
116 if (!outs().has_colors())
118 // Just reset to basic white.
119 outs().changeColor(raw_ostream::WHITE
, false);
122 MarkupTag
MarkupParser::parseTag() {
123 // First off, extract the tag into it's own StringRef so we can look at it
124 // outside of the context of consuming input.
125 StringRef::const_iterator Start
= Lex
.getPosition();
126 SMLoc Loc
= SMLoc::getFromPointer(Start
- 1);
127 while(Lex
.getNextChar() != ':') {
130 FatalError(SMLoc::getFromPointer(Start
), "unterminated markup tag");
132 StringRef
RawTag(Start
, Lex
.getPosition() - Start
- 1);
133 std::pair
<StringRef
, StringRef
> SplitTag
= RawTag
.split(' ');
134 return MarkupTag(SplitTag
.first
, SplitTag
.second
, Loc
);
137 static void parseMCMarkup(StringRef Filename
) {
138 ErrorOr
<std::unique_ptr
<MemoryBuffer
>> BufferPtr
=
139 MemoryBuffer::getFileOrSTDIN(Filename
);
140 if (std::error_code EC
= BufferPtr
.getError()) {
141 errs() << ToolName
<< ": " << EC
.message() << '\n';
144 std::unique_ptr
<MemoryBuffer
> &Buffer
= BufferPtr
.get();
148 StringRef InputSource
= Buffer
->getBuffer();
150 // Tell SrcMgr about this buffer, which is what the parser will pick up.
151 SrcMgr
.AddNewSourceBuffer(std::move(Buffer
), SMLoc());
153 MarkupLexer
Lex(InputSource
);
154 MarkupParser
Parser(Lex
, SrcMgr
);
156 SmallVector
<MarkupTag
, 4> TagStack
;
158 for (int CurChar
= Lex
.getNextChar();
160 CurChar
= Lex
.getNextChar()) {
163 // A "<<" is output as a literal '<' and does not start a markup tag.
164 if (Lex
.peekNextChar() == '<') {
165 (void)Lex
.getNextChar();
168 // Parse the markup entry.
169 TagStack
.push_back(Parser
.parseTag());
171 // Do any special handling for the start of a tag.
172 processStartTag(TagStack
.back());
176 SMLoc Loc
= SMLoc::getFromPointer(Lex
.getPosition() - 1);
177 // A ">>" is output as a literal '>' and does not end a markup tag.
178 if (Lex
.peekNextChar() == '>') {
179 (void)Lex
.getNextChar();
182 // Close out the innermost tag.
183 if (TagStack
.empty())
184 Parser
.FatalError(Loc
, "'>' without matching '<'");
186 // Do any special handling for the end of a tag.
187 processEndTag(TagStack
.back());
195 // For anything else, just echo the character back out.
196 if (!DumpTags
&& CurChar
!= EOF
)
197 outs() << (char)CurChar
;
200 // If there are any unterminated markup tags, issue diagnostics for them.
201 while (!TagStack
.empty()) {
202 MarkupTag
&Tag
= TagStack
.back();
203 SrcMgr
.PrintMessage(Tag
.getLoc(), SourceMgr::DK_Error
,
204 "unterminated markup tag");
209 int main(int argc
, char **argv
) {
210 // Print a stack trace if we signal out.
211 sys::PrintStackTraceOnErrorSignal(argv
[0]);
212 PrettyStackTraceProgram
X(argc
, argv
);
214 llvm_shutdown_obj Y
; // Call llvm_shutdown() on exit.
215 cl::ParseCommandLineOptions(argc
, argv
, "llvm MC markup parser\n");
219 // If no input files specified, read from stdin.
220 if (InputFilenames
.size() == 0)
221 InputFilenames
.push_back("-");
223 std::for_each(InputFilenames
.begin(), InputFilenames
.end(),