xref: /aosp_15_r20/external/llvm/tools/llvm-mcmarkup/llvm-mcmarkup.cpp (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker //===-- llvm-mcmarkup.cpp - Parse the MC assembly markup tags -------------===//
2*9880d681SAndroid Build Coastguard Worker //
3*9880d681SAndroid Build Coastguard Worker //                     The LLVM Compiler Infrastructure
4*9880d681SAndroid Build Coastguard Worker //
5*9880d681SAndroid Build Coastguard Worker // This file is distributed under the University of Illinois Open Source
6*9880d681SAndroid Build Coastguard Worker // License. See LICENSE.TXT for details.
7*9880d681SAndroid Build Coastguard Worker //
8*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
9*9880d681SAndroid Build Coastguard Worker //
10*9880d681SAndroid Build Coastguard Worker // Example simple parser implementation for the MC assembly markup language.
11*9880d681SAndroid Build Coastguard Worker //
12*9880d681SAndroid Build Coastguard Worker //===----------------------------------------------------------------------===//
13*9880d681SAndroid Build Coastguard Worker 
14*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/CommandLine.h"
15*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/Format.h"
16*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/ManagedStatic.h"
17*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/MemoryBuffer.h"
18*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/PrettyStackTrace.h"
19*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/Signals.h"
20*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/SourceMgr.h"
21*9880d681SAndroid Build Coastguard Worker #include "llvm/Support/raw_ostream.h"
22*9880d681SAndroid Build Coastguard Worker #include <system_error>
23*9880d681SAndroid Build Coastguard Worker using namespace llvm;
24*9880d681SAndroid Build Coastguard Worker 
25*9880d681SAndroid Build Coastguard Worker static cl::list<std::string>
26*9880d681SAndroid Build Coastguard Worker        InputFilenames(cl::Positional, cl::desc("<input files>"),
27*9880d681SAndroid Build Coastguard Worker                       cl::ZeroOrMore);
28*9880d681SAndroid Build Coastguard Worker static cl::opt<bool>
29*9880d681SAndroid Build Coastguard Worker DumpTags("dump-tags", cl::desc("List all tags encountered in input"));
30*9880d681SAndroid Build Coastguard Worker 
31*9880d681SAndroid Build Coastguard Worker static StringRef ToolName;
32*9880d681SAndroid Build Coastguard Worker 
33*9880d681SAndroid Build Coastguard Worker /// Trivial lexer for the markup parser. Input is always handled a character
34*9880d681SAndroid Build Coastguard Worker /// at a time. The lexer just encapsulates EOF and lookahead handling.
35*9880d681SAndroid Build Coastguard Worker class MarkupLexer {
36*9880d681SAndroid Build Coastguard Worker   StringRef::const_iterator Start;
37*9880d681SAndroid Build Coastguard Worker   StringRef::const_iterator CurPtr;
38*9880d681SAndroid Build Coastguard Worker   StringRef::const_iterator End;
39*9880d681SAndroid Build Coastguard Worker public:
MarkupLexer(StringRef Source)40*9880d681SAndroid Build Coastguard Worker   MarkupLexer(StringRef Source)
41*9880d681SAndroid Build Coastguard Worker     : Start(Source.begin()), CurPtr(Source.begin()), End(Source.end()) {}
42*9880d681SAndroid Build Coastguard Worker   // When processing non-markup, input is consumed a character at a time.
isEOF()43*9880d681SAndroid Build Coastguard Worker   bool isEOF() { return CurPtr == End; }
getNextChar()44*9880d681SAndroid Build Coastguard Worker   int getNextChar() {
45*9880d681SAndroid Build Coastguard Worker     if (CurPtr == End) return EOF;
46*9880d681SAndroid Build Coastguard Worker     return *CurPtr++;
47*9880d681SAndroid Build Coastguard Worker   }
peekNextChar()48*9880d681SAndroid Build Coastguard Worker   int peekNextChar() {
49*9880d681SAndroid Build Coastguard Worker     if (CurPtr == End) return EOF;
50*9880d681SAndroid Build Coastguard Worker     return *CurPtr;
51*9880d681SAndroid Build Coastguard Worker   }
getPosition() const52*9880d681SAndroid Build Coastguard Worker   StringRef::const_iterator getPosition() const { return CurPtr; }
53*9880d681SAndroid Build Coastguard Worker };
54*9880d681SAndroid Build Coastguard Worker 
55*9880d681SAndroid Build Coastguard Worker /// A markup tag is a name and a (usually empty) list of modifiers.
56*9880d681SAndroid Build Coastguard Worker class MarkupTag {
57*9880d681SAndroid Build Coastguard Worker   StringRef Name;
58*9880d681SAndroid Build Coastguard Worker   StringRef Modifiers;
59*9880d681SAndroid Build Coastguard Worker   SMLoc StartLoc;
60*9880d681SAndroid Build Coastguard Worker public:
MarkupTag(StringRef n,StringRef m,SMLoc Loc)61*9880d681SAndroid Build Coastguard Worker   MarkupTag(StringRef n, StringRef m, SMLoc Loc)
62*9880d681SAndroid Build Coastguard Worker     : Name(n), Modifiers(m), StartLoc(Loc) {}
getName() const63*9880d681SAndroid Build Coastguard Worker   StringRef getName() const { return Name; }
getModifiers() const64*9880d681SAndroid Build Coastguard Worker   StringRef getModifiers() const { return Modifiers; }
getLoc() const65*9880d681SAndroid Build Coastguard Worker   SMLoc getLoc() const { return StartLoc; }
66*9880d681SAndroid Build Coastguard Worker };
67*9880d681SAndroid Build Coastguard Worker 
68*9880d681SAndroid Build Coastguard Worker /// A simple parser implementation for creating MarkupTags from input text.
69*9880d681SAndroid Build Coastguard Worker class MarkupParser {
70*9880d681SAndroid Build Coastguard Worker   MarkupLexer &Lex;
71*9880d681SAndroid Build Coastguard Worker   SourceMgr &SM;
72*9880d681SAndroid Build Coastguard Worker public:
MarkupParser(MarkupLexer & lex,SourceMgr & SrcMgr)73*9880d681SAndroid Build Coastguard Worker   MarkupParser(MarkupLexer &lex, SourceMgr &SrcMgr) : Lex(lex), SM(SrcMgr) {}
74*9880d681SAndroid Build Coastguard Worker   /// Create a MarkupTag from the current position in the MarkupLexer.
75*9880d681SAndroid Build Coastguard Worker   /// The parseTag() method should be called when the lexer has processed
76*9880d681SAndroid Build Coastguard Worker   /// the opening '<' character. Input will be consumed up to and including
77*9880d681SAndroid Build Coastguard Worker   /// the ':' which terminates the tag open.
78*9880d681SAndroid Build Coastguard Worker   MarkupTag parseTag();
79*9880d681SAndroid Build Coastguard Worker   /// Issue a diagnostic and terminate program execution.
80*9880d681SAndroid Build Coastguard Worker   void FatalError(SMLoc Loc, StringRef Msg);
81*9880d681SAndroid Build Coastguard Worker };
82*9880d681SAndroid Build Coastguard Worker 
FatalError(SMLoc Loc,StringRef Msg)83*9880d681SAndroid Build Coastguard Worker void MarkupParser::FatalError(SMLoc Loc, StringRef Msg) {
84*9880d681SAndroid Build Coastguard Worker   SM.PrintMessage(Loc, SourceMgr::DK_Error, Msg);
85*9880d681SAndroid Build Coastguard Worker   exit(1);
86*9880d681SAndroid Build Coastguard Worker }
87*9880d681SAndroid Build Coastguard Worker 
88*9880d681SAndroid Build Coastguard Worker // Example handler for when a tag is recognized.
processStartTag(MarkupTag & Tag)89*9880d681SAndroid Build Coastguard Worker static void processStartTag(MarkupTag &Tag) {
90*9880d681SAndroid Build Coastguard Worker   // If we're just printing the tags, do that, otherwise do some simple
91*9880d681SAndroid Build Coastguard Worker   // colorization.
92*9880d681SAndroid Build Coastguard Worker   if (DumpTags) {
93*9880d681SAndroid Build Coastguard Worker     outs() << Tag.getName();
94*9880d681SAndroid Build Coastguard Worker     if (Tag.getModifiers().size())
95*9880d681SAndroid Build Coastguard Worker       outs() << " " << Tag.getModifiers();
96*9880d681SAndroid Build Coastguard Worker     outs() << "\n";
97*9880d681SAndroid Build Coastguard Worker     return;
98*9880d681SAndroid Build Coastguard Worker   }
99*9880d681SAndroid Build Coastguard Worker 
100*9880d681SAndroid Build Coastguard Worker   if (!outs().has_colors())
101*9880d681SAndroid Build Coastguard Worker     return;
102*9880d681SAndroid Build Coastguard Worker   // Color registers as red and immediates as cyan. Those don't have nested
103*9880d681SAndroid Build Coastguard Worker   // tags, so don't bother keeping a stack of colors to reset to.
104*9880d681SAndroid Build Coastguard Worker   if (Tag.getName() == "reg")
105*9880d681SAndroid Build Coastguard Worker     outs().changeColor(raw_ostream::RED);
106*9880d681SAndroid Build Coastguard Worker   else if (Tag.getName() == "imm")
107*9880d681SAndroid Build Coastguard Worker     outs().changeColor(raw_ostream::CYAN);
108*9880d681SAndroid Build Coastguard Worker }
109*9880d681SAndroid Build Coastguard Worker 
110*9880d681SAndroid Build Coastguard Worker // Example handler for when the end of a tag is recognized.
processEndTag(MarkupTag & Tag)111*9880d681SAndroid Build Coastguard Worker static void processEndTag(MarkupTag &Tag) {
112*9880d681SAndroid Build Coastguard Worker   // If we're printing the tags, there's nothing more to do here. Otherwise,
113*9880d681SAndroid Build Coastguard Worker   // set the color back the normal.
114*9880d681SAndroid Build Coastguard Worker   if (DumpTags)
115*9880d681SAndroid Build Coastguard Worker     return;
116*9880d681SAndroid Build Coastguard Worker   if (!outs().has_colors())
117*9880d681SAndroid Build Coastguard Worker     return;
118*9880d681SAndroid Build Coastguard Worker   // Just reset to basic white.
119*9880d681SAndroid Build Coastguard Worker   outs().changeColor(raw_ostream::WHITE, false);
120*9880d681SAndroid Build Coastguard Worker }
121*9880d681SAndroid Build Coastguard Worker 
parseTag()122*9880d681SAndroid Build Coastguard Worker MarkupTag MarkupParser::parseTag() {
123*9880d681SAndroid Build Coastguard Worker   // First off, extract the tag into it's own StringRef so we can look at it
124*9880d681SAndroid Build Coastguard Worker   // outside of the context of consuming input.
125*9880d681SAndroid Build Coastguard Worker   StringRef::const_iterator Start = Lex.getPosition();
126*9880d681SAndroid Build Coastguard Worker   SMLoc Loc = SMLoc::getFromPointer(Start - 1);
127*9880d681SAndroid Build Coastguard Worker   while(Lex.getNextChar() != ':') {
128*9880d681SAndroid Build Coastguard Worker     // EOF is an error.
129*9880d681SAndroid Build Coastguard Worker     if (Lex.isEOF())
130*9880d681SAndroid Build Coastguard Worker       FatalError(SMLoc::getFromPointer(Start), "unterminated markup tag");
131*9880d681SAndroid Build Coastguard Worker   }
132*9880d681SAndroid Build Coastguard Worker   StringRef RawTag(Start, Lex.getPosition() - Start - 1);
133*9880d681SAndroid Build Coastguard Worker   std::pair<StringRef, StringRef> SplitTag = RawTag.split(' ');
134*9880d681SAndroid Build Coastguard Worker   return MarkupTag(SplitTag.first, SplitTag.second, Loc);
135*9880d681SAndroid Build Coastguard Worker }
136*9880d681SAndroid Build Coastguard Worker 
parseMCMarkup(StringRef Filename)137*9880d681SAndroid Build Coastguard Worker static void parseMCMarkup(StringRef Filename) {
138*9880d681SAndroid Build Coastguard Worker   ErrorOr<std::unique_ptr<MemoryBuffer>> BufferPtr =
139*9880d681SAndroid Build Coastguard Worker       MemoryBuffer::getFileOrSTDIN(Filename);
140*9880d681SAndroid Build Coastguard Worker   if (std::error_code EC = BufferPtr.getError()) {
141*9880d681SAndroid Build Coastguard Worker     errs() << ToolName << ": " << EC.message() << '\n';
142*9880d681SAndroid Build Coastguard Worker     return;
143*9880d681SAndroid Build Coastguard Worker   }
144*9880d681SAndroid Build Coastguard Worker   std::unique_ptr<MemoryBuffer> &Buffer = BufferPtr.get();
145*9880d681SAndroid Build Coastguard Worker 
146*9880d681SAndroid Build Coastguard Worker   SourceMgr SrcMgr;
147*9880d681SAndroid Build Coastguard Worker 
148*9880d681SAndroid Build Coastguard Worker   StringRef InputSource = Buffer->getBuffer();
149*9880d681SAndroid Build Coastguard Worker 
150*9880d681SAndroid Build Coastguard Worker   // Tell SrcMgr about this buffer, which is what the parser will pick up.
151*9880d681SAndroid Build Coastguard Worker   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
152*9880d681SAndroid Build Coastguard Worker 
153*9880d681SAndroid Build Coastguard Worker   MarkupLexer Lex(InputSource);
154*9880d681SAndroid Build Coastguard Worker   MarkupParser Parser(Lex, SrcMgr);
155*9880d681SAndroid Build Coastguard Worker 
156*9880d681SAndroid Build Coastguard Worker   SmallVector<MarkupTag, 4> TagStack;
157*9880d681SAndroid Build Coastguard Worker 
158*9880d681SAndroid Build Coastguard Worker   for (int CurChar = Lex.getNextChar();
159*9880d681SAndroid Build Coastguard Worker        CurChar != EOF;
160*9880d681SAndroid Build Coastguard Worker        CurChar = Lex.getNextChar()) {
161*9880d681SAndroid Build Coastguard Worker     switch (CurChar) {
162*9880d681SAndroid Build Coastguard Worker     case '<': {
163*9880d681SAndroid Build Coastguard Worker       // A "<<" is output as a literal '<' and does not start a markup tag.
164*9880d681SAndroid Build Coastguard Worker       if (Lex.peekNextChar() == '<') {
165*9880d681SAndroid Build Coastguard Worker         (void)Lex.getNextChar();
166*9880d681SAndroid Build Coastguard Worker         break;
167*9880d681SAndroid Build Coastguard Worker       }
168*9880d681SAndroid Build Coastguard Worker       // Parse the markup entry.
169*9880d681SAndroid Build Coastguard Worker       TagStack.push_back(Parser.parseTag());
170*9880d681SAndroid Build Coastguard Worker 
171*9880d681SAndroid Build Coastguard Worker       // Do any special handling for the start of a tag.
172*9880d681SAndroid Build Coastguard Worker       processStartTag(TagStack.back());
173*9880d681SAndroid Build Coastguard Worker       continue;
174*9880d681SAndroid Build Coastguard Worker     }
175*9880d681SAndroid Build Coastguard Worker     case '>': {
176*9880d681SAndroid Build Coastguard Worker       SMLoc Loc = SMLoc::getFromPointer(Lex.getPosition() - 1);
177*9880d681SAndroid Build Coastguard Worker       // A ">>" is output as a literal '>' and does not end a markup tag.
178*9880d681SAndroid Build Coastguard Worker       if (Lex.peekNextChar() == '>') {
179*9880d681SAndroid Build Coastguard Worker         (void)Lex.getNextChar();
180*9880d681SAndroid Build Coastguard Worker         break;
181*9880d681SAndroid Build Coastguard Worker       }
182*9880d681SAndroid Build Coastguard Worker       // Close out the innermost tag.
183*9880d681SAndroid Build Coastguard Worker       if (TagStack.empty())
184*9880d681SAndroid Build Coastguard Worker         Parser.FatalError(Loc, "'>' without matching '<'");
185*9880d681SAndroid Build Coastguard Worker 
186*9880d681SAndroid Build Coastguard Worker       // Do any special handling for the end of a tag.
187*9880d681SAndroid Build Coastguard Worker       processEndTag(TagStack.back());
188*9880d681SAndroid Build Coastguard Worker 
189*9880d681SAndroid Build Coastguard Worker       TagStack.pop_back();
190*9880d681SAndroid Build Coastguard Worker       continue;
191*9880d681SAndroid Build Coastguard Worker     }
192*9880d681SAndroid Build Coastguard Worker     default:
193*9880d681SAndroid Build Coastguard Worker       break;
194*9880d681SAndroid Build Coastguard Worker     }
195*9880d681SAndroid Build Coastguard Worker     // For anything else, just echo the character back out.
196*9880d681SAndroid Build Coastguard Worker     if (!DumpTags && CurChar != EOF)
197*9880d681SAndroid Build Coastguard Worker       outs() << (char)CurChar;
198*9880d681SAndroid Build Coastguard Worker   }
199*9880d681SAndroid Build Coastguard Worker 
200*9880d681SAndroid Build Coastguard Worker   // If there are any unterminated markup tags, issue diagnostics for them.
201*9880d681SAndroid Build Coastguard Worker   while (!TagStack.empty()) {
202*9880d681SAndroid Build Coastguard Worker     MarkupTag &Tag = TagStack.back();
203*9880d681SAndroid Build Coastguard Worker     SrcMgr.PrintMessage(Tag.getLoc(), SourceMgr::DK_Error,
204*9880d681SAndroid Build Coastguard Worker                         "unterminated markup tag");
205*9880d681SAndroid Build Coastguard Worker     TagStack.pop_back();
206*9880d681SAndroid Build Coastguard Worker   }
207*9880d681SAndroid Build Coastguard Worker }
208*9880d681SAndroid Build Coastguard Worker 
main(int argc,char ** argv)209*9880d681SAndroid Build Coastguard Worker int main(int argc, char **argv) {
210*9880d681SAndroid Build Coastguard Worker   // Print a stack trace if we signal out.
211*9880d681SAndroid Build Coastguard Worker   sys::PrintStackTraceOnErrorSignal(argv[0]);
212*9880d681SAndroid Build Coastguard Worker   PrettyStackTraceProgram X(argc, argv);
213*9880d681SAndroid Build Coastguard Worker 
214*9880d681SAndroid Build Coastguard Worker   llvm_shutdown_obj Y;  // Call llvm_shutdown() on exit.
215*9880d681SAndroid Build Coastguard Worker   cl::ParseCommandLineOptions(argc, argv, "llvm MC markup parser\n");
216*9880d681SAndroid Build Coastguard Worker 
217*9880d681SAndroid Build Coastguard Worker   ToolName = argv[0];
218*9880d681SAndroid Build Coastguard Worker 
219*9880d681SAndroid Build Coastguard Worker   // If no input files specified, read from stdin.
220*9880d681SAndroid Build Coastguard Worker   if (InputFilenames.size() == 0)
221*9880d681SAndroid Build Coastguard Worker     InputFilenames.push_back("-");
222*9880d681SAndroid Build Coastguard Worker 
223*9880d681SAndroid Build Coastguard Worker   std::for_each(InputFilenames.begin(), InputFilenames.end(),
224*9880d681SAndroid Build Coastguard Worker                 parseMCMarkup);
225*9880d681SAndroid Build Coastguard Worker   return 0;
226*9880d681SAndroid Build Coastguard Worker }
227