1 //===- YAMLRemarkParser.cpp -----------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file provides utility methods used by clients that want to use the
10 // parser for remark diagnostics in LLVM.
11 //
12 //===----------------------------------------------------------------------===//
13
14 #include "YAMLRemarkParser.h"
15 #include "llvm/ADT/StringSwitch.h"
16 #include "llvm/Support/Endian.h"
17 #include "llvm/Support/Path.h"
18 #include <optional>
19
20 using namespace llvm;
21 using namespace llvm::remarks;
22
23 char YAMLParseError::ID = 0;
24
handleDiagnostic(const SMDiagnostic & Diag,void * Ctx)25 static void handleDiagnostic(const SMDiagnostic &Diag, void *Ctx) {
26 assert(Ctx && "Expected non-null Ctx in diagnostic handler.");
27 std::string &Message = *static_cast<std::string *>(Ctx);
28 assert(Message.empty() && "Expected an empty string.");
29 raw_string_ostream OS(Message);
30 Diag.print(/*ProgName=*/nullptr, OS, /*ShowColors*/ false,
31 /*ShowKindLabels*/ true);
32 OS << '\n';
33 OS.flush();
34 }
35
YAMLParseError(StringRef Msg,SourceMgr & SM,yaml::Stream & Stream,yaml::Node & Node)36 YAMLParseError::YAMLParseError(StringRef Msg, SourceMgr &SM,
37 yaml::Stream &Stream, yaml::Node &Node) {
38 // 1) Set up a diagnostic handler to avoid errors being printed out to
39 // stderr.
40 // 2) Use the stream to print the error with the associated node.
41 // 3) The stream will use the source manager to print the error, which will
42 // call the diagnostic handler.
43 // 4) The diagnostic handler will stream the error directly into this object's
44 // Message member, which is used when logging is asked for.
45 auto OldDiagHandler = SM.getDiagHandler();
46 auto OldDiagCtx = SM.getDiagContext();
47 SM.setDiagHandler(handleDiagnostic, &Message);
48 Stream.printError(&Node, Twine(Msg) + Twine('\n'));
49 // Restore the old handlers.
50 SM.setDiagHandler(OldDiagHandler, OldDiagCtx);
51 }
52
setupSM(std::string & LastErrorMessage)53 static SourceMgr setupSM(std::string &LastErrorMessage) {
54 SourceMgr SM;
55 SM.setDiagHandler(handleDiagnostic, &LastErrorMessage);
56 return SM;
57 }
58
59 // Parse the magic number. This function returns true if this represents remark
60 // metadata, false otherwise.
parseMagic(StringRef & Buf)61 static Expected<bool> parseMagic(StringRef &Buf) {
62 if (!Buf.consume_front(remarks::Magic))
63 return false;
64
65 if (Buf.size() < 1 || !Buf.consume_front(StringRef("\0", 1)))
66 return createStringError(std::errc::illegal_byte_sequence,
67 "Expecting \\0 after magic number.");
68 return true;
69 }
70
parseVersion(StringRef & Buf)71 static Expected<uint64_t> parseVersion(StringRef &Buf) {
72 if (Buf.size() < sizeof(uint64_t))
73 return createStringError(std::errc::illegal_byte_sequence,
74 "Expecting version number.");
75
76 uint64_t Version =
77 support::endian::read<uint64_t, support::little, support::unaligned>(
78 Buf.data());
79 if (Version != remarks::CurrentRemarkVersion)
80 return createStringError(std::errc::illegal_byte_sequence,
81 "Mismatching remark version. Got %" PRId64
82 ", expected %" PRId64 ".",
83 Version, remarks::CurrentRemarkVersion);
84 Buf = Buf.drop_front(sizeof(uint64_t));
85 return Version;
86 }
87
parseStrTabSize(StringRef & Buf)88 static Expected<uint64_t> parseStrTabSize(StringRef &Buf) {
89 if (Buf.size() < sizeof(uint64_t))
90 return createStringError(std::errc::illegal_byte_sequence,
91 "Expecting string table size.");
92 uint64_t StrTabSize =
93 support::endian::read<uint64_t, support::little, support::unaligned>(
94 Buf.data());
95 Buf = Buf.drop_front(sizeof(uint64_t));
96 return StrTabSize;
97 }
98
parseStrTab(StringRef & Buf,uint64_t StrTabSize)99 static Expected<ParsedStringTable> parseStrTab(StringRef &Buf,
100 uint64_t StrTabSize) {
101 if (Buf.size() < StrTabSize)
102 return createStringError(std::errc::illegal_byte_sequence,
103 "Expecting string table.");
104
105 // Attach the string table to the parser.
106 ParsedStringTable Result(StringRef(Buf.data(), StrTabSize));
107 Buf = Buf.drop_front(StrTabSize);
108 return Expected<ParsedStringTable>(std::move(Result));
109 }
110
createYAMLParserFromMeta(StringRef Buf,std::optional<ParsedStringTable> StrTab,std::optional<StringRef> ExternalFilePrependPath)111 Expected<std::unique_ptr<YAMLRemarkParser>> remarks::createYAMLParserFromMeta(
112 StringRef Buf, std::optional<ParsedStringTable> StrTab,
113 std::optional<StringRef> ExternalFilePrependPath) {
114 // We now have a magic number. The metadata has to be correct.
115 Expected<bool> isMeta = parseMagic(Buf);
116 if (!isMeta)
117 return isMeta.takeError();
118 // If it's not recognized as metadata, roll back.
119 std::unique_ptr<MemoryBuffer> SeparateBuf;
120 if (*isMeta) {
121 Expected<uint64_t> Version = parseVersion(Buf);
122 if (!Version)
123 return Version.takeError();
124
125 Expected<uint64_t> StrTabSize = parseStrTabSize(Buf);
126 if (!StrTabSize)
127 return StrTabSize.takeError();
128
129 // If the size of string table is not 0, try to build one.
130 if (*StrTabSize != 0) {
131 if (StrTab)
132 return createStringError(std::errc::illegal_byte_sequence,
133 "String table already provided.");
134 Expected<ParsedStringTable> MaybeStrTab = parseStrTab(Buf, *StrTabSize);
135 if (!MaybeStrTab)
136 return MaybeStrTab.takeError();
137 StrTab = std::move(*MaybeStrTab);
138 }
139 // If it starts with "---", there is no external file.
140 if (!Buf.startswith("---")) {
141 // At this point, we expect Buf to contain the external file path.
142 StringRef ExternalFilePath = Buf;
143 SmallString<80> FullPath;
144 if (ExternalFilePrependPath)
145 FullPath = *ExternalFilePrependPath;
146 sys::path::append(FullPath, ExternalFilePath);
147
148 // Try to open the file and start parsing from there.
149 ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr =
150 MemoryBuffer::getFile(FullPath);
151 if (std::error_code EC = BufferOrErr.getError())
152 return createFileError(FullPath, EC);
153
154 // Keep the buffer alive.
155 SeparateBuf = std::move(*BufferOrErr);
156 Buf = SeparateBuf->getBuffer();
157 }
158 }
159
160 std::unique_ptr<YAMLRemarkParser> Result =
161 StrTab
162 ? std::make_unique<YAMLStrTabRemarkParser>(Buf, std::move(*StrTab))
163 : std::make_unique<YAMLRemarkParser>(Buf);
164 if (SeparateBuf)
165 Result->SeparateBuf = std::move(SeparateBuf);
166 return std::move(Result);
167 }
168
YAMLRemarkParser(StringRef Buf)169 YAMLRemarkParser::YAMLRemarkParser(StringRef Buf)
170 : YAMLRemarkParser(Buf, std::nullopt) {}
171
YAMLRemarkParser(StringRef Buf,std::optional<ParsedStringTable> StrTab)172 YAMLRemarkParser::YAMLRemarkParser(StringRef Buf,
173 std::optional<ParsedStringTable> StrTab)
174 : RemarkParser{Format::YAML}, StrTab(std::move(StrTab)),
175 SM(setupSM(LastErrorMessage)), Stream(Buf, SM), YAMLIt(Stream.begin()) {}
176
error(StringRef Message,yaml::Node & Node)177 Error YAMLRemarkParser::error(StringRef Message, yaml::Node &Node) {
178 return make_error<YAMLParseError>(Message, SM, Stream, Node);
179 }
180
error()181 Error YAMLRemarkParser::error() {
182 if (LastErrorMessage.empty())
183 return Error::success();
184 Error E = make_error<YAMLParseError>(LastErrorMessage);
185 LastErrorMessage.clear();
186 return E;
187 }
188
189 Expected<std::unique_ptr<Remark>>
parseRemark(yaml::Document & RemarkEntry)190 YAMLRemarkParser::parseRemark(yaml::Document &RemarkEntry) {
191 if (Error E = error())
192 return std::move(E);
193
194 yaml::Node *YAMLRoot = RemarkEntry.getRoot();
195 if (!YAMLRoot) {
196 return createStringError(std::make_error_code(std::errc::invalid_argument),
197 "not a valid YAML file.");
198 }
199
200 auto *Root = dyn_cast<yaml::MappingNode>(YAMLRoot);
201 if (!Root)
202 return error("document root is not of mapping type.", *YAMLRoot);
203
204 std::unique_ptr<Remark> Result = std::make_unique<Remark>();
205 Remark &TheRemark = *Result;
206
207 // First, the type. It needs special handling since is not part of the
208 // key-value stream.
209 Expected<Type> T = parseType(*Root);
210 if (!T)
211 return T.takeError();
212 else
213 TheRemark.RemarkType = *T;
214
215 // Then, parse the fields, one by one.
216 for (yaml::KeyValueNode &RemarkField : *Root) {
217 Expected<StringRef> MaybeKey = parseKey(RemarkField);
218 if (!MaybeKey)
219 return MaybeKey.takeError();
220 StringRef KeyName = *MaybeKey;
221
222 if (KeyName == "Pass") {
223 if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
224 TheRemark.PassName = *MaybeStr;
225 else
226 return MaybeStr.takeError();
227 } else if (KeyName == "Name") {
228 if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
229 TheRemark.RemarkName = *MaybeStr;
230 else
231 return MaybeStr.takeError();
232 } else if (KeyName == "Function") {
233 if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
234 TheRemark.FunctionName = *MaybeStr;
235 else
236 return MaybeStr.takeError();
237 } else if (KeyName == "Hotness") {
238 if (Expected<unsigned> MaybeU = parseUnsigned(RemarkField))
239 TheRemark.Hotness = *MaybeU;
240 else
241 return MaybeU.takeError();
242 } else if (KeyName == "DebugLoc") {
243 if (Expected<RemarkLocation> MaybeLoc = parseDebugLoc(RemarkField))
244 TheRemark.Loc = *MaybeLoc;
245 else
246 return MaybeLoc.takeError();
247 } else if (KeyName == "Args") {
248 auto *Args = dyn_cast<yaml::SequenceNode>(RemarkField.getValue());
249 if (!Args)
250 return error("wrong value type for key.", RemarkField);
251
252 for (yaml::Node &Arg : *Args) {
253 if (Expected<Argument> MaybeArg = parseArg(Arg))
254 TheRemark.Args.push_back(*MaybeArg);
255 else
256 return MaybeArg.takeError();
257 }
258 } else {
259 return error("unknown key.", RemarkField);
260 }
261 }
262
263 // Check if any of the mandatory fields are missing.
264 if (TheRemark.RemarkType == Type::Unknown || TheRemark.PassName.empty() ||
265 TheRemark.RemarkName.empty() || TheRemark.FunctionName.empty())
266 return error("Type, Pass, Name or Function missing.",
267 *RemarkEntry.getRoot());
268
269 return std::move(Result);
270 }
271
parseType(yaml::MappingNode & Node)272 Expected<Type> YAMLRemarkParser::parseType(yaml::MappingNode &Node) {
273 auto Type = StringSwitch<remarks::Type>(Node.getRawTag())
274 .Case("!Passed", remarks::Type::Passed)
275 .Case("!Missed", remarks::Type::Missed)
276 .Case("!Analysis", remarks::Type::Analysis)
277 .Case("!AnalysisFPCommute", remarks::Type::AnalysisFPCommute)
278 .Case("!AnalysisAliasing", remarks::Type::AnalysisAliasing)
279 .Case("!Failure", remarks::Type::Failure)
280 .Default(remarks::Type::Unknown);
281 if (Type == remarks::Type::Unknown)
282 return error("expected a remark tag.", Node);
283 return Type;
284 }
285
parseKey(yaml::KeyValueNode & Node)286 Expected<StringRef> YAMLRemarkParser::parseKey(yaml::KeyValueNode &Node) {
287 if (auto *Key = dyn_cast<yaml::ScalarNode>(Node.getKey()))
288 return Key->getRawValue();
289
290 return error("key is not a string.", Node);
291 }
292
parseStr(yaml::KeyValueNode & Node)293 Expected<StringRef> YAMLRemarkParser::parseStr(yaml::KeyValueNode &Node) {
294 auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
295 if (!Value)
296 return error("expected a value of scalar type.", Node);
297 StringRef Result = Value->getRawValue();
298
299 if (Result.front() == '\'')
300 Result = Result.drop_front();
301
302 if (Result.back() == '\'')
303 Result = Result.drop_back();
304
305 return Result;
306 }
307
parseUnsigned(yaml::KeyValueNode & Node)308 Expected<unsigned> YAMLRemarkParser::parseUnsigned(yaml::KeyValueNode &Node) {
309 SmallVector<char, 4> Tmp;
310 auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
311 if (!Value)
312 return error("expected a value of scalar type.", Node);
313 unsigned UnsignedValue = 0;
314 if (Value->getValue(Tmp).getAsInteger(10, UnsignedValue))
315 return error("expected a value of integer type.", *Value);
316 return UnsignedValue;
317 }
318
319 Expected<RemarkLocation>
parseDebugLoc(yaml::KeyValueNode & Node)320 YAMLRemarkParser::parseDebugLoc(yaml::KeyValueNode &Node) {
321 auto *DebugLoc = dyn_cast<yaml::MappingNode>(Node.getValue());
322 if (!DebugLoc)
323 return error("expected a value of mapping type.", Node);
324
325 std::optional<StringRef> File;
326 std::optional<unsigned> Line;
327 std::optional<unsigned> Column;
328
329 for (yaml::KeyValueNode &DLNode : *DebugLoc) {
330 Expected<StringRef> MaybeKey = parseKey(DLNode);
331 if (!MaybeKey)
332 return MaybeKey.takeError();
333 StringRef KeyName = *MaybeKey;
334
335 if (KeyName == "File") {
336 if (Expected<StringRef> MaybeStr = parseStr(DLNode))
337 File = *MaybeStr;
338 else
339 return MaybeStr.takeError();
340 } else if (KeyName == "Column") {
341 if (Expected<unsigned> MaybeU = parseUnsigned(DLNode))
342 Column = *MaybeU;
343 else
344 return MaybeU.takeError();
345 } else if (KeyName == "Line") {
346 if (Expected<unsigned> MaybeU = parseUnsigned(DLNode))
347 Line = *MaybeU;
348 else
349 return MaybeU.takeError();
350 } else {
351 return error("unknown entry in DebugLoc map.", DLNode);
352 }
353 }
354
355 // If any of the debug loc fields is missing, return an error.
356 if (!File || !Line || !Column)
357 return error("DebugLoc node incomplete.", Node);
358
359 return RemarkLocation{*File, *Line, *Column};
360 }
361
parseArg(yaml::Node & Node)362 Expected<Argument> YAMLRemarkParser::parseArg(yaml::Node &Node) {
363 auto *ArgMap = dyn_cast<yaml::MappingNode>(&Node);
364 if (!ArgMap)
365 return error("expected a value of mapping type.", Node);
366
367 std::optional<StringRef> KeyStr;
368 std::optional<StringRef> ValueStr;
369 std::optional<RemarkLocation> Loc;
370
371 for (yaml::KeyValueNode &ArgEntry : *ArgMap) {
372 Expected<StringRef> MaybeKey = parseKey(ArgEntry);
373 if (!MaybeKey)
374 return MaybeKey.takeError();
375 StringRef KeyName = *MaybeKey;
376
377 // Try to parse debug locs.
378 if (KeyName == "DebugLoc") {
379 // Can't have multiple DebugLoc entries per argument.
380 if (Loc)
381 return error("only one DebugLoc entry is allowed per argument.",
382 ArgEntry);
383
384 if (Expected<RemarkLocation> MaybeLoc = parseDebugLoc(ArgEntry)) {
385 Loc = *MaybeLoc;
386 continue;
387 } else
388 return MaybeLoc.takeError();
389 }
390
391 // If we already have a string, error out.
392 if (ValueStr)
393 return error("only one string entry is allowed per argument.", ArgEntry);
394
395 // Try to parse the value.
396 if (Expected<StringRef> MaybeStr = parseStr(ArgEntry))
397 ValueStr = *MaybeStr;
398 else
399 return MaybeStr.takeError();
400
401 // Keep the key from the string.
402 KeyStr = KeyName;
403 }
404
405 if (!KeyStr)
406 return error("argument key is missing.", *ArgMap);
407 if (!ValueStr)
408 return error("argument value is missing.", *ArgMap);
409
410 return Argument{*KeyStr, *ValueStr, Loc};
411 }
412
next()413 Expected<std::unique_ptr<Remark>> YAMLRemarkParser::next() {
414 if (YAMLIt == Stream.end())
415 return make_error<EndOfFileError>();
416
417 Expected<std::unique_ptr<Remark>> MaybeResult = parseRemark(*YAMLIt);
418 if (!MaybeResult) {
419 // Avoid garbage input, set the iterator to the end.
420 YAMLIt = Stream.end();
421 return MaybeResult.takeError();
422 }
423
424 ++YAMLIt;
425
426 return std::move(*MaybeResult);
427 }
428
parseStr(yaml::KeyValueNode & Node)429 Expected<StringRef> YAMLStrTabRemarkParser::parseStr(yaml::KeyValueNode &Node) {
430 auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
431 if (!Value)
432 return error("expected a value of scalar type.", Node);
433 StringRef Result;
434 // If we have a string table, parse it as an unsigned.
435 unsigned StrID = 0;
436 if (Expected<unsigned> MaybeStrID = parseUnsigned(Node))
437 StrID = *MaybeStrID;
438 else
439 return MaybeStrID.takeError();
440
441 if (Expected<StringRef> Str = (*StrTab)[StrID])
442 Result = *Str;
443 else
444 return Str.takeError();
445
446 if (Result.front() == '\'')
447 Result = Result.drop_front();
448
449 if (Result.back() == '\'')
450 Result = Result.drop_back();
451
452 return Result;
453 }
454