454 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			454 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===- YAMLRemarkParser.cpp -----------------------------------------------===//
 | |
| //
 | |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 | |
| // See https://llvm.org/LICENSE.txt for license information.
 | |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| //
 | |
| // This file provides utility methods used by clients that want to use the
 | |
| // parser for remark diagnostics in LLVM.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| #include "YAMLRemarkParser.h"
 | |
| #include "llvm/ADT/StringSwitch.h"
 | |
| #include "llvm/Support/Endian.h"
 | |
| #include "llvm/Support/Path.h"
 | |
| 
 | |
| using namespace llvm;
 | |
| using namespace llvm::remarks;
 | |
| 
 | |
| char YAMLParseError::ID = 0;
 | |
| 
 | |
| static void handleDiagnostic(const SMDiagnostic &Diag, void *Ctx) {
 | |
|   assert(Ctx && "Expected non-null Ctx in diagnostic handler.");
 | |
|   std::string &Message = *static_cast<std::string *>(Ctx);
 | |
|   assert(Message.empty() && "Expected an empty string.");
 | |
|   raw_string_ostream OS(Message);
 | |
|   Diag.print(/*ProgName=*/nullptr, OS, /*ShowColors*/ false,
 | |
|              /*ShowKindLabels*/ true);
 | |
|   OS << '\n';
 | |
|   OS.flush();
 | |
| }
 | |
| 
 | |
| YAMLParseError::YAMLParseError(StringRef Msg, SourceMgr &SM,
 | |
|                                yaml::Stream &Stream, yaml::Node &Node) {
 | |
|   // 1) Set up a diagnostic handler to avoid errors being printed out to
 | |
|   // stderr.
 | |
|   // 2) Use the stream to print the error with the associated node.
 | |
|   // 3) The stream will use the source manager to print the error, which will
 | |
|   // call the diagnostic handler.
 | |
|   // 4) The diagnostic handler will stream the error directly into this object's
 | |
|   // Message member, which is used when logging is asked for.
 | |
|   auto OldDiagHandler = SM.getDiagHandler();
 | |
|   auto OldDiagCtx = SM.getDiagContext();
 | |
|   SM.setDiagHandler(handleDiagnostic, &Message);
 | |
|   Stream.printError(&Node, Twine(Msg) + Twine('\n'));
 | |
|   // Restore the old handlers.
 | |
|   SM.setDiagHandler(OldDiagHandler, OldDiagCtx);
 | |
| }
 | |
| 
 | |
| static SourceMgr setupSM(std::string &LastErrorMessage) {
 | |
|   SourceMgr SM;
 | |
|   SM.setDiagHandler(handleDiagnostic, &LastErrorMessage);
 | |
|   return SM;
 | |
| }
 | |
| 
 | |
| // Parse the magic number. This function returns true if this represents remark
 | |
| // metadata, false otherwise.
 | |
| static Expected<bool> parseMagic(StringRef &Buf) {
 | |
|   if (!Buf.consume_front(remarks::Magic))
 | |
|     return false;
 | |
| 
 | |
|   if (Buf.size() < 1 || !Buf.consume_front(StringRef("\0", 1)))
 | |
|     return createStringError(std::errc::illegal_byte_sequence,
 | |
|                              "Expecting \\0 after magic number.");
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| static Expected<uint64_t> parseVersion(StringRef &Buf) {
 | |
|   if (Buf.size() < sizeof(uint64_t))
 | |
|     return createStringError(std::errc::illegal_byte_sequence,
 | |
|                              "Expecting version number.");
 | |
| 
 | |
|   uint64_t Version =
 | |
|       support::endian::read<uint64_t, support::little, support::unaligned>(
 | |
|           Buf.data());
 | |
|   if (Version != remarks::CurrentRemarkVersion)
 | |
|     return createStringError(std::errc::illegal_byte_sequence,
 | |
|                              "Mismatching remark version. Got %" PRId64
 | |
|                              ", expected %" PRId64 ".",
 | |
|                              Version, remarks::CurrentRemarkVersion);
 | |
|   Buf = Buf.drop_front(sizeof(uint64_t));
 | |
|   return Version;
 | |
| }
 | |
| 
 | |
| static Expected<uint64_t> parseStrTabSize(StringRef &Buf) {
 | |
|   if (Buf.size() < sizeof(uint64_t))
 | |
|     return createStringError(std::errc::illegal_byte_sequence,
 | |
|                              "Expecting string table size.");
 | |
|   uint64_t StrTabSize =
 | |
|       support::endian::read<uint64_t, support::little, support::unaligned>(
 | |
|           Buf.data());
 | |
|   Buf = Buf.drop_front(sizeof(uint64_t));
 | |
|   return StrTabSize;
 | |
| }
 | |
| 
 | |
| static Expected<ParsedStringTable> parseStrTab(StringRef &Buf,
 | |
|                                                uint64_t StrTabSize) {
 | |
|   if (Buf.size() < StrTabSize)
 | |
|     return createStringError(std::errc::illegal_byte_sequence,
 | |
|                              "Expecting string table.");
 | |
| 
 | |
|   // Attach the string table to the parser.
 | |
|   ParsedStringTable Result(StringRef(Buf.data(), StrTabSize));
 | |
|   Buf = Buf.drop_front(StrTabSize);
 | |
|   return Expected<ParsedStringTable>(std::move(Result));
 | |
| }
 | |
| 
 | |
| Expected<std::unique_ptr<YAMLRemarkParser>>
 | |
| remarks::createYAMLParserFromMeta(StringRef Buf,
 | |
|                                   Optional<ParsedStringTable> StrTab,
 | |
|                                   Optional<StringRef> ExternalFilePrependPath) {
 | |
|   // We now have a magic number. The metadata has to be correct.
 | |
|   Expected<bool> isMeta = parseMagic(Buf);
 | |
|   if (!isMeta)
 | |
|     return isMeta.takeError();
 | |
|   // If it's not recognized as metadata, roll back.
 | |
|   std::unique_ptr<MemoryBuffer> SeparateBuf;
 | |
|   if (*isMeta) {
 | |
|     Expected<uint64_t> Version = parseVersion(Buf);
 | |
|     if (!Version)
 | |
|       return Version.takeError();
 | |
| 
 | |
|     Expected<uint64_t> StrTabSize = parseStrTabSize(Buf);
 | |
|     if (!StrTabSize)
 | |
|       return StrTabSize.takeError();
 | |
| 
 | |
|     // If the size of string table is not 0, try to build one.
 | |
|     if (*StrTabSize != 0) {
 | |
|       if (StrTab)
 | |
|         return createStringError(std::errc::illegal_byte_sequence,
 | |
|                                  "String table already provided.");
 | |
|       Expected<ParsedStringTable> MaybeStrTab = parseStrTab(Buf, *StrTabSize);
 | |
|       if (!MaybeStrTab)
 | |
|         return MaybeStrTab.takeError();
 | |
|       StrTab = std::move(*MaybeStrTab);
 | |
|     }
 | |
|     // If it starts with "---", there is no external file.
 | |
|     if (!Buf.startswith("---")) {
 | |
|       // At this point, we expect Buf to contain the external file path.
 | |
|       StringRef ExternalFilePath = Buf;
 | |
|       SmallString<80> FullPath;
 | |
|       if (ExternalFilePrependPath)
 | |
|         FullPath = *ExternalFilePrependPath;
 | |
|       sys::path::append(FullPath, ExternalFilePath);
 | |
| 
 | |
|       // Try to open the file and start parsing from there.
 | |
|       ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr =
 | |
|           MemoryBuffer::getFile(FullPath);
 | |
|       if (std::error_code EC = BufferOrErr.getError())
 | |
|         return createFileError(FullPath, EC);
 | |
| 
 | |
|       // Keep the buffer alive.
 | |
|       SeparateBuf = std::move(*BufferOrErr);
 | |
|       Buf = SeparateBuf->getBuffer();
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   std::unique_ptr<YAMLRemarkParser> Result =
 | |
|       StrTab
 | |
|           ? std::make_unique<YAMLStrTabRemarkParser>(Buf, std::move(*StrTab))
 | |
|           : std::make_unique<YAMLRemarkParser>(Buf);
 | |
|   if (SeparateBuf)
 | |
|     Result->SeparateBuf = std::move(SeparateBuf);
 | |
|   return std::move(Result);
 | |
| }
 | |
| 
 | |
| YAMLRemarkParser::YAMLRemarkParser(StringRef Buf)
 | |
|     : YAMLRemarkParser(Buf, None) {}
 | |
| 
 | |
| YAMLRemarkParser::YAMLRemarkParser(StringRef Buf,
 | |
|                                    Optional<ParsedStringTable> StrTab)
 | |
|     : RemarkParser{Format::YAML}, StrTab(std::move(StrTab)), LastErrorMessage(),
 | |
|       SM(setupSM(LastErrorMessage)), Stream(Buf, SM), YAMLIt(Stream.begin()) {}
 | |
| 
 | |
| Error YAMLRemarkParser::error(StringRef Message, yaml::Node &Node) {
 | |
|   return make_error<YAMLParseError>(Message, SM, Stream, Node);
 | |
| }
 | |
| 
 | |
| Error YAMLRemarkParser::error() {
 | |
|   if (LastErrorMessage.empty())
 | |
|     return Error::success();
 | |
|   Error E = make_error<YAMLParseError>(LastErrorMessage);
 | |
|   LastErrorMessage.clear();
 | |
|   return E;
 | |
| }
 | |
| 
 | |
| Expected<std::unique_ptr<Remark>>
 | |
| YAMLRemarkParser::parseRemark(yaml::Document &RemarkEntry) {
 | |
|   if (Error E = error())
 | |
|     return std::move(E);
 | |
| 
 | |
|   yaml::Node *YAMLRoot = RemarkEntry.getRoot();
 | |
|   if (!YAMLRoot) {
 | |
|     return createStringError(std::make_error_code(std::errc::invalid_argument),
 | |
|                              "not a valid YAML file.");
 | |
|   }
 | |
| 
 | |
|   auto *Root = dyn_cast<yaml::MappingNode>(YAMLRoot);
 | |
|   if (!Root)
 | |
|     return error("document root is not of mapping type.", *YAMLRoot);
 | |
| 
 | |
|   std::unique_ptr<Remark> Result = std::make_unique<Remark>();
 | |
|   Remark &TheRemark = *Result;
 | |
| 
 | |
|   // First, the type. It needs special handling since is not part of the
 | |
|   // key-value stream.
 | |
|   Expected<Type> T = parseType(*Root);
 | |
|   if (!T)
 | |
|     return T.takeError();
 | |
|   else
 | |
|     TheRemark.RemarkType = *T;
 | |
| 
 | |
|   // Then, parse the fields, one by one.
 | |
|   for (yaml::KeyValueNode &RemarkField : *Root) {
 | |
|     Expected<StringRef> MaybeKey = parseKey(RemarkField);
 | |
|     if (!MaybeKey)
 | |
|       return MaybeKey.takeError();
 | |
|     StringRef KeyName = *MaybeKey;
 | |
| 
 | |
|     if (KeyName == "Pass") {
 | |
|       if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
 | |
|         TheRemark.PassName = *MaybeStr;
 | |
|       else
 | |
|         return MaybeStr.takeError();
 | |
|     } else if (KeyName == "Name") {
 | |
|       if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
 | |
|         TheRemark.RemarkName = *MaybeStr;
 | |
|       else
 | |
|         return MaybeStr.takeError();
 | |
|     } else if (KeyName == "Function") {
 | |
|       if (Expected<StringRef> MaybeStr = parseStr(RemarkField))
 | |
|         TheRemark.FunctionName = *MaybeStr;
 | |
|       else
 | |
|         return MaybeStr.takeError();
 | |
|     } else if (KeyName == "Hotness") {
 | |
|       if (Expected<unsigned> MaybeU = parseUnsigned(RemarkField))
 | |
|         TheRemark.Hotness = *MaybeU;
 | |
|       else
 | |
|         return MaybeU.takeError();
 | |
|     } else if (KeyName == "DebugLoc") {
 | |
|       if (Expected<RemarkLocation> MaybeLoc = parseDebugLoc(RemarkField))
 | |
|         TheRemark.Loc = *MaybeLoc;
 | |
|       else
 | |
|         return MaybeLoc.takeError();
 | |
|     } else if (KeyName == "Args") {
 | |
|       auto *Args = dyn_cast<yaml::SequenceNode>(RemarkField.getValue());
 | |
|       if (!Args)
 | |
|         return error("wrong value type for key.", RemarkField);
 | |
| 
 | |
|       for (yaml::Node &Arg : *Args) {
 | |
|         if (Expected<Argument> MaybeArg = parseArg(Arg))
 | |
|           TheRemark.Args.push_back(*MaybeArg);
 | |
|         else
 | |
|           return MaybeArg.takeError();
 | |
|       }
 | |
|     } else {
 | |
|       return error("unknown key.", RemarkField);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // Check if any of the mandatory fields are missing.
 | |
|   if (TheRemark.RemarkType == Type::Unknown || TheRemark.PassName.empty() ||
 | |
|       TheRemark.RemarkName.empty() || TheRemark.FunctionName.empty())
 | |
|     return error("Type, Pass, Name or Function missing.",
 | |
|                  *RemarkEntry.getRoot());
 | |
| 
 | |
|   return std::move(Result);
 | |
| }
 | |
| 
 | |
| Expected<Type> YAMLRemarkParser::parseType(yaml::MappingNode &Node) {
 | |
|   auto Type = StringSwitch<remarks::Type>(Node.getRawTag())
 | |
|                   .Case("!Passed", remarks::Type::Passed)
 | |
|                   .Case("!Missed", remarks::Type::Missed)
 | |
|                   .Case("!Analysis", remarks::Type::Analysis)
 | |
|                   .Case("!AnalysisFPCommute", remarks::Type::AnalysisFPCommute)
 | |
|                   .Case("!AnalysisAliasing", remarks::Type::AnalysisAliasing)
 | |
|                   .Case("!Failure", remarks::Type::Failure)
 | |
|                   .Default(remarks::Type::Unknown);
 | |
|   if (Type == remarks::Type::Unknown)
 | |
|     return error("expected a remark tag.", Node);
 | |
|   return Type;
 | |
| }
 | |
| 
 | |
| Expected<StringRef> YAMLRemarkParser::parseKey(yaml::KeyValueNode &Node) {
 | |
|   if (auto *Key = dyn_cast<yaml::ScalarNode>(Node.getKey()))
 | |
|     return Key->getRawValue();
 | |
| 
 | |
|   return error("key is not a string.", Node);
 | |
| }
 | |
| 
 | |
| Expected<StringRef> YAMLRemarkParser::parseStr(yaml::KeyValueNode &Node) {
 | |
|   auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
 | |
|   if (!Value)
 | |
|     return error("expected a value of scalar type.", Node);
 | |
|   StringRef Result = Value->getRawValue();
 | |
| 
 | |
|   if (Result.front() == '\'')
 | |
|     Result = Result.drop_front();
 | |
| 
 | |
|   if (Result.back() == '\'')
 | |
|     Result = Result.drop_back();
 | |
| 
 | |
|   return Result;
 | |
| }
 | |
| 
 | |
| Expected<unsigned> YAMLRemarkParser::parseUnsigned(yaml::KeyValueNode &Node) {
 | |
|   SmallVector<char, 4> Tmp;
 | |
|   auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
 | |
|   if (!Value)
 | |
|     return error("expected a value of scalar type.", Node);
 | |
|   unsigned UnsignedValue = 0;
 | |
|   if (Value->getValue(Tmp).getAsInteger(10, UnsignedValue))
 | |
|     return error("expected a value of integer type.", *Value);
 | |
|   return UnsignedValue;
 | |
| }
 | |
| 
 | |
| Expected<RemarkLocation>
 | |
| YAMLRemarkParser::parseDebugLoc(yaml::KeyValueNode &Node) {
 | |
|   auto *DebugLoc = dyn_cast<yaml::MappingNode>(Node.getValue());
 | |
|   if (!DebugLoc)
 | |
|     return error("expected a value of mapping type.", Node);
 | |
| 
 | |
|   Optional<StringRef> File;
 | |
|   Optional<unsigned> Line;
 | |
|   Optional<unsigned> Column;
 | |
| 
 | |
|   for (yaml::KeyValueNode &DLNode : *DebugLoc) {
 | |
|     Expected<StringRef> MaybeKey = parseKey(DLNode);
 | |
|     if (!MaybeKey)
 | |
|       return MaybeKey.takeError();
 | |
|     StringRef KeyName = *MaybeKey;
 | |
| 
 | |
|     if (KeyName == "File") {
 | |
|       if (Expected<StringRef> MaybeStr = parseStr(DLNode))
 | |
|         File = *MaybeStr;
 | |
|       else
 | |
|         return MaybeStr.takeError();
 | |
|     } else if (KeyName == "Column") {
 | |
|       if (Expected<unsigned> MaybeU = parseUnsigned(DLNode))
 | |
|         Column = *MaybeU;
 | |
|       else
 | |
|         return MaybeU.takeError();
 | |
|     } else if (KeyName == "Line") {
 | |
|       if (Expected<unsigned> MaybeU = parseUnsigned(DLNode))
 | |
|         Line = *MaybeU;
 | |
|       else
 | |
|         return MaybeU.takeError();
 | |
|     } else {
 | |
|       return error("unknown entry in DebugLoc map.", DLNode);
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // If any of the debug loc fields is missing, return an error.
 | |
|   if (!File || !Line || !Column)
 | |
|     return error("DebugLoc node incomplete.", Node);
 | |
| 
 | |
|   return RemarkLocation{*File, *Line, *Column};
 | |
| }
 | |
| 
 | |
| Expected<Argument> YAMLRemarkParser::parseArg(yaml::Node &Node) {
 | |
|   auto *ArgMap = dyn_cast<yaml::MappingNode>(&Node);
 | |
|   if (!ArgMap)
 | |
|     return error("expected a value of mapping type.", Node);
 | |
| 
 | |
|   Optional<StringRef> KeyStr;
 | |
|   Optional<StringRef> ValueStr;
 | |
|   Optional<RemarkLocation> Loc;
 | |
| 
 | |
|   for (yaml::KeyValueNode &ArgEntry : *ArgMap) {
 | |
|     Expected<StringRef> MaybeKey = parseKey(ArgEntry);
 | |
|     if (!MaybeKey)
 | |
|       return MaybeKey.takeError();
 | |
|     StringRef KeyName = *MaybeKey;
 | |
| 
 | |
|     // Try to parse debug locs.
 | |
|     if (KeyName == "DebugLoc") {
 | |
|       // Can't have multiple DebugLoc entries per argument.
 | |
|       if (Loc)
 | |
|         return error("only one DebugLoc entry is allowed per argument.",
 | |
|                      ArgEntry);
 | |
| 
 | |
|       if (Expected<RemarkLocation> MaybeLoc = parseDebugLoc(ArgEntry)) {
 | |
|         Loc = *MaybeLoc;
 | |
|         continue;
 | |
|       } else
 | |
|         return MaybeLoc.takeError();
 | |
|     }
 | |
| 
 | |
|     // If we already have a string, error out.
 | |
|     if (ValueStr)
 | |
|       return error("only one string entry is allowed per argument.", ArgEntry);
 | |
| 
 | |
|     // Try to parse the value.
 | |
|     if (Expected<StringRef> MaybeStr = parseStr(ArgEntry))
 | |
|       ValueStr = *MaybeStr;
 | |
|     else
 | |
|       return MaybeStr.takeError();
 | |
| 
 | |
|     // Keep the key from the string.
 | |
|     KeyStr = KeyName;
 | |
|   }
 | |
| 
 | |
|   if (!KeyStr)
 | |
|     return error("argument key is missing.", *ArgMap);
 | |
|   if (!ValueStr)
 | |
|     return error("argument value is missing.", *ArgMap);
 | |
| 
 | |
|   return Argument{*KeyStr, *ValueStr, Loc};
 | |
| }
 | |
| 
 | |
| Expected<std::unique_ptr<Remark>> YAMLRemarkParser::next() {
 | |
|   if (YAMLIt == Stream.end())
 | |
|     return make_error<EndOfFileError>();
 | |
| 
 | |
|   Expected<std::unique_ptr<Remark>> MaybeResult = parseRemark(*YAMLIt);
 | |
|   if (!MaybeResult) {
 | |
|     // Avoid garbage input, set the iterator to the end.
 | |
|     YAMLIt = Stream.end();
 | |
|     return MaybeResult.takeError();
 | |
|   }
 | |
| 
 | |
|   ++YAMLIt;
 | |
| 
 | |
|   return std::move(*MaybeResult);
 | |
| }
 | |
| 
 | |
| Expected<StringRef> YAMLStrTabRemarkParser::parseStr(yaml::KeyValueNode &Node) {
 | |
|   auto *Value = dyn_cast<yaml::ScalarNode>(Node.getValue());
 | |
|   if (!Value)
 | |
|     return error("expected a value of scalar type.", Node);
 | |
|   StringRef Result;
 | |
|   // If we have a string table, parse it as an unsigned.
 | |
|   unsigned StrID = 0;
 | |
|   if (Expected<unsigned> MaybeStrID = parseUnsigned(Node))
 | |
|     StrID = *MaybeStrID;
 | |
|   else
 | |
|     return MaybeStrID.takeError();
 | |
| 
 | |
|   if (Expected<StringRef> Str = (*StrTab)[StrID])
 | |
|     Result = *Str;
 | |
|   else
 | |
|     return Str.takeError();
 | |
| 
 | |
|   if (Result.front() == '\'')
 | |
|     Result = Result.drop_front();
 | |
| 
 | |
|   if (Result.back() == '\'')
 | |
|     Result = Result.drop_back();
 | |
| 
 | |
|   return Result;
 | |
| }
 |