10b57cec5SDimitry Andric //===- JSONCompilationDatabase.cpp ----------------------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric // This file contains the implementation of the JSONCompilationDatabase.
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric
130b57cec5SDimitry Andric #include "clang/Tooling/JSONCompilationDatabase.h"
140b57cec5SDimitry Andric #include "clang/Basic/LLVM.h"
150b57cec5SDimitry Andric #include "clang/Tooling/CompilationDatabase.h"
160b57cec5SDimitry Andric #include "clang/Tooling/CompilationDatabasePluginRegistry.h"
170b57cec5SDimitry Andric #include "clang/Tooling/Tooling.h"
180b57cec5SDimitry Andric #include "llvm/ADT/STLExtras.h"
190b57cec5SDimitry Andric #include "llvm/ADT/SmallString.h"
200b57cec5SDimitry Andric #include "llvm/ADT/SmallVector.h"
210b57cec5SDimitry Andric #include "llvm/ADT/StringRef.h"
220b57cec5SDimitry Andric #include "llvm/Support/Allocator.h"
230b57cec5SDimitry Andric #include "llvm/Support/Casting.h"
240b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
250b57cec5SDimitry Andric #include "llvm/Support/ErrorOr.h"
260b57cec5SDimitry Andric #include "llvm/Support/MemoryBuffer.h"
270b57cec5SDimitry Andric #include "llvm/Support/Path.h"
280b57cec5SDimitry Andric #include "llvm/Support/StringSaver.h"
29480093f4SDimitry Andric #include "llvm/Support/VirtualFileSystem.h"
300b57cec5SDimitry Andric #include "llvm/Support/YAMLParser.h"
310b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
32*fe013be4SDimitry Andric #include "llvm/TargetParser/Host.h"
33*fe013be4SDimitry Andric #include "llvm/TargetParser/Triple.h"
340b57cec5SDimitry Andric #include <cassert>
350b57cec5SDimitry Andric #include <memory>
36bdd1243dSDimitry Andric #include <optional>
370b57cec5SDimitry Andric #include <string>
380b57cec5SDimitry Andric #include <system_error>
390b57cec5SDimitry Andric #include <tuple>
400b57cec5SDimitry Andric #include <utility>
410b57cec5SDimitry Andric #include <vector>
420b57cec5SDimitry Andric
430b57cec5SDimitry Andric using namespace clang;
440b57cec5SDimitry Andric using namespace tooling;
450b57cec5SDimitry Andric
460b57cec5SDimitry Andric namespace {
470b57cec5SDimitry Andric
480b57cec5SDimitry Andric /// A parser for escaped strings of command line arguments.
490b57cec5SDimitry Andric ///
500b57cec5SDimitry Andric /// Assumes \-escaping for quoted arguments (see the documentation of
510b57cec5SDimitry Andric /// unescapeCommandLine(...)).
520b57cec5SDimitry Andric class CommandLineArgumentParser {
530b57cec5SDimitry Andric public:
CommandLineArgumentParser(StringRef CommandLine)540b57cec5SDimitry Andric CommandLineArgumentParser(StringRef CommandLine)
550b57cec5SDimitry Andric : Input(CommandLine), Position(Input.begin()-1) {}
560b57cec5SDimitry Andric
parse()570b57cec5SDimitry Andric std::vector<std::string> parse() {
580b57cec5SDimitry Andric bool HasMoreInput = true;
590b57cec5SDimitry Andric while (HasMoreInput && nextNonWhitespace()) {
600b57cec5SDimitry Andric std::string Argument;
610b57cec5SDimitry Andric HasMoreInput = parseStringInto(Argument);
620b57cec5SDimitry Andric CommandLine.push_back(Argument);
630b57cec5SDimitry Andric }
640b57cec5SDimitry Andric return CommandLine;
650b57cec5SDimitry Andric }
660b57cec5SDimitry Andric
670b57cec5SDimitry Andric private:
680b57cec5SDimitry Andric // All private methods return true if there is more input available.
690b57cec5SDimitry Andric
parseStringInto(std::string & String)700b57cec5SDimitry Andric bool parseStringInto(std::string &String) {
710b57cec5SDimitry Andric do {
720b57cec5SDimitry Andric if (*Position == '"') {
730b57cec5SDimitry Andric if (!parseDoubleQuotedStringInto(String)) return false;
740b57cec5SDimitry Andric } else if (*Position == '\'') {
750b57cec5SDimitry Andric if (!parseSingleQuotedStringInto(String)) return false;
760b57cec5SDimitry Andric } else {
770b57cec5SDimitry Andric if (!parseFreeStringInto(String)) return false;
780b57cec5SDimitry Andric }
790b57cec5SDimitry Andric } while (*Position != ' ');
800b57cec5SDimitry Andric return true;
810b57cec5SDimitry Andric }
820b57cec5SDimitry Andric
parseDoubleQuotedStringInto(std::string & String)830b57cec5SDimitry Andric bool parseDoubleQuotedStringInto(std::string &String) {
840b57cec5SDimitry Andric if (!next()) return false;
850b57cec5SDimitry Andric while (*Position != '"') {
860b57cec5SDimitry Andric if (!skipEscapeCharacter()) return false;
870b57cec5SDimitry Andric String.push_back(*Position);
880b57cec5SDimitry Andric if (!next()) return false;
890b57cec5SDimitry Andric }
900b57cec5SDimitry Andric return next();
910b57cec5SDimitry Andric }
920b57cec5SDimitry Andric
parseSingleQuotedStringInto(std::string & String)930b57cec5SDimitry Andric bool parseSingleQuotedStringInto(std::string &String) {
940b57cec5SDimitry Andric if (!next()) return false;
950b57cec5SDimitry Andric while (*Position != '\'') {
960b57cec5SDimitry Andric String.push_back(*Position);
970b57cec5SDimitry Andric if (!next()) return false;
980b57cec5SDimitry Andric }
990b57cec5SDimitry Andric return next();
1000b57cec5SDimitry Andric }
1010b57cec5SDimitry Andric
parseFreeStringInto(std::string & String)1020b57cec5SDimitry Andric bool parseFreeStringInto(std::string &String) {
1030b57cec5SDimitry Andric do {
1040b57cec5SDimitry Andric if (!skipEscapeCharacter()) return false;
1050b57cec5SDimitry Andric String.push_back(*Position);
1060b57cec5SDimitry Andric if (!next()) return false;
1070b57cec5SDimitry Andric } while (*Position != ' ' && *Position != '"' && *Position != '\'');
1080b57cec5SDimitry Andric return true;
1090b57cec5SDimitry Andric }
1100b57cec5SDimitry Andric
skipEscapeCharacter()1110b57cec5SDimitry Andric bool skipEscapeCharacter() {
1120b57cec5SDimitry Andric if (*Position == '\\') {
1130b57cec5SDimitry Andric return next();
1140b57cec5SDimitry Andric }
1150b57cec5SDimitry Andric return true;
1160b57cec5SDimitry Andric }
1170b57cec5SDimitry Andric
nextNonWhitespace()1180b57cec5SDimitry Andric bool nextNonWhitespace() {
1190b57cec5SDimitry Andric do {
1200b57cec5SDimitry Andric if (!next()) return false;
1210b57cec5SDimitry Andric } while (*Position == ' ');
1220b57cec5SDimitry Andric return true;
1230b57cec5SDimitry Andric }
1240b57cec5SDimitry Andric
next()1250b57cec5SDimitry Andric bool next() {
1260b57cec5SDimitry Andric ++Position;
1270b57cec5SDimitry Andric return Position != Input.end();
1280b57cec5SDimitry Andric }
1290b57cec5SDimitry Andric
1300b57cec5SDimitry Andric const StringRef Input;
1310b57cec5SDimitry Andric StringRef::iterator Position;
1320b57cec5SDimitry Andric std::vector<std::string> CommandLine;
1330b57cec5SDimitry Andric };
1340b57cec5SDimitry Andric
unescapeCommandLine(JSONCommandLineSyntax Syntax,StringRef EscapedCommandLine)1350b57cec5SDimitry Andric std::vector<std::string> unescapeCommandLine(JSONCommandLineSyntax Syntax,
1360b57cec5SDimitry Andric StringRef EscapedCommandLine) {
1370b57cec5SDimitry Andric if (Syntax == JSONCommandLineSyntax::AutoDetect) {
138349cc55cSDimitry Andric #ifdef _WIN32
139349cc55cSDimitry Andric // Assume Windows command line parsing on Win32
1400b57cec5SDimitry Andric Syntax = JSONCommandLineSyntax::Windows;
141349cc55cSDimitry Andric #else
142349cc55cSDimitry Andric Syntax = JSONCommandLineSyntax::Gnu;
143349cc55cSDimitry Andric #endif
1440b57cec5SDimitry Andric }
1450b57cec5SDimitry Andric
1460b57cec5SDimitry Andric if (Syntax == JSONCommandLineSyntax::Windows) {
1470b57cec5SDimitry Andric llvm::BumpPtrAllocator Alloc;
1480b57cec5SDimitry Andric llvm::StringSaver Saver(Alloc);
1490b57cec5SDimitry Andric llvm::SmallVector<const char *, 64> T;
1500b57cec5SDimitry Andric llvm::cl::TokenizeWindowsCommandLine(EscapedCommandLine, Saver, T);
1510b57cec5SDimitry Andric std::vector<std::string> Result(T.begin(), T.end());
1520b57cec5SDimitry Andric return Result;
1530b57cec5SDimitry Andric }
1540b57cec5SDimitry Andric assert(Syntax == JSONCommandLineSyntax::Gnu);
1550b57cec5SDimitry Andric CommandLineArgumentParser parser(EscapedCommandLine);
1560b57cec5SDimitry Andric return parser.parse();
1570b57cec5SDimitry Andric }
1580b57cec5SDimitry Andric
1590b57cec5SDimitry Andric // This plugin locates a nearby compile_command.json file, and also infers
1600b57cec5SDimitry Andric // compile commands for files not present in the database.
1610b57cec5SDimitry Andric class JSONCompilationDatabasePlugin : public CompilationDatabasePlugin {
1620b57cec5SDimitry Andric std::unique_ptr<CompilationDatabase>
loadFromDirectory(StringRef Directory,std::string & ErrorMessage)1630b57cec5SDimitry Andric loadFromDirectory(StringRef Directory, std::string &ErrorMessage) override {
1640b57cec5SDimitry Andric SmallString<1024> JSONDatabasePath(Directory);
1650b57cec5SDimitry Andric llvm::sys::path::append(JSONDatabasePath, "compile_commands.json");
1660b57cec5SDimitry Andric auto Base = JSONCompilationDatabase::loadFromFile(
1670b57cec5SDimitry Andric JSONDatabasePath, ErrorMessage, JSONCommandLineSyntax::AutoDetect);
1680b57cec5SDimitry Andric return Base ? inferTargetAndDriverMode(
169480093f4SDimitry Andric inferMissingCompileCommands(expandResponseFiles(
170480093f4SDimitry Andric std::move(Base), llvm::vfs::getRealFileSystem())))
1710b57cec5SDimitry Andric : nullptr;
1720b57cec5SDimitry Andric }
1730b57cec5SDimitry Andric };
1740b57cec5SDimitry Andric
1750b57cec5SDimitry Andric } // namespace
1760b57cec5SDimitry Andric
1770b57cec5SDimitry Andric // Register the JSONCompilationDatabasePlugin with the
1780b57cec5SDimitry Andric // CompilationDatabasePluginRegistry using this statically initialized variable.
1790b57cec5SDimitry Andric static CompilationDatabasePluginRegistry::Add<JSONCompilationDatabasePlugin>
1800b57cec5SDimitry Andric X("json-compilation-database", "Reads JSON formatted compilation databases");
1810b57cec5SDimitry Andric
1820b57cec5SDimitry Andric namespace clang {
1830b57cec5SDimitry Andric namespace tooling {
1840b57cec5SDimitry Andric
1850b57cec5SDimitry Andric // This anchor is used to force the linker to link in the generated object file
1860b57cec5SDimitry Andric // and thus register the JSONCompilationDatabasePlugin.
1870b57cec5SDimitry Andric volatile int JSONAnchorSource = 0;
1880b57cec5SDimitry Andric
1890b57cec5SDimitry Andric } // namespace tooling
1900b57cec5SDimitry Andric } // namespace clang
1910b57cec5SDimitry Andric
1920b57cec5SDimitry Andric std::unique_ptr<JSONCompilationDatabase>
loadFromFile(StringRef FilePath,std::string & ErrorMessage,JSONCommandLineSyntax Syntax)1930b57cec5SDimitry Andric JSONCompilationDatabase::loadFromFile(StringRef FilePath,
1940b57cec5SDimitry Andric std::string &ErrorMessage,
1950b57cec5SDimitry Andric JSONCommandLineSyntax Syntax) {
1960b57cec5SDimitry Andric // Don't mmap: if we're a long-lived process, the build system may overwrite.
1970b57cec5SDimitry Andric llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> DatabaseBuffer =
198fe6060f1SDimitry Andric llvm::MemoryBuffer::getFile(FilePath, /*IsText=*/false,
1990b57cec5SDimitry Andric /*RequiresNullTerminator=*/true,
2000b57cec5SDimitry Andric /*IsVolatile=*/true);
2010b57cec5SDimitry Andric if (std::error_code Result = DatabaseBuffer.getError()) {
2020b57cec5SDimitry Andric ErrorMessage = "Error while opening JSON database: " + Result.message();
2030b57cec5SDimitry Andric return nullptr;
2040b57cec5SDimitry Andric }
2050b57cec5SDimitry Andric std::unique_ptr<JSONCompilationDatabase> Database(
2060b57cec5SDimitry Andric new JSONCompilationDatabase(std::move(*DatabaseBuffer), Syntax));
2070b57cec5SDimitry Andric if (!Database->parse(ErrorMessage))
2080b57cec5SDimitry Andric return nullptr;
2090b57cec5SDimitry Andric return Database;
2100b57cec5SDimitry Andric }
2110b57cec5SDimitry Andric
2120b57cec5SDimitry Andric std::unique_ptr<JSONCompilationDatabase>
loadFromBuffer(StringRef DatabaseString,std::string & ErrorMessage,JSONCommandLineSyntax Syntax)2130b57cec5SDimitry Andric JSONCompilationDatabase::loadFromBuffer(StringRef DatabaseString,
2140b57cec5SDimitry Andric std::string &ErrorMessage,
2150b57cec5SDimitry Andric JSONCommandLineSyntax Syntax) {
2160b57cec5SDimitry Andric std::unique_ptr<llvm::MemoryBuffer> DatabaseBuffer(
217e8d8bef9SDimitry Andric llvm::MemoryBuffer::getMemBufferCopy(DatabaseString));
2180b57cec5SDimitry Andric std::unique_ptr<JSONCompilationDatabase> Database(
2190b57cec5SDimitry Andric new JSONCompilationDatabase(std::move(DatabaseBuffer), Syntax));
2200b57cec5SDimitry Andric if (!Database->parse(ErrorMessage))
2210b57cec5SDimitry Andric return nullptr;
2220b57cec5SDimitry Andric return Database;
2230b57cec5SDimitry Andric }
2240b57cec5SDimitry Andric
2250b57cec5SDimitry Andric std::vector<CompileCommand>
getCompileCommands(StringRef FilePath) const2260b57cec5SDimitry Andric JSONCompilationDatabase::getCompileCommands(StringRef FilePath) const {
2270b57cec5SDimitry Andric SmallString<128> NativeFilePath;
2280b57cec5SDimitry Andric llvm::sys::path::native(FilePath, NativeFilePath);
2290b57cec5SDimitry Andric
2300b57cec5SDimitry Andric std::string Error;
2310b57cec5SDimitry Andric llvm::raw_string_ostream ES(Error);
2320b57cec5SDimitry Andric StringRef Match = MatchTrie.findEquivalent(NativeFilePath, ES);
2330b57cec5SDimitry Andric if (Match.empty())
2340b57cec5SDimitry Andric return {};
2350b57cec5SDimitry Andric const auto CommandsRefI = IndexByFile.find(Match);
2360b57cec5SDimitry Andric if (CommandsRefI == IndexByFile.end())
2370b57cec5SDimitry Andric return {};
2380b57cec5SDimitry Andric std::vector<CompileCommand> Commands;
2390b57cec5SDimitry Andric getCommands(CommandsRefI->getValue(), Commands);
2400b57cec5SDimitry Andric return Commands;
2410b57cec5SDimitry Andric }
2420b57cec5SDimitry Andric
2430b57cec5SDimitry Andric std::vector<std::string>
getAllFiles() const2440b57cec5SDimitry Andric JSONCompilationDatabase::getAllFiles() const {
2450b57cec5SDimitry Andric std::vector<std::string> Result;
2460b57cec5SDimitry Andric for (const auto &CommandRef : IndexByFile)
2470b57cec5SDimitry Andric Result.push_back(CommandRef.first().str());
2480b57cec5SDimitry Andric return Result;
2490b57cec5SDimitry Andric }
2500b57cec5SDimitry Andric
2510b57cec5SDimitry Andric std::vector<CompileCommand>
getAllCompileCommands() const2520b57cec5SDimitry Andric JSONCompilationDatabase::getAllCompileCommands() const {
2530b57cec5SDimitry Andric std::vector<CompileCommand> Commands;
2540b57cec5SDimitry Andric getCommands(AllCommands, Commands);
2550b57cec5SDimitry Andric return Commands;
2560b57cec5SDimitry Andric }
2570b57cec5SDimitry Andric
stripExecutableExtension(llvm::StringRef Name)2580b57cec5SDimitry Andric static llvm::StringRef stripExecutableExtension(llvm::StringRef Name) {
2590b57cec5SDimitry Andric Name.consume_back(".exe");
2600b57cec5SDimitry Andric return Name;
2610b57cec5SDimitry Andric }
2620b57cec5SDimitry Andric
2630b57cec5SDimitry Andric // There are compiler-wrappers (ccache, distcc, gomacc) that take the "real"
2640b57cec5SDimitry Andric // compiler as an argument, e.g. distcc gcc -O3 foo.c.
2650b57cec5SDimitry Andric // These end up in compile_commands.json when people set CC="distcc gcc".
2660b57cec5SDimitry Andric // Clang's driver doesn't understand this, so we need to unwrap.
unwrapCommand(std::vector<std::string> & Args)2670b57cec5SDimitry Andric static bool unwrapCommand(std::vector<std::string> &Args) {
2680b57cec5SDimitry Andric if (Args.size() < 2)
2690b57cec5SDimitry Andric return false;
2700b57cec5SDimitry Andric StringRef Wrapper =
2710b57cec5SDimitry Andric stripExecutableExtension(llvm::sys::path::filename(Args.front()));
272e8d8bef9SDimitry Andric if (Wrapper == "distcc" || Wrapper == "gomacc" || Wrapper == "ccache" ||
273e8d8bef9SDimitry Andric Wrapper == "sccache") {
2740b57cec5SDimitry Andric // Most of these wrappers support being invoked 3 ways:
2750b57cec5SDimitry Andric // `distcc g++ file.c` This is the mode we're trying to match.
2760b57cec5SDimitry Andric // We need to drop `distcc`.
2770b57cec5SDimitry Andric // `distcc file.c` This acts like compiler is cc or similar.
2780b57cec5SDimitry Andric // Clang's driver can handle this, no change needed.
2790b57cec5SDimitry Andric // `g++ file.c` g++ is a symlink to distcc.
2800b57cec5SDimitry Andric // We don't even notice this case, and all is well.
2810b57cec5SDimitry Andric //
2820b57cec5SDimitry Andric // We need to distinguish between the first and second case.
2830b57cec5SDimitry Andric // The wrappers themselves don't take flags, so Args[1] is a compiler flag,
2840b57cec5SDimitry Andric // an input file, or a compiler. Inputs have extensions, compilers don't.
2850b57cec5SDimitry Andric bool HasCompiler =
2860b57cec5SDimitry Andric (Args[1][0] != '-') &&
2870b57cec5SDimitry Andric !llvm::sys::path::has_extension(stripExecutableExtension(Args[1]));
2880b57cec5SDimitry Andric if (HasCompiler) {
2890b57cec5SDimitry Andric Args.erase(Args.begin());
2900b57cec5SDimitry Andric return true;
2910b57cec5SDimitry Andric }
2920b57cec5SDimitry Andric // If !HasCompiler, wrappers act like GCC. Fine: so do we.
2930b57cec5SDimitry Andric }
2940b57cec5SDimitry Andric return false;
2950b57cec5SDimitry Andric }
2960b57cec5SDimitry Andric
2970b57cec5SDimitry Andric static std::vector<std::string>
nodeToCommandLine(JSONCommandLineSyntax Syntax,const std::vector<llvm::yaml::ScalarNode * > & Nodes)2980b57cec5SDimitry Andric nodeToCommandLine(JSONCommandLineSyntax Syntax,
2990b57cec5SDimitry Andric const std::vector<llvm::yaml::ScalarNode *> &Nodes) {
3000b57cec5SDimitry Andric SmallString<1024> Storage;
3010b57cec5SDimitry Andric std::vector<std::string> Arguments;
3020b57cec5SDimitry Andric if (Nodes.size() == 1)
3030b57cec5SDimitry Andric Arguments = unescapeCommandLine(Syntax, Nodes[0]->getValue(Storage));
3040b57cec5SDimitry Andric else
3050b57cec5SDimitry Andric for (const auto *Node : Nodes)
3065ffd83dbSDimitry Andric Arguments.push_back(std::string(Node->getValue(Storage)));
3070b57cec5SDimitry Andric // There may be multiple wrappers: using distcc and ccache together is common.
3080b57cec5SDimitry Andric while (unwrapCommand(Arguments))
3090b57cec5SDimitry Andric ;
3100b57cec5SDimitry Andric return Arguments;
3110b57cec5SDimitry Andric }
3120b57cec5SDimitry Andric
getCommands(ArrayRef<CompileCommandRef> CommandsRef,std::vector<CompileCommand> & Commands) const3130b57cec5SDimitry Andric void JSONCompilationDatabase::getCommands(
3140b57cec5SDimitry Andric ArrayRef<CompileCommandRef> CommandsRef,
3150b57cec5SDimitry Andric std::vector<CompileCommand> &Commands) const {
3160b57cec5SDimitry Andric for (const auto &CommandRef : CommandsRef) {
3170b57cec5SDimitry Andric SmallString<8> DirectoryStorage;
3180b57cec5SDimitry Andric SmallString<32> FilenameStorage;
3190b57cec5SDimitry Andric SmallString<32> OutputStorage;
3200b57cec5SDimitry Andric auto Output = std::get<3>(CommandRef);
3210b57cec5SDimitry Andric Commands.emplace_back(
3220b57cec5SDimitry Andric std::get<0>(CommandRef)->getValue(DirectoryStorage),
3230b57cec5SDimitry Andric std::get<1>(CommandRef)->getValue(FilenameStorage),
3240b57cec5SDimitry Andric nodeToCommandLine(Syntax, std::get<2>(CommandRef)),
3250b57cec5SDimitry Andric Output ? Output->getValue(OutputStorage) : "");
3260b57cec5SDimitry Andric }
3270b57cec5SDimitry Andric }
3280b57cec5SDimitry Andric
parse(std::string & ErrorMessage)3290b57cec5SDimitry Andric bool JSONCompilationDatabase::parse(std::string &ErrorMessage) {
3300b57cec5SDimitry Andric llvm::yaml::document_iterator I = YAMLStream.begin();
3310b57cec5SDimitry Andric if (I == YAMLStream.end()) {
3320b57cec5SDimitry Andric ErrorMessage = "Error while parsing YAML.";
3330b57cec5SDimitry Andric return false;
3340b57cec5SDimitry Andric }
3350b57cec5SDimitry Andric llvm::yaml::Node *Root = I->getRoot();
3360b57cec5SDimitry Andric if (!Root) {
3370b57cec5SDimitry Andric ErrorMessage = "Error while parsing YAML.";
3380b57cec5SDimitry Andric return false;
3390b57cec5SDimitry Andric }
3400b57cec5SDimitry Andric auto *Array = dyn_cast<llvm::yaml::SequenceNode>(Root);
3410b57cec5SDimitry Andric if (!Array) {
3420b57cec5SDimitry Andric ErrorMessage = "Expected array.";
3430b57cec5SDimitry Andric return false;
3440b57cec5SDimitry Andric }
3450b57cec5SDimitry Andric for (auto &NextObject : *Array) {
3460b57cec5SDimitry Andric auto *Object = dyn_cast<llvm::yaml::MappingNode>(&NextObject);
3470b57cec5SDimitry Andric if (!Object) {
3480b57cec5SDimitry Andric ErrorMessage = "Expected object.";
3490b57cec5SDimitry Andric return false;
3500b57cec5SDimitry Andric }
3510b57cec5SDimitry Andric llvm::yaml::ScalarNode *Directory = nullptr;
352bdd1243dSDimitry Andric std::optional<std::vector<llvm::yaml::ScalarNode *>> Command;
3530b57cec5SDimitry Andric llvm::yaml::ScalarNode *File = nullptr;
3540b57cec5SDimitry Andric llvm::yaml::ScalarNode *Output = nullptr;
3550b57cec5SDimitry Andric for (auto& NextKeyValue : *Object) {
3560b57cec5SDimitry Andric auto *KeyString = dyn_cast<llvm::yaml::ScalarNode>(NextKeyValue.getKey());
3570b57cec5SDimitry Andric if (!KeyString) {
3580b57cec5SDimitry Andric ErrorMessage = "Expected strings as key.";
3590b57cec5SDimitry Andric return false;
3600b57cec5SDimitry Andric }
3610b57cec5SDimitry Andric SmallString<10> KeyStorage;
3620b57cec5SDimitry Andric StringRef KeyValue = KeyString->getValue(KeyStorage);
3630b57cec5SDimitry Andric llvm::yaml::Node *Value = NextKeyValue.getValue();
3640b57cec5SDimitry Andric if (!Value) {
3650b57cec5SDimitry Andric ErrorMessage = "Expected value.";
3660b57cec5SDimitry Andric return false;
3670b57cec5SDimitry Andric }
3680b57cec5SDimitry Andric auto *ValueString = dyn_cast<llvm::yaml::ScalarNode>(Value);
3690b57cec5SDimitry Andric auto *SequenceString = dyn_cast<llvm::yaml::SequenceNode>(Value);
370e8d8bef9SDimitry Andric if (KeyValue == "arguments") {
371e8d8bef9SDimitry Andric if (!SequenceString) {
3720b57cec5SDimitry Andric ErrorMessage = "Expected sequence as value.";
3730b57cec5SDimitry Andric return false;
3740b57cec5SDimitry Andric }
3750b57cec5SDimitry Andric Command = std::vector<llvm::yaml::ScalarNode *>();
3760b57cec5SDimitry Andric for (auto &Argument : *SequenceString) {
3770b57cec5SDimitry Andric auto *Scalar = dyn_cast<llvm::yaml::ScalarNode>(&Argument);
3780b57cec5SDimitry Andric if (!Scalar) {
3790b57cec5SDimitry Andric ErrorMessage = "Only strings are allowed in 'arguments'.";
3800b57cec5SDimitry Andric return false;
3810b57cec5SDimitry Andric }
3820b57cec5SDimitry Andric Command->push_back(Scalar);
3830b57cec5SDimitry Andric }
384e8d8bef9SDimitry Andric } else {
385e8d8bef9SDimitry Andric if (!ValueString) {
386e8d8bef9SDimitry Andric ErrorMessage = "Expected string as value.";
387e8d8bef9SDimitry Andric return false;
388e8d8bef9SDimitry Andric }
389e8d8bef9SDimitry Andric if (KeyValue == "directory") {
390e8d8bef9SDimitry Andric Directory = ValueString;
3910b57cec5SDimitry Andric } else if (KeyValue == "command") {
3920b57cec5SDimitry Andric if (!Command)
3930b57cec5SDimitry Andric Command = std::vector<llvm::yaml::ScalarNode *>(1, ValueString);
3940b57cec5SDimitry Andric } else if (KeyValue == "file") {
3950b57cec5SDimitry Andric File = ValueString;
3960b57cec5SDimitry Andric } else if (KeyValue == "output") {
3970b57cec5SDimitry Andric Output = ValueString;
3980b57cec5SDimitry Andric } else {
399e8d8bef9SDimitry Andric ErrorMessage =
400e8d8bef9SDimitry Andric ("Unknown key: \"" + KeyString->getRawValue() + "\"").str();
4010b57cec5SDimitry Andric return false;
4020b57cec5SDimitry Andric }
4030b57cec5SDimitry Andric }
404e8d8bef9SDimitry Andric }
4050b57cec5SDimitry Andric if (!File) {
4060b57cec5SDimitry Andric ErrorMessage = "Missing key: \"file\".";
4070b57cec5SDimitry Andric return false;
4080b57cec5SDimitry Andric }
4090b57cec5SDimitry Andric if (!Command) {
4100b57cec5SDimitry Andric ErrorMessage = "Missing key: \"command\" or \"arguments\".";
4110b57cec5SDimitry Andric return false;
4120b57cec5SDimitry Andric }
4130b57cec5SDimitry Andric if (!Directory) {
4140b57cec5SDimitry Andric ErrorMessage = "Missing key: \"directory\".";
4150b57cec5SDimitry Andric return false;
4160b57cec5SDimitry Andric }
4170b57cec5SDimitry Andric SmallString<8> FileStorage;
4180b57cec5SDimitry Andric StringRef FileName = File->getValue(FileStorage);
4190b57cec5SDimitry Andric SmallString<128> NativeFilePath;
4200b57cec5SDimitry Andric if (llvm::sys::path::is_relative(FileName)) {
4210b57cec5SDimitry Andric SmallString<8> DirectoryStorage;
422bdd1243dSDimitry Andric SmallString<128> AbsolutePath(Directory->getValue(DirectoryStorage));
4230b57cec5SDimitry Andric llvm::sys::path::append(AbsolutePath, FileName);
4240b57cec5SDimitry Andric llvm::sys::path::native(AbsolutePath, NativeFilePath);
4250b57cec5SDimitry Andric } else {
4260b57cec5SDimitry Andric llvm::sys::path::native(FileName, NativeFilePath);
4270b57cec5SDimitry Andric }
428bdd1243dSDimitry Andric llvm::sys::path::remove_dots(NativeFilePath, /*remove_dot_dot=*/true);
4290b57cec5SDimitry Andric auto Cmd = CompileCommandRef(Directory, File, *Command, Output);
4300b57cec5SDimitry Andric IndexByFile[NativeFilePath].push_back(Cmd);
4310b57cec5SDimitry Andric AllCommands.push_back(Cmd);
4320b57cec5SDimitry Andric MatchTrie.insert(NativeFilePath);
4330b57cec5SDimitry Andric }
4340b57cec5SDimitry Andric return true;
4350b57cec5SDimitry Andric }
436