1 //===--- CompilationDatabase.cpp - ----------------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 //  This file contains implementations of the CompilationDatabase base class
11 //  and the FixedCompilationDatabase.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "clang/Tooling/CompilationDatabase.h"
16 #include "clang/Basic/Diagnostic.h"
17 #include "clang/Basic/DiagnosticOptions.h"
18 #include "clang/Driver/Action.h"
19 #include "clang/Driver/Compilation.h"
20 #include "clang/Driver/Driver.h"
21 #include "clang/Driver/DriverDiagnostic.h"
22 #include "clang/Driver/Job.h"
23 #include "clang/Frontend/TextDiagnosticPrinter.h"
24 #include "clang/Tooling/CompilationDatabasePluginRegistry.h"
25 #include "clang/Tooling/Tooling.h"
26 #include "llvm/ADT/SmallString.h"
27 #include "llvm/Option/Arg.h"
28 #include "llvm/Support/Host.h"
29 #include "llvm/Support/Path.h"
30 #include <sstream>
31 #include <system_error>
32 using namespace clang;
33 using namespace tooling;
34 
35 LLVM_INSTANTIATE_REGISTRY(CompilationDatabasePluginRegistry)
36 
37 CompilationDatabase::~CompilationDatabase() {}
38 
39 std::unique_ptr<CompilationDatabase>
40 CompilationDatabase::loadFromDirectory(StringRef BuildDirectory,
41                                        std::string &ErrorMessage) {
42   std::stringstream ErrorStream;
43   for (CompilationDatabasePluginRegistry::iterator
44        It = CompilationDatabasePluginRegistry::begin(),
45        Ie = CompilationDatabasePluginRegistry::end();
46        It != Ie; ++It) {
47     std::string DatabaseErrorMessage;
48     std::unique_ptr<CompilationDatabasePlugin> Plugin(It->instantiate());
49     if (std::unique_ptr<CompilationDatabase> DB =
50             Plugin->loadFromDirectory(BuildDirectory, DatabaseErrorMessage))
51       return DB;
52     ErrorStream << It->getName() << ": " << DatabaseErrorMessage << "\n";
53   }
54   ErrorMessage = ErrorStream.str();
55   return nullptr;
56 }
57 
58 static std::unique_ptr<CompilationDatabase>
59 findCompilationDatabaseFromDirectory(StringRef Directory,
60                                      std::string &ErrorMessage) {
61   std::stringstream ErrorStream;
62   bool HasErrorMessage = false;
63   while (!Directory.empty()) {
64     std::string LoadErrorMessage;
65 
66     if (std::unique_ptr<CompilationDatabase> DB =
67             CompilationDatabase::loadFromDirectory(Directory, LoadErrorMessage))
68       return DB;
69 
70     if (!HasErrorMessage) {
71       ErrorStream << "No compilation database found in " << Directory.str()
72                   << " or any parent directory\n" << LoadErrorMessage;
73       HasErrorMessage = true;
74     }
75 
76     Directory = llvm::sys::path::parent_path(Directory);
77   }
78   ErrorMessage = ErrorStream.str();
79   return nullptr;
80 }
81 
82 std::unique_ptr<CompilationDatabase>
83 CompilationDatabase::autoDetectFromSource(StringRef SourceFile,
84                                           std::string &ErrorMessage) {
85   SmallString<1024> AbsolutePath(getAbsolutePath(SourceFile));
86   StringRef Directory = llvm::sys::path::parent_path(AbsolutePath);
87 
88   std::unique_ptr<CompilationDatabase> DB =
89       findCompilationDatabaseFromDirectory(Directory, ErrorMessage);
90 
91   if (!DB)
92     ErrorMessage = ("Could not auto-detect compilation database for file \"" +
93                    SourceFile + "\"\n" + ErrorMessage).str();
94   return DB;
95 }
96 
97 std::unique_ptr<CompilationDatabase>
98 CompilationDatabase::autoDetectFromDirectory(StringRef SourceDir,
99                                              std::string &ErrorMessage) {
100   SmallString<1024> AbsolutePath(getAbsolutePath(SourceDir));
101 
102   std::unique_ptr<CompilationDatabase> DB =
103       findCompilationDatabaseFromDirectory(AbsolutePath, ErrorMessage);
104 
105   if (!DB)
106     ErrorMessage = ("Could not auto-detect compilation database from directory \"" +
107                    SourceDir + "\"\n" + ErrorMessage).str();
108   return DB;
109 }
110 
111 CompilationDatabasePlugin::~CompilationDatabasePlugin() {}
112 
113 namespace {
114 // Helper for recursively searching through a chain of actions and collecting
115 // all inputs, direct and indirect, of compile jobs.
116 struct CompileJobAnalyzer {
117   void run(const driver::Action *A) {
118     runImpl(A, false);
119   }
120 
121   SmallVector<std::string, 2> Inputs;
122 
123 private:
124 
125   void runImpl(const driver::Action *A, bool Collect) {
126     bool CollectChildren = Collect;
127     switch (A->getKind()) {
128     case driver::Action::CompileJobClass:
129       CollectChildren = true;
130       break;
131 
132     case driver::Action::InputClass: {
133       if (Collect) {
134         const driver::InputAction *IA = cast<driver::InputAction>(A);
135         Inputs.push_back(IA->getInputArg().getSpelling());
136       }
137     } break;
138 
139     default:
140       // Don't care about others
141       ;
142     }
143 
144     for (const driver::Action *AI : A->inputs())
145       runImpl(AI, CollectChildren);
146   }
147 };
148 
149 // Special DiagnosticConsumer that looks for warn_drv_input_file_unused
150 // diagnostics from the driver and collects the option strings for those unused
151 // options.
152 class UnusedInputDiagConsumer : public DiagnosticConsumer {
153 public:
154   UnusedInputDiagConsumer() : Other(nullptr) {}
155 
156   // Useful for debugging, chain diagnostics to another consumer after
157   // recording for our own purposes.
158   UnusedInputDiagConsumer(DiagnosticConsumer *Other) : Other(Other) {}
159 
160   void HandleDiagnostic(DiagnosticsEngine::Level DiagLevel,
161                         const Diagnostic &Info) override {
162     if (Info.getID() == clang::diag::warn_drv_input_file_unused) {
163       // Arg 1 for this diagnostic is the option that didn't get used.
164       UnusedInputs.push_back(Info.getArgStdStr(0));
165     }
166     if (Other)
167       Other->HandleDiagnostic(DiagLevel, Info);
168   }
169 
170   DiagnosticConsumer *Other;
171   SmallVector<std::string, 2> UnusedInputs;
172 };
173 
174 // Unary functor for asking "Given a StringRef S1, does there exist a string
175 // S2 in Arr where S1 == S2?"
176 struct MatchesAny {
177   MatchesAny(ArrayRef<std::string> Arr) : Arr(Arr) {}
178   bool operator() (StringRef S) {
179     for (const std::string *I = Arr.begin(), *E = Arr.end(); I != E; ++I)
180       if (*I == S)
181         return true;
182     return false;
183   }
184 private:
185   ArrayRef<std::string> Arr;
186 };
187 } // namespace
188 
189 /// \brief Strips any positional args and possible argv[0] from a command-line
190 /// provided by the user to construct a FixedCompilationDatabase.
191 ///
192 /// FixedCompilationDatabase requires a command line to be in this format as it
193 /// constructs the command line for each file by appending the name of the file
194 /// to be compiled. FixedCompilationDatabase also adds its own argv[0] to the
195 /// start of the command line although its value is not important as it's just
196 /// ignored by the Driver invoked by the ClangTool using the
197 /// FixedCompilationDatabase.
198 ///
199 /// FIXME: This functionality should probably be made available by
200 /// clang::driver::Driver although what the interface should look like is not
201 /// clear.
202 ///
203 /// \param[in] Args Args as provided by the user.
204 /// \return Resulting stripped command line.
205 ///          \li true if successful.
206 ///          \li false if \c Args cannot be used for compilation jobs (e.g.
207 ///          contains an option like -E or -version).
208 static bool stripPositionalArgs(std::vector<const char *> Args,
209                                 std::vector<std::string> &Result) {
210   IntrusiveRefCntPtr<DiagnosticOptions> DiagOpts = new DiagnosticOptions();
211   UnusedInputDiagConsumer DiagClient;
212   DiagnosticsEngine Diagnostics(
213       IntrusiveRefCntPtr<clang::DiagnosticIDs>(new DiagnosticIDs()),
214       &*DiagOpts, &DiagClient, false);
215 
216   // The clang executable path isn't required since the jobs the driver builds
217   // will not be executed.
218   std::unique_ptr<driver::Driver> NewDriver(new driver::Driver(
219       /* ClangExecutable= */ "", llvm::sys::getDefaultTargetTriple(),
220       Diagnostics));
221   NewDriver->setCheckInputsExist(false);
222 
223   // This becomes the new argv[0]. The value is actually not important as it
224   // isn't used for invoking Tools.
225   Args.insert(Args.begin(), "clang-tool");
226 
227   // By adding -c, we force the driver to treat compilation as the last phase.
228   // It will then issue warnings via Diagnostics about un-used options that
229   // would have been used for linking. If the user provided a compiler name as
230   // the original argv[0], this will be treated as a linker input thanks to
231   // insertng a new argv[0] above. All un-used options get collected by
232   // UnusedInputdiagConsumer and get stripped out later.
233   Args.push_back("-c");
234 
235   // Put a dummy C++ file on to ensure there's at least one compile job for the
236   // driver to construct. If the user specified some other argument that
237   // prevents compilation, e.g. -E or something like -version, we may still end
238   // up with no jobs but then this is the user's fault.
239   Args.push_back("placeholder.cpp");
240 
241   // Remove -no-integrated-as; it's not used for syntax checking,
242   // and it confuses targets which don't support this option.
243   Args.erase(std::remove_if(Args.begin(), Args.end(),
244                             MatchesAny(std::string("-no-integrated-as"))),
245              Args.end());
246 
247   const std::unique_ptr<driver::Compilation> Compilation(
248       NewDriver->BuildCompilation(Args));
249 
250   const driver::JobList &Jobs = Compilation->getJobs();
251 
252   CompileJobAnalyzer CompileAnalyzer;
253 
254   for (const auto &Cmd : Jobs) {
255     // Collect only for Assemble jobs. If we do all jobs we get duplicates
256     // since Link jobs point to Assemble jobs as inputs.
257     if (Cmd.getSource().getKind() == driver::Action::AssembleJobClass)
258       CompileAnalyzer.run(&Cmd.getSource());
259   }
260 
261   if (CompileAnalyzer.Inputs.empty()) {
262     // No compile jobs found.
263     // FIXME: Emit a warning of some kind?
264     return false;
265   }
266 
267   // Remove all compilation input files from the command line. This is
268   // necessary so that getCompileCommands() can construct a command line for
269   // each file.
270   std::vector<const char *>::iterator End = std::remove_if(
271       Args.begin(), Args.end(), MatchesAny(CompileAnalyzer.Inputs));
272 
273   // Remove all inputs deemed unused for compilation.
274   End = std::remove_if(Args.begin(), End, MatchesAny(DiagClient.UnusedInputs));
275 
276   // Remove the -c add above as well. It will be at the end right now.
277   assert(strcmp(*(End - 1), "-c") == 0);
278   --End;
279 
280   Result = std::vector<std::string>(Args.begin() + 1, End);
281   return true;
282 }
283 
284 FixedCompilationDatabase *FixedCompilationDatabase::loadFromCommandLine(
285     int &Argc, const char *const *Argv, Twine Directory) {
286   const char *const *DoubleDash = std::find(Argv, Argv + Argc, StringRef("--"));
287   if (DoubleDash == Argv + Argc)
288     return nullptr;
289   std::vector<const char *> CommandLine(DoubleDash + 1, Argv + Argc);
290   Argc = DoubleDash - Argv;
291 
292   std::vector<std::string> StrippedArgs;
293   if (!stripPositionalArgs(CommandLine, StrippedArgs))
294     return nullptr;
295   return new FixedCompilationDatabase(Directory, StrippedArgs);
296 }
297 
298 FixedCompilationDatabase::
299 FixedCompilationDatabase(Twine Directory, ArrayRef<std::string> CommandLine) {
300   std::vector<std::string> ToolCommandLine(1, "clang-tool");
301   ToolCommandLine.insert(ToolCommandLine.end(),
302                          CommandLine.begin(), CommandLine.end());
303   CompileCommands.emplace_back(Directory, StringRef(),
304                                std::move(ToolCommandLine));
305 }
306 
307 std::vector<CompileCommand>
308 FixedCompilationDatabase::getCompileCommands(StringRef FilePath) const {
309   std::vector<CompileCommand> Result(CompileCommands);
310   Result[0].CommandLine.push_back(FilePath);
311   Result[0].Filename = FilePath;
312   return Result;
313 }
314 
315 std::vector<std::string>
316 FixedCompilationDatabase::getAllFiles() const {
317   return std::vector<std::string>();
318 }
319 
320 std::vector<CompileCommand>
321 FixedCompilationDatabase::getAllCompileCommands() const {
322   return std::vector<CompileCommand>();
323 }
324 
325 namespace clang {
326 namespace tooling {
327 
328 // This anchor is used to force the linker to link in the generated object file
329 // and thus register the JSONCompilationDatabasePlugin.
330 extern volatile int JSONAnchorSource;
331 static int LLVM_ATTRIBUTE_UNUSED JSONAnchorDest = JSONAnchorSource;
332 
333 } // end namespace tooling
334 } // end namespace clang
335