1 //===-- driver.cpp - Clang GCC-Compatible Driver --------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This is the entry point to the clang driver; it is a thin wrapper
11 // for functionality in the Driver clang library.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "clang/Basic/DiagnosticOptions.h"
16 #include "clang/Driver/Compilation.h"
17 #include "clang/Driver/Driver.h"
18 #include "clang/Driver/DriverDiagnostic.h"
19 #include "clang/Driver/Options.h"
20 #include "clang/Driver/ToolChain.h"
21 #include "clang/Frontend/ChainedDiagnosticConsumer.h"
22 #include "clang/Frontend/CompilerInvocation.h"
23 #include "clang/Frontend/SerializedDiagnosticPrinter.h"
24 #include "clang/Frontend/TextDiagnosticPrinter.h"
25 #include "clang/Frontend/Utils.h"
26 #include "llvm/ADT/ArrayRef.h"
27 #include "llvm/ADT/SmallString.h"
28 #include "llvm/ADT/SmallVector.h"
29 #include "llvm/Config/llvm-config.h"
30 #include "llvm/Option/ArgList.h"
31 #include "llvm/Option/OptTable.h"
32 #include "llvm/Option/Option.h"
33 #include "llvm/Support/CommandLine.h"
34 #include "llvm/Support/ErrorHandling.h"
35 #include "llvm/Support/FileSystem.h"
36 #include "llvm/Support/Host.h"
37 #include "llvm/Support/ManagedStatic.h"
38 #include "llvm/Support/Path.h"
39 #include "llvm/Support/PrettyStackTrace.h"
40 #include "llvm/Support/Process.h"
41 #include "llvm/Support/Program.h"
42 #include "llvm/Support/Regex.h"
43 #include "llvm/Support/Signals.h"
44 #include "llvm/Support/StringSaver.h"
45 #include "llvm/Support/TargetSelect.h"
46 #include "llvm/Support/Timer.h"
47 #include "llvm/Support/raw_ostream.h"
48 #include <memory>
49 #include <set>
50 #include <system_error>
51 using namespace clang;
52 using namespace clang::driver;
53 using namespace llvm::opt;
54 
55 std::string GetExecutablePath(const char *Argv0, bool CanonicalPrefixes) {
56   if (!CanonicalPrefixes) {
57     SmallString<128> ExecutablePath(Argv0);
58     // Do a PATH lookup if Argv0 isn't a valid path.
59     if (!llvm::sys::fs::exists(ExecutablePath))
60       if (llvm::ErrorOr<std::string> P =
61               llvm::sys::findProgramByName(ExecutablePath))
62         ExecutablePath = *P;
63     return ExecutablePath.str();
64   }
65 
66   // This just needs to be some symbol in the binary; C++ doesn't
67   // allow taking the address of ::main however.
68   void *P = (void*) (intptr_t) GetExecutablePath;
69   return llvm::sys::fs::getMainExecutable(Argv0, P);
70 }
71 
72 static const char *GetStableCStr(std::set<std::string> &SavedStrings,
73                                  StringRef S) {
74   return SavedStrings.insert(S).first->c_str();
75 }
76 
77 /// ApplyQAOverride - Apply a list of edits to the input argument lists.
78 ///
79 /// The input string is a space separate list of edits to perform,
80 /// they are applied in order to the input argument lists. Edits
81 /// should be one of the following forms:
82 ///
83 ///  '#': Silence information about the changes to the command line arguments.
84 ///
85 ///  '^': Add FOO as a new argument at the beginning of the command line.
86 ///
87 ///  '+': Add FOO as a new argument at the end of the command line.
88 ///
89 ///  's/XXX/YYY/': Substitute the regular expression XXX with YYY in the command
90 ///  line.
91 ///
92 ///  'xOPTION': Removes all instances of the literal argument OPTION.
93 ///
94 ///  'XOPTION': Removes all instances of the literal argument OPTION,
95 ///  and the following argument.
96 ///
97 ///  'Ox': Removes all flags matching 'O' or 'O[sz0-9]' and adds 'Ox'
98 ///  at the end of the command line.
99 ///
100 /// \param OS - The stream to write edit information to.
101 /// \param Args - The vector of command line arguments.
102 /// \param Edit - The override command to perform.
103 /// \param SavedStrings - Set to use for storing string representations.
104 static void ApplyOneQAOverride(raw_ostream &OS,
105                                SmallVectorImpl<const char*> &Args,
106                                StringRef Edit,
107                                std::set<std::string> &SavedStrings) {
108   // This does not need to be efficient.
109 
110   if (Edit[0] == '^') {
111     const char *Str =
112       GetStableCStr(SavedStrings, Edit.substr(1));
113     OS << "### Adding argument " << Str << " at beginning\n";
114     Args.insert(Args.begin() + 1, Str);
115   } else if (Edit[0] == '+') {
116     const char *Str =
117       GetStableCStr(SavedStrings, Edit.substr(1));
118     OS << "### Adding argument " << Str << " at end\n";
119     Args.push_back(Str);
120   } else if (Edit[0] == 's' && Edit[1] == '/' && Edit.endswith("/") &&
121              Edit.slice(2, Edit.size()-1).find('/') != StringRef::npos) {
122     StringRef MatchPattern = Edit.substr(2).split('/').first;
123     StringRef ReplPattern = Edit.substr(2).split('/').second;
124     ReplPattern = ReplPattern.slice(0, ReplPattern.size()-1);
125 
126     for (unsigned i = 1, e = Args.size(); i != e; ++i) {
127       // Ignore end-of-line response file markers
128       if (Args[i] == nullptr)
129         continue;
130       std::string Repl = llvm::Regex(MatchPattern).sub(ReplPattern, Args[i]);
131 
132       if (Repl != Args[i]) {
133         OS << "### Replacing '" << Args[i] << "' with '" << Repl << "'\n";
134         Args[i] = GetStableCStr(SavedStrings, Repl);
135       }
136     }
137   } else if (Edit[0] == 'x' || Edit[0] == 'X') {
138     auto Option = Edit.substr(1);
139     for (unsigned i = 1; i < Args.size();) {
140       if (Option == Args[i]) {
141         OS << "### Deleting argument " << Args[i] << '\n';
142         Args.erase(Args.begin() + i);
143         if (Edit[0] == 'X') {
144           if (i < Args.size()) {
145             OS << "### Deleting argument " << Args[i] << '\n';
146             Args.erase(Args.begin() + i);
147           } else
148             OS << "### Invalid X edit, end of command line!\n";
149         }
150       } else
151         ++i;
152     }
153   } else if (Edit[0] == 'O') {
154     for (unsigned i = 1; i < Args.size();) {
155       const char *A = Args[i];
156       // Ignore end-of-line response file markers
157       if (A == nullptr)
158         continue;
159       if (A[0] == '-' && A[1] == 'O' &&
160           (A[2] == '\0' ||
161            (A[3] == '\0' && (A[2] == 's' || A[2] == 'z' ||
162                              ('0' <= A[2] && A[2] <= '9'))))) {
163         OS << "### Deleting argument " << Args[i] << '\n';
164         Args.erase(Args.begin() + i);
165       } else
166         ++i;
167     }
168     OS << "### Adding argument " << Edit << " at end\n";
169     Args.push_back(GetStableCStr(SavedStrings, '-' + Edit.str()));
170   } else {
171     OS << "### Unrecognized edit: " << Edit << "\n";
172   }
173 }
174 
175 /// ApplyQAOverride - Apply a comma separate list of edits to the
176 /// input argument lists. See ApplyOneQAOverride.
177 static void ApplyQAOverride(SmallVectorImpl<const char*> &Args,
178                             const char *OverrideStr,
179                             std::set<std::string> &SavedStrings) {
180   raw_ostream *OS = &llvm::errs();
181 
182   if (OverrideStr[0] == '#') {
183     ++OverrideStr;
184     OS = &llvm::nulls();
185   }
186 
187   *OS << "### CCC_OVERRIDE_OPTIONS: " << OverrideStr << "\n";
188 
189   // This does not need to be efficient.
190 
191   const char *S = OverrideStr;
192   while (*S) {
193     const char *End = ::strchr(S, ' ');
194     if (!End)
195       End = S + strlen(S);
196     if (End != S)
197       ApplyOneQAOverride(*OS, Args, std::string(S, End), SavedStrings);
198     S = End;
199     if (*S != '\0')
200       ++S;
201   }
202 }
203 
204 extern int cc1_main(ArrayRef<const char *> Argv, const char *Argv0,
205                     void *MainAddr);
206 extern int cc1as_main(ArrayRef<const char *> Argv, const char *Argv0,
207                       void *MainAddr);
208 
209 static void insertTargetAndModeArgs(StringRef Target, StringRef Mode,
210                                     SmallVectorImpl<const char *> &ArgVector,
211                                     std::set<std::string> &SavedStrings) {
212   if (!Mode.empty()) {
213     // Add the mode flag to the arguments.
214     auto it = ArgVector.begin();
215     if (it != ArgVector.end())
216       ++it;
217     ArgVector.insert(it, GetStableCStr(SavedStrings, Mode));
218   }
219 
220   if (!Target.empty()) {
221     auto it = ArgVector.begin();
222     if (it != ArgVector.end())
223       ++it;
224     const char *arr[] = {"-target", GetStableCStr(SavedStrings, Target)};
225     ArgVector.insert(it, std::begin(arr), std::end(arr));
226   }
227 }
228 
229 static void getCLEnvVarOptions(std::string &EnvValue, llvm::StringSaver &Saver,
230                                SmallVectorImpl<const char *> &Opts) {
231   llvm::cl::TokenizeWindowsCommandLine(EnvValue, Saver, Opts);
232   // The first instance of '#' should be replaced with '=' in each option.
233   for (const char *Opt : Opts)
234     if (char *NumberSignPtr = const_cast<char *>(::strchr(Opt, '#')))
235       *NumberSignPtr = '=';
236 }
237 
238 static void SetBackdoorDriverOutputsFromEnvVars(Driver &TheDriver) {
239   // Handle CC_PRINT_OPTIONS and CC_PRINT_OPTIONS_FILE.
240   TheDriver.CCPrintOptions = !!::getenv("CC_PRINT_OPTIONS");
241   if (TheDriver.CCPrintOptions)
242     TheDriver.CCPrintOptionsFilename = ::getenv("CC_PRINT_OPTIONS_FILE");
243 
244   // Handle CC_PRINT_HEADERS and CC_PRINT_HEADERS_FILE.
245   TheDriver.CCPrintHeaders = !!::getenv("CC_PRINT_HEADERS");
246   if (TheDriver.CCPrintHeaders)
247     TheDriver.CCPrintHeadersFilename = ::getenv("CC_PRINT_HEADERS_FILE");
248 
249   // Handle CC_LOG_DIAGNOSTICS and CC_LOG_DIAGNOSTICS_FILE.
250   TheDriver.CCLogDiagnostics = !!::getenv("CC_LOG_DIAGNOSTICS");
251   if (TheDriver.CCLogDiagnostics)
252     TheDriver.CCLogDiagnosticsFilename = ::getenv("CC_LOG_DIAGNOSTICS_FILE");
253 }
254 
255 static void FixupDiagPrefixExeName(TextDiagnosticPrinter *DiagClient,
256                                    const std::string &Path) {
257   // If the clang binary happens to be named cl.exe for compatibility reasons,
258   // use clang-cl.exe as the prefix to avoid confusion between clang and MSVC.
259   StringRef ExeBasename(llvm::sys::path::filename(Path));
260   if (ExeBasename.equals_lower("cl.exe"))
261     ExeBasename = "clang-cl.exe";
262   DiagClient->setPrefix(ExeBasename);
263 }
264 
265 // This lets us create the DiagnosticsEngine with a properly-filled-out
266 // DiagnosticOptions instance.
267 static DiagnosticOptions *
268 CreateAndPopulateDiagOpts(ArrayRef<const char *> argv) {
269   auto *DiagOpts = new DiagnosticOptions;
270   std::unique_ptr<OptTable> Opts(createDriverOptTable());
271   unsigned MissingArgIndex, MissingArgCount;
272   InputArgList Args =
273       Opts->ParseArgs(argv.slice(1), MissingArgIndex, MissingArgCount);
274   // We ignore MissingArgCount and the return value of ParseDiagnosticArgs.
275   // Any errors that would be diagnosed here will also be diagnosed later,
276   // when the DiagnosticsEngine actually exists.
277   (void)ParseDiagnosticArgs(*DiagOpts, Args);
278   return DiagOpts;
279 }
280 
281 static void SetInstallDir(SmallVectorImpl<const char *> &argv,
282                           Driver &TheDriver, bool CanonicalPrefixes) {
283   // Attempt to find the original path used to invoke the driver, to determine
284   // the installed path. We do this manually, because we want to support that
285   // path being a symlink.
286   SmallString<128> InstalledPath(argv[0]);
287 
288   // Do a PATH lookup, if there are no directory components.
289   if (llvm::sys::path::filename(InstalledPath) == InstalledPath)
290     if (llvm::ErrorOr<std::string> Tmp = llvm::sys::findProgramByName(
291             llvm::sys::path::filename(InstalledPath.str())))
292       InstalledPath = *Tmp;
293 
294   // FIXME: We don't actually canonicalize this, we just make it absolute.
295   if (CanonicalPrefixes)
296     llvm::sys::fs::make_absolute(InstalledPath);
297 
298   StringRef InstalledPathParent(llvm::sys::path::parent_path(InstalledPath));
299   if (llvm::sys::fs::exists(InstalledPathParent))
300     TheDriver.setInstalledDir(InstalledPathParent);
301 }
302 
303 static int ExecuteCC1Tool(ArrayRef<const char *> argv, StringRef Tool) {
304   void *GetExecutablePathVP = (void *)(intptr_t) GetExecutablePath;
305   if (Tool == "")
306     return cc1_main(argv.slice(2), argv[0], GetExecutablePathVP);
307   if (Tool == "as")
308     return cc1as_main(argv.slice(2), argv[0], GetExecutablePathVP);
309 
310   // Reject unknown tools.
311   llvm::errs() << "error: unknown integrated tool '" << Tool << "'\n";
312   return 1;
313 }
314 
315 int main(int argc_, const char **argv_) {
316   llvm::sys::PrintStackTraceOnErrorSignal(argv_[0]);
317   llvm::PrettyStackTraceProgram X(argc_, argv_);
318   llvm::llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
319 
320   if (llvm::sys::Process::FixupStandardFileDescriptors())
321     return 1;
322 
323   SmallVector<const char *, 256> argv;
324   llvm::SpecificBumpPtrAllocator<char> ArgAllocator;
325   std::error_code EC = llvm::sys::Process::GetArgumentVector(
326       argv, llvm::makeArrayRef(argv_, argc_), ArgAllocator);
327   if (EC) {
328     llvm::errs() << "error: couldn't get arguments: " << EC.message() << '\n';
329     return 1;
330   }
331 
332   llvm::InitializeAllTargets();
333   std::string ProgName = argv[0];
334   std::pair<std::string, std::string> TargetAndMode =
335       ToolChain::getTargetAndModeFromProgramName(ProgName);
336 
337   llvm::BumpPtrAllocator A;
338   llvm::StringSaver Saver(A);
339 
340   // Parse response files using the GNU syntax, unless we're in CL mode. There
341   // are two ways to put clang in CL compatibility mode: argv[0] is either
342   // clang-cl or cl, or --driver-mode=cl is on the command line. The normal
343   // command line parsing can't happen until after response file parsing, so we
344   // have to manually search for a --driver-mode=cl argument the hard way.
345   // Finally, our -cc1 tools don't care which tokenization mode we use because
346   // response files written by clang will tokenize the same way in either mode.
347   bool ClangCLMode = false;
348   if (TargetAndMode.second == "--driver-mode=cl" ||
349       std::find_if(argv.begin(), argv.end(), [](const char *F) {
350         return F && strcmp(F, "--driver-mode=cl") == 0;
351       }) != argv.end()) {
352     ClangCLMode = true;
353   }
354   enum { Default, POSIX, Windows } RSPQuoting = Default;
355   for (const char *F : argv) {
356     if (strcmp(F, "--rsp-quoting=posix") == 0)
357       RSPQuoting = POSIX;
358     else if (strcmp(F, "--rsp-quoting=windows") == 0)
359       RSPQuoting = Windows;
360   }
361 
362   // Determines whether we want nullptr markers in argv to indicate response
363   // files end-of-lines. We only use this for the /LINK driver argument with
364   // clang-cl.exe on Windows.
365   bool MarkEOLs = ClangCLMode;
366 
367   llvm::cl::TokenizerCallback Tokenizer;
368   if (RSPQuoting == Windows || (RSPQuoting == Default && ClangCLMode))
369     Tokenizer = &llvm::cl::TokenizeWindowsCommandLine;
370   else
371     Tokenizer = &llvm::cl::TokenizeGNUCommandLine;
372 
373   if (MarkEOLs && argv.size() > 1 && StringRef(argv[1]).startswith("-cc1"))
374     MarkEOLs = false;
375   llvm::cl::ExpandResponseFiles(Saver, Tokenizer, argv, MarkEOLs);
376 
377   // Handle -cc1 integrated tools, even if -cc1 was expanded from a response
378   // file.
379   auto FirstArg = std::find_if(argv.begin() + 1, argv.end(),
380                                [](const char *A) { return A != nullptr; });
381   if (FirstArg != argv.end() && StringRef(*FirstArg).startswith("-cc1")) {
382     // If -cc1 came from a response file, remove the EOL sentinels.
383     if (MarkEOLs) {
384       auto newEnd = std::remove(argv.begin(), argv.end(), nullptr);
385       argv.resize(newEnd - argv.begin());
386     }
387     return ExecuteCC1Tool(argv, argv[1] + 4);
388   }
389 
390   bool CanonicalPrefixes = true;
391   for (int i = 1, size = argv.size(); i < size; ++i) {
392     // Skip end-of-line response file markers
393     if (argv[i] == nullptr)
394       continue;
395     if (StringRef(argv[i]) == "-no-canonical-prefixes") {
396       CanonicalPrefixes = false;
397       break;
398     }
399   }
400 
401   // Handle CL and _CL_ which permits additional command line options to be
402   // prepended or appended.
403   if (ClangCLMode) {
404     // Arguments in "CL" are prepended.
405     llvm::Optional<std::string> OptCL = llvm::sys::Process::GetEnv("CL");
406     if (OptCL.hasValue()) {
407       SmallVector<const char *, 8> PrependedOpts;
408       getCLEnvVarOptions(OptCL.getValue(), Saver, PrependedOpts);
409 
410       // Insert right after the program name to prepend to the argument list.
411       argv.insert(argv.begin() + 1, PrependedOpts.begin(), PrependedOpts.end());
412     }
413     // Arguments in "_CL_" are appended.
414     llvm::Optional<std::string> Opt_CL_ = llvm::sys::Process::GetEnv("_CL_");
415     if (Opt_CL_.hasValue()) {
416       SmallVector<const char *, 8> AppendedOpts;
417       getCLEnvVarOptions(Opt_CL_.getValue(), Saver, AppendedOpts);
418 
419       // Insert at the end of the argument list to append.
420       argv.append(AppendedOpts.begin(), AppendedOpts.end());
421     }
422   }
423 
424   std::set<std::string> SavedStrings;
425   // Handle CCC_OVERRIDE_OPTIONS, used for editing a command line behind the
426   // scenes.
427   if (const char *OverrideStr = ::getenv("CCC_OVERRIDE_OPTIONS")) {
428     // FIXME: Driver shouldn't take extra initial argument.
429     ApplyQAOverride(argv, OverrideStr, SavedStrings);
430   }
431 
432   std::string Path = GetExecutablePath(argv[0], CanonicalPrefixes);
433 
434   IntrusiveRefCntPtr<DiagnosticOptions> DiagOpts =
435       CreateAndPopulateDiagOpts(argv);
436 
437   TextDiagnosticPrinter *DiagClient
438     = new TextDiagnosticPrinter(llvm::errs(), &*DiagOpts);
439   FixupDiagPrefixExeName(DiagClient, Path);
440 
441   IntrusiveRefCntPtr<DiagnosticIDs> DiagID(new DiagnosticIDs());
442 
443   DiagnosticsEngine Diags(DiagID, &*DiagOpts, DiagClient);
444 
445   if (!DiagOpts->DiagnosticSerializationFile.empty()) {
446     auto SerializedConsumer =
447         clang::serialized_diags::create(DiagOpts->DiagnosticSerializationFile,
448                                         &*DiagOpts, /*MergeChildRecords=*/true);
449     Diags.setClient(new ChainedDiagnosticConsumer(
450         Diags.takeClient(), std::move(SerializedConsumer)));
451   }
452 
453   ProcessWarningOptions(Diags, *DiagOpts, /*ReportDiags=*/false);
454 
455   Driver TheDriver(Path, llvm::sys::getDefaultTargetTriple(), Diags);
456   SetInstallDir(argv, TheDriver, CanonicalPrefixes);
457 
458   insertTargetAndModeArgs(TargetAndMode.first, TargetAndMode.second, argv,
459                           SavedStrings);
460 
461   SetBackdoorDriverOutputsFromEnvVars(TheDriver);
462 
463   std::unique_ptr<Compilation> C(TheDriver.BuildCompilation(argv));
464   int Res = 1;
465   if (C.get()) {
466     SmallVector<std::pair<int, const Command *>, 4> FailingCommands;
467     Res = TheDriver.ExecuteCompilation(*C, FailingCommands);
468 
469     // Force a crash to test the diagnostics.
470     if (TheDriver.GenReproducer) {
471       Diags.Report(diag::err_drv_force_crash)
472         << !::getenv("FORCE_CLANG_DIAGNOSTICS_CRASH");
473 
474       // Pretend that every command failed.
475       FailingCommands.clear();
476       for (const auto &J : C->getJobs())
477         if (const Command *C = dyn_cast<Command>(&J))
478           FailingCommands.push_back(std::make_pair(-1, C));
479     }
480 
481     for (const auto &P : FailingCommands) {
482       int CommandRes = P.first;
483       const Command *FailingCommand = P.second;
484       if (!Res)
485         Res = CommandRes;
486 
487       // If result status is < 0, then the driver command signalled an error.
488       // If result status is 70, then the driver command reported a fatal error.
489       // On Windows, abort will return an exit code of 3.  In these cases,
490       // generate additional diagnostic information if possible.
491       bool DiagnoseCrash = CommandRes < 0 || CommandRes == 70;
492 #ifdef LLVM_ON_WIN32
493       DiagnoseCrash |= CommandRes == 3;
494 #endif
495       if (DiagnoseCrash) {
496         TheDriver.generateCompilationDiagnostics(*C, *FailingCommand);
497         break;
498       }
499     }
500   }
501 
502   Diags.getClient()->finish();
503 
504   // If any timers were active but haven't been destroyed yet, print their
505   // results now.  This happens in -disable-free mode.
506   llvm::TimerGroup::printAll(llvm::errs());
507 
508 #ifdef LLVM_ON_WIN32
509   // Exit status should not be negative on Win32, unless abnormal termination.
510   // Once abnormal termiation was caught, negative status should not be
511   // propagated.
512   if (Res < 0)
513     Res = 1;
514 #endif
515 
516   // If we have multiple failing commands, we return the result of the first
517   // failing command.
518   return Res;
519 }
520