1 //===--- PrecompiledPreamble.cpp - Build precompiled preambles --*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Helper class to build precompiled preamble.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "clang/Frontend/PrecompiledPreamble.h"
15 #include "clang/AST/DeclObjC.h"
16 #include "clang/Basic/TargetInfo.h"
17 #include "clang/Basic/VirtualFileSystem.h"
18 #include "clang/Frontend/CompilerInstance.h"
19 #include "clang/Frontend/CompilerInvocation.h"
20 #include "clang/Frontend/FrontendActions.h"
21 #include "clang/Frontend/FrontendOptions.h"
22 #include "clang/Lex/Lexer.h"
23 #include "clang/Lex/PreprocessorOptions.h"
24 #include "clang/Serialization/ASTWriter.h"
25 #include "llvm/ADT/StringExtras.h"
26 #include "llvm/ADT/StringSet.h"
27 #include "llvm/Support/CrashRecoveryContext.h"
28 #include "llvm/Support/FileSystem.h"
29 #include "llvm/Support/Mutex.h"
30 #include "llvm/Support/MutexGuard.h"
31 #include "llvm/Support/Process.h"
32 
33 using namespace clang;
34 
35 namespace {
36 
37 /// Keeps a track of files to be deleted in destructor.
38 class TemporaryFiles {
39 public:
40   // A static instance to be used by all clients.
41   static TemporaryFiles &getInstance();
42 
43 private:
44   // Disallow constructing the class directly.
45   TemporaryFiles() = default;
46   // Disallow copy.
47   TemporaryFiles(const TemporaryFiles &) = delete;
48 
49 public:
50   ~TemporaryFiles();
51 
52   /// Adds \p File to a set of tracked files.
53   void addFile(StringRef File);
54 
55   /// Remove \p File from disk and from the set of tracked files.
56   void removeFile(StringRef File);
57 
58 private:
59   llvm::sys::SmartMutex<false> Mutex;
60   llvm::StringSet<> Files;
61 };
62 
63 TemporaryFiles &TemporaryFiles::getInstance() {
64   static TemporaryFiles Instance;
65   return Instance;
66 }
67 
68 TemporaryFiles::~TemporaryFiles() {
69   llvm::MutexGuard Guard(Mutex);
70   for (const auto &File : Files)
71     llvm::sys::fs::remove(File.getKey());
72 }
73 
74 void TemporaryFiles::addFile(StringRef File) {
75   llvm::MutexGuard Guard(Mutex);
76   auto IsInserted = Files.insert(File).second;
77   (void)IsInserted;
78   assert(IsInserted && "File has already been added");
79 }
80 
81 void TemporaryFiles::removeFile(StringRef File) {
82   llvm::MutexGuard Guard(Mutex);
83   auto WasPresent = Files.erase(File);
84   (void)WasPresent;
85   assert(WasPresent && "File was not tracked");
86   llvm::sys::fs::remove(File);
87 }
88 
89 class PreambleMacroCallbacks : public PPCallbacks {
90 public:
91   PreambleMacroCallbacks(PreambleCallbacks &Callbacks) : Callbacks(Callbacks) {}
92 
93   void MacroDefined(const Token &MacroNameTok,
94                     const MacroDirective *MD) override {
95     Callbacks.HandleMacroDefined(MacroNameTok, MD);
96   }
97 
98 private:
99   PreambleCallbacks &Callbacks;
100 };
101 
102 class PrecompilePreambleAction : public ASTFrontendAction {
103 public:
104   PrecompilePreambleAction(PreambleCallbacks &Callbacks)
105       : Callbacks(Callbacks) {}
106 
107   std::unique_ptr<ASTConsumer> CreateASTConsumer(CompilerInstance &CI,
108                                                  StringRef InFile) override;
109 
110   bool hasEmittedPreamblePCH() const { return HasEmittedPreamblePCH; }
111 
112   void setEmittedPreamblePCH(ASTWriter &Writer) {
113     this->HasEmittedPreamblePCH = true;
114     Callbacks.AfterPCHEmitted(Writer);
115   }
116 
117   bool shouldEraseOutputFiles() override { return !hasEmittedPreamblePCH(); }
118   bool hasCodeCompletionSupport() const override { return false; }
119   bool hasASTFileSupport() const override { return false; }
120   TranslationUnitKind getTranslationUnitKind() override { return TU_Prefix; }
121 
122 private:
123   friend class PrecompilePreambleConsumer;
124 
125   bool HasEmittedPreamblePCH = false;
126   PreambleCallbacks &Callbacks;
127 };
128 
129 class PrecompilePreambleConsumer : public PCHGenerator {
130 public:
131   PrecompilePreambleConsumer(PrecompilePreambleAction &Action,
132                              const Preprocessor &PP, StringRef isysroot,
133                              std::unique_ptr<raw_ostream> Out)
134       : PCHGenerator(PP, "", isysroot, std::make_shared<PCHBuffer>(),
135                      ArrayRef<std::shared_ptr<ModuleFileExtension>>(),
136                      /*AllowASTWithErrors=*/true),
137         Action(Action), Out(std::move(Out)) {}
138 
139   bool HandleTopLevelDecl(DeclGroupRef DG) override {
140     Action.Callbacks.HandleTopLevelDecl(DG);
141     return true;
142   }
143 
144   void HandleTranslationUnit(ASTContext &Ctx) override {
145     PCHGenerator::HandleTranslationUnit(Ctx);
146     if (!hasEmittedPCH())
147       return;
148 
149     // Write the generated bitstream to "Out".
150     *Out << getPCH();
151     // Make sure it hits disk now.
152     Out->flush();
153     // Free the buffer.
154     llvm::SmallVector<char, 0> Empty;
155     getPCH() = std::move(Empty);
156 
157     Action.setEmittedPreamblePCH(getWriter());
158   }
159 
160 private:
161   PrecompilePreambleAction &Action;
162   std::unique_ptr<raw_ostream> Out;
163 };
164 
165 std::unique_ptr<ASTConsumer>
166 PrecompilePreambleAction::CreateASTConsumer(CompilerInstance &CI,
167 
168                                             StringRef InFile) {
169   std::string Sysroot;
170   std::string OutputFile;
171   std::unique_ptr<raw_ostream> OS =
172       GeneratePCHAction::ComputeASTConsumerArguments(CI, InFile, Sysroot,
173                                                      OutputFile);
174   if (!OS)
175     return nullptr;
176 
177   if (!CI.getFrontendOpts().RelocatablePCH)
178     Sysroot.clear();
179 
180   CI.getPreprocessor().addPPCallbacks(
181       llvm::make_unique<PreambleMacroCallbacks>(Callbacks));
182   return llvm::make_unique<PrecompilePreambleConsumer>(
183       *this, CI.getPreprocessor(), Sysroot, std::move(OS));
184 }
185 
186 template <class T> bool moveOnNoError(llvm::ErrorOr<T> Val, T &Output) {
187   if (!Val)
188     return false;
189   Output = std::move(*Val);
190   return true;
191 }
192 
193 } // namespace
194 
195 PreambleBounds clang::ComputePreambleBounds(const LangOptions &LangOpts,
196                                             llvm::MemoryBuffer *Buffer,
197                                             unsigned MaxLines) {
198   return Lexer::ComputePreamble(Buffer->getBuffer(), LangOpts, MaxLines);
199 }
200 
201 llvm::ErrorOr<PrecompiledPreamble> PrecompiledPreamble::Build(
202     const CompilerInvocation &Invocation,
203     const llvm::MemoryBuffer *MainFileBuffer, PreambleBounds Bounds,
204     DiagnosticsEngine &Diagnostics, IntrusiveRefCntPtr<vfs::FileSystem> VFS,
205     std::shared_ptr<PCHContainerOperations> PCHContainerOps,
206     PreambleCallbacks &Callbacks) {
207   assert(VFS && "VFS is null");
208 
209   if (!Bounds.Size)
210     return BuildPreambleError::PreambleIsEmpty;
211 
212   auto PreambleInvocation = std::make_shared<CompilerInvocation>(Invocation);
213   FrontendOptions &FrontendOpts = PreambleInvocation->getFrontendOpts();
214   PreprocessorOptions &PreprocessorOpts =
215       PreambleInvocation->getPreprocessorOpts();
216 
217   // Create a temporary file for the precompiled preamble. In rare
218   // circumstances, this can fail.
219   llvm::ErrorOr<PrecompiledPreamble::TempPCHFile> PreamblePCHFile =
220       PrecompiledPreamble::TempPCHFile::CreateNewPreamblePCHFile();
221   if (!PreamblePCHFile)
222     return BuildPreambleError::CouldntCreateTempFile;
223 
224   // Save the preamble text for later; we'll need to compare against it for
225   // subsequent reparses.
226   std::vector<char> PreambleBytes(MainFileBuffer->getBufferStart(),
227                                   MainFileBuffer->getBufferStart() +
228                                       Bounds.Size);
229   bool PreambleEndsAtStartOfLine = Bounds.PreambleEndsAtStartOfLine;
230 
231   // Tell the compiler invocation to generate a temporary precompiled header.
232   FrontendOpts.ProgramAction = frontend::GeneratePCH;
233   // FIXME: Generate the precompiled header into memory?
234   FrontendOpts.OutputFile = PreamblePCHFile->getFilePath();
235   PreprocessorOpts.PrecompiledPreambleBytes.first = 0;
236   PreprocessorOpts.PrecompiledPreambleBytes.second = false;
237 
238   // Create the compiler instance to use for building the precompiled preamble.
239   std::unique_ptr<CompilerInstance> Clang(
240       new CompilerInstance(std::move(PCHContainerOps)));
241 
242   // Recover resources if we crash before exiting this method.
243   llvm::CrashRecoveryContextCleanupRegistrar<CompilerInstance> CICleanup(
244       Clang.get());
245 
246   Clang->setInvocation(std::move(PreambleInvocation));
247   Clang->setDiagnostics(&Diagnostics);
248 
249   // Create the target instance.
250   Clang->setTarget(TargetInfo::CreateTargetInfo(
251       Clang->getDiagnostics(), Clang->getInvocation().TargetOpts));
252   if (!Clang->hasTarget())
253     return BuildPreambleError::CouldntCreateTargetInfo;
254 
255   // Inform the target of the language options.
256   //
257   // FIXME: We shouldn't need to do this, the target should be immutable once
258   // created. This complexity should be lifted elsewhere.
259   Clang->getTarget().adjust(Clang->getLangOpts());
260 
261   assert(Clang->getFrontendOpts().Inputs.size() == 1 &&
262          "Invocation must have exactly one source file!");
263   assert(Clang->getFrontendOpts().Inputs[0].getKind().getFormat() ==
264              InputKind::Source &&
265          "FIXME: AST inputs not yet supported here!");
266   assert(Clang->getFrontendOpts().Inputs[0].getKind().getLanguage() !=
267              InputKind::LLVM_IR &&
268          "IR inputs not support here!");
269 
270   // Clear out old caches and data.
271   Diagnostics.Reset();
272   ProcessWarningOptions(Diagnostics, Clang->getDiagnosticOpts());
273 
274   VFS =
275       createVFSFromCompilerInvocation(Clang->getInvocation(), Diagnostics, VFS);
276   if (!VFS)
277     return BuildPreambleError::CouldntCreateVFSOverlay;
278 
279   // Create a file manager object to provide access to and cache the filesystem.
280   Clang->setFileManager(new FileManager(Clang->getFileSystemOpts(), VFS));
281 
282   // Create the source manager.
283   Clang->setSourceManager(
284       new SourceManager(Diagnostics, Clang->getFileManager()));
285 
286   auto PreambleDepCollector = std::make_shared<DependencyCollector>();
287   Clang->addDependencyCollector(PreambleDepCollector);
288 
289   // Remap the main source file to the preamble buffer.
290   StringRef MainFilePath = FrontendOpts.Inputs[0].getFile();
291   auto PreambleInputBuffer = llvm::MemoryBuffer::getMemBufferCopy(
292       MainFileBuffer->getBuffer().slice(0, Bounds.Size), MainFilePath);
293   if (PreprocessorOpts.RetainRemappedFileBuffers) {
294     // MainFileBuffer will be deleted by unique_ptr after leaving the method.
295     PreprocessorOpts.addRemappedFile(MainFilePath, PreambleInputBuffer.get());
296   } else {
297     // In that case, remapped buffer will be deleted by CompilerInstance on
298     // BeginSourceFile, so we call release() to avoid double deletion.
299     PreprocessorOpts.addRemappedFile(MainFilePath,
300                                      PreambleInputBuffer.release());
301   }
302 
303   std::unique_ptr<PrecompilePreambleAction> Act;
304   Act.reset(new PrecompilePreambleAction(Callbacks));
305   if (!Act->BeginSourceFile(*Clang.get(), Clang->getFrontendOpts().Inputs[0]))
306     return BuildPreambleError::BeginSourceFileFailed;
307 
308   Act->Execute();
309 
310   // Run the callbacks.
311   Callbacks.AfterExecute(*Clang);
312 
313   Act->EndSourceFile();
314 
315   if (!Act->hasEmittedPreamblePCH())
316     return BuildPreambleError::CouldntEmitPCH;
317 
318   // Keep track of all of the files that the source manager knows about,
319   // so we can verify whether they have changed or not.
320   llvm::StringMap<PrecompiledPreamble::PreambleFileHash> FilesInPreamble;
321 
322   SourceManager &SourceMgr = Clang->getSourceManager();
323   for (auto &Filename : PreambleDepCollector->getDependencies()) {
324     const FileEntry *File = Clang->getFileManager().getFile(Filename);
325     if (!File || File == SourceMgr.getFileEntryForID(SourceMgr.getMainFileID()))
326       continue;
327     if (time_t ModTime = File->getModificationTime()) {
328       FilesInPreamble[File->getName()] =
329           PrecompiledPreamble::PreambleFileHash::createForFile(File->getSize(),
330                                                                ModTime);
331     } else {
332       llvm::MemoryBuffer *Buffer = SourceMgr.getMemoryBufferForFile(File);
333       FilesInPreamble[File->getName()] =
334           PrecompiledPreamble::PreambleFileHash::createForMemoryBuffer(Buffer);
335     }
336   }
337 
338   return PrecompiledPreamble(
339       std::move(*PreamblePCHFile), std::move(PreambleBytes),
340       PreambleEndsAtStartOfLine, std::move(FilesInPreamble));
341 }
342 
343 PreambleBounds PrecompiledPreamble::getBounds() const {
344   return PreambleBounds(PreambleBytes.size(), PreambleEndsAtStartOfLine);
345 }
346 
347 bool PrecompiledPreamble::CanReuse(const CompilerInvocation &Invocation,
348                                    const llvm::MemoryBuffer *MainFileBuffer,
349                                    PreambleBounds Bounds,
350                                    vfs::FileSystem *VFS) const {
351 
352   assert(
353       Bounds.Size <= MainFileBuffer->getBufferSize() &&
354       "Buffer is too large. Bounds were calculated from a different buffer?");
355 
356   auto PreambleInvocation = std::make_shared<CompilerInvocation>(Invocation);
357   PreprocessorOptions &PreprocessorOpts =
358       PreambleInvocation->getPreprocessorOpts();
359 
360   if (!Bounds.Size)
361     return false;
362 
363   // We've previously computed a preamble. Check whether we have the same
364   // preamble now that we did before, and that there's enough space in
365   // the main-file buffer within the precompiled preamble to fit the
366   // new main file.
367   if (PreambleBytes.size() != Bounds.Size ||
368       PreambleEndsAtStartOfLine != Bounds.PreambleEndsAtStartOfLine ||
369       memcmp(PreambleBytes.data(), MainFileBuffer->getBufferStart(),
370              Bounds.Size) != 0)
371     return false;
372   // The preamble has not changed. We may be able to re-use the precompiled
373   // preamble.
374 
375   // Check that none of the files used by the preamble have changed.
376   // First, make a record of those files that have been overridden via
377   // remapping or unsaved_files.
378   std::map<llvm::sys::fs::UniqueID, PreambleFileHash> OverriddenFiles;
379   for (const auto &R : PreprocessorOpts.RemappedFiles) {
380     vfs::Status Status;
381     if (!moveOnNoError(VFS->status(R.second), Status)) {
382       // If we can't stat the file we're remapping to, assume that something
383       // horrible happened.
384       return false;
385     }
386 
387     OverriddenFiles[Status.getUniqueID()] = PreambleFileHash::createForFile(
388         Status.getSize(), llvm::sys::toTimeT(Status.getLastModificationTime()));
389   }
390 
391   for (const auto &RB : PreprocessorOpts.RemappedFileBuffers) {
392     vfs::Status Status;
393     if (!moveOnNoError(VFS->status(RB.first), Status))
394       return false;
395 
396     OverriddenFiles[Status.getUniqueID()] =
397         PreambleFileHash::createForMemoryBuffer(RB.second);
398   }
399 
400   // Check whether anything has changed.
401   for (const auto &F : FilesInPreamble) {
402     vfs::Status Status;
403     if (!moveOnNoError(VFS->status(F.first()), Status)) {
404       // If we can't stat the file, assume that something horrible happened.
405       return false;
406     }
407 
408     std::map<llvm::sys::fs::UniqueID, PreambleFileHash>::iterator Overridden =
409         OverriddenFiles.find(Status.getUniqueID());
410     if (Overridden != OverriddenFiles.end()) {
411       // This file was remapped; check whether the newly-mapped file
412       // matches up with the previous mapping.
413       if (Overridden->second != F.second)
414         return false;
415       continue;
416     }
417 
418     // The file was not remapped; check whether it has changed on disk.
419     if (Status.getSize() != uint64_t(F.second.Size) ||
420         llvm::sys::toTimeT(Status.getLastModificationTime()) !=
421             F.second.ModTime)
422       return false;
423   }
424   return true;
425 }
426 
427 void PrecompiledPreamble::AddImplicitPreamble(
428     CompilerInvocation &CI, llvm::MemoryBuffer *MainFileBuffer) const {
429   auto &PreprocessorOpts = CI.getPreprocessorOpts();
430 
431   // Configure ImpicitPCHInclude.
432   PreprocessorOpts.PrecompiledPreambleBytes.first = PreambleBytes.size();
433   PreprocessorOpts.PrecompiledPreambleBytes.second = PreambleEndsAtStartOfLine;
434   PreprocessorOpts.ImplicitPCHInclude = PCHFile.getFilePath();
435   PreprocessorOpts.DisablePCHValidation = true;
436 
437   // Remap main file to point to MainFileBuffer.
438   auto MainFilePath = CI.getFrontendOpts().Inputs[0].getFile();
439   PreprocessorOpts.addRemappedFile(MainFilePath, MainFileBuffer);
440 }
441 
442 PrecompiledPreamble::PrecompiledPreamble(
443     TempPCHFile PCHFile, std::vector<char> PreambleBytes,
444     bool PreambleEndsAtStartOfLine,
445     llvm::StringMap<PreambleFileHash> FilesInPreamble)
446     : PCHFile(std::move(PCHFile)), FilesInPreamble(FilesInPreamble),
447       PreambleBytes(std::move(PreambleBytes)),
448       PreambleEndsAtStartOfLine(PreambleEndsAtStartOfLine) {}
449 
450 llvm::ErrorOr<PrecompiledPreamble::TempPCHFile>
451 PrecompiledPreamble::TempPCHFile::CreateNewPreamblePCHFile() {
452   // FIXME: This is a hack so that we can override the preamble file during
453   // crash-recovery testing, which is the only case where the preamble files
454   // are not necessarily cleaned up.
455   const char *TmpFile = ::getenv("CINDEXTEST_PREAMBLE_FILE");
456   if (TmpFile)
457     return TempPCHFile::createFromCustomPath(TmpFile);
458   return TempPCHFile::createInSystemTempDir("preamble", "pch");
459 }
460 
461 llvm::ErrorOr<PrecompiledPreamble::TempPCHFile>
462 PrecompiledPreamble::TempPCHFile::createInSystemTempDir(const Twine &Prefix,
463                                                         StringRef Suffix) {
464   llvm::SmallString<64> File;
465   // Using a version of createTemporaryFile with a file descriptor guarantees
466   // that we would never get a race condition in a multi-threaded setting (i.e.,
467   // multiple threads getting the same temporary path).
468   int FD;
469   auto EC = llvm::sys::fs::createTemporaryFile(Prefix, Suffix, /*ref*/ FD,
470                                                /*ref*/ File);
471   if (EC)
472     return EC;
473   // We only needed to make sure the file exists, close the file right away.
474   llvm::sys::Process::SafelyCloseFileDescriptor(FD);
475   return TempPCHFile(std::move(File).str());
476 }
477 
478 llvm::ErrorOr<PrecompiledPreamble::TempPCHFile>
479 PrecompiledPreamble::TempPCHFile::createFromCustomPath(const Twine &Path) {
480   return TempPCHFile(Path.str());
481 }
482 
483 PrecompiledPreamble::TempPCHFile::TempPCHFile(std::string FilePath)
484     : FilePath(std::move(FilePath)) {
485   TemporaryFiles::getInstance().addFile(*this->FilePath);
486 }
487 
488 PrecompiledPreamble::TempPCHFile::TempPCHFile(TempPCHFile &&Other) {
489   FilePath = std::move(Other.FilePath);
490   Other.FilePath = None;
491 }
492 
493 PrecompiledPreamble::TempPCHFile &PrecompiledPreamble::TempPCHFile::
494 operator=(TempPCHFile &&Other) {
495   RemoveFileIfPresent();
496 
497   FilePath = std::move(Other.FilePath);
498   Other.FilePath = None;
499   return *this;
500 }
501 
502 PrecompiledPreamble::TempPCHFile::~TempPCHFile() { RemoveFileIfPresent(); }
503 
504 void PrecompiledPreamble::TempPCHFile::RemoveFileIfPresent() {
505   if (FilePath) {
506     TemporaryFiles::getInstance().removeFile(*FilePath);
507     FilePath = None;
508   }
509 }
510 
511 llvm::StringRef PrecompiledPreamble::TempPCHFile::getFilePath() const {
512   assert(FilePath && "TempPCHFile doesn't have a FilePath. Had it been moved?");
513   return *FilePath;
514 }
515 
516 PrecompiledPreamble::PreambleFileHash
517 PrecompiledPreamble::PreambleFileHash::createForFile(off_t Size,
518                                                      time_t ModTime) {
519   PreambleFileHash Result;
520   Result.Size = Size;
521   Result.ModTime = ModTime;
522   Result.MD5 = {};
523   return Result;
524 }
525 
526 PrecompiledPreamble::PreambleFileHash
527 PrecompiledPreamble::PreambleFileHash::createForMemoryBuffer(
528     const llvm::MemoryBuffer *Buffer) {
529   PreambleFileHash Result;
530   Result.Size = Buffer->getBufferSize();
531   Result.ModTime = 0;
532 
533   llvm::MD5 MD5Ctx;
534   MD5Ctx.update(Buffer->getBuffer().data());
535   MD5Ctx.final(Result.MD5);
536 
537   return Result;
538 }
539 
540 void PreambleCallbacks::AfterExecute(CompilerInstance &CI) {}
541 void PreambleCallbacks::AfterPCHEmitted(ASTWriter &Writer) {}
542 void PreambleCallbacks::HandleTopLevelDecl(DeclGroupRef DG) {}
543 void PreambleCallbacks::HandleMacroDefined(const Token &MacroNameTok,
544                                            const MacroDirective *MD) {}
545 
546 std::error_code clang::make_error_code(BuildPreambleError Error) {
547   return std::error_code(static_cast<int>(Error), BuildPreambleErrorCategory());
548 }
549 
550 const char *BuildPreambleErrorCategory::name() const noexcept {
551   return "build-preamble.error";
552 }
553 
554 std::string BuildPreambleErrorCategory::message(int condition) const {
555   switch (static_cast<BuildPreambleError>(condition)) {
556   case BuildPreambleError::PreambleIsEmpty:
557     return "Preamble is empty";
558   case BuildPreambleError::CouldntCreateTempFile:
559     return "Could not create temporary file for PCH";
560   case BuildPreambleError::CouldntCreateTargetInfo:
561     return "CreateTargetInfo() return null";
562   case BuildPreambleError::CouldntCreateVFSOverlay:
563     return "Could not create VFS Overlay";
564   case BuildPreambleError::BeginSourceFileFailed:
565     return "BeginSourceFile() return an error";
566   case BuildPreambleError::CouldntEmitPCH:
567     return "Could not emit PCH";
568   }
569   llvm_unreachable("unexpected BuildPreambleError");
570 }
571