1 //===--- ModuleManager.cpp - Module Manager ---------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 //  This file defines the ModuleManager class, which manages a set of loaded
11 //  modules for the ASTReader.
12 //
13 //===----------------------------------------------------------------------===//
14 #include "clang/Serialization/ModuleManager.h"
15 #include "clang/Frontend/PCHContainerOperations.h"
16 #include "clang/Lex/HeaderSearch.h"
17 #include "clang/Lex/ModuleMap.h"
18 #include "clang/Serialization/GlobalModuleIndex.h"
19 #include "llvm/Support/MemoryBuffer.h"
20 #include "llvm/Support/Path.h"
21 #include <system_error>
22 
23 #ifndef NDEBUG
24 #include "llvm/Support/GraphWriter.h"
25 #endif
26 
27 using namespace clang;
28 using namespace serialization;
29 
30 ModuleFile *ModuleManager::lookup(StringRef Name) {
31   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
32                                            /*cacheFailure=*/false);
33   if (Entry)
34     return lookup(Entry);
35 
36   return nullptr;
37 }
38 
39 ModuleFile *ModuleManager::lookup(const FileEntry *File) {
40   llvm::DenseMap<const FileEntry *, ModuleFile *>::iterator Known
41     = Modules.find(File);
42   if (Known == Modules.end())
43     return nullptr;
44 
45   return Known->second;
46 }
47 
48 std::unique_ptr<llvm::MemoryBuffer>
49 ModuleManager::lookupBuffer(StringRef Name) {
50   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
51                                            /*cacheFailure=*/false);
52   return std::move(InMemoryBuffers[Entry]);
53 }
54 
55 static bool checkSignature(ASTFileSignature Signature,
56                            ASTFileSignature ExpectedSignature,
57                            std::string &ErrorStr) {
58   if (!ExpectedSignature || Signature == ExpectedSignature)
59     return false;
60 
61   ErrorStr =
62       Signature ? "signature mismatch" : "could not read module signature";
63   return true;
64 }
65 
66 static void updateModuleImports(ModuleFile &MF, ModuleFile *ImportedBy,
67                                 SourceLocation ImportLoc) {
68   if (ImportedBy) {
69     MF.ImportedBy.insert(ImportedBy);
70     ImportedBy->Imports.insert(&MF);
71   } else {
72     if (!MF.DirectlyImported)
73       MF.ImportLoc = ImportLoc;
74 
75     MF.DirectlyImported = true;
76   }
77 }
78 
79 ModuleManager::AddModuleResult
80 ModuleManager::addModule(StringRef FileName, ModuleKind Type,
81                          SourceLocation ImportLoc, ModuleFile *ImportedBy,
82                          unsigned Generation,
83                          off_t ExpectedSize, time_t ExpectedModTime,
84                          ASTFileSignature ExpectedSignature,
85                          ASTFileSignatureReader ReadSignature,
86                          ModuleFile *&Module,
87                          std::string &ErrorStr) {
88   Module = nullptr;
89 
90   // Look for the file entry. This only fails if the expected size or
91   // modification time differ.
92   const FileEntry *Entry;
93   if (Type == MK_ExplicitModule || Type == MK_PrebuiltModule) {
94     // If we're not expecting to pull this file out of the module cache, it
95     // might have a different mtime due to being moved across filesystems in
96     // a distributed build. The size must still match, though. (As must the
97     // contents, but we can't check that.)
98     ExpectedModTime = 0;
99   }
100   if (lookupModuleFile(FileName, ExpectedSize, ExpectedModTime, Entry)) {
101     ErrorStr = "module file out of date";
102     return OutOfDate;
103   }
104 
105   if (!Entry && FileName != "-") {
106     ErrorStr = "module file not found";
107     return Missing;
108   }
109 
110   // Check whether we already loaded this module, before
111   if (ModuleFile *ModuleEntry = Modules.lookup(Entry)) {
112     // Check the stored signature.
113     if (checkSignature(ModuleEntry->Signature, ExpectedSignature, ErrorStr))
114       return OutOfDate;
115 
116     Module = ModuleEntry;
117     updateModuleImports(*ModuleEntry, ImportedBy, ImportLoc);
118     return AlreadyLoaded;
119   }
120 
121   // Allocate a new module.
122   auto NewModule = llvm::make_unique<ModuleFile>(Type, Generation);
123   NewModule->Index = Chain.size();
124   NewModule->FileName = FileName.str();
125   NewModule->File = Entry;
126   NewModule->ImportLoc = ImportLoc;
127   NewModule->InputFilesValidationTimestamp = 0;
128 
129   if (NewModule->Kind == MK_ImplicitModule) {
130     std::string TimestampFilename = NewModule->getTimestampFilename();
131     vfs::Status Status;
132     // A cached stat value would be fine as well.
133     if (!FileMgr.getNoncachedStatValue(TimestampFilename, Status))
134       NewModule->InputFilesValidationTimestamp =
135           llvm::sys::toTimeT(Status.getLastModificationTime());
136   }
137 
138   // Load the contents of the module
139   if (std::unique_ptr<llvm::MemoryBuffer> Buffer = lookupBuffer(FileName)) {
140     // The buffer was already provided for us.
141     NewModule->Buffer = std::move(Buffer);
142   } else {
143     // Open the AST file.
144     llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Buf((std::error_code()));
145     if (FileName == "-") {
146       Buf = llvm::MemoryBuffer::getSTDIN();
147     } else {
148       // Leave the FileEntry open so if it gets read again by another
149       // ModuleManager it must be the same underlying file.
150       // FIXME: Because FileManager::getFile() doesn't guarantee that it will
151       // give us an open file, this may not be 100% reliable.
152       Buf = FileMgr.getBufferForFile(NewModule->File,
153                                      /*IsVolatile=*/false,
154                                      /*ShouldClose=*/false);
155     }
156 
157     if (!Buf) {
158       ErrorStr = Buf.getError().message();
159       return Missing;
160     }
161 
162     NewModule->Buffer = std::move(*Buf);
163   }
164 
165   // Initialize the stream.
166   NewModule->Data = PCHContainerRdr.ExtractPCH(*NewModule->Buffer);
167 
168   // Read the signature eagerly now so that we can check it.  Avoid calling
169   // ReadSignature unless there's something to check though.
170   if (ExpectedSignature && checkSignature(ReadSignature(NewModule->Data),
171                                           ExpectedSignature, ErrorStr))
172     return OutOfDate;
173 
174   // We're keeping this module.  Store it everywhere.
175   Module = Modules[Entry] = NewModule.get();
176 
177   updateModuleImports(*NewModule, ImportedBy, ImportLoc);
178 
179   if (!NewModule->isModule())
180     PCHChain.push_back(NewModule.get());
181   if (!ImportedBy)
182     Roots.push_back(NewModule.get());
183 
184   Chain.push_back(std::move(NewModule));
185   return NewlyLoaded;
186 }
187 
188 void ModuleManager::removeModules(
189     ModuleIterator First,
190     llvm::SmallPtrSetImpl<ModuleFile *> &LoadedSuccessfully,
191     ModuleMap *modMap) {
192   auto Last = end();
193   if (First == Last)
194     return;
195 
196 
197   // Explicitly clear VisitOrder since we might not notice it is stale.
198   VisitOrder.clear();
199 
200   // Collect the set of module file pointers that we'll be removing.
201   llvm::SmallPtrSet<ModuleFile *, 4> victimSet(
202       (llvm::pointer_iterator<ModuleIterator>(First)),
203       (llvm::pointer_iterator<ModuleIterator>(Last)));
204 
205   auto IsVictim = [&](ModuleFile *MF) {
206     return victimSet.count(MF);
207   };
208   // Remove any references to the now-destroyed modules.
209   for (auto I = begin(); I != First; ++I) {
210     I->Imports.remove_if(IsVictim);
211     I->ImportedBy.remove_if(IsVictim);
212   }
213   Roots.erase(std::remove_if(Roots.begin(), Roots.end(), IsVictim),
214               Roots.end());
215 
216   // Remove the modules from the PCH chain.
217   for (auto I = First; I != Last; ++I) {
218     if (!I->isModule()) {
219       PCHChain.erase(std::find(PCHChain.begin(), PCHChain.end(), &*I),
220                      PCHChain.end());
221       break;
222     }
223   }
224 
225   // Delete the modules and erase them from the various structures.
226   for (ModuleIterator victim = First; victim != Last; ++victim) {
227     Modules.erase(victim->File);
228 
229     if (modMap) {
230       StringRef ModuleName = victim->ModuleName;
231       if (Module *mod = modMap->findModule(ModuleName)) {
232         mod->setASTFile(nullptr);
233       }
234     }
235 
236     // Files that didn't make it through ReadASTCore successfully will be
237     // rebuilt (or there was an error). Invalidate them so that we can load the
238     // new files that will be renamed over the old ones.
239     if (LoadedSuccessfully.count(&*victim) == 0)
240       FileMgr.invalidateCache(victim->File);
241   }
242 
243   // Delete the modules.
244   Chain.erase(Chain.begin() + (First - begin()), Chain.end());
245 }
246 
247 void
248 ModuleManager::addInMemoryBuffer(StringRef FileName,
249                                  std::unique_ptr<llvm::MemoryBuffer> Buffer) {
250 
251   const FileEntry *Entry =
252       FileMgr.getVirtualFile(FileName, Buffer->getBufferSize(), 0);
253   InMemoryBuffers[Entry] = std::move(Buffer);
254 }
255 
256 ModuleManager::VisitState *ModuleManager::allocateVisitState() {
257   // Fast path: if we have a cached state, use it.
258   if (FirstVisitState) {
259     VisitState *Result = FirstVisitState;
260     FirstVisitState = FirstVisitState->NextState;
261     Result->NextState = nullptr;
262     return Result;
263   }
264 
265   // Allocate and return a new state.
266   return new VisitState(size());
267 }
268 
269 void ModuleManager::returnVisitState(VisitState *State) {
270   assert(State->NextState == nullptr && "Visited state is in list?");
271   State->NextState = FirstVisitState;
272   FirstVisitState = State;
273 }
274 
275 void ModuleManager::setGlobalIndex(GlobalModuleIndex *Index) {
276   GlobalIndex = Index;
277   if (!GlobalIndex) {
278     ModulesInCommonWithGlobalIndex.clear();
279     return;
280   }
281 
282   // Notify the global module index about all of the modules we've already
283   // loaded.
284   for (ModuleFile &M : *this)
285     if (!GlobalIndex->loadedModuleFile(&M))
286       ModulesInCommonWithGlobalIndex.push_back(&M);
287 }
288 
289 void ModuleManager::moduleFileAccepted(ModuleFile *MF) {
290   if (!GlobalIndex || GlobalIndex->loadedModuleFile(MF))
291     return;
292 
293   ModulesInCommonWithGlobalIndex.push_back(MF);
294 }
295 
296 ModuleManager::ModuleManager(FileManager &FileMgr,
297                              const PCHContainerReader &PCHContainerRdr)
298     : FileMgr(FileMgr), PCHContainerRdr(PCHContainerRdr), GlobalIndex(),
299       FirstVisitState(nullptr) {}
300 
301 ModuleManager::~ModuleManager() { delete FirstVisitState; }
302 
303 void ModuleManager::visit(llvm::function_ref<bool(ModuleFile &M)> Visitor,
304                           llvm::SmallPtrSetImpl<ModuleFile *> *ModuleFilesHit) {
305   // If the visitation order vector is the wrong size, recompute the order.
306   if (VisitOrder.size() != Chain.size()) {
307     unsigned N = size();
308     VisitOrder.clear();
309     VisitOrder.reserve(N);
310 
311     // Record the number of incoming edges for each module. When we
312     // encounter a module with no incoming edges, push it into the queue
313     // to seed the queue.
314     SmallVector<ModuleFile *, 4> Queue;
315     Queue.reserve(N);
316     llvm::SmallVector<unsigned, 4> UnusedIncomingEdges;
317     UnusedIncomingEdges.resize(size());
318     for (ModuleFile &M : llvm::reverse(*this)) {
319       unsigned Size = M.ImportedBy.size();
320       UnusedIncomingEdges[M.Index] = Size;
321       if (!Size)
322         Queue.push_back(&M);
323     }
324 
325     // Traverse the graph, making sure to visit a module before visiting any
326     // of its dependencies.
327     while (!Queue.empty()) {
328       ModuleFile *CurrentModule = Queue.pop_back_val();
329       VisitOrder.push_back(CurrentModule);
330 
331       // For any module that this module depends on, push it on the
332       // stack (if it hasn't already been marked as visited).
333       for (auto M = CurrentModule->Imports.rbegin(),
334                 MEnd = CurrentModule->Imports.rend();
335            M != MEnd; ++M) {
336         // Remove our current module as an impediment to visiting the
337         // module we depend on. If we were the last unvisited module
338         // that depends on this particular module, push it into the
339         // queue to be visited.
340         unsigned &NumUnusedEdges = UnusedIncomingEdges[(*M)->Index];
341         if (NumUnusedEdges && (--NumUnusedEdges == 0))
342           Queue.push_back(*M);
343       }
344     }
345 
346     assert(VisitOrder.size() == N && "Visitation order is wrong?");
347 
348     delete FirstVisitState;
349     FirstVisitState = nullptr;
350   }
351 
352   VisitState *State = allocateVisitState();
353   unsigned VisitNumber = State->NextVisitNumber++;
354 
355   // If the caller has provided us with a hit-set that came from the global
356   // module index, mark every module file in common with the global module
357   // index that is *not* in that set as 'visited'.
358   if (ModuleFilesHit && !ModulesInCommonWithGlobalIndex.empty()) {
359     for (unsigned I = 0, N = ModulesInCommonWithGlobalIndex.size(); I != N; ++I)
360     {
361       ModuleFile *M = ModulesInCommonWithGlobalIndex[I];
362       if (!ModuleFilesHit->count(M))
363         State->VisitNumber[M->Index] = VisitNumber;
364     }
365   }
366 
367   for (unsigned I = 0, N = VisitOrder.size(); I != N; ++I) {
368     ModuleFile *CurrentModule = VisitOrder[I];
369     // Should we skip this module file?
370     if (State->VisitNumber[CurrentModule->Index] == VisitNumber)
371       continue;
372 
373     // Visit the module.
374     assert(State->VisitNumber[CurrentModule->Index] == VisitNumber - 1);
375     State->VisitNumber[CurrentModule->Index] = VisitNumber;
376     if (!Visitor(*CurrentModule))
377       continue;
378 
379     // The visitor has requested that cut off visitation of any
380     // module that the current module depends on. To indicate this
381     // behavior, we mark all of the reachable modules as having been visited.
382     ModuleFile *NextModule = CurrentModule;
383     do {
384       // For any module that this module depends on, push it on the
385       // stack (if it hasn't already been marked as visited).
386       for (llvm::SetVector<ModuleFile *>::iterator
387              M = NextModule->Imports.begin(),
388              MEnd = NextModule->Imports.end();
389            M != MEnd; ++M) {
390         if (State->VisitNumber[(*M)->Index] != VisitNumber) {
391           State->Stack.push_back(*M);
392           State->VisitNumber[(*M)->Index] = VisitNumber;
393         }
394       }
395 
396       if (State->Stack.empty())
397         break;
398 
399       // Pop the next module off the stack.
400       NextModule = State->Stack.pop_back_val();
401     } while (true);
402   }
403 
404   returnVisitState(State);
405 }
406 
407 bool ModuleManager::lookupModuleFile(StringRef FileName,
408                                      off_t ExpectedSize,
409                                      time_t ExpectedModTime,
410                                      const FileEntry *&File) {
411   if (FileName == "-") {
412     File = nullptr;
413     return false;
414   }
415 
416   // Open the file immediately to ensure there is no race between stat'ing and
417   // opening the file.
418   File = FileMgr.getFile(FileName, /*openFile=*/true, /*cacheFailure=*/false);
419   if (!File)
420     return false;
421 
422   if ((ExpectedSize && ExpectedSize != File->getSize()) ||
423       (ExpectedModTime && ExpectedModTime != File->getModificationTime()))
424     // Do not destroy File, as it may be referenced. If we need to rebuild it,
425     // it will be destroyed by removeModules.
426     return true;
427 
428   return false;
429 }
430 
431 #ifndef NDEBUG
432 namespace llvm {
433   template<>
434   struct GraphTraits<ModuleManager> {
435     typedef ModuleFile *NodeRef;
436     typedef llvm::SetVector<ModuleFile *>::const_iterator ChildIteratorType;
437     typedef pointer_iterator<ModuleManager::ModuleConstIterator> nodes_iterator;
438 
439     static ChildIteratorType child_begin(NodeRef Node) {
440       return Node->Imports.begin();
441     }
442 
443     static ChildIteratorType child_end(NodeRef Node) {
444       return Node->Imports.end();
445     }
446 
447     static nodes_iterator nodes_begin(const ModuleManager &Manager) {
448       return nodes_iterator(Manager.begin());
449     }
450 
451     static nodes_iterator nodes_end(const ModuleManager &Manager) {
452       return nodes_iterator(Manager.end());
453     }
454   };
455 
456   template<>
457   struct DOTGraphTraits<ModuleManager> : public DefaultDOTGraphTraits {
458     explicit DOTGraphTraits(bool IsSimple = false)
459       : DefaultDOTGraphTraits(IsSimple) { }
460 
461     static bool renderGraphFromBottomUp() {
462       return true;
463     }
464 
465     std::string getNodeLabel(ModuleFile *M, const ModuleManager&) {
466       return M->ModuleName;
467     }
468   };
469 }
470 
471 void ModuleManager::viewGraph() {
472   llvm::ViewGraph(*this, "Modules");
473 }
474 #endif
475