1 //===--- ModuleManager.cpp - Module Manager ---------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 //  This file defines the ModuleManager class, which manages a set of loaded
11 //  modules for the ASTReader.
12 //
13 //===----------------------------------------------------------------------===//
14 #include "clang/Frontend/PCHContainerOperations.h"
15 #include "clang/Lex/HeaderSearch.h"
16 #include "clang/Lex/ModuleMap.h"
17 #include "clang/Serialization/GlobalModuleIndex.h"
18 #include "clang/Serialization/ModuleManager.h"
19 #include "llvm/Support/MemoryBuffer.h"
20 #include "llvm/Support/Path.h"
21 #include "llvm/Support/raw_ostream.h"
22 #include <system_error>
23 
24 #ifndef NDEBUG
25 #include "llvm/Support/GraphWriter.h"
26 #endif
27 
28 using namespace clang;
29 using namespace serialization;
30 
31 ModuleFile *ModuleManager::lookup(StringRef Name) {
32   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
33                                            /*cacheFailure=*/false);
34   if (Entry)
35     return lookup(Entry);
36 
37   return nullptr;
38 }
39 
40 ModuleFile *ModuleManager::lookup(const FileEntry *File) {
41   llvm::DenseMap<const FileEntry *, ModuleFile *>::iterator Known
42     = Modules.find(File);
43   if (Known == Modules.end())
44     return nullptr;
45 
46   return Known->second;
47 }
48 
49 std::unique_ptr<llvm::MemoryBuffer>
50 ModuleManager::lookupBuffer(StringRef Name) {
51   const FileEntry *Entry = FileMgr.getFile(Name, /*openFile=*/false,
52                                            /*cacheFailure=*/false);
53   return std::move(InMemoryBuffers[Entry]);
54 }
55 
56 ModuleManager::AddModuleResult
57 ModuleManager::addModule(StringRef FileName, ModuleKind Type,
58                          SourceLocation ImportLoc, ModuleFile *ImportedBy,
59                          unsigned Generation,
60                          off_t ExpectedSize, time_t ExpectedModTime,
61                          ASTFileSignature ExpectedSignature,
62                          ASTFileSignatureReader ReadSignature,
63                          ModuleFile *&Module,
64                          std::string &ErrorStr) {
65   Module = nullptr;
66 
67   // Look for the file entry. This only fails if the expected size or
68   // modification time differ.
69   const FileEntry *Entry;
70   if (Type == MK_ExplicitModule) {
71     // If we're not expecting to pull this file out of the module cache, it
72     // might have a different mtime due to being moved across filesystems in
73     // a distributed build. The size must still match, though. (As must the
74     // contents, but we can't check that.)
75     ExpectedModTime = 0;
76   }
77   if (lookupModuleFile(FileName, ExpectedSize, ExpectedModTime, Entry)) {
78     ErrorStr = "module file out of date";
79     return OutOfDate;
80   }
81 
82   if (!Entry && FileName != "-") {
83     ErrorStr = "module file not found";
84     return Missing;
85   }
86 
87   // Check whether we already loaded this module, before
88   ModuleFile *&ModuleEntry = Modules[Entry];
89   bool NewModule = false;
90   if (!ModuleEntry) {
91     // Allocate a new module.
92     ModuleFile *New = new ModuleFile(Type, Generation);
93     New->Index = Chain.size();
94     New->FileName = FileName.str();
95     New->File = Entry;
96     New->ImportLoc = ImportLoc;
97     Chain.push_back(New);
98     if (!New->isModule())
99       PCHChain.push_back(New);
100     if (!ImportedBy)
101       Roots.push_back(New);
102     NewModule = true;
103     ModuleEntry = New;
104 
105     New->InputFilesValidationTimestamp = 0;
106     if (New->Kind == MK_ImplicitModule) {
107       std::string TimestampFilename = New->getTimestampFilename();
108       vfs::Status Status;
109       // A cached stat value would be fine as well.
110       if (!FileMgr.getNoncachedStatValue(TimestampFilename, Status))
111         New->InputFilesValidationTimestamp =
112             Status.getLastModificationTime().toEpochTime();
113     }
114 
115     // Load the contents of the module
116     if (std::unique_ptr<llvm::MemoryBuffer> Buffer = lookupBuffer(FileName)) {
117       // The buffer was already provided for us.
118       New->Buffer = std::move(Buffer);
119     } else {
120       // Open the AST file.
121       llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> Buf(
122           (std::error_code()));
123       if (FileName == "-") {
124         Buf = llvm::MemoryBuffer::getSTDIN();
125       } else {
126         // Leave the FileEntry open so if it gets read again by another
127         // ModuleManager it must be the same underlying file.
128         // FIXME: Because FileManager::getFile() doesn't guarantee that it will
129         // give us an open file, this may not be 100% reliable.
130         Buf = FileMgr.getBufferForFile(New->File,
131                                        /*IsVolatile=*/false,
132                                        /*ShouldClose=*/false);
133       }
134 
135       if (!Buf) {
136         ErrorStr = Buf.getError().message();
137         return Missing;
138       }
139 
140       New->Buffer = std::move(*Buf);
141     }
142 
143     // Initialize the stream.
144     PCHContainerRdr.ExtractPCH(New->Buffer->getMemBufferRef(), New->StreamFile);
145   }
146 
147   if (ExpectedSignature) {
148     if (NewModule)
149       ModuleEntry->Signature = ReadSignature(ModuleEntry->StreamFile);
150     else
151       assert(ModuleEntry->Signature == ReadSignature(ModuleEntry->StreamFile));
152 
153     if (ModuleEntry->Signature != ExpectedSignature) {
154       ErrorStr = ModuleEntry->Signature ? "signature mismatch"
155                                         : "could not read module signature";
156 
157       if (NewModule) {
158         // Remove the module file immediately, since removeModules might try to
159         // invalidate the file cache for Entry, and that is not safe if this
160         // module is *itself* up to date, but has an out-of-date importer.
161         Modules.erase(Entry);
162         assert(Chain.back() == ModuleEntry);
163         Chain.pop_back();
164         if (!ModuleEntry->isModule())
165           PCHChain.pop_back();
166         if (Roots.back() == ModuleEntry)
167           Roots.pop_back();
168         else
169           assert(ImportedBy);
170         delete ModuleEntry;
171       }
172       return OutOfDate;
173     }
174   }
175 
176   if (ImportedBy) {
177     ModuleEntry->ImportedBy.insert(ImportedBy);
178     ImportedBy->Imports.insert(ModuleEntry);
179   } else {
180     if (!ModuleEntry->DirectlyImported)
181       ModuleEntry->ImportLoc = ImportLoc;
182 
183     ModuleEntry->DirectlyImported = true;
184   }
185 
186   Module = ModuleEntry;
187   return NewModule? NewlyLoaded : AlreadyLoaded;
188 }
189 
190 void ModuleManager::removeModules(
191     ModuleIterator first, ModuleIterator last,
192     llvm::SmallPtrSetImpl<ModuleFile *> &LoadedSuccessfully,
193     ModuleMap *modMap) {
194   if (first == last)
195     return;
196 
197   // Collect the set of module file pointers that we'll be removing.
198   llvm::SmallPtrSet<ModuleFile *, 4> victimSet(first, last);
199 
200   auto IsVictim = [&](ModuleFile *MF) {
201     return victimSet.count(MF);
202   };
203   // Remove any references to the now-destroyed modules.
204   for (unsigned i = 0, n = Chain.size(); i != n; ++i) {
205     Chain[i]->ImportedBy.remove_if(IsVictim);
206   }
207   Roots.erase(std::remove_if(Roots.begin(), Roots.end(), IsVictim),
208               Roots.end());
209 
210   // Remove the modules from the PCH chain.
211   for (auto I = first; I != last; ++I) {
212     if (!(*I)->isModule()) {
213       PCHChain.erase(std::find(PCHChain.begin(), PCHChain.end(), *I),
214                      PCHChain.end());
215       break;
216     }
217   }
218 
219   // Delete the modules and erase them from the various structures.
220   for (ModuleIterator victim = first; victim != last; ++victim) {
221     Modules.erase((*victim)->File);
222 
223     if (modMap) {
224       StringRef ModuleName = (*victim)->ModuleName;
225       if (Module *mod = modMap->findModule(ModuleName)) {
226         mod->setASTFile(nullptr);
227       }
228     }
229 
230     // Files that didn't make it through ReadASTCore successfully will be
231     // rebuilt (or there was an error). Invalidate them so that we can load the
232     // new files that will be renamed over the old ones.
233     if (LoadedSuccessfully.count(*victim) == 0)
234       FileMgr.invalidateCache((*victim)->File);
235 
236     delete *victim;
237   }
238 
239   // Remove the modules from the chain.
240   Chain.erase(first, last);
241 }
242 
243 void
244 ModuleManager::addInMemoryBuffer(StringRef FileName,
245                                  std::unique_ptr<llvm::MemoryBuffer> Buffer) {
246 
247   const FileEntry *Entry =
248       FileMgr.getVirtualFile(FileName, Buffer->getBufferSize(), 0);
249   InMemoryBuffers[Entry] = std::move(Buffer);
250 }
251 
252 ModuleManager::VisitState *ModuleManager::allocateVisitState() {
253   // Fast path: if we have a cached state, use it.
254   if (FirstVisitState) {
255     VisitState *Result = FirstVisitState;
256     FirstVisitState = FirstVisitState->NextState;
257     Result->NextState = nullptr;
258     return Result;
259   }
260 
261   // Allocate and return a new state.
262   return new VisitState(size());
263 }
264 
265 void ModuleManager::returnVisitState(VisitState *State) {
266   assert(State->NextState == nullptr && "Visited state is in list?");
267   State->NextState = FirstVisitState;
268   FirstVisitState = State;
269 }
270 
271 void ModuleManager::setGlobalIndex(GlobalModuleIndex *Index) {
272   GlobalIndex = Index;
273   if (!GlobalIndex) {
274     ModulesInCommonWithGlobalIndex.clear();
275     return;
276   }
277 
278   // Notify the global module index about all of the modules we've already
279   // loaded.
280   for (unsigned I = 0, N = Chain.size(); I != N; ++I) {
281     if (!GlobalIndex->loadedModuleFile(Chain[I])) {
282       ModulesInCommonWithGlobalIndex.push_back(Chain[I]);
283     }
284   }
285 }
286 
287 void ModuleManager::moduleFileAccepted(ModuleFile *MF) {
288   if (!GlobalIndex || GlobalIndex->loadedModuleFile(MF))
289     return;
290 
291   ModulesInCommonWithGlobalIndex.push_back(MF);
292 }
293 
294 ModuleManager::ModuleManager(FileManager &FileMgr,
295                              const PCHContainerReader &PCHContainerRdr)
296     : FileMgr(FileMgr), PCHContainerRdr(PCHContainerRdr), GlobalIndex(),
297       FirstVisitState(nullptr) {}
298 
299 ModuleManager::~ModuleManager() {
300   for (unsigned i = 0, e = Chain.size(); i != e; ++i)
301     delete Chain[e - i - 1];
302   delete FirstVisitState;
303 }
304 
305 void ModuleManager::visit(llvm::function_ref<bool(ModuleFile &M)> Visitor,
306                           llvm::SmallPtrSetImpl<ModuleFile *> *ModuleFilesHit) {
307   // If the visitation order vector is the wrong size, recompute the order.
308   if (VisitOrder.size() != Chain.size()) {
309     unsigned N = size();
310     VisitOrder.clear();
311     VisitOrder.reserve(N);
312 
313     // Record the number of incoming edges for each module. When we
314     // encounter a module with no incoming edges, push it into the queue
315     // to seed the queue.
316     SmallVector<ModuleFile *, 4> Queue;
317     Queue.reserve(N);
318     llvm::SmallVector<unsigned, 4> UnusedIncomingEdges;
319     UnusedIncomingEdges.resize(size());
320     for (auto M = rbegin(), MEnd = rend(); M != MEnd; ++M) {
321       unsigned Size = (*M)->ImportedBy.size();
322       UnusedIncomingEdges[(*M)->Index] = Size;
323       if (!Size)
324         Queue.push_back(*M);
325     }
326 
327     // Traverse the graph, making sure to visit a module before visiting any
328     // of its dependencies.
329     while (!Queue.empty()) {
330       ModuleFile *CurrentModule = Queue.pop_back_val();
331       VisitOrder.push_back(CurrentModule);
332 
333       // For any module that this module depends on, push it on the
334       // stack (if it hasn't already been marked as visited).
335       for (auto M = CurrentModule->Imports.rbegin(),
336                 MEnd = CurrentModule->Imports.rend();
337            M != MEnd; ++M) {
338         // Remove our current module as an impediment to visiting the
339         // module we depend on. If we were the last unvisited module
340         // that depends on this particular module, push it into the
341         // queue to be visited.
342         unsigned &NumUnusedEdges = UnusedIncomingEdges[(*M)->Index];
343         if (NumUnusedEdges && (--NumUnusedEdges == 0))
344           Queue.push_back(*M);
345       }
346     }
347 
348     assert(VisitOrder.size() == N && "Visitation order is wrong?");
349 
350     delete FirstVisitState;
351     FirstVisitState = nullptr;
352   }
353 
354   VisitState *State = allocateVisitState();
355   unsigned VisitNumber = State->NextVisitNumber++;
356 
357   // If the caller has provided us with a hit-set that came from the global
358   // module index, mark every module file in common with the global module
359   // index that is *not* in that set as 'visited'.
360   if (ModuleFilesHit && !ModulesInCommonWithGlobalIndex.empty()) {
361     for (unsigned I = 0, N = ModulesInCommonWithGlobalIndex.size(); I != N; ++I)
362     {
363       ModuleFile *M = ModulesInCommonWithGlobalIndex[I];
364       if (!ModuleFilesHit->count(M))
365         State->VisitNumber[M->Index] = VisitNumber;
366     }
367   }
368 
369   for (unsigned I = 0, N = VisitOrder.size(); I != N; ++I) {
370     ModuleFile *CurrentModule = VisitOrder[I];
371     // Should we skip this module file?
372     if (State->VisitNumber[CurrentModule->Index] == VisitNumber)
373       continue;
374 
375     // Visit the module.
376     assert(State->VisitNumber[CurrentModule->Index] == VisitNumber - 1);
377     State->VisitNumber[CurrentModule->Index] = VisitNumber;
378     if (!Visitor(*CurrentModule))
379       continue;
380 
381     // The visitor has requested that cut off visitation of any
382     // module that the current module depends on. To indicate this
383     // behavior, we mark all of the reachable modules as having been visited.
384     ModuleFile *NextModule = CurrentModule;
385     do {
386       // For any module that this module depends on, push it on the
387       // stack (if it hasn't already been marked as visited).
388       for (llvm::SetVector<ModuleFile *>::iterator
389              M = NextModule->Imports.begin(),
390              MEnd = NextModule->Imports.end();
391            M != MEnd; ++M) {
392         if (State->VisitNumber[(*M)->Index] != VisitNumber) {
393           State->Stack.push_back(*M);
394           State->VisitNumber[(*M)->Index] = VisitNumber;
395         }
396       }
397 
398       if (State->Stack.empty())
399         break;
400 
401       // Pop the next module off the stack.
402       NextModule = State->Stack.pop_back_val();
403     } while (true);
404   }
405 
406   returnVisitState(State);
407 }
408 
409 bool ModuleManager::lookupModuleFile(StringRef FileName,
410                                      off_t ExpectedSize,
411                                      time_t ExpectedModTime,
412                                      const FileEntry *&File) {
413   // Open the file immediately to ensure there is no race between stat'ing and
414   // opening the file.
415   File = FileMgr.getFile(FileName, /*openFile=*/true, /*cacheFailure=*/false);
416 
417   if (!File && FileName != "-") {
418     return false;
419   }
420 
421   if ((ExpectedSize && ExpectedSize != File->getSize()) ||
422       (ExpectedModTime && ExpectedModTime != File->getModificationTime()))
423     // Do not destroy File, as it may be referenced. If we need to rebuild it,
424     // it will be destroyed by removeModules.
425     return true;
426 
427   return false;
428 }
429 
430 #ifndef NDEBUG
431 namespace llvm {
432   template<>
433   struct GraphTraits<ModuleManager> {
434     typedef ModuleFile NodeType;
435     typedef llvm::SetVector<ModuleFile *>::const_iterator ChildIteratorType;
436     typedef ModuleManager::ModuleConstIterator nodes_iterator;
437 
438     static ChildIteratorType child_begin(NodeType *Node) {
439       return Node->Imports.begin();
440     }
441 
442     static ChildIteratorType child_end(NodeType *Node) {
443       return Node->Imports.end();
444     }
445 
446     static nodes_iterator nodes_begin(const ModuleManager &Manager) {
447       return Manager.begin();
448     }
449 
450     static nodes_iterator nodes_end(const ModuleManager &Manager) {
451       return Manager.end();
452     }
453   };
454 
455   template<>
456   struct DOTGraphTraits<ModuleManager> : public DefaultDOTGraphTraits {
457     explicit DOTGraphTraits(bool IsSimple = false)
458       : DefaultDOTGraphTraits(IsSimple) { }
459 
460     static bool renderGraphFromBottomUp() {
461       return true;
462     }
463 
464     std::string getNodeLabel(ModuleFile *M, const ModuleManager&) {
465       return M->ModuleName;
466     }
467   };
468 }
469 
470 void ModuleManager::viewGraph() {
471   llvm::ViewGraph(*this, "Modules");
472 }
473 #endif
474