15e306b12SDouglas Gregor //===--- GlobalModuleIndex.cpp - Global Module Index ------------*- C++ -*-===//
25e306b12SDouglas Gregor //
35e306b12SDouglas Gregor //                     The LLVM Compiler Infrastructure
45e306b12SDouglas Gregor //
55e306b12SDouglas Gregor // This file is distributed under the University of Illinois Open Source
65e306b12SDouglas Gregor // License. See LICENSE.TXT for details.
75e306b12SDouglas Gregor //
85e306b12SDouglas Gregor //===----------------------------------------------------------------------===//
95e306b12SDouglas Gregor //
105e306b12SDouglas Gregor // This file implements the GlobalModuleIndex class.
115e306b12SDouglas Gregor //
125e306b12SDouglas Gregor //===----------------------------------------------------------------------===//
135e306b12SDouglas Gregor 
145e306b12SDouglas Gregor #include "ASTReaderInternals.h"
15*bb165fb0SAdrian Prantl #include "clang/Frontend/PCHContainerOperations.h"
165e306b12SDouglas Gregor #include "clang/Basic/FileManager.h"
17beee15e7SBen Langmuir #include "clang/Lex/HeaderSearch.h"
185e306b12SDouglas Gregor #include "clang/Serialization/ASTBitCodes.h"
195e306b12SDouglas Gregor #include "clang/Serialization/GlobalModuleIndex.h"
20603cd869SDouglas Gregor #include "clang/Serialization/Module.h"
215e306b12SDouglas Gregor #include "llvm/ADT/DenseMap.h"
225e306b12SDouglas Gregor #include "llvm/ADT/MapVector.h"
235e306b12SDouglas Gregor #include "llvm/ADT/SmallString.h"
245e306b12SDouglas Gregor #include "llvm/ADT/StringExtras.h"
255e306b12SDouglas Gregor #include "llvm/Bitcode/BitstreamReader.h"
265e306b12SDouglas Gregor #include "llvm/Bitcode/BitstreamWriter.h"
278ec343ccSDouglas Gregor #include "llvm/Support/FileSystem.h"
285e306b12SDouglas Gregor #include "llvm/Support/LockFileManager.h"
295e306b12SDouglas Gregor #include "llvm/Support/MemoryBuffer.h"
30bb094f06SJustin Bogner #include "llvm/Support/OnDiskHashTable.h"
31552c169eSRafael Espindola #include "llvm/Support/Path.h"
32f0add23aSNAKAMURA Takumi #include <cstdio>
335e306b12SDouglas Gregor using namespace clang;
345e306b12SDouglas Gregor using namespace serialization;
355e306b12SDouglas Gregor 
365e306b12SDouglas Gregor //----------------------------------------------------------------------------//
375e306b12SDouglas Gregor // Shared constants
385e306b12SDouglas Gregor //----------------------------------------------------------------------------//
395e306b12SDouglas Gregor namespace {
405e306b12SDouglas Gregor   enum {
415e306b12SDouglas Gregor     /// \brief The block containing the index.
425e306b12SDouglas Gregor     GLOBAL_INDEX_BLOCK_ID = llvm::bitc::FIRST_APPLICATION_BLOCKID
435e306b12SDouglas Gregor   };
445e306b12SDouglas Gregor 
455e306b12SDouglas Gregor   /// \brief Describes the record types in the index.
465e306b12SDouglas Gregor   enum IndexRecordTypes {
475e306b12SDouglas Gregor     /// \brief Contains version information and potentially other metadata,
485e306b12SDouglas Gregor     /// used to determine if we can read this global index file.
49e060e57bSDouglas Gregor     INDEX_METADATA,
505e306b12SDouglas Gregor     /// \brief Describes a module, including its file name and dependencies.
515e306b12SDouglas Gregor     MODULE,
525e306b12SDouglas Gregor     /// \brief The index for identifiers.
535e306b12SDouglas Gregor     IDENTIFIER_INDEX
545e306b12SDouglas Gregor   };
555e306b12SDouglas Gregor }
565e306b12SDouglas Gregor 
575e306b12SDouglas Gregor /// \brief The name of the global index file.
585e306b12SDouglas Gregor static const char * const IndexFileName = "modules.idx";
595e306b12SDouglas Gregor 
605e306b12SDouglas Gregor /// \brief The global index file version.
615e306b12SDouglas Gregor static const unsigned CurrentVersion = 1;
625e306b12SDouglas Gregor 
635e306b12SDouglas Gregor //----------------------------------------------------------------------------//
64e060e57bSDouglas Gregor // Global module index reader.
65e060e57bSDouglas Gregor //----------------------------------------------------------------------------//
66e060e57bSDouglas Gregor 
67e060e57bSDouglas Gregor namespace {
68e060e57bSDouglas Gregor 
69e060e57bSDouglas Gregor /// \brief Trait used to read the identifier index from the on-disk hash
70e060e57bSDouglas Gregor /// table.
71e060e57bSDouglas Gregor class IdentifierIndexReaderTrait {
72e060e57bSDouglas Gregor public:
73e060e57bSDouglas Gregor   typedef StringRef external_key_type;
74e060e57bSDouglas Gregor   typedef StringRef internal_key_type;
75e060e57bSDouglas Gregor   typedef SmallVector<unsigned, 2> data_type;
7625463f15SJustin Bogner   typedef unsigned hash_value_type;
7725463f15SJustin Bogner   typedef unsigned offset_type;
78e060e57bSDouglas Gregor 
79e060e57bSDouglas Gregor   static bool EqualKey(const internal_key_type& a, const internal_key_type& b) {
80e060e57bSDouglas Gregor     return a == b;
81e060e57bSDouglas Gregor   }
82e060e57bSDouglas Gregor 
8325463f15SJustin Bogner   static hash_value_type ComputeHash(const internal_key_type& a) {
84e060e57bSDouglas Gregor     return llvm::HashString(a);
85e060e57bSDouglas Gregor   }
86e060e57bSDouglas Gregor 
87e060e57bSDouglas Gregor   static std::pair<unsigned, unsigned>
88e060e57bSDouglas Gregor   ReadKeyDataLength(const unsigned char*& d) {
8957ba0b22SJustin Bogner     using namespace llvm::support;
9057ba0b22SJustin Bogner     unsigned KeyLen = endian::readNext<uint16_t, little, unaligned>(d);
9157ba0b22SJustin Bogner     unsigned DataLen = endian::readNext<uint16_t, little, unaligned>(d);
92e060e57bSDouglas Gregor     return std::make_pair(KeyLen, DataLen);
93e060e57bSDouglas Gregor   }
94e060e57bSDouglas Gregor 
95e060e57bSDouglas Gregor   static const internal_key_type&
96e060e57bSDouglas Gregor   GetInternalKey(const external_key_type& x) { return x; }
97e060e57bSDouglas Gregor 
98e060e57bSDouglas Gregor   static const external_key_type&
99e060e57bSDouglas Gregor   GetExternalKey(const internal_key_type& x) { return x; }
100e060e57bSDouglas Gregor 
101e060e57bSDouglas Gregor   static internal_key_type ReadKey(const unsigned char* d, unsigned n) {
102e060e57bSDouglas Gregor     return StringRef((const char *)d, n);
103e060e57bSDouglas Gregor   }
104e060e57bSDouglas Gregor 
105e060e57bSDouglas Gregor   static data_type ReadData(const internal_key_type& k,
106e060e57bSDouglas Gregor                             const unsigned char* d,
107e060e57bSDouglas Gregor                             unsigned DataLen) {
10857ba0b22SJustin Bogner     using namespace llvm::support;
109e060e57bSDouglas Gregor 
110e060e57bSDouglas Gregor     data_type Result;
111e060e57bSDouglas Gregor     while (DataLen > 0) {
11257ba0b22SJustin Bogner       unsigned ID = endian::readNext<uint32_t, little, unaligned>(d);
113e060e57bSDouglas Gregor       Result.push_back(ID);
114e060e57bSDouglas Gregor       DataLen -= 4;
115e060e57bSDouglas Gregor     }
116e060e57bSDouglas Gregor 
117e060e57bSDouglas Gregor     return Result;
118e060e57bSDouglas Gregor   }
119e060e57bSDouglas Gregor };
120e060e57bSDouglas Gregor 
121bb094f06SJustin Bogner typedef llvm::OnDiskIterableChainedHashTable<IdentifierIndexReaderTrait>
122da4e650eSJustin Bogner     IdentifierIndexTable;
123e060e57bSDouglas Gregor 
124e060e57bSDouglas Gregor }
125e060e57bSDouglas Gregor 
126afa10d3eSDavid Blaikie GlobalModuleIndex::GlobalModuleIndex(std::unique_ptr<llvm::MemoryBuffer> Buffer,
127e060e57bSDouglas Gregor                                      llvm::BitstreamCursor Cursor)
128afa10d3eSDavid Blaikie     : Buffer(std::move(Buffer)), IdentifierIndex(), NumIdentifierLookups(),
129afa10d3eSDavid Blaikie       NumIdentifierLookupHits() {
130e060e57bSDouglas Gregor   // Read the global index.
131e060e57bSDouglas Gregor   bool InGlobalIndexBlock = false;
132e060e57bSDouglas Gregor   bool Done = false;
133e060e57bSDouglas Gregor   while (!Done) {
134e060e57bSDouglas Gregor     llvm::BitstreamEntry Entry = Cursor.advance();
135e060e57bSDouglas Gregor 
136e060e57bSDouglas Gregor     switch (Entry.Kind) {
137e060e57bSDouglas Gregor     case llvm::BitstreamEntry::Error:
138e060e57bSDouglas Gregor       return;
139e060e57bSDouglas Gregor 
140e060e57bSDouglas Gregor     case llvm::BitstreamEntry::EndBlock:
141e060e57bSDouglas Gregor       if (InGlobalIndexBlock) {
142e060e57bSDouglas Gregor         InGlobalIndexBlock = false;
143e060e57bSDouglas Gregor         Done = true;
144e060e57bSDouglas Gregor         continue;
145e060e57bSDouglas Gregor       }
146e060e57bSDouglas Gregor       return;
147e060e57bSDouglas Gregor 
148e060e57bSDouglas Gregor 
149e060e57bSDouglas Gregor     case llvm::BitstreamEntry::Record:
150e060e57bSDouglas Gregor       // Entries in the global index block are handled below.
151e060e57bSDouglas Gregor       if (InGlobalIndexBlock)
152e060e57bSDouglas Gregor         break;
153e060e57bSDouglas Gregor 
154e060e57bSDouglas Gregor       return;
155e060e57bSDouglas Gregor 
156e060e57bSDouglas Gregor     case llvm::BitstreamEntry::SubBlock:
157e060e57bSDouglas Gregor       if (!InGlobalIndexBlock && Entry.ID == GLOBAL_INDEX_BLOCK_ID) {
158e060e57bSDouglas Gregor         if (Cursor.EnterSubBlock(GLOBAL_INDEX_BLOCK_ID))
159e060e57bSDouglas Gregor           return;
160e060e57bSDouglas Gregor 
161e060e57bSDouglas Gregor         InGlobalIndexBlock = true;
162e060e57bSDouglas Gregor       } else if (Cursor.SkipBlock()) {
163e060e57bSDouglas Gregor         return;
164e060e57bSDouglas Gregor       }
165e060e57bSDouglas Gregor       continue;
166e060e57bSDouglas Gregor     }
167e060e57bSDouglas Gregor 
168e060e57bSDouglas Gregor     SmallVector<uint64_t, 64> Record;
169e060e57bSDouglas Gregor     StringRef Blob;
170e060e57bSDouglas Gregor     switch ((IndexRecordTypes)Cursor.readRecord(Entry.ID, Record, &Blob)) {
171e060e57bSDouglas Gregor     case INDEX_METADATA:
172e060e57bSDouglas Gregor       // Make sure that the version matches.
173e060e57bSDouglas Gregor       if (Record.size() < 1 || Record[0] != CurrentVersion)
174e060e57bSDouglas Gregor         return;
175e060e57bSDouglas Gregor       break;
176e060e57bSDouglas Gregor 
177e060e57bSDouglas Gregor     case MODULE: {
178e060e57bSDouglas Gregor       unsigned Idx = 0;
179e060e57bSDouglas Gregor       unsigned ID = Record[Idx++];
180e060e57bSDouglas Gregor 
1817029ce1aSDouglas Gregor       // Make room for this module's information.
1827029ce1aSDouglas Gregor       if (ID == Modules.size())
1837029ce1aSDouglas Gregor         Modules.push_back(ModuleInfo());
1847029ce1aSDouglas Gregor       else
1857029ce1aSDouglas Gregor         Modules.resize(ID + 1);
1867029ce1aSDouglas Gregor 
1877029ce1aSDouglas Gregor       // Size/modification time for this module file at the time the
1887029ce1aSDouglas Gregor       // global index was built.
1897029ce1aSDouglas Gregor       Modules[ID].Size = Record[Idx++];
1907029ce1aSDouglas Gregor       Modules[ID].ModTime = Record[Idx++];
191e060e57bSDouglas Gregor 
192e060e57bSDouglas Gregor       // File name.
193e060e57bSDouglas Gregor       unsigned NameLen = Record[Idx++];
1947029ce1aSDouglas Gregor       Modules[ID].FileName.assign(Record.begin() + Idx,
195e060e57bSDouglas Gregor                                   Record.begin() + Idx + NameLen);
196e060e57bSDouglas Gregor       Idx += NameLen;
197e060e57bSDouglas Gregor 
198e060e57bSDouglas Gregor       // Dependencies
199e060e57bSDouglas Gregor       unsigned NumDeps = Record[Idx++];
2007029ce1aSDouglas Gregor       Modules[ID].Dependencies.insert(Modules[ID].Dependencies.end(),
2017029ce1aSDouglas Gregor                                       Record.begin() + Idx,
2027029ce1aSDouglas Gregor                                       Record.begin() + Idx + NumDeps);
2037029ce1aSDouglas Gregor       Idx += NumDeps;
204e060e57bSDouglas Gregor 
2057029ce1aSDouglas Gregor       // Make sure we're at the end of the record.
2067029ce1aSDouglas Gregor       assert(Idx == Record.size() && "More module info?");
207603cd869SDouglas Gregor 
208603cd869SDouglas Gregor       // Record this module as an unresolved module.
209beee15e7SBen Langmuir       // FIXME: this doesn't work correctly for module names containing path
210beee15e7SBen Langmuir       // separators.
211beee15e7SBen Langmuir       StringRef ModuleName = llvm::sys::path::stem(Modules[ID].FileName);
212beee15e7SBen Langmuir       // Remove the -<hash of ModuleMapPath>
213beee15e7SBen Langmuir       ModuleName = ModuleName.rsplit('-').first;
214beee15e7SBen Langmuir       UnresolvedModules[ModuleName] = ID;
215e060e57bSDouglas Gregor       break;
216e060e57bSDouglas Gregor     }
217e060e57bSDouglas Gregor 
218e060e57bSDouglas Gregor     case IDENTIFIER_INDEX:
219e060e57bSDouglas Gregor       // Wire up the identifier index.
220e060e57bSDouglas Gregor       if (Record[0]) {
221e060e57bSDouglas Gregor         IdentifierIndex = IdentifierIndexTable::Create(
222e060e57bSDouglas Gregor             (const unsigned char *)Blob.data() + Record[0],
223da4e650eSJustin Bogner             (const unsigned char *)Blob.data() + sizeof(uint32_t),
224da4e650eSJustin Bogner             (const unsigned char *)Blob.data(), IdentifierIndexReaderTrait());
225e060e57bSDouglas Gregor       }
226e060e57bSDouglas Gregor       break;
227e060e57bSDouglas Gregor     }
228e060e57bSDouglas Gregor   }
229e060e57bSDouglas Gregor }
230e060e57bSDouglas Gregor 
231e68b847fSNico Weber GlobalModuleIndex::~GlobalModuleIndex() {
232e68b847fSNico Weber   delete static_cast<IdentifierIndexTable *>(IdentifierIndex);
233e68b847fSNico Weber }
234e060e57bSDouglas Gregor 
235e060e57bSDouglas Gregor std::pair<GlobalModuleIndex *, GlobalModuleIndex::ErrorCode>
2367029ce1aSDouglas Gregor GlobalModuleIndex::readIndex(StringRef Path) {
237e060e57bSDouglas Gregor   // Load the index file, if it's there.
238e060e57bSDouglas Gregor   llvm::SmallString<128> IndexPath;
239e060e57bSDouglas Gregor   IndexPath += Path;
240e060e57bSDouglas Gregor   llvm::sys::path::append(IndexPath, IndexFileName);
241e060e57bSDouglas Gregor 
2422d2b420aSRafael Espindola   llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> BufferOrErr =
2432d2b420aSRafael Espindola       llvm::MemoryBuffer::getFile(IndexPath.c_str());
2442d2b420aSRafael Espindola   if (!BufferOrErr)
245a13603a2SCraig Topper     return std::make_pair(nullptr, EC_NotFound);
2462d2b420aSRafael Espindola   std::unique_ptr<llvm::MemoryBuffer> Buffer = std::move(BufferOrErr.get());
247e060e57bSDouglas Gregor 
248e060e57bSDouglas Gregor   /// \brief The bitstream reader from which we'll read the AST file.
249e060e57bSDouglas Gregor   llvm::BitstreamReader Reader((const unsigned char *)Buffer->getBufferStart(),
250e060e57bSDouglas Gregor                                (const unsigned char *)Buffer->getBufferEnd());
251e060e57bSDouglas Gregor 
252e060e57bSDouglas Gregor   /// \brief The main bitstream cursor for the main block.
253e060e57bSDouglas Gregor   llvm::BitstreamCursor Cursor(Reader);
254e060e57bSDouglas Gregor 
255e060e57bSDouglas Gregor   // Sniff for the signature.
256e060e57bSDouglas Gregor   if (Cursor.Read(8) != 'B' ||
257e060e57bSDouglas Gregor       Cursor.Read(8) != 'C' ||
258e060e57bSDouglas Gregor       Cursor.Read(8) != 'G' ||
259e060e57bSDouglas Gregor       Cursor.Read(8) != 'I') {
260a13603a2SCraig Topper     return std::make_pair(nullptr, EC_IOError);
261e060e57bSDouglas Gregor   }
262e060e57bSDouglas Gregor 
263afa10d3eSDavid Blaikie   return std::make_pair(new GlobalModuleIndex(std::move(Buffer), Cursor),
2649a16beb8SAhmed Charles                         EC_None);
265e060e57bSDouglas Gregor }
266e060e57bSDouglas Gregor 
2677029ce1aSDouglas Gregor void
2687029ce1aSDouglas Gregor GlobalModuleIndex::getKnownModules(SmallVectorImpl<ModuleFile *> &ModuleFiles) {
269e060e57bSDouglas Gregor   ModuleFiles.clear();
270e060e57bSDouglas Gregor   for (unsigned I = 0, N = Modules.size(); I != N; ++I) {
271603cd869SDouglas Gregor     if (ModuleFile *MF = Modules[I].File)
272603cd869SDouglas Gregor       ModuleFiles.push_back(MF);
273e060e57bSDouglas Gregor   }
274e060e57bSDouglas Gregor }
275e060e57bSDouglas Gregor 
276e060e57bSDouglas Gregor void GlobalModuleIndex::getModuleDependencies(
2777029ce1aSDouglas Gregor        ModuleFile *File,
2787029ce1aSDouglas Gregor        SmallVectorImpl<ModuleFile *> &Dependencies) {
279e060e57bSDouglas Gregor   // Look for information about this module file.
2807029ce1aSDouglas Gregor   llvm::DenseMap<ModuleFile *, unsigned>::iterator Known
2817029ce1aSDouglas Gregor     = ModulesByFile.find(File);
282e060e57bSDouglas Gregor   if (Known == ModulesByFile.end())
283e060e57bSDouglas Gregor     return;
284e060e57bSDouglas Gregor 
285e060e57bSDouglas Gregor   // Record dependencies.
2867029ce1aSDouglas Gregor   Dependencies.clear();
2877029ce1aSDouglas Gregor   ArrayRef<unsigned> StoredDependencies = Modules[Known->second].Dependencies;
2887029ce1aSDouglas Gregor   for (unsigned I = 0, N = StoredDependencies.size(); I != N; ++I) {
289603cd869SDouglas Gregor     if (ModuleFile *MF = Modules[I].File)
2907029ce1aSDouglas Gregor       Dependencies.push_back(MF);
2917029ce1aSDouglas Gregor   }
292e060e57bSDouglas Gregor }
293e060e57bSDouglas Gregor 
2947211ac15SDouglas Gregor bool GlobalModuleIndex::lookupIdentifier(StringRef Name, HitSet &Hits) {
2957211ac15SDouglas Gregor   Hits.clear();
296e060e57bSDouglas Gregor 
297e060e57bSDouglas Gregor   // If there's no identifier index, there is nothing we can do.
298e060e57bSDouglas Gregor   if (!IdentifierIndex)
299e060e57bSDouglas Gregor     return false;
300e060e57bSDouglas Gregor 
301e060e57bSDouglas Gregor   // Look into the identifier index.
302e060e57bSDouglas Gregor   ++NumIdentifierLookups;
303e060e57bSDouglas Gregor   IdentifierIndexTable &Table
304e060e57bSDouglas Gregor     = *static_cast<IdentifierIndexTable *>(IdentifierIndex);
305e060e57bSDouglas Gregor   IdentifierIndexTable::iterator Known = Table.find(Name);
306e060e57bSDouglas Gregor   if (Known == Table.end()) {
307e060e57bSDouglas Gregor     return true;
308e060e57bSDouglas Gregor   }
309e060e57bSDouglas Gregor 
310e060e57bSDouglas Gregor   SmallVector<unsigned, 2> ModuleIDs = *Known;
311e060e57bSDouglas Gregor   for (unsigned I = 0, N = ModuleIDs.size(); I != N; ++I) {
312603cd869SDouglas Gregor     if (ModuleFile *MF = Modules[ModuleIDs[I]].File)
313603cd869SDouglas Gregor       Hits.insert(MF);
314e060e57bSDouglas Gregor   }
315e060e57bSDouglas Gregor 
316e060e57bSDouglas Gregor   ++NumIdentifierLookupHits;
317e060e57bSDouglas Gregor   return true;
318e060e57bSDouglas Gregor }
319e060e57bSDouglas Gregor 
320603cd869SDouglas Gregor bool GlobalModuleIndex::loadedModuleFile(ModuleFile *File) {
321603cd869SDouglas Gregor   // Look for the module in the global module index based on the module name.
322beee15e7SBen Langmuir   StringRef Name = File->ModuleName;
323603cd869SDouglas Gregor   llvm::StringMap<unsigned>::iterator Known = UnresolvedModules.find(Name);
324603cd869SDouglas Gregor   if (Known == UnresolvedModules.end()) {
325603cd869SDouglas Gregor     return true;
3267029ce1aSDouglas Gregor   }
3277029ce1aSDouglas Gregor 
328603cd869SDouglas Gregor   // Rectify this module with the global module index.
329603cd869SDouglas Gregor   ModuleInfo &Info = Modules[Known->second];
330603cd869SDouglas Gregor 
331603cd869SDouglas Gregor   //  If the size and modification time match what we expected, record this
332603cd869SDouglas Gregor   // module file.
333603cd869SDouglas Gregor   bool Failed = true;
334603cd869SDouglas Gregor   if (File->File->getSize() == Info.Size &&
335603cd869SDouglas Gregor       File->File->getModificationTime() == Info.ModTime) {
336603cd869SDouglas Gregor     Info.File = File;
337603cd869SDouglas Gregor     ModulesByFile[File] = Known->second;
338603cd869SDouglas Gregor 
339603cd869SDouglas Gregor     Failed = false;
3407029ce1aSDouglas Gregor   }
3417029ce1aSDouglas Gregor 
342603cd869SDouglas Gregor   // One way or another, we have resolved this module file.
343603cd869SDouglas Gregor   UnresolvedModules.erase(Known);
344603cd869SDouglas Gregor   return Failed;
3457029ce1aSDouglas Gregor }
3467029ce1aSDouglas Gregor 
347e060e57bSDouglas Gregor void GlobalModuleIndex::printStats() {
348e060e57bSDouglas Gregor   std::fprintf(stderr, "*** Global Module Index Statistics:\n");
349e060e57bSDouglas Gregor   if (NumIdentifierLookups) {
350e060e57bSDouglas Gregor     fprintf(stderr, "  %u / %u identifier lookups succeeded (%f%%)\n",
351e060e57bSDouglas Gregor             NumIdentifierLookupHits, NumIdentifierLookups,
352e060e57bSDouglas Gregor             (double)NumIdentifierLookupHits*100.0/NumIdentifierLookups);
353e060e57bSDouglas Gregor   }
354e060e57bSDouglas Gregor   std::fprintf(stderr, "\n");
355e060e57bSDouglas Gregor }
356e060e57bSDouglas Gregor 
357bcdcc92eSJohn Thompson void GlobalModuleIndex::dump() {
358a39baf1aSJohn Thompson   llvm::errs() << "*** Global Module Index Dump:\n";
359a39baf1aSJohn Thompson   llvm::errs() << "Module files:\n";
3604f52d44dSJohn Thompson   for (auto &MI : Modules) {
361a39baf1aSJohn Thompson     llvm::errs() << "** " << MI.FileName << "\n";
362a39baf1aSJohn Thompson     if (MI.File)
363a39baf1aSJohn Thompson       MI.File->dump();
364bcdcc92eSJohn Thompson     else
365a39baf1aSJohn Thompson       llvm::errs() << "\n";
366bcdcc92eSJohn Thompson   }
367a39baf1aSJohn Thompson   llvm::errs() << "\n";
368bcdcc92eSJohn Thompson }
369bcdcc92eSJohn Thompson 
370e060e57bSDouglas Gregor //----------------------------------------------------------------------------//
3715e306b12SDouglas Gregor // Global module index writer.
3725e306b12SDouglas Gregor //----------------------------------------------------------------------------//
3735e306b12SDouglas Gregor 
3745e306b12SDouglas Gregor namespace {
3755e306b12SDouglas Gregor   /// \brief Provides information about a specific module file.
3765e306b12SDouglas Gregor   struct ModuleFileInfo {
3775e306b12SDouglas Gregor     /// \brief The numberic ID for this module file.
3785e306b12SDouglas Gregor     unsigned ID;
3795e306b12SDouglas Gregor 
3805e306b12SDouglas Gregor     /// \brief The set of modules on which this module depends. Each entry is
3815e306b12SDouglas Gregor     /// a module ID.
3825e306b12SDouglas Gregor     SmallVector<unsigned, 4> Dependencies;
3835e306b12SDouglas Gregor   };
3845e306b12SDouglas Gregor 
3855e306b12SDouglas Gregor   /// \brief Builder that generates the global module index file.
3865e306b12SDouglas Gregor   class GlobalModuleIndexBuilder {
3875e306b12SDouglas Gregor     FileManager &FileMgr;
388*bb165fb0SAdrian Prantl     const PCHContainerOperations &PCHContainerOps;
3895e306b12SDouglas Gregor 
3905e306b12SDouglas Gregor     /// \brief Mapping from files to module file information.
3915e306b12SDouglas Gregor     typedef llvm::MapVector<const FileEntry *, ModuleFileInfo> ModuleFilesMap;
3925e306b12SDouglas Gregor 
3935e306b12SDouglas Gregor     /// \brief Information about each of the known module files.
3945e306b12SDouglas Gregor     ModuleFilesMap ModuleFiles;
3955e306b12SDouglas Gregor 
3965e306b12SDouglas Gregor     /// \brief Mapping from identifiers to the list of module file IDs that
3975e306b12SDouglas Gregor     /// consider this identifier to be interesting.
3985e306b12SDouglas Gregor     typedef llvm::StringMap<SmallVector<unsigned, 2> > InterestingIdentifierMap;
3995e306b12SDouglas Gregor 
4005e306b12SDouglas Gregor     /// \brief A mapping from all interesting identifiers to the set of module
4015e306b12SDouglas Gregor     /// files in which those identifiers are considered interesting.
4025e306b12SDouglas Gregor     InterestingIdentifierMap InterestingIdentifiers;
4035e306b12SDouglas Gregor 
4045e306b12SDouglas Gregor     /// \brief Write the block-info block for the global module index file.
4055e306b12SDouglas Gregor     void emitBlockInfoBlock(llvm::BitstreamWriter &Stream);
4065e306b12SDouglas Gregor 
4075e306b12SDouglas Gregor     /// \brief Retrieve the module file information for the given file.
4085e306b12SDouglas Gregor     ModuleFileInfo &getModuleFileInfo(const FileEntry *File) {
4095e306b12SDouglas Gregor       llvm::MapVector<const FileEntry *, ModuleFileInfo>::iterator Known
4105e306b12SDouglas Gregor         = ModuleFiles.find(File);
4115e306b12SDouglas Gregor       if (Known != ModuleFiles.end())
4125e306b12SDouglas Gregor         return Known->second;
4135e306b12SDouglas Gregor 
4145e306b12SDouglas Gregor       unsigned NewID = ModuleFiles.size();
4155e306b12SDouglas Gregor       ModuleFileInfo &Info = ModuleFiles[File];
4165e306b12SDouglas Gregor       Info.ID = NewID;
4175e306b12SDouglas Gregor       return Info;
4185e306b12SDouglas Gregor     }
4195e306b12SDouglas Gregor 
4205e306b12SDouglas Gregor   public:
421*bb165fb0SAdrian Prantl     explicit GlobalModuleIndexBuilder(
422*bb165fb0SAdrian Prantl         FileManager &FileMgr, const PCHContainerOperations &PCHContainerOps)
423*bb165fb0SAdrian Prantl         : FileMgr(FileMgr), PCHContainerOps(PCHContainerOps) {}
4245e306b12SDouglas Gregor 
4255e306b12SDouglas Gregor     /// \brief Load the contents of the given module file into the builder.
4265e306b12SDouglas Gregor     ///
4275e306b12SDouglas Gregor     /// \returns true if an error occurred, false otherwise.
4285e306b12SDouglas Gregor     bool loadModuleFile(const FileEntry *File);
4295e306b12SDouglas Gregor 
4305e306b12SDouglas Gregor     /// \brief Write the index to the given bitstream.
4315e306b12SDouglas Gregor     void writeIndex(llvm::BitstreamWriter &Stream);
4325e306b12SDouglas Gregor   };
4335e306b12SDouglas Gregor }
4345e306b12SDouglas Gregor 
4355e306b12SDouglas Gregor static void emitBlockID(unsigned ID, const char *Name,
4365e306b12SDouglas Gregor                         llvm::BitstreamWriter &Stream,
4375e306b12SDouglas Gregor                         SmallVectorImpl<uint64_t> &Record) {
4385e306b12SDouglas Gregor   Record.clear();
4395e306b12SDouglas Gregor   Record.push_back(ID);
4405e306b12SDouglas Gregor   Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_SETBID, Record);
4415e306b12SDouglas Gregor 
4425e306b12SDouglas Gregor   // Emit the block name if present.
443a13603a2SCraig Topper   if (!Name || Name[0] == 0) return;
4445e306b12SDouglas Gregor   Record.clear();
4455e306b12SDouglas Gregor   while (*Name)
4465e306b12SDouglas Gregor     Record.push_back(*Name++);
4475e306b12SDouglas Gregor   Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_BLOCKNAME, Record);
4485e306b12SDouglas Gregor }
4495e306b12SDouglas Gregor 
4505e306b12SDouglas Gregor static void emitRecordID(unsigned ID, const char *Name,
4515e306b12SDouglas Gregor                          llvm::BitstreamWriter &Stream,
4525e306b12SDouglas Gregor                          SmallVectorImpl<uint64_t> &Record) {
4535e306b12SDouglas Gregor   Record.clear();
4545e306b12SDouglas Gregor   Record.push_back(ID);
4555e306b12SDouglas Gregor   while (*Name)
4565e306b12SDouglas Gregor     Record.push_back(*Name++);
4575e306b12SDouglas Gregor   Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_SETRECORDNAME, Record);
4585e306b12SDouglas Gregor }
4595e306b12SDouglas Gregor 
4605e306b12SDouglas Gregor void
4615e306b12SDouglas Gregor GlobalModuleIndexBuilder::emitBlockInfoBlock(llvm::BitstreamWriter &Stream) {
4625e306b12SDouglas Gregor   SmallVector<uint64_t, 64> Record;
4635e306b12SDouglas Gregor   Stream.EnterSubblock(llvm::bitc::BLOCKINFO_BLOCK_ID, 3);
4645e306b12SDouglas Gregor 
4655e306b12SDouglas Gregor #define BLOCK(X) emitBlockID(X ## _ID, #X, Stream, Record)
4665e306b12SDouglas Gregor #define RECORD(X) emitRecordID(X, #X, Stream, Record)
4675e306b12SDouglas Gregor   BLOCK(GLOBAL_INDEX_BLOCK);
468e060e57bSDouglas Gregor   RECORD(INDEX_METADATA);
4695e306b12SDouglas Gregor   RECORD(MODULE);
4705e306b12SDouglas Gregor   RECORD(IDENTIFIER_INDEX);
4715e306b12SDouglas Gregor #undef RECORD
4725e306b12SDouglas Gregor #undef BLOCK
4735e306b12SDouglas Gregor 
4745e306b12SDouglas Gregor   Stream.ExitBlock();
4755e306b12SDouglas Gregor }
4765e306b12SDouglas Gregor 
477e060e57bSDouglas Gregor namespace {
4785e306b12SDouglas Gregor   class InterestingASTIdentifierLookupTrait
4795e306b12SDouglas Gregor     : public serialization::reader::ASTIdentifierLookupTraitBase {
4805e306b12SDouglas Gregor 
4815e306b12SDouglas Gregor   public:
4825e306b12SDouglas Gregor     /// \brief The identifier and whether it is "interesting".
4835e306b12SDouglas Gregor     typedef std::pair<StringRef, bool> data_type;
4845e306b12SDouglas Gregor 
4855e306b12SDouglas Gregor     data_type ReadData(const internal_key_type& k,
4865e306b12SDouglas Gregor                        const unsigned char* d,
4875e306b12SDouglas Gregor                        unsigned DataLen) {
4885e306b12SDouglas Gregor       // The first bit indicates whether this identifier is interesting.
4895e306b12SDouglas Gregor       // That's all we care about.
49057ba0b22SJustin Bogner       using namespace llvm::support;
49157ba0b22SJustin Bogner       unsigned RawID = endian::readNext<uint32_t, little, unaligned>(d);
4925e306b12SDouglas Gregor       bool IsInteresting = RawID & 0x01;
4935e306b12SDouglas Gregor       return std::make_pair(k, IsInteresting);
4945e306b12SDouglas Gregor     }
4955e306b12SDouglas Gregor   };
4965e306b12SDouglas Gregor }
4975e306b12SDouglas Gregor 
4985e306b12SDouglas Gregor bool GlobalModuleIndexBuilder::loadModuleFile(const FileEntry *File) {
4995e306b12SDouglas Gregor   // Open the module file.
5006406f7b8SRafael Espindola 
501a885796dSBenjamin Kramer   auto Buffer = FileMgr.getBufferForFile(File, /*isVolatile=*/true);
5025e306b12SDouglas Gregor   if (!Buffer) {
5035e306b12SDouglas Gregor     return true;
5045e306b12SDouglas Gregor   }
5055e306b12SDouglas Gregor 
5065e306b12SDouglas Gregor   // Initialize the input stream
5075e306b12SDouglas Gregor   llvm::BitstreamReader InStreamFile;
508*bb165fb0SAdrian Prantl   PCHContainerOps.ExtractPCH((*Buffer)->getMemBufferRef(), InStreamFile);
509af0e40acSRafael Espindola   llvm::BitstreamCursor InStream(InStreamFile);
5105e306b12SDouglas Gregor 
5115e306b12SDouglas Gregor   // Sniff for the signature.
5125e306b12SDouglas Gregor   if (InStream.Read(8) != 'C' ||
5135e306b12SDouglas Gregor       InStream.Read(8) != 'P' ||
5145e306b12SDouglas Gregor       InStream.Read(8) != 'C' ||
5155e306b12SDouglas Gregor       InStream.Read(8) != 'H') {
5165e306b12SDouglas Gregor     return true;
5175e306b12SDouglas Gregor   }
5185e306b12SDouglas Gregor 
5195e306b12SDouglas Gregor   // Record this module file and assign it a unique ID (if it doesn't have
5205e306b12SDouglas Gregor   // one already).
5215e306b12SDouglas Gregor   unsigned ID = getModuleFileInfo(File).ID;
5225e306b12SDouglas Gregor 
5235e306b12SDouglas Gregor   // Search for the blocks and records we care about.
524e060e57bSDouglas Gregor   enum { Other, ControlBlock, ASTBlock } State = Other;
5255e306b12SDouglas Gregor   bool Done = false;
5265e306b12SDouglas Gregor   while (!Done) {
527e060e57bSDouglas Gregor     llvm::BitstreamEntry Entry = InStream.advance();
5285e306b12SDouglas Gregor     switch (Entry.Kind) {
5295e306b12SDouglas Gregor     case llvm::BitstreamEntry::Error:
530e060e57bSDouglas Gregor       Done = true;
531e060e57bSDouglas Gregor       continue;
5325e306b12SDouglas Gregor 
5335e306b12SDouglas Gregor     case llvm::BitstreamEntry::Record:
534e060e57bSDouglas Gregor       // In the 'other' state, just skip the record. We don't care.
535e060e57bSDouglas Gregor       if (State == Other) {
5365e306b12SDouglas Gregor         InStream.skipRecord(Entry.ID);
5375e306b12SDouglas Gregor         continue;
5385e306b12SDouglas Gregor       }
5395e306b12SDouglas Gregor 
5405e306b12SDouglas Gregor       // Handle potentially-interesting records below.
5415e306b12SDouglas Gregor       break;
5425e306b12SDouglas Gregor 
5435e306b12SDouglas Gregor     case llvm::BitstreamEntry::SubBlock:
544e060e57bSDouglas Gregor       if (Entry.ID == CONTROL_BLOCK_ID) {
5455e306b12SDouglas Gregor         if (InStream.EnterSubBlock(CONTROL_BLOCK_ID))
5465e306b12SDouglas Gregor           return true;
5475e306b12SDouglas Gregor 
5485e306b12SDouglas Gregor         // Found the control block.
5495e306b12SDouglas Gregor         State = ControlBlock;
5505e306b12SDouglas Gregor         continue;
5515e306b12SDouglas Gregor       }
5525e306b12SDouglas Gregor 
553e060e57bSDouglas Gregor       if (Entry.ID == AST_BLOCK_ID) {
5545e306b12SDouglas Gregor         if (InStream.EnterSubBlock(AST_BLOCK_ID))
5555e306b12SDouglas Gregor           return true;
5565e306b12SDouglas Gregor 
5575e306b12SDouglas Gregor         // Found the AST block.
5585e306b12SDouglas Gregor         State = ASTBlock;
5595e306b12SDouglas Gregor         continue;
5605e306b12SDouglas Gregor       }
5615e306b12SDouglas Gregor 
5625e306b12SDouglas Gregor       if (InStream.SkipBlock())
5635e306b12SDouglas Gregor         return true;
5645e306b12SDouglas Gregor 
5655e306b12SDouglas Gregor       continue;
5665e306b12SDouglas Gregor 
5675e306b12SDouglas Gregor     case llvm::BitstreamEntry::EndBlock:
568e060e57bSDouglas Gregor       State = Other;
5695e306b12SDouglas Gregor       continue;
5705e306b12SDouglas Gregor     }
5715e306b12SDouglas Gregor 
5725e306b12SDouglas Gregor     // Read the given record.
5735e306b12SDouglas Gregor     SmallVector<uint64_t, 64> Record;
5745e306b12SDouglas Gregor     StringRef Blob;
5755e306b12SDouglas Gregor     unsigned Code = InStream.readRecord(Entry.ID, Record, &Blob);
5765e306b12SDouglas Gregor 
5775e306b12SDouglas Gregor     // Handle module dependencies.
5785e306b12SDouglas Gregor     if (State == ControlBlock && Code == IMPORTS) {
5795e306b12SDouglas Gregor       // Load each of the imported PCH files.
5805e306b12SDouglas Gregor       unsigned Idx = 0, N = Record.size();
5815e306b12SDouglas Gregor       while (Idx < N) {
5825e306b12SDouglas Gregor         // Read information about the AST file.
5835e306b12SDouglas Gregor 
5845e306b12SDouglas Gregor         // Skip the imported kind
5855e306b12SDouglas Gregor         ++Idx;
5865e306b12SDouglas Gregor 
5875e306b12SDouglas Gregor         // Skip the import location
5885e306b12SDouglas Gregor         ++Idx;
5895e306b12SDouglas Gregor 
5907029ce1aSDouglas Gregor         // Load stored size/modification time.
5917029ce1aSDouglas Gregor         off_t StoredSize = (off_t)Record[Idx++];
5927029ce1aSDouglas Gregor         time_t StoredModTime = (time_t)Record[Idx++];
5937029ce1aSDouglas Gregor 
594487ea14aSBen Langmuir         // Skip the stored signature.
595487ea14aSBen Langmuir         // FIXME: we could read the signature out of the import and validate it.
596487ea14aSBen Langmuir         Idx++;
597487ea14aSBen Langmuir 
5985e306b12SDouglas Gregor         // Retrieve the imported file name.
5995e306b12SDouglas Gregor         unsigned Length = Record[Idx++];
6005e306b12SDouglas Gregor         SmallString<128> ImportedFile(Record.begin() + Idx,
6015e306b12SDouglas Gregor                                       Record.begin() + Idx + Length);
6025e306b12SDouglas Gregor         Idx += Length;
6035e306b12SDouglas Gregor 
6045e306b12SDouglas Gregor         // Find the imported module file.
605dadd85dcSDouglas Gregor         const FileEntry *DependsOnFile
606dadd85dcSDouglas Gregor           = FileMgr.getFile(ImportedFile, /*openFile=*/false,
607dadd85dcSDouglas Gregor                             /*cacheFailure=*/false);
6087029ce1aSDouglas Gregor         if (!DependsOnFile ||
6097029ce1aSDouglas Gregor             (StoredSize != DependsOnFile->getSize()) ||
6107029ce1aSDouglas Gregor             (StoredModTime != DependsOnFile->getModificationTime()))
6115e306b12SDouglas Gregor           return true;
6125e306b12SDouglas Gregor 
6135e306b12SDouglas Gregor         // Record the dependency.
6145e306b12SDouglas Gregor         unsigned DependsOnID = getModuleFileInfo(DependsOnFile).ID;
6155e306b12SDouglas Gregor         getModuleFileInfo(File).Dependencies.push_back(DependsOnID);
6165e306b12SDouglas Gregor       }
6175e306b12SDouglas Gregor 
6185e306b12SDouglas Gregor       continue;
6195e306b12SDouglas Gregor     }
6205e306b12SDouglas Gregor 
6215e306b12SDouglas Gregor     // Handle the identifier table
6225e306b12SDouglas Gregor     if (State == ASTBlock && Code == IDENTIFIER_TABLE && Record[0] > 0) {
623bb094f06SJustin Bogner       typedef llvm::OnDiskIterableChainedHashTable<
624bb094f06SJustin Bogner           InterestingASTIdentifierLookupTrait> InterestingIdentifierTable;
625b8984329SAhmed Charles       std::unique_ptr<InterestingIdentifierTable> Table(
626b8984329SAhmed Charles           InterestingIdentifierTable::Create(
6275e306b12SDouglas Gregor               (const unsigned char *)Blob.data() + Record[0],
628da4e650eSJustin Bogner               (const unsigned char *)Blob.data() + sizeof(uint32_t),
6295e306b12SDouglas Gregor               (const unsigned char *)Blob.data()));
6305e306b12SDouglas Gregor       for (InterestingIdentifierTable::data_iterator D = Table->data_begin(),
6315e306b12SDouglas Gregor                                                      DEnd = Table->data_end();
6325e306b12SDouglas Gregor            D != DEnd; ++D) {
6335e306b12SDouglas Gregor         std::pair<StringRef, bool> Ident = *D;
6345e306b12SDouglas Gregor         if (Ident.second)
6355e306b12SDouglas Gregor           InterestingIdentifiers[Ident.first].push_back(ID);
636e060e57bSDouglas Gregor         else
637e060e57bSDouglas Gregor           (void)InterestingIdentifiers[Ident.first];
6385e306b12SDouglas Gregor       }
6395e306b12SDouglas Gregor     }
6405e306b12SDouglas Gregor 
6415e306b12SDouglas Gregor     // We don't care about this record.
6425e306b12SDouglas Gregor   }
6435e306b12SDouglas Gregor 
6445e306b12SDouglas Gregor   return false;
6455e306b12SDouglas Gregor }
6465e306b12SDouglas Gregor 
6475e306b12SDouglas Gregor namespace {
6485e306b12SDouglas Gregor 
6495e306b12SDouglas Gregor /// \brief Trait used to generate the identifier index as an on-disk hash
6505e306b12SDouglas Gregor /// table.
6515e306b12SDouglas Gregor class IdentifierIndexWriterTrait {
6525e306b12SDouglas Gregor public:
6535e306b12SDouglas Gregor   typedef StringRef key_type;
6545e306b12SDouglas Gregor   typedef StringRef key_type_ref;
6555e306b12SDouglas Gregor   typedef SmallVector<unsigned, 2> data_type;
6565e306b12SDouglas Gregor   typedef const SmallVector<unsigned, 2> &data_type_ref;
65725463f15SJustin Bogner   typedef unsigned hash_value_type;
65825463f15SJustin Bogner   typedef unsigned offset_type;
6595e306b12SDouglas Gregor 
66025463f15SJustin Bogner   static hash_value_type ComputeHash(key_type_ref Key) {
6615e306b12SDouglas Gregor     return llvm::HashString(Key);
6625e306b12SDouglas Gregor   }
6635e306b12SDouglas Gregor 
6645e306b12SDouglas Gregor   std::pair<unsigned,unsigned>
6655e306b12SDouglas Gregor   EmitKeyDataLength(raw_ostream& Out, key_type_ref Key, data_type_ref Data) {
666e1c147c3SJustin Bogner     using namespace llvm::support;
667e1c147c3SJustin Bogner     endian::Writer<little> LE(Out);
6685e306b12SDouglas Gregor     unsigned KeyLen = Key.size();
6695e306b12SDouglas Gregor     unsigned DataLen = Data.size() * 4;
670e1c147c3SJustin Bogner     LE.write<uint16_t>(KeyLen);
671e1c147c3SJustin Bogner     LE.write<uint16_t>(DataLen);
6725e306b12SDouglas Gregor     return std::make_pair(KeyLen, DataLen);
6735e306b12SDouglas Gregor   }
6745e306b12SDouglas Gregor 
6755e306b12SDouglas Gregor   void EmitKey(raw_ostream& Out, key_type_ref Key, unsigned KeyLen) {
6765e306b12SDouglas Gregor     Out.write(Key.data(), KeyLen);
6775e306b12SDouglas Gregor   }
6785e306b12SDouglas Gregor 
6795e306b12SDouglas Gregor   void EmitData(raw_ostream& Out, key_type_ref Key, data_type_ref Data,
6805e306b12SDouglas Gregor                 unsigned DataLen) {
681e1c147c3SJustin Bogner     using namespace llvm::support;
6825e306b12SDouglas Gregor     for (unsigned I = 0, N = Data.size(); I != N; ++I)
683e1c147c3SJustin Bogner       endian::Writer<little>(Out).write<uint32_t>(Data[I]);
6845e306b12SDouglas Gregor   }
6855e306b12SDouglas Gregor };
6865e306b12SDouglas Gregor 
6875e306b12SDouglas Gregor }
6885e306b12SDouglas Gregor 
6895e306b12SDouglas Gregor void GlobalModuleIndexBuilder::writeIndex(llvm::BitstreamWriter &Stream) {
6905e306b12SDouglas Gregor   using namespace llvm;
6915e306b12SDouglas Gregor 
6925e306b12SDouglas Gregor   // Emit the file header.
6935e306b12SDouglas Gregor   Stream.Emit((unsigned)'B', 8);
6945e306b12SDouglas Gregor   Stream.Emit((unsigned)'C', 8);
6955e306b12SDouglas Gregor   Stream.Emit((unsigned)'G', 8);
6965e306b12SDouglas Gregor   Stream.Emit((unsigned)'I', 8);
6975e306b12SDouglas Gregor 
6985e306b12SDouglas Gregor   // Write the block-info block, which describes the records in this bitcode
6995e306b12SDouglas Gregor   // file.
7005e306b12SDouglas Gregor   emitBlockInfoBlock(Stream);
7015e306b12SDouglas Gregor 
7025e306b12SDouglas Gregor   Stream.EnterSubblock(GLOBAL_INDEX_BLOCK_ID, 3);
7035e306b12SDouglas Gregor 
7045e306b12SDouglas Gregor   // Write the metadata.
7055e306b12SDouglas Gregor   SmallVector<uint64_t, 2> Record;
7065e306b12SDouglas Gregor   Record.push_back(CurrentVersion);
707e060e57bSDouglas Gregor   Stream.EmitRecord(INDEX_METADATA, Record);
7085e306b12SDouglas Gregor 
7095e306b12SDouglas Gregor   // Write the set of known module files.
7105e306b12SDouglas Gregor   for (ModuleFilesMap::iterator M = ModuleFiles.begin(),
7115e306b12SDouglas Gregor                                 MEnd = ModuleFiles.end();
7125e306b12SDouglas Gregor        M != MEnd; ++M) {
7135e306b12SDouglas Gregor     Record.clear();
7145e306b12SDouglas Gregor     Record.push_back(M->second.ID);
7155e306b12SDouglas Gregor     Record.push_back(M->first->getSize());
7165e306b12SDouglas Gregor     Record.push_back(M->first->getModificationTime());
7175e306b12SDouglas Gregor 
7185e306b12SDouglas Gregor     // File name
7195e306b12SDouglas Gregor     StringRef Name(M->first->getName());
7205e306b12SDouglas Gregor     Record.push_back(Name.size());
7215e306b12SDouglas Gregor     Record.append(Name.begin(), Name.end());
7225e306b12SDouglas Gregor 
7235e306b12SDouglas Gregor     // Dependencies
7245e306b12SDouglas Gregor     Record.push_back(M->second.Dependencies.size());
7255e306b12SDouglas Gregor     Record.append(M->second.Dependencies.begin(), M->second.Dependencies.end());
7265e306b12SDouglas Gregor     Stream.EmitRecord(MODULE, Record);
7275e306b12SDouglas Gregor   }
7285e306b12SDouglas Gregor 
7295e306b12SDouglas Gregor   // Write the identifier -> module file mapping.
7305e306b12SDouglas Gregor   {
731bb094f06SJustin Bogner     llvm::OnDiskChainedHashTableGenerator<IdentifierIndexWriterTrait> Generator;
7325e306b12SDouglas Gregor     IdentifierIndexWriterTrait Trait;
7335e306b12SDouglas Gregor 
7345e306b12SDouglas Gregor     // Populate the hash table.
7355e306b12SDouglas Gregor     for (InterestingIdentifierMap::iterator I = InterestingIdentifiers.begin(),
7365e306b12SDouglas Gregor                                             IEnd = InterestingIdentifiers.end();
7375e306b12SDouglas Gregor          I != IEnd; ++I) {
7385e306b12SDouglas Gregor       Generator.insert(I->first(), I->second, Trait);
7395e306b12SDouglas Gregor     }
7405e306b12SDouglas Gregor 
7415e306b12SDouglas Gregor     // Create the on-disk hash table in a buffer.
7425e306b12SDouglas Gregor     SmallString<4096> IdentifierTable;
7435e306b12SDouglas Gregor     uint32_t BucketOffset;
7445e306b12SDouglas Gregor     {
745e1c147c3SJustin Bogner       using namespace llvm::support;
7465e306b12SDouglas Gregor       llvm::raw_svector_ostream Out(IdentifierTable);
7475e306b12SDouglas Gregor       // Make sure that no bucket is at offset 0
748e1c147c3SJustin Bogner       endian::Writer<little>(Out).write<uint32_t>(0);
7495e306b12SDouglas Gregor       BucketOffset = Generator.Emit(Out, Trait);
7505e306b12SDouglas Gregor     }
7515e306b12SDouglas Gregor 
7525e306b12SDouglas Gregor     // Create a blob abbreviation
7535e306b12SDouglas Gregor     BitCodeAbbrev *Abbrev = new BitCodeAbbrev();
7545e306b12SDouglas Gregor     Abbrev->Add(BitCodeAbbrevOp(IDENTIFIER_INDEX));
7555e306b12SDouglas Gregor     Abbrev->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, 32));
7565e306b12SDouglas Gregor     Abbrev->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Blob));
7575e306b12SDouglas Gregor     unsigned IDTableAbbrev = Stream.EmitAbbrev(Abbrev);
7585e306b12SDouglas Gregor 
7595e306b12SDouglas Gregor     // Write the identifier table
7605e306b12SDouglas Gregor     Record.clear();
7615e306b12SDouglas Gregor     Record.push_back(IDENTIFIER_INDEX);
7625e306b12SDouglas Gregor     Record.push_back(BucketOffset);
76392e1b62dSYaron Keren     Stream.EmitRecordWithBlob(IDTableAbbrev, Record, IdentifierTable);
7645e306b12SDouglas Gregor   }
7655e306b12SDouglas Gregor 
7665e306b12SDouglas Gregor   Stream.ExitBlock();
7675e306b12SDouglas Gregor }
7685e306b12SDouglas Gregor 
7695e306b12SDouglas Gregor GlobalModuleIndex::ErrorCode
770*bb165fb0SAdrian Prantl GlobalModuleIndex::writeIndex(FileManager &FileMgr,
771*bb165fb0SAdrian Prantl                               const PCHContainerOperations &PCHContainerOps,
772*bb165fb0SAdrian Prantl                               StringRef Path) {
7735e306b12SDouglas Gregor   llvm::SmallString<128> IndexPath;
7745e306b12SDouglas Gregor   IndexPath += Path;
7755e306b12SDouglas Gregor   llvm::sys::path::append(IndexPath, IndexFileName);
7765e306b12SDouglas Gregor 
7775e306b12SDouglas Gregor   // Coordinate building the global index file with other processes that might
7785e306b12SDouglas Gregor   // try to do the same.
7795e306b12SDouglas Gregor   llvm::LockFileManager Locked(IndexPath);
7805e306b12SDouglas Gregor   switch (Locked) {
7815e306b12SDouglas Gregor   case llvm::LockFileManager::LFS_Error:
7825e306b12SDouglas Gregor     return EC_IOError;
7835e306b12SDouglas Gregor 
7845e306b12SDouglas Gregor   case llvm::LockFileManager::LFS_Owned:
7855e306b12SDouglas Gregor     // We're responsible for building the index ourselves. Do so below.
7865e306b12SDouglas Gregor     break;
7875e306b12SDouglas Gregor 
7885e306b12SDouglas Gregor   case llvm::LockFileManager::LFS_Shared:
7895e306b12SDouglas Gregor     // Someone else is responsible for building the index. We don't care
7905e306b12SDouglas Gregor     // when they finish, so we're done.
7915e306b12SDouglas Gregor     return EC_Building;
7925e306b12SDouglas Gregor   }
7935e306b12SDouglas Gregor 
7945e306b12SDouglas Gregor   // The module index builder.
795*bb165fb0SAdrian Prantl   GlobalModuleIndexBuilder Builder(FileMgr, PCHContainerOps);
7965e306b12SDouglas Gregor 
7975e306b12SDouglas Gregor   // Load each of the module files.
798c080917eSRafael Espindola   std::error_code EC;
7995e306b12SDouglas Gregor   for (llvm::sys::fs::directory_iterator D(Path, EC), DEnd;
8005e306b12SDouglas Gregor        D != DEnd && !EC;
8015e306b12SDouglas Gregor        D.increment(EC)) {
8025e306b12SDouglas Gregor     // If this isn't a module file, we don't care.
8035e306b12SDouglas Gregor     if (llvm::sys::path::extension(D->path()) != ".pcm") {
8045e306b12SDouglas Gregor       // ... unless it's a .pcm.lock file, which indicates that someone is
8055e306b12SDouglas Gregor       // in the process of rebuilding a module. They'll rebuild the index
8065e306b12SDouglas Gregor       // at the end of that translation unit, so we don't have to.
8075e306b12SDouglas Gregor       if (llvm::sys::path::extension(D->path()) == ".pcm.lock")
8085e306b12SDouglas Gregor         return EC_Building;
8095e306b12SDouglas Gregor 
8105e306b12SDouglas Gregor       continue;
8115e306b12SDouglas Gregor     }
8125e306b12SDouglas Gregor 
8135e306b12SDouglas Gregor     // If we can't find the module file, skip it.
8145e306b12SDouglas Gregor     const FileEntry *ModuleFile = FileMgr.getFile(D->path());
8155e306b12SDouglas Gregor     if (!ModuleFile)
8165e306b12SDouglas Gregor       continue;
8175e306b12SDouglas Gregor 
8185e306b12SDouglas Gregor     // Load this module file.
8195e306b12SDouglas Gregor     if (Builder.loadModuleFile(ModuleFile))
8205e306b12SDouglas Gregor       return EC_IOError;
8215e306b12SDouglas Gregor   }
8225e306b12SDouglas Gregor 
8235e306b12SDouglas Gregor   // The output buffer, into which the global index will be written.
8245e306b12SDouglas Gregor   SmallVector<char, 16> OutputBuffer;
8255e306b12SDouglas Gregor   {
8265e306b12SDouglas Gregor     llvm::BitstreamWriter OutputStream(OutputBuffer);
8275e306b12SDouglas Gregor     Builder.writeIndex(OutputStream);
8285e306b12SDouglas Gregor   }
8295e306b12SDouglas Gregor 
8305e306b12SDouglas Gregor   // Write the global index file to a temporary file.
8315e306b12SDouglas Gregor   llvm::SmallString<128> IndexTmpPath;
8325e306b12SDouglas Gregor   int TmpFD;
83318627115SRafael Espindola   if (llvm::sys::fs::createUniqueFile(IndexPath + "-%%%%%%%%", TmpFD,
83418627115SRafael Espindola                                       IndexTmpPath))
8355e306b12SDouglas Gregor     return EC_IOError;
8365e306b12SDouglas Gregor 
8375e306b12SDouglas Gregor   // Open the temporary global index file for output.
838e00c9868SNAKAMURA Takumi   llvm::raw_fd_ostream Out(TmpFD, true);
8395e306b12SDouglas Gregor   if (Out.has_error())
8405e306b12SDouglas Gregor     return EC_IOError;
8415e306b12SDouglas Gregor 
8425e306b12SDouglas Gregor   // Write the index.
8435e306b12SDouglas Gregor   Out.write(OutputBuffer.data(), OutputBuffer.size());
8445e306b12SDouglas Gregor   Out.close();
8455e306b12SDouglas Gregor   if (Out.has_error())
8465e306b12SDouglas Gregor     return EC_IOError;
8475e306b12SDouglas Gregor 
8485e306b12SDouglas Gregor   // Remove the old index file. It isn't relevant any more.
84992e1b62dSYaron Keren   llvm::sys::fs::remove(IndexPath);
8505e306b12SDouglas Gregor 
8515e306b12SDouglas Gregor   // Rename the newly-written index file to the proper name.
85292e1b62dSYaron Keren   if (llvm::sys::fs::rename(IndexTmpPath, IndexPath)) {
8535e306b12SDouglas Gregor     // Rename failed; just remove the
85492e1b62dSYaron Keren     llvm::sys::fs::remove(IndexTmpPath);
8555e306b12SDouglas Gregor     return EC_IOError;
8565e306b12SDouglas Gregor   }
8575e306b12SDouglas Gregor 
8585e306b12SDouglas Gregor   // We're done.
8595e306b12SDouglas Gregor   return EC_None;
8605e306b12SDouglas Gregor }
8619aca3c61SArgyrios Kyrtzidis 
8629aca3c61SArgyrios Kyrtzidis namespace {
8639aca3c61SArgyrios Kyrtzidis   class GlobalIndexIdentifierIterator : public IdentifierIterator {
8649aca3c61SArgyrios Kyrtzidis     /// \brief The current position within the identifier lookup table.
8659aca3c61SArgyrios Kyrtzidis     IdentifierIndexTable::key_iterator Current;
8669aca3c61SArgyrios Kyrtzidis 
8679aca3c61SArgyrios Kyrtzidis     /// \brief The end position within the identifier lookup table.
8689aca3c61SArgyrios Kyrtzidis     IdentifierIndexTable::key_iterator End;
8699aca3c61SArgyrios Kyrtzidis 
8709aca3c61SArgyrios Kyrtzidis   public:
8719aca3c61SArgyrios Kyrtzidis     explicit GlobalIndexIdentifierIterator(IdentifierIndexTable &Idx) {
8729aca3c61SArgyrios Kyrtzidis       Current = Idx.key_begin();
8739aca3c61SArgyrios Kyrtzidis       End = Idx.key_end();
8749aca3c61SArgyrios Kyrtzidis     }
8759aca3c61SArgyrios Kyrtzidis 
8763e89dfeeSCraig Topper     StringRef Next() override {
8779aca3c61SArgyrios Kyrtzidis       if (Current == End)
8789aca3c61SArgyrios Kyrtzidis         return StringRef();
8799aca3c61SArgyrios Kyrtzidis 
8809aca3c61SArgyrios Kyrtzidis       StringRef Result = *Current;
8819aca3c61SArgyrios Kyrtzidis       ++Current;
8829aca3c61SArgyrios Kyrtzidis       return Result;
8839aca3c61SArgyrios Kyrtzidis     }
8849aca3c61SArgyrios Kyrtzidis   };
8859aca3c61SArgyrios Kyrtzidis }
8869aca3c61SArgyrios Kyrtzidis 
8879aca3c61SArgyrios Kyrtzidis IdentifierIterator *GlobalModuleIndex::createIdentifierIterator() const {
8889aca3c61SArgyrios Kyrtzidis   IdentifierIndexTable &Table =
8899aca3c61SArgyrios Kyrtzidis     *static_cast<IdentifierIndexTable *>(IdentifierIndex);
8909aca3c61SArgyrios Kyrtzidis   return new GlobalIndexIdentifierIterator(Table);
8919aca3c61SArgyrios Kyrtzidis }
892