15e306b12SDouglas Gregor //===--- GlobalModuleIndex.cpp - Global Module Index ------------*- C++ -*-===// 25e306b12SDouglas Gregor // 35e306b12SDouglas Gregor // The LLVM Compiler Infrastructure 45e306b12SDouglas Gregor // 55e306b12SDouglas Gregor // This file is distributed under the University of Illinois Open Source 65e306b12SDouglas Gregor // License. See LICENSE.TXT for details. 75e306b12SDouglas Gregor // 85e306b12SDouglas Gregor //===----------------------------------------------------------------------===// 95e306b12SDouglas Gregor // 105e306b12SDouglas Gregor // This file implements the GlobalModuleIndex class. 115e306b12SDouglas Gregor // 125e306b12SDouglas Gregor //===----------------------------------------------------------------------===// 135e306b12SDouglas Gregor 145e306b12SDouglas Gregor #include "ASTReaderInternals.h" 15*bb165fb0SAdrian Prantl #include "clang/Frontend/PCHContainerOperations.h" 165e306b12SDouglas Gregor #include "clang/Basic/FileManager.h" 17beee15e7SBen Langmuir #include "clang/Lex/HeaderSearch.h" 185e306b12SDouglas Gregor #include "clang/Serialization/ASTBitCodes.h" 195e306b12SDouglas Gregor #include "clang/Serialization/GlobalModuleIndex.h" 20603cd869SDouglas Gregor #include "clang/Serialization/Module.h" 215e306b12SDouglas Gregor #include "llvm/ADT/DenseMap.h" 225e306b12SDouglas Gregor #include "llvm/ADT/MapVector.h" 235e306b12SDouglas Gregor #include "llvm/ADT/SmallString.h" 245e306b12SDouglas Gregor #include "llvm/ADT/StringExtras.h" 255e306b12SDouglas Gregor #include "llvm/Bitcode/BitstreamReader.h" 265e306b12SDouglas Gregor #include "llvm/Bitcode/BitstreamWriter.h" 278ec343ccSDouglas Gregor #include "llvm/Support/FileSystem.h" 285e306b12SDouglas Gregor #include "llvm/Support/LockFileManager.h" 295e306b12SDouglas Gregor #include "llvm/Support/MemoryBuffer.h" 30bb094f06SJustin Bogner #include "llvm/Support/OnDiskHashTable.h" 31552c169eSRafael Espindola #include "llvm/Support/Path.h" 32f0add23aSNAKAMURA Takumi #include <cstdio> 335e306b12SDouglas Gregor using namespace clang; 345e306b12SDouglas Gregor using namespace serialization; 355e306b12SDouglas Gregor 365e306b12SDouglas Gregor //----------------------------------------------------------------------------// 375e306b12SDouglas Gregor // Shared constants 385e306b12SDouglas Gregor //----------------------------------------------------------------------------// 395e306b12SDouglas Gregor namespace { 405e306b12SDouglas Gregor enum { 415e306b12SDouglas Gregor /// \brief The block containing the index. 425e306b12SDouglas Gregor GLOBAL_INDEX_BLOCK_ID = llvm::bitc::FIRST_APPLICATION_BLOCKID 435e306b12SDouglas Gregor }; 445e306b12SDouglas Gregor 455e306b12SDouglas Gregor /// \brief Describes the record types in the index. 465e306b12SDouglas Gregor enum IndexRecordTypes { 475e306b12SDouglas Gregor /// \brief Contains version information and potentially other metadata, 485e306b12SDouglas Gregor /// used to determine if we can read this global index file. 49e060e57bSDouglas Gregor INDEX_METADATA, 505e306b12SDouglas Gregor /// \brief Describes a module, including its file name and dependencies. 515e306b12SDouglas Gregor MODULE, 525e306b12SDouglas Gregor /// \brief The index for identifiers. 535e306b12SDouglas Gregor IDENTIFIER_INDEX 545e306b12SDouglas Gregor }; 555e306b12SDouglas Gregor } 565e306b12SDouglas Gregor 575e306b12SDouglas Gregor /// \brief The name of the global index file. 585e306b12SDouglas Gregor static const char * const IndexFileName = "modules.idx"; 595e306b12SDouglas Gregor 605e306b12SDouglas Gregor /// \brief The global index file version. 615e306b12SDouglas Gregor static const unsigned CurrentVersion = 1; 625e306b12SDouglas Gregor 635e306b12SDouglas Gregor //----------------------------------------------------------------------------// 64e060e57bSDouglas Gregor // Global module index reader. 65e060e57bSDouglas Gregor //----------------------------------------------------------------------------// 66e060e57bSDouglas Gregor 67e060e57bSDouglas Gregor namespace { 68e060e57bSDouglas Gregor 69e060e57bSDouglas Gregor /// \brief Trait used to read the identifier index from the on-disk hash 70e060e57bSDouglas Gregor /// table. 71e060e57bSDouglas Gregor class IdentifierIndexReaderTrait { 72e060e57bSDouglas Gregor public: 73e060e57bSDouglas Gregor typedef StringRef external_key_type; 74e060e57bSDouglas Gregor typedef StringRef internal_key_type; 75e060e57bSDouglas Gregor typedef SmallVector<unsigned, 2> data_type; 7625463f15SJustin Bogner typedef unsigned hash_value_type; 7725463f15SJustin Bogner typedef unsigned offset_type; 78e060e57bSDouglas Gregor 79e060e57bSDouglas Gregor static bool EqualKey(const internal_key_type& a, const internal_key_type& b) { 80e060e57bSDouglas Gregor return a == b; 81e060e57bSDouglas Gregor } 82e060e57bSDouglas Gregor 8325463f15SJustin Bogner static hash_value_type ComputeHash(const internal_key_type& a) { 84e060e57bSDouglas Gregor return llvm::HashString(a); 85e060e57bSDouglas Gregor } 86e060e57bSDouglas Gregor 87e060e57bSDouglas Gregor static std::pair<unsigned, unsigned> 88e060e57bSDouglas Gregor ReadKeyDataLength(const unsigned char*& d) { 8957ba0b22SJustin Bogner using namespace llvm::support; 9057ba0b22SJustin Bogner unsigned KeyLen = endian::readNext<uint16_t, little, unaligned>(d); 9157ba0b22SJustin Bogner unsigned DataLen = endian::readNext<uint16_t, little, unaligned>(d); 92e060e57bSDouglas Gregor return std::make_pair(KeyLen, DataLen); 93e060e57bSDouglas Gregor } 94e060e57bSDouglas Gregor 95e060e57bSDouglas Gregor static const internal_key_type& 96e060e57bSDouglas Gregor GetInternalKey(const external_key_type& x) { return x; } 97e060e57bSDouglas Gregor 98e060e57bSDouglas Gregor static const external_key_type& 99e060e57bSDouglas Gregor GetExternalKey(const internal_key_type& x) { return x; } 100e060e57bSDouglas Gregor 101e060e57bSDouglas Gregor static internal_key_type ReadKey(const unsigned char* d, unsigned n) { 102e060e57bSDouglas Gregor return StringRef((const char *)d, n); 103e060e57bSDouglas Gregor } 104e060e57bSDouglas Gregor 105e060e57bSDouglas Gregor static data_type ReadData(const internal_key_type& k, 106e060e57bSDouglas Gregor const unsigned char* d, 107e060e57bSDouglas Gregor unsigned DataLen) { 10857ba0b22SJustin Bogner using namespace llvm::support; 109e060e57bSDouglas Gregor 110e060e57bSDouglas Gregor data_type Result; 111e060e57bSDouglas Gregor while (DataLen > 0) { 11257ba0b22SJustin Bogner unsigned ID = endian::readNext<uint32_t, little, unaligned>(d); 113e060e57bSDouglas Gregor Result.push_back(ID); 114e060e57bSDouglas Gregor DataLen -= 4; 115e060e57bSDouglas Gregor } 116e060e57bSDouglas Gregor 117e060e57bSDouglas Gregor return Result; 118e060e57bSDouglas Gregor } 119e060e57bSDouglas Gregor }; 120e060e57bSDouglas Gregor 121bb094f06SJustin Bogner typedef llvm::OnDiskIterableChainedHashTable<IdentifierIndexReaderTrait> 122da4e650eSJustin Bogner IdentifierIndexTable; 123e060e57bSDouglas Gregor 124e060e57bSDouglas Gregor } 125e060e57bSDouglas Gregor 126afa10d3eSDavid Blaikie GlobalModuleIndex::GlobalModuleIndex(std::unique_ptr<llvm::MemoryBuffer> Buffer, 127e060e57bSDouglas Gregor llvm::BitstreamCursor Cursor) 128afa10d3eSDavid Blaikie : Buffer(std::move(Buffer)), IdentifierIndex(), NumIdentifierLookups(), 129afa10d3eSDavid Blaikie NumIdentifierLookupHits() { 130e060e57bSDouglas Gregor // Read the global index. 131e060e57bSDouglas Gregor bool InGlobalIndexBlock = false; 132e060e57bSDouglas Gregor bool Done = false; 133e060e57bSDouglas Gregor while (!Done) { 134e060e57bSDouglas Gregor llvm::BitstreamEntry Entry = Cursor.advance(); 135e060e57bSDouglas Gregor 136e060e57bSDouglas Gregor switch (Entry.Kind) { 137e060e57bSDouglas Gregor case llvm::BitstreamEntry::Error: 138e060e57bSDouglas Gregor return; 139e060e57bSDouglas Gregor 140e060e57bSDouglas Gregor case llvm::BitstreamEntry::EndBlock: 141e060e57bSDouglas Gregor if (InGlobalIndexBlock) { 142e060e57bSDouglas Gregor InGlobalIndexBlock = false; 143e060e57bSDouglas Gregor Done = true; 144e060e57bSDouglas Gregor continue; 145e060e57bSDouglas Gregor } 146e060e57bSDouglas Gregor return; 147e060e57bSDouglas Gregor 148e060e57bSDouglas Gregor 149e060e57bSDouglas Gregor case llvm::BitstreamEntry::Record: 150e060e57bSDouglas Gregor // Entries in the global index block are handled below. 151e060e57bSDouglas Gregor if (InGlobalIndexBlock) 152e060e57bSDouglas Gregor break; 153e060e57bSDouglas Gregor 154e060e57bSDouglas Gregor return; 155e060e57bSDouglas Gregor 156e060e57bSDouglas Gregor case llvm::BitstreamEntry::SubBlock: 157e060e57bSDouglas Gregor if (!InGlobalIndexBlock && Entry.ID == GLOBAL_INDEX_BLOCK_ID) { 158e060e57bSDouglas Gregor if (Cursor.EnterSubBlock(GLOBAL_INDEX_BLOCK_ID)) 159e060e57bSDouglas Gregor return; 160e060e57bSDouglas Gregor 161e060e57bSDouglas Gregor InGlobalIndexBlock = true; 162e060e57bSDouglas Gregor } else if (Cursor.SkipBlock()) { 163e060e57bSDouglas Gregor return; 164e060e57bSDouglas Gregor } 165e060e57bSDouglas Gregor continue; 166e060e57bSDouglas Gregor } 167e060e57bSDouglas Gregor 168e060e57bSDouglas Gregor SmallVector<uint64_t, 64> Record; 169e060e57bSDouglas Gregor StringRef Blob; 170e060e57bSDouglas Gregor switch ((IndexRecordTypes)Cursor.readRecord(Entry.ID, Record, &Blob)) { 171e060e57bSDouglas Gregor case INDEX_METADATA: 172e060e57bSDouglas Gregor // Make sure that the version matches. 173e060e57bSDouglas Gregor if (Record.size() < 1 || Record[0] != CurrentVersion) 174e060e57bSDouglas Gregor return; 175e060e57bSDouglas Gregor break; 176e060e57bSDouglas Gregor 177e060e57bSDouglas Gregor case MODULE: { 178e060e57bSDouglas Gregor unsigned Idx = 0; 179e060e57bSDouglas Gregor unsigned ID = Record[Idx++]; 180e060e57bSDouglas Gregor 1817029ce1aSDouglas Gregor // Make room for this module's information. 1827029ce1aSDouglas Gregor if (ID == Modules.size()) 1837029ce1aSDouglas Gregor Modules.push_back(ModuleInfo()); 1847029ce1aSDouglas Gregor else 1857029ce1aSDouglas Gregor Modules.resize(ID + 1); 1867029ce1aSDouglas Gregor 1877029ce1aSDouglas Gregor // Size/modification time for this module file at the time the 1887029ce1aSDouglas Gregor // global index was built. 1897029ce1aSDouglas Gregor Modules[ID].Size = Record[Idx++]; 1907029ce1aSDouglas Gregor Modules[ID].ModTime = Record[Idx++]; 191e060e57bSDouglas Gregor 192e060e57bSDouglas Gregor // File name. 193e060e57bSDouglas Gregor unsigned NameLen = Record[Idx++]; 1947029ce1aSDouglas Gregor Modules[ID].FileName.assign(Record.begin() + Idx, 195e060e57bSDouglas Gregor Record.begin() + Idx + NameLen); 196e060e57bSDouglas Gregor Idx += NameLen; 197e060e57bSDouglas Gregor 198e060e57bSDouglas Gregor // Dependencies 199e060e57bSDouglas Gregor unsigned NumDeps = Record[Idx++]; 2007029ce1aSDouglas Gregor Modules[ID].Dependencies.insert(Modules[ID].Dependencies.end(), 2017029ce1aSDouglas Gregor Record.begin() + Idx, 2027029ce1aSDouglas Gregor Record.begin() + Idx + NumDeps); 2037029ce1aSDouglas Gregor Idx += NumDeps; 204e060e57bSDouglas Gregor 2057029ce1aSDouglas Gregor // Make sure we're at the end of the record. 2067029ce1aSDouglas Gregor assert(Idx == Record.size() && "More module info?"); 207603cd869SDouglas Gregor 208603cd869SDouglas Gregor // Record this module as an unresolved module. 209beee15e7SBen Langmuir // FIXME: this doesn't work correctly for module names containing path 210beee15e7SBen Langmuir // separators. 211beee15e7SBen Langmuir StringRef ModuleName = llvm::sys::path::stem(Modules[ID].FileName); 212beee15e7SBen Langmuir // Remove the -<hash of ModuleMapPath> 213beee15e7SBen Langmuir ModuleName = ModuleName.rsplit('-').first; 214beee15e7SBen Langmuir UnresolvedModules[ModuleName] = ID; 215e060e57bSDouglas Gregor break; 216e060e57bSDouglas Gregor } 217e060e57bSDouglas Gregor 218e060e57bSDouglas Gregor case IDENTIFIER_INDEX: 219e060e57bSDouglas Gregor // Wire up the identifier index. 220e060e57bSDouglas Gregor if (Record[0]) { 221e060e57bSDouglas Gregor IdentifierIndex = IdentifierIndexTable::Create( 222e060e57bSDouglas Gregor (const unsigned char *)Blob.data() + Record[0], 223da4e650eSJustin Bogner (const unsigned char *)Blob.data() + sizeof(uint32_t), 224da4e650eSJustin Bogner (const unsigned char *)Blob.data(), IdentifierIndexReaderTrait()); 225e060e57bSDouglas Gregor } 226e060e57bSDouglas Gregor break; 227e060e57bSDouglas Gregor } 228e060e57bSDouglas Gregor } 229e060e57bSDouglas Gregor } 230e060e57bSDouglas Gregor 231e68b847fSNico Weber GlobalModuleIndex::~GlobalModuleIndex() { 232e68b847fSNico Weber delete static_cast<IdentifierIndexTable *>(IdentifierIndex); 233e68b847fSNico Weber } 234e060e57bSDouglas Gregor 235e060e57bSDouglas Gregor std::pair<GlobalModuleIndex *, GlobalModuleIndex::ErrorCode> 2367029ce1aSDouglas Gregor GlobalModuleIndex::readIndex(StringRef Path) { 237e060e57bSDouglas Gregor // Load the index file, if it's there. 238e060e57bSDouglas Gregor llvm::SmallString<128> IndexPath; 239e060e57bSDouglas Gregor IndexPath += Path; 240e060e57bSDouglas Gregor llvm::sys::path::append(IndexPath, IndexFileName); 241e060e57bSDouglas Gregor 2422d2b420aSRafael Espindola llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> BufferOrErr = 2432d2b420aSRafael Espindola llvm::MemoryBuffer::getFile(IndexPath.c_str()); 2442d2b420aSRafael Espindola if (!BufferOrErr) 245a13603a2SCraig Topper return std::make_pair(nullptr, EC_NotFound); 2462d2b420aSRafael Espindola std::unique_ptr<llvm::MemoryBuffer> Buffer = std::move(BufferOrErr.get()); 247e060e57bSDouglas Gregor 248e060e57bSDouglas Gregor /// \brief The bitstream reader from which we'll read the AST file. 249e060e57bSDouglas Gregor llvm::BitstreamReader Reader((const unsigned char *)Buffer->getBufferStart(), 250e060e57bSDouglas Gregor (const unsigned char *)Buffer->getBufferEnd()); 251e060e57bSDouglas Gregor 252e060e57bSDouglas Gregor /// \brief The main bitstream cursor for the main block. 253e060e57bSDouglas Gregor llvm::BitstreamCursor Cursor(Reader); 254e060e57bSDouglas Gregor 255e060e57bSDouglas Gregor // Sniff for the signature. 256e060e57bSDouglas Gregor if (Cursor.Read(8) != 'B' || 257e060e57bSDouglas Gregor Cursor.Read(8) != 'C' || 258e060e57bSDouglas Gregor Cursor.Read(8) != 'G' || 259e060e57bSDouglas Gregor Cursor.Read(8) != 'I') { 260a13603a2SCraig Topper return std::make_pair(nullptr, EC_IOError); 261e060e57bSDouglas Gregor } 262e060e57bSDouglas Gregor 263afa10d3eSDavid Blaikie return std::make_pair(new GlobalModuleIndex(std::move(Buffer), Cursor), 2649a16beb8SAhmed Charles EC_None); 265e060e57bSDouglas Gregor } 266e060e57bSDouglas Gregor 2677029ce1aSDouglas Gregor void 2687029ce1aSDouglas Gregor GlobalModuleIndex::getKnownModules(SmallVectorImpl<ModuleFile *> &ModuleFiles) { 269e060e57bSDouglas Gregor ModuleFiles.clear(); 270e060e57bSDouglas Gregor for (unsigned I = 0, N = Modules.size(); I != N; ++I) { 271603cd869SDouglas Gregor if (ModuleFile *MF = Modules[I].File) 272603cd869SDouglas Gregor ModuleFiles.push_back(MF); 273e060e57bSDouglas Gregor } 274e060e57bSDouglas Gregor } 275e060e57bSDouglas Gregor 276e060e57bSDouglas Gregor void GlobalModuleIndex::getModuleDependencies( 2777029ce1aSDouglas Gregor ModuleFile *File, 2787029ce1aSDouglas Gregor SmallVectorImpl<ModuleFile *> &Dependencies) { 279e060e57bSDouglas Gregor // Look for information about this module file. 2807029ce1aSDouglas Gregor llvm::DenseMap<ModuleFile *, unsigned>::iterator Known 2817029ce1aSDouglas Gregor = ModulesByFile.find(File); 282e060e57bSDouglas Gregor if (Known == ModulesByFile.end()) 283e060e57bSDouglas Gregor return; 284e060e57bSDouglas Gregor 285e060e57bSDouglas Gregor // Record dependencies. 2867029ce1aSDouglas Gregor Dependencies.clear(); 2877029ce1aSDouglas Gregor ArrayRef<unsigned> StoredDependencies = Modules[Known->second].Dependencies; 2887029ce1aSDouglas Gregor for (unsigned I = 0, N = StoredDependencies.size(); I != N; ++I) { 289603cd869SDouglas Gregor if (ModuleFile *MF = Modules[I].File) 2907029ce1aSDouglas Gregor Dependencies.push_back(MF); 2917029ce1aSDouglas Gregor } 292e060e57bSDouglas Gregor } 293e060e57bSDouglas Gregor 2947211ac15SDouglas Gregor bool GlobalModuleIndex::lookupIdentifier(StringRef Name, HitSet &Hits) { 2957211ac15SDouglas Gregor Hits.clear(); 296e060e57bSDouglas Gregor 297e060e57bSDouglas Gregor // If there's no identifier index, there is nothing we can do. 298e060e57bSDouglas Gregor if (!IdentifierIndex) 299e060e57bSDouglas Gregor return false; 300e060e57bSDouglas Gregor 301e060e57bSDouglas Gregor // Look into the identifier index. 302e060e57bSDouglas Gregor ++NumIdentifierLookups; 303e060e57bSDouglas Gregor IdentifierIndexTable &Table 304e060e57bSDouglas Gregor = *static_cast<IdentifierIndexTable *>(IdentifierIndex); 305e060e57bSDouglas Gregor IdentifierIndexTable::iterator Known = Table.find(Name); 306e060e57bSDouglas Gregor if (Known == Table.end()) { 307e060e57bSDouglas Gregor return true; 308e060e57bSDouglas Gregor } 309e060e57bSDouglas Gregor 310e060e57bSDouglas Gregor SmallVector<unsigned, 2> ModuleIDs = *Known; 311e060e57bSDouglas Gregor for (unsigned I = 0, N = ModuleIDs.size(); I != N; ++I) { 312603cd869SDouglas Gregor if (ModuleFile *MF = Modules[ModuleIDs[I]].File) 313603cd869SDouglas Gregor Hits.insert(MF); 314e060e57bSDouglas Gregor } 315e060e57bSDouglas Gregor 316e060e57bSDouglas Gregor ++NumIdentifierLookupHits; 317e060e57bSDouglas Gregor return true; 318e060e57bSDouglas Gregor } 319e060e57bSDouglas Gregor 320603cd869SDouglas Gregor bool GlobalModuleIndex::loadedModuleFile(ModuleFile *File) { 321603cd869SDouglas Gregor // Look for the module in the global module index based on the module name. 322beee15e7SBen Langmuir StringRef Name = File->ModuleName; 323603cd869SDouglas Gregor llvm::StringMap<unsigned>::iterator Known = UnresolvedModules.find(Name); 324603cd869SDouglas Gregor if (Known == UnresolvedModules.end()) { 325603cd869SDouglas Gregor return true; 3267029ce1aSDouglas Gregor } 3277029ce1aSDouglas Gregor 328603cd869SDouglas Gregor // Rectify this module with the global module index. 329603cd869SDouglas Gregor ModuleInfo &Info = Modules[Known->second]; 330603cd869SDouglas Gregor 331603cd869SDouglas Gregor // If the size and modification time match what we expected, record this 332603cd869SDouglas Gregor // module file. 333603cd869SDouglas Gregor bool Failed = true; 334603cd869SDouglas Gregor if (File->File->getSize() == Info.Size && 335603cd869SDouglas Gregor File->File->getModificationTime() == Info.ModTime) { 336603cd869SDouglas Gregor Info.File = File; 337603cd869SDouglas Gregor ModulesByFile[File] = Known->second; 338603cd869SDouglas Gregor 339603cd869SDouglas Gregor Failed = false; 3407029ce1aSDouglas Gregor } 3417029ce1aSDouglas Gregor 342603cd869SDouglas Gregor // One way or another, we have resolved this module file. 343603cd869SDouglas Gregor UnresolvedModules.erase(Known); 344603cd869SDouglas Gregor return Failed; 3457029ce1aSDouglas Gregor } 3467029ce1aSDouglas Gregor 347e060e57bSDouglas Gregor void GlobalModuleIndex::printStats() { 348e060e57bSDouglas Gregor std::fprintf(stderr, "*** Global Module Index Statistics:\n"); 349e060e57bSDouglas Gregor if (NumIdentifierLookups) { 350e060e57bSDouglas Gregor fprintf(stderr, " %u / %u identifier lookups succeeded (%f%%)\n", 351e060e57bSDouglas Gregor NumIdentifierLookupHits, NumIdentifierLookups, 352e060e57bSDouglas Gregor (double)NumIdentifierLookupHits*100.0/NumIdentifierLookups); 353e060e57bSDouglas Gregor } 354e060e57bSDouglas Gregor std::fprintf(stderr, "\n"); 355e060e57bSDouglas Gregor } 356e060e57bSDouglas Gregor 357bcdcc92eSJohn Thompson void GlobalModuleIndex::dump() { 358a39baf1aSJohn Thompson llvm::errs() << "*** Global Module Index Dump:\n"; 359a39baf1aSJohn Thompson llvm::errs() << "Module files:\n"; 3604f52d44dSJohn Thompson for (auto &MI : Modules) { 361a39baf1aSJohn Thompson llvm::errs() << "** " << MI.FileName << "\n"; 362a39baf1aSJohn Thompson if (MI.File) 363a39baf1aSJohn Thompson MI.File->dump(); 364bcdcc92eSJohn Thompson else 365a39baf1aSJohn Thompson llvm::errs() << "\n"; 366bcdcc92eSJohn Thompson } 367a39baf1aSJohn Thompson llvm::errs() << "\n"; 368bcdcc92eSJohn Thompson } 369bcdcc92eSJohn Thompson 370e060e57bSDouglas Gregor //----------------------------------------------------------------------------// 3715e306b12SDouglas Gregor // Global module index writer. 3725e306b12SDouglas Gregor //----------------------------------------------------------------------------// 3735e306b12SDouglas Gregor 3745e306b12SDouglas Gregor namespace { 3755e306b12SDouglas Gregor /// \brief Provides information about a specific module file. 3765e306b12SDouglas Gregor struct ModuleFileInfo { 3775e306b12SDouglas Gregor /// \brief The numberic ID for this module file. 3785e306b12SDouglas Gregor unsigned ID; 3795e306b12SDouglas Gregor 3805e306b12SDouglas Gregor /// \brief The set of modules on which this module depends. Each entry is 3815e306b12SDouglas Gregor /// a module ID. 3825e306b12SDouglas Gregor SmallVector<unsigned, 4> Dependencies; 3835e306b12SDouglas Gregor }; 3845e306b12SDouglas Gregor 3855e306b12SDouglas Gregor /// \brief Builder that generates the global module index file. 3865e306b12SDouglas Gregor class GlobalModuleIndexBuilder { 3875e306b12SDouglas Gregor FileManager &FileMgr; 388*bb165fb0SAdrian Prantl const PCHContainerOperations &PCHContainerOps; 3895e306b12SDouglas Gregor 3905e306b12SDouglas Gregor /// \brief Mapping from files to module file information. 3915e306b12SDouglas Gregor typedef llvm::MapVector<const FileEntry *, ModuleFileInfo> ModuleFilesMap; 3925e306b12SDouglas Gregor 3935e306b12SDouglas Gregor /// \brief Information about each of the known module files. 3945e306b12SDouglas Gregor ModuleFilesMap ModuleFiles; 3955e306b12SDouglas Gregor 3965e306b12SDouglas Gregor /// \brief Mapping from identifiers to the list of module file IDs that 3975e306b12SDouglas Gregor /// consider this identifier to be interesting. 3985e306b12SDouglas Gregor typedef llvm::StringMap<SmallVector<unsigned, 2> > InterestingIdentifierMap; 3995e306b12SDouglas Gregor 4005e306b12SDouglas Gregor /// \brief A mapping from all interesting identifiers to the set of module 4015e306b12SDouglas Gregor /// files in which those identifiers are considered interesting. 4025e306b12SDouglas Gregor InterestingIdentifierMap InterestingIdentifiers; 4035e306b12SDouglas Gregor 4045e306b12SDouglas Gregor /// \brief Write the block-info block for the global module index file. 4055e306b12SDouglas Gregor void emitBlockInfoBlock(llvm::BitstreamWriter &Stream); 4065e306b12SDouglas Gregor 4075e306b12SDouglas Gregor /// \brief Retrieve the module file information for the given file. 4085e306b12SDouglas Gregor ModuleFileInfo &getModuleFileInfo(const FileEntry *File) { 4095e306b12SDouglas Gregor llvm::MapVector<const FileEntry *, ModuleFileInfo>::iterator Known 4105e306b12SDouglas Gregor = ModuleFiles.find(File); 4115e306b12SDouglas Gregor if (Known != ModuleFiles.end()) 4125e306b12SDouglas Gregor return Known->second; 4135e306b12SDouglas Gregor 4145e306b12SDouglas Gregor unsigned NewID = ModuleFiles.size(); 4155e306b12SDouglas Gregor ModuleFileInfo &Info = ModuleFiles[File]; 4165e306b12SDouglas Gregor Info.ID = NewID; 4175e306b12SDouglas Gregor return Info; 4185e306b12SDouglas Gregor } 4195e306b12SDouglas Gregor 4205e306b12SDouglas Gregor public: 421*bb165fb0SAdrian Prantl explicit GlobalModuleIndexBuilder( 422*bb165fb0SAdrian Prantl FileManager &FileMgr, const PCHContainerOperations &PCHContainerOps) 423*bb165fb0SAdrian Prantl : FileMgr(FileMgr), PCHContainerOps(PCHContainerOps) {} 4245e306b12SDouglas Gregor 4255e306b12SDouglas Gregor /// \brief Load the contents of the given module file into the builder. 4265e306b12SDouglas Gregor /// 4275e306b12SDouglas Gregor /// \returns true if an error occurred, false otherwise. 4285e306b12SDouglas Gregor bool loadModuleFile(const FileEntry *File); 4295e306b12SDouglas Gregor 4305e306b12SDouglas Gregor /// \brief Write the index to the given bitstream. 4315e306b12SDouglas Gregor void writeIndex(llvm::BitstreamWriter &Stream); 4325e306b12SDouglas Gregor }; 4335e306b12SDouglas Gregor } 4345e306b12SDouglas Gregor 4355e306b12SDouglas Gregor static void emitBlockID(unsigned ID, const char *Name, 4365e306b12SDouglas Gregor llvm::BitstreamWriter &Stream, 4375e306b12SDouglas Gregor SmallVectorImpl<uint64_t> &Record) { 4385e306b12SDouglas Gregor Record.clear(); 4395e306b12SDouglas Gregor Record.push_back(ID); 4405e306b12SDouglas Gregor Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_SETBID, Record); 4415e306b12SDouglas Gregor 4425e306b12SDouglas Gregor // Emit the block name if present. 443a13603a2SCraig Topper if (!Name || Name[0] == 0) return; 4445e306b12SDouglas Gregor Record.clear(); 4455e306b12SDouglas Gregor while (*Name) 4465e306b12SDouglas Gregor Record.push_back(*Name++); 4475e306b12SDouglas Gregor Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_BLOCKNAME, Record); 4485e306b12SDouglas Gregor } 4495e306b12SDouglas Gregor 4505e306b12SDouglas Gregor static void emitRecordID(unsigned ID, const char *Name, 4515e306b12SDouglas Gregor llvm::BitstreamWriter &Stream, 4525e306b12SDouglas Gregor SmallVectorImpl<uint64_t> &Record) { 4535e306b12SDouglas Gregor Record.clear(); 4545e306b12SDouglas Gregor Record.push_back(ID); 4555e306b12SDouglas Gregor while (*Name) 4565e306b12SDouglas Gregor Record.push_back(*Name++); 4575e306b12SDouglas Gregor Stream.EmitRecord(llvm::bitc::BLOCKINFO_CODE_SETRECORDNAME, Record); 4585e306b12SDouglas Gregor } 4595e306b12SDouglas Gregor 4605e306b12SDouglas Gregor void 4615e306b12SDouglas Gregor GlobalModuleIndexBuilder::emitBlockInfoBlock(llvm::BitstreamWriter &Stream) { 4625e306b12SDouglas Gregor SmallVector<uint64_t, 64> Record; 4635e306b12SDouglas Gregor Stream.EnterSubblock(llvm::bitc::BLOCKINFO_BLOCK_ID, 3); 4645e306b12SDouglas Gregor 4655e306b12SDouglas Gregor #define BLOCK(X) emitBlockID(X ## _ID, #X, Stream, Record) 4665e306b12SDouglas Gregor #define RECORD(X) emitRecordID(X, #X, Stream, Record) 4675e306b12SDouglas Gregor BLOCK(GLOBAL_INDEX_BLOCK); 468e060e57bSDouglas Gregor RECORD(INDEX_METADATA); 4695e306b12SDouglas Gregor RECORD(MODULE); 4705e306b12SDouglas Gregor RECORD(IDENTIFIER_INDEX); 4715e306b12SDouglas Gregor #undef RECORD 4725e306b12SDouglas Gregor #undef BLOCK 4735e306b12SDouglas Gregor 4745e306b12SDouglas Gregor Stream.ExitBlock(); 4755e306b12SDouglas Gregor } 4765e306b12SDouglas Gregor 477e060e57bSDouglas Gregor namespace { 4785e306b12SDouglas Gregor class InterestingASTIdentifierLookupTrait 4795e306b12SDouglas Gregor : public serialization::reader::ASTIdentifierLookupTraitBase { 4805e306b12SDouglas Gregor 4815e306b12SDouglas Gregor public: 4825e306b12SDouglas Gregor /// \brief The identifier and whether it is "interesting". 4835e306b12SDouglas Gregor typedef std::pair<StringRef, bool> data_type; 4845e306b12SDouglas Gregor 4855e306b12SDouglas Gregor data_type ReadData(const internal_key_type& k, 4865e306b12SDouglas Gregor const unsigned char* d, 4875e306b12SDouglas Gregor unsigned DataLen) { 4885e306b12SDouglas Gregor // The first bit indicates whether this identifier is interesting. 4895e306b12SDouglas Gregor // That's all we care about. 49057ba0b22SJustin Bogner using namespace llvm::support; 49157ba0b22SJustin Bogner unsigned RawID = endian::readNext<uint32_t, little, unaligned>(d); 4925e306b12SDouglas Gregor bool IsInteresting = RawID & 0x01; 4935e306b12SDouglas Gregor return std::make_pair(k, IsInteresting); 4945e306b12SDouglas Gregor } 4955e306b12SDouglas Gregor }; 4965e306b12SDouglas Gregor } 4975e306b12SDouglas Gregor 4985e306b12SDouglas Gregor bool GlobalModuleIndexBuilder::loadModuleFile(const FileEntry *File) { 4995e306b12SDouglas Gregor // Open the module file. 5006406f7b8SRafael Espindola 501a885796dSBenjamin Kramer auto Buffer = FileMgr.getBufferForFile(File, /*isVolatile=*/true); 5025e306b12SDouglas Gregor if (!Buffer) { 5035e306b12SDouglas Gregor return true; 5045e306b12SDouglas Gregor } 5055e306b12SDouglas Gregor 5065e306b12SDouglas Gregor // Initialize the input stream 5075e306b12SDouglas Gregor llvm::BitstreamReader InStreamFile; 508*bb165fb0SAdrian Prantl PCHContainerOps.ExtractPCH((*Buffer)->getMemBufferRef(), InStreamFile); 509af0e40acSRafael Espindola llvm::BitstreamCursor InStream(InStreamFile); 5105e306b12SDouglas Gregor 5115e306b12SDouglas Gregor // Sniff for the signature. 5125e306b12SDouglas Gregor if (InStream.Read(8) != 'C' || 5135e306b12SDouglas Gregor InStream.Read(8) != 'P' || 5145e306b12SDouglas Gregor InStream.Read(8) != 'C' || 5155e306b12SDouglas Gregor InStream.Read(8) != 'H') { 5165e306b12SDouglas Gregor return true; 5175e306b12SDouglas Gregor } 5185e306b12SDouglas Gregor 5195e306b12SDouglas Gregor // Record this module file and assign it a unique ID (if it doesn't have 5205e306b12SDouglas Gregor // one already). 5215e306b12SDouglas Gregor unsigned ID = getModuleFileInfo(File).ID; 5225e306b12SDouglas Gregor 5235e306b12SDouglas Gregor // Search for the blocks and records we care about. 524e060e57bSDouglas Gregor enum { Other, ControlBlock, ASTBlock } State = Other; 5255e306b12SDouglas Gregor bool Done = false; 5265e306b12SDouglas Gregor while (!Done) { 527e060e57bSDouglas Gregor llvm::BitstreamEntry Entry = InStream.advance(); 5285e306b12SDouglas Gregor switch (Entry.Kind) { 5295e306b12SDouglas Gregor case llvm::BitstreamEntry::Error: 530e060e57bSDouglas Gregor Done = true; 531e060e57bSDouglas Gregor continue; 5325e306b12SDouglas Gregor 5335e306b12SDouglas Gregor case llvm::BitstreamEntry::Record: 534e060e57bSDouglas Gregor // In the 'other' state, just skip the record. We don't care. 535e060e57bSDouglas Gregor if (State == Other) { 5365e306b12SDouglas Gregor InStream.skipRecord(Entry.ID); 5375e306b12SDouglas Gregor continue; 5385e306b12SDouglas Gregor } 5395e306b12SDouglas Gregor 5405e306b12SDouglas Gregor // Handle potentially-interesting records below. 5415e306b12SDouglas Gregor break; 5425e306b12SDouglas Gregor 5435e306b12SDouglas Gregor case llvm::BitstreamEntry::SubBlock: 544e060e57bSDouglas Gregor if (Entry.ID == CONTROL_BLOCK_ID) { 5455e306b12SDouglas Gregor if (InStream.EnterSubBlock(CONTROL_BLOCK_ID)) 5465e306b12SDouglas Gregor return true; 5475e306b12SDouglas Gregor 5485e306b12SDouglas Gregor // Found the control block. 5495e306b12SDouglas Gregor State = ControlBlock; 5505e306b12SDouglas Gregor continue; 5515e306b12SDouglas Gregor } 5525e306b12SDouglas Gregor 553e060e57bSDouglas Gregor if (Entry.ID == AST_BLOCK_ID) { 5545e306b12SDouglas Gregor if (InStream.EnterSubBlock(AST_BLOCK_ID)) 5555e306b12SDouglas Gregor return true; 5565e306b12SDouglas Gregor 5575e306b12SDouglas Gregor // Found the AST block. 5585e306b12SDouglas Gregor State = ASTBlock; 5595e306b12SDouglas Gregor continue; 5605e306b12SDouglas Gregor } 5615e306b12SDouglas Gregor 5625e306b12SDouglas Gregor if (InStream.SkipBlock()) 5635e306b12SDouglas Gregor return true; 5645e306b12SDouglas Gregor 5655e306b12SDouglas Gregor continue; 5665e306b12SDouglas Gregor 5675e306b12SDouglas Gregor case llvm::BitstreamEntry::EndBlock: 568e060e57bSDouglas Gregor State = Other; 5695e306b12SDouglas Gregor continue; 5705e306b12SDouglas Gregor } 5715e306b12SDouglas Gregor 5725e306b12SDouglas Gregor // Read the given record. 5735e306b12SDouglas Gregor SmallVector<uint64_t, 64> Record; 5745e306b12SDouglas Gregor StringRef Blob; 5755e306b12SDouglas Gregor unsigned Code = InStream.readRecord(Entry.ID, Record, &Blob); 5765e306b12SDouglas Gregor 5775e306b12SDouglas Gregor // Handle module dependencies. 5785e306b12SDouglas Gregor if (State == ControlBlock && Code == IMPORTS) { 5795e306b12SDouglas Gregor // Load each of the imported PCH files. 5805e306b12SDouglas Gregor unsigned Idx = 0, N = Record.size(); 5815e306b12SDouglas Gregor while (Idx < N) { 5825e306b12SDouglas Gregor // Read information about the AST file. 5835e306b12SDouglas Gregor 5845e306b12SDouglas Gregor // Skip the imported kind 5855e306b12SDouglas Gregor ++Idx; 5865e306b12SDouglas Gregor 5875e306b12SDouglas Gregor // Skip the import location 5885e306b12SDouglas Gregor ++Idx; 5895e306b12SDouglas Gregor 5907029ce1aSDouglas Gregor // Load stored size/modification time. 5917029ce1aSDouglas Gregor off_t StoredSize = (off_t)Record[Idx++]; 5927029ce1aSDouglas Gregor time_t StoredModTime = (time_t)Record[Idx++]; 5937029ce1aSDouglas Gregor 594487ea14aSBen Langmuir // Skip the stored signature. 595487ea14aSBen Langmuir // FIXME: we could read the signature out of the import and validate it. 596487ea14aSBen Langmuir Idx++; 597487ea14aSBen Langmuir 5985e306b12SDouglas Gregor // Retrieve the imported file name. 5995e306b12SDouglas Gregor unsigned Length = Record[Idx++]; 6005e306b12SDouglas Gregor SmallString<128> ImportedFile(Record.begin() + Idx, 6015e306b12SDouglas Gregor Record.begin() + Idx + Length); 6025e306b12SDouglas Gregor Idx += Length; 6035e306b12SDouglas Gregor 6045e306b12SDouglas Gregor // Find the imported module file. 605dadd85dcSDouglas Gregor const FileEntry *DependsOnFile 606dadd85dcSDouglas Gregor = FileMgr.getFile(ImportedFile, /*openFile=*/false, 607dadd85dcSDouglas Gregor /*cacheFailure=*/false); 6087029ce1aSDouglas Gregor if (!DependsOnFile || 6097029ce1aSDouglas Gregor (StoredSize != DependsOnFile->getSize()) || 6107029ce1aSDouglas Gregor (StoredModTime != DependsOnFile->getModificationTime())) 6115e306b12SDouglas Gregor return true; 6125e306b12SDouglas Gregor 6135e306b12SDouglas Gregor // Record the dependency. 6145e306b12SDouglas Gregor unsigned DependsOnID = getModuleFileInfo(DependsOnFile).ID; 6155e306b12SDouglas Gregor getModuleFileInfo(File).Dependencies.push_back(DependsOnID); 6165e306b12SDouglas Gregor } 6175e306b12SDouglas Gregor 6185e306b12SDouglas Gregor continue; 6195e306b12SDouglas Gregor } 6205e306b12SDouglas Gregor 6215e306b12SDouglas Gregor // Handle the identifier table 6225e306b12SDouglas Gregor if (State == ASTBlock && Code == IDENTIFIER_TABLE && Record[0] > 0) { 623bb094f06SJustin Bogner typedef llvm::OnDiskIterableChainedHashTable< 624bb094f06SJustin Bogner InterestingASTIdentifierLookupTrait> InterestingIdentifierTable; 625b8984329SAhmed Charles std::unique_ptr<InterestingIdentifierTable> Table( 626b8984329SAhmed Charles InterestingIdentifierTable::Create( 6275e306b12SDouglas Gregor (const unsigned char *)Blob.data() + Record[0], 628da4e650eSJustin Bogner (const unsigned char *)Blob.data() + sizeof(uint32_t), 6295e306b12SDouglas Gregor (const unsigned char *)Blob.data())); 6305e306b12SDouglas Gregor for (InterestingIdentifierTable::data_iterator D = Table->data_begin(), 6315e306b12SDouglas Gregor DEnd = Table->data_end(); 6325e306b12SDouglas Gregor D != DEnd; ++D) { 6335e306b12SDouglas Gregor std::pair<StringRef, bool> Ident = *D; 6345e306b12SDouglas Gregor if (Ident.second) 6355e306b12SDouglas Gregor InterestingIdentifiers[Ident.first].push_back(ID); 636e060e57bSDouglas Gregor else 637e060e57bSDouglas Gregor (void)InterestingIdentifiers[Ident.first]; 6385e306b12SDouglas Gregor } 6395e306b12SDouglas Gregor } 6405e306b12SDouglas Gregor 6415e306b12SDouglas Gregor // We don't care about this record. 6425e306b12SDouglas Gregor } 6435e306b12SDouglas Gregor 6445e306b12SDouglas Gregor return false; 6455e306b12SDouglas Gregor } 6465e306b12SDouglas Gregor 6475e306b12SDouglas Gregor namespace { 6485e306b12SDouglas Gregor 6495e306b12SDouglas Gregor /// \brief Trait used to generate the identifier index as an on-disk hash 6505e306b12SDouglas Gregor /// table. 6515e306b12SDouglas Gregor class IdentifierIndexWriterTrait { 6525e306b12SDouglas Gregor public: 6535e306b12SDouglas Gregor typedef StringRef key_type; 6545e306b12SDouglas Gregor typedef StringRef key_type_ref; 6555e306b12SDouglas Gregor typedef SmallVector<unsigned, 2> data_type; 6565e306b12SDouglas Gregor typedef const SmallVector<unsigned, 2> &data_type_ref; 65725463f15SJustin Bogner typedef unsigned hash_value_type; 65825463f15SJustin Bogner typedef unsigned offset_type; 6595e306b12SDouglas Gregor 66025463f15SJustin Bogner static hash_value_type ComputeHash(key_type_ref Key) { 6615e306b12SDouglas Gregor return llvm::HashString(Key); 6625e306b12SDouglas Gregor } 6635e306b12SDouglas Gregor 6645e306b12SDouglas Gregor std::pair<unsigned,unsigned> 6655e306b12SDouglas Gregor EmitKeyDataLength(raw_ostream& Out, key_type_ref Key, data_type_ref Data) { 666e1c147c3SJustin Bogner using namespace llvm::support; 667e1c147c3SJustin Bogner endian::Writer<little> LE(Out); 6685e306b12SDouglas Gregor unsigned KeyLen = Key.size(); 6695e306b12SDouglas Gregor unsigned DataLen = Data.size() * 4; 670e1c147c3SJustin Bogner LE.write<uint16_t>(KeyLen); 671e1c147c3SJustin Bogner LE.write<uint16_t>(DataLen); 6725e306b12SDouglas Gregor return std::make_pair(KeyLen, DataLen); 6735e306b12SDouglas Gregor } 6745e306b12SDouglas Gregor 6755e306b12SDouglas Gregor void EmitKey(raw_ostream& Out, key_type_ref Key, unsigned KeyLen) { 6765e306b12SDouglas Gregor Out.write(Key.data(), KeyLen); 6775e306b12SDouglas Gregor } 6785e306b12SDouglas Gregor 6795e306b12SDouglas Gregor void EmitData(raw_ostream& Out, key_type_ref Key, data_type_ref Data, 6805e306b12SDouglas Gregor unsigned DataLen) { 681e1c147c3SJustin Bogner using namespace llvm::support; 6825e306b12SDouglas Gregor for (unsigned I = 0, N = Data.size(); I != N; ++I) 683e1c147c3SJustin Bogner endian::Writer<little>(Out).write<uint32_t>(Data[I]); 6845e306b12SDouglas Gregor } 6855e306b12SDouglas Gregor }; 6865e306b12SDouglas Gregor 6875e306b12SDouglas Gregor } 6885e306b12SDouglas Gregor 6895e306b12SDouglas Gregor void GlobalModuleIndexBuilder::writeIndex(llvm::BitstreamWriter &Stream) { 6905e306b12SDouglas Gregor using namespace llvm; 6915e306b12SDouglas Gregor 6925e306b12SDouglas Gregor // Emit the file header. 6935e306b12SDouglas Gregor Stream.Emit((unsigned)'B', 8); 6945e306b12SDouglas Gregor Stream.Emit((unsigned)'C', 8); 6955e306b12SDouglas Gregor Stream.Emit((unsigned)'G', 8); 6965e306b12SDouglas Gregor Stream.Emit((unsigned)'I', 8); 6975e306b12SDouglas Gregor 6985e306b12SDouglas Gregor // Write the block-info block, which describes the records in this bitcode 6995e306b12SDouglas Gregor // file. 7005e306b12SDouglas Gregor emitBlockInfoBlock(Stream); 7015e306b12SDouglas Gregor 7025e306b12SDouglas Gregor Stream.EnterSubblock(GLOBAL_INDEX_BLOCK_ID, 3); 7035e306b12SDouglas Gregor 7045e306b12SDouglas Gregor // Write the metadata. 7055e306b12SDouglas Gregor SmallVector<uint64_t, 2> Record; 7065e306b12SDouglas Gregor Record.push_back(CurrentVersion); 707e060e57bSDouglas Gregor Stream.EmitRecord(INDEX_METADATA, Record); 7085e306b12SDouglas Gregor 7095e306b12SDouglas Gregor // Write the set of known module files. 7105e306b12SDouglas Gregor for (ModuleFilesMap::iterator M = ModuleFiles.begin(), 7115e306b12SDouglas Gregor MEnd = ModuleFiles.end(); 7125e306b12SDouglas Gregor M != MEnd; ++M) { 7135e306b12SDouglas Gregor Record.clear(); 7145e306b12SDouglas Gregor Record.push_back(M->second.ID); 7155e306b12SDouglas Gregor Record.push_back(M->first->getSize()); 7165e306b12SDouglas Gregor Record.push_back(M->first->getModificationTime()); 7175e306b12SDouglas Gregor 7185e306b12SDouglas Gregor // File name 7195e306b12SDouglas Gregor StringRef Name(M->first->getName()); 7205e306b12SDouglas Gregor Record.push_back(Name.size()); 7215e306b12SDouglas Gregor Record.append(Name.begin(), Name.end()); 7225e306b12SDouglas Gregor 7235e306b12SDouglas Gregor // Dependencies 7245e306b12SDouglas Gregor Record.push_back(M->second.Dependencies.size()); 7255e306b12SDouglas Gregor Record.append(M->second.Dependencies.begin(), M->second.Dependencies.end()); 7265e306b12SDouglas Gregor Stream.EmitRecord(MODULE, Record); 7275e306b12SDouglas Gregor } 7285e306b12SDouglas Gregor 7295e306b12SDouglas Gregor // Write the identifier -> module file mapping. 7305e306b12SDouglas Gregor { 731bb094f06SJustin Bogner llvm::OnDiskChainedHashTableGenerator<IdentifierIndexWriterTrait> Generator; 7325e306b12SDouglas Gregor IdentifierIndexWriterTrait Trait; 7335e306b12SDouglas Gregor 7345e306b12SDouglas Gregor // Populate the hash table. 7355e306b12SDouglas Gregor for (InterestingIdentifierMap::iterator I = InterestingIdentifiers.begin(), 7365e306b12SDouglas Gregor IEnd = InterestingIdentifiers.end(); 7375e306b12SDouglas Gregor I != IEnd; ++I) { 7385e306b12SDouglas Gregor Generator.insert(I->first(), I->second, Trait); 7395e306b12SDouglas Gregor } 7405e306b12SDouglas Gregor 7415e306b12SDouglas Gregor // Create the on-disk hash table in a buffer. 7425e306b12SDouglas Gregor SmallString<4096> IdentifierTable; 7435e306b12SDouglas Gregor uint32_t BucketOffset; 7445e306b12SDouglas Gregor { 745e1c147c3SJustin Bogner using namespace llvm::support; 7465e306b12SDouglas Gregor llvm::raw_svector_ostream Out(IdentifierTable); 7475e306b12SDouglas Gregor // Make sure that no bucket is at offset 0 748e1c147c3SJustin Bogner endian::Writer<little>(Out).write<uint32_t>(0); 7495e306b12SDouglas Gregor BucketOffset = Generator.Emit(Out, Trait); 7505e306b12SDouglas Gregor } 7515e306b12SDouglas Gregor 7525e306b12SDouglas Gregor // Create a blob abbreviation 7535e306b12SDouglas Gregor BitCodeAbbrev *Abbrev = new BitCodeAbbrev(); 7545e306b12SDouglas Gregor Abbrev->Add(BitCodeAbbrevOp(IDENTIFIER_INDEX)); 7555e306b12SDouglas Gregor Abbrev->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Fixed, 32)); 7565e306b12SDouglas Gregor Abbrev->Add(BitCodeAbbrevOp(BitCodeAbbrevOp::Blob)); 7575e306b12SDouglas Gregor unsigned IDTableAbbrev = Stream.EmitAbbrev(Abbrev); 7585e306b12SDouglas Gregor 7595e306b12SDouglas Gregor // Write the identifier table 7605e306b12SDouglas Gregor Record.clear(); 7615e306b12SDouglas Gregor Record.push_back(IDENTIFIER_INDEX); 7625e306b12SDouglas Gregor Record.push_back(BucketOffset); 76392e1b62dSYaron Keren Stream.EmitRecordWithBlob(IDTableAbbrev, Record, IdentifierTable); 7645e306b12SDouglas Gregor } 7655e306b12SDouglas Gregor 7665e306b12SDouglas Gregor Stream.ExitBlock(); 7675e306b12SDouglas Gregor } 7685e306b12SDouglas Gregor 7695e306b12SDouglas Gregor GlobalModuleIndex::ErrorCode 770*bb165fb0SAdrian Prantl GlobalModuleIndex::writeIndex(FileManager &FileMgr, 771*bb165fb0SAdrian Prantl const PCHContainerOperations &PCHContainerOps, 772*bb165fb0SAdrian Prantl StringRef Path) { 7735e306b12SDouglas Gregor llvm::SmallString<128> IndexPath; 7745e306b12SDouglas Gregor IndexPath += Path; 7755e306b12SDouglas Gregor llvm::sys::path::append(IndexPath, IndexFileName); 7765e306b12SDouglas Gregor 7775e306b12SDouglas Gregor // Coordinate building the global index file with other processes that might 7785e306b12SDouglas Gregor // try to do the same. 7795e306b12SDouglas Gregor llvm::LockFileManager Locked(IndexPath); 7805e306b12SDouglas Gregor switch (Locked) { 7815e306b12SDouglas Gregor case llvm::LockFileManager::LFS_Error: 7825e306b12SDouglas Gregor return EC_IOError; 7835e306b12SDouglas Gregor 7845e306b12SDouglas Gregor case llvm::LockFileManager::LFS_Owned: 7855e306b12SDouglas Gregor // We're responsible for building the index ourselves. Do so below. 7865e306b12SDouglas Gregor break; 7875e306b12SDouglas Gregor 7885e306b12SDouglas Gregor case llvm::LockFileManager::LFS_Shared: 7895e306b12SDouglas Gregor // Someone else is responsible for building the index. We don't care 7905e306b12SDouglas Gregor // when they finish, so we're done. 7915e306b12SDouglas Gregor return EC_Building; 7925e306b12SDouglas Gregor } 7935e306b12SDouglas Gregor 7945e306b12SDouglas Gregor // The module index builder. 795*bb165fb0SAdrian Prantl GlobalModuleIndexBuilder Builder(FileMgr, PCHContainerOps); 7965e306b12SDouglas Gregor 7975e306b12SDouglas Gregor // Load each of the module files. 798c080917eSRafael Espindola std::error_code EC; 7995e306b12SDouglas Gregor for (llvm::sys::fs::directory_iterator D(Path, EC), DEnd; 8005e306b12SDouglas Gregor D != DEnd && !EC; 8015e306b12SDouglas Gregor D.increment(EC)) { 8025e306b12SDouglas Gregor // If this isn't a module file, we don't care. 8035e306b12SDouglas Gregor if (llvm::sys::path::extension(D->path()) != ".pcm") { 8045e306b12SDouglas Gregor // ... unless it's a .pcm.lock file, which indicates that someone is 8055e306b12SDouglas Gregor // in the process of rebuilding a module. They'll rebuild the index 8065e306b12SDouglas Gregor // at the end of that translation unit, so we don't have to. 8075e306b12SDouglas Gregor if (llvm::sys::path::extension(D->path()) == ".pcm.lock") 8085e306b12SDouglas Gregor return EC_Building; 8095e306b12SDouglas Gregor 8105e306b12SDouglas Gregor continue; 8115e306b12SDouglas Gregor } 8125e306b12SDouglas Gregor 8135e306b12SDouglas Gregor // If we can't find the module file, skip it. 8145e306b12SDouglas Gregor const FileEntry *ModuleFile = FileMgr.getFile(D->path()); 8155e306b12SDouglas Gregor if (!ModuleFile) 8165e306b12SDouglas Gregor continue; 8175e306b12SDouglas Gregor 8185e306b12SDouglas Gregor // Load this module file. 8195e306b12SDouglas Gregor if (Builder.loadModuleFile(ModuleFile)) 8205e306b12SDouglas Gregor return EC_IOError; 8215e306b12SDouglas Gregor } 8225e306b12SDouglas Gregor 8235e306b12SDouglas Gregor // The output buffer, into which the global index will be written. 8245e306b12SDouglas Gregor SmallVector<char, 16> OutputBuffer; 8255e306b12SDouglas Gregor { 8265e306b12SDouglas Gregor llvm::BitstreamWriter OutputStream(OutputBuffer); 8275e306b12SDouglas Gregor Builder.writeIndex(OutputStream); 8285e306b12SDouglas Gregor } 8295e306b12SDouglas Gregor 8305e306b12SDouglas Gregor // Write the global index file to a temporary file. 8315e306b12SDouglas Gregor llvm::SmallString<128> IndexTmpPath; 8325e306b12SDouglas Gregor int TmpFD; 83318627115SRafael Espindola if (llvm::sys::fs::createUniqueFile(IndexPath + "-%%%%%%%%", TmpFD, 83418627115SRafael Espindola IndexTmpPath)) 8355e306b12SDouglas Gregor return EC_IOError; 8365e306b12SDouglas Gregor 8375e306b12SDouglas Gregor // Open the temporary global index file for output. 838e00c9868SNAKAMURA Takumi llvm::raw_fd_ostream Out(TmpFD, true); 8395e306b12SDouglas Gregor if (Out.has_error()) 8405e306b12SDouglas Gregor return EC_IOError; 8415e306b12SDouglas Gregor 8425e306b12SDouglas Gregor // Write the index. 8435e306b12SDouglas Gregor Out.write(OutputBuffer.data(), OutputBuffer.size()); 8445e306b12SDouglas Gregor Out.close(); 8455e306b12SDouglas Gregor if (Out.has_error()) 8465e306b12SDouglas Gregor return EC_IOError; 8475e306b12SDouglas Gregor 8485e306b12SDouglas Gregor // Remove the old index file. It isn't relevant any more. 84992e1b62dSYaron Keren llvm::sys::fs::remove(IndexPath); 8505e306b12SDouglas Gregor 8515e306b12SDouglas Gregor // Rename the newly-written index file to the proper name. 85292e1b62dSYaron Keren if (llvm::sys::fs::rename(IndexTmpPath, IndexPath)) { 8535e306b12SDouglas Gregor // Rename failed; just remove the 85492e1b62dSYaron Keren llvm::sys::fs::remove(IndexTmpPath); 8555e306b12SDouglas Gregor return EC_IOError; 8565e306b12SDouglas Gregor } 8575e306b12SDouglas Gregor 8585e306b12SDouglas Gregor // We're done. 8595e306b12SDouglas Gregor return EC_None; 8605e306b12SDouglas Gregor } 8619aca3c61SArgyrios Kyrtzidis 8629aca3c61SArgyrios Kyrtzidis namespace { 8639aca3c61SArgyrios Kyrtzidis class GlobalIndexIdentifierIterator : public IdentifierIterator { 8649aca3c61SArgyrios Kyrtzidis /// \brief The current position within the identifier lookup table. 8659aca3c61SArgyrios Kyrtzidis IdentifierIndexTable::key_iterator Current; 8669aca3c61SArgyrios Kyrtzidis 8679aca3c61SArgyrios Kyrtzidis /// \brief The end position within the identifier lookup table. 8689aca3c61SArgyrios Kyrtzidis IdentifierIndexTable::key_iterator End; 8699aca3c61SArgyrios Kyrtzidis 8709aca3c61SArgyrios Kyrtzidis public: 8719aca3c61SArgyrios Kyrtzidis explicit GlobalIndexIdentifierIterator(IdentifierIndexTable &Idx) { 8729aca3c61SArgyrios Kyrtzidis Current = Idx.key_begin(); 8739aca3c61SArgyrios Kyrtzidis End = Idx.key_end(); 8749aca3c61SArgyrios Kyrtzidis } 8759aca3c61SArgyrios Kyrtzidis 8763e89dfeeSCraig Topper StringRef Next() override { 8779aca3c61SArgyrios Kyrtzidis if (Current == End) 8789aca3c61SArgyrios Kyrtzidis return StringRef(); 8799aca3c61SArgyrios Kyrtzidis 8809aca3c61SArgyrios Kyrtzidis StringRef Result = *Current; 8819aca3c61SArgyrios Kyrtzidis ++Current; 8829aca3c61SArgyrios Kyrtzidis return Result; 8839aca3c61SArgyrios Kyrtzidis } 8849aca3c61SArgyrios Kyrtzidis }; 8859aca3c61SArgyrios Kyrtzidis } 8869aca3c61SArgyrios Kyrtzidis 8879aca3c61SArgyrios Kyrtzidis IdentifierIterator *GlobalModuleIndex::createIdentifierIterator() const { 8889aca3c61SArgyrios Kyrtzidis IdentifierIndexTable &Table = 8899aca3c61SArgyrios Kyrtzidis *static_cast<IdentifierIndexTable *>(IdentifierIndex); 8909aca3c61SArgyrios Kyrtzidis return new GlobalIndexIdentifierIterator(Table); 8919aca3c61SArgyrios Kyrtzidis } 892