1 //===- DebugTypes.cpp -----------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "DebugTypes.h"
10 #include "Chunks.h"
11 #include "Driver.h"
12 #include "InputFiles.h"
13 #include "PDB.h"
14 #include "TypeMerger.h"
15 #include "lld/Common/ErrorHandler.h"
16 #include "lld/Common/Memory.h"
17 #include "lld/Common/Timer.h"
18 #include "llvm/DebugInfo/CodeView/TypeIndexDiscovery.h"
19 #include "llvm/DebugInfo/CodeView/TypeRecord.h"
20 #include "llvm/DebugInfo/CodeView/TypeRecordHelpers.h"
21 #include "llvm/DebugInfo/CodeView/TypeStreamMerger.h"
22 #include "llvm/DebugInfo/PDB/GenericError.h"
23 #include "llvm/DebugInfo/PDB/Native/InfoStream.h"
24 #include "llvm/DebugInfo/PDB/Native/NativeSession.h"
25 #include "llvm/DebugInfo/PDB/Native/PDBFile.h"
26 #include "llvm/DebugInfo/PDB/Native/TpiHashing.h"
27 #include "llvm/DebugInfo/PDB/Native/TpiStream.h"
28 #include "llvm/Support/FormatVariadic.h"
29 #include "llvm/Support/Parallel.h"
30 #include "llvm/Support/Path.h"
31 
32 using namespace llvm;
33 using namespace llvm::codeview;
34 using namespace lld;
35 using namespace lld::coff;
36 
37 namespace {
38 class TypeServerIpiSource;
39 
40 // The TypeServerSource class represents a PDB type server, a file referenced by
41 // OBJ files compiled with MSVC /Zi. A single PDB can be shared by several OBJ
42 // files, therefore there must be only once instance per OBJ lot. The file path
43 // is discovered from the dependent OBJ's debug type stream. The
44 // TypeServerSource object is then queued and loaded by the COFF Driver. The
45 // debug type stream for such PDB files will be merged first in the final PDB,
46 // before any dependent OBJ.
47 class TypeServerSource : public TpiSource {
48 public:
49   explicit TypeServerSource(PDBInputFile *f)
50       : TpiSource(PDB, nullptr), pdbInputFile(f) {
51     if (f->loadErr && *f->loadErr)
52       return;
53     pdb::PDBFile &file = f->session->getPDBFile();
54     auto expectedInfo = file.getPDBInfoStream();
55     if (!expectedInfo)
56       return;
57     auto it = mappings.emplace(expectedInfo->getGuid(), this);
58     assert(it.second);
59     (void)it;
60   }
61 
62   Error mergeDebugT(TypeMerger *m) override;
63 
64   void loadGHashes() override;
65   void remapTpiWithGHashes(GHashState *g) override;
66 
67   bool isDependency() const override { return true; }
68 
69   PDBInputFile *pdbInputFile = nullptr;
70 
71   // TpiSource for IPI stream.
72   TypeServerIpiSource *ipiSrc = nullptr;
73 
74   static std::map<codeview::GUID, TypeServerSource *> mappings;
75 };
76 
77 // Companion to TypeServerSource. Stores the index map for the IPI stream in the
78 // PDB. Modeling PDBs with two sources for TPI and IPI helps establish the
79 // invariant of one type index space per source.
80 class TypeServerIpiSource : public TpiSource {
81 public:
82   explicit TypeServerIpiSource() : TpiSource(PDBIpi, nullptr) {}
83 
84   friend class TypeServerSource;
85 
86   // All of the TpiSource methods are no-ops. The parent TypeServerSource
87   // handles both TPI and IPI.
88   Error mergeDebugT(TypeMerger *m) override { return Error::success(); }
89   void loadGHashes() override {}
90   void remapTpiWithGHashes(GHashState *g) override {}
91   bool isDependency() const override { return true; }
92 };
93 
94 // This class represents the debug type stream of an OBJ file that depends on a
95 // PDB type server (see TypeServerSource).
96 class UseTypeServerSource : public TpiSource {
97   Expected<TypeServerSource *> getTypeServerSource();
98 
99 public:
100   UseTypeServerSource(ObjFile *f, TypeServer2Record ts)
101       : TpiSource(UsingPDB, f), typeServerDependency(ts) {}
102 
103   Error mergeDebugT(TypeMerger *m) override;
104 
105   // No need to load ghashes from /Zi objects.
106   void loadGHashes() override {}
107   void remapTpiWithGHashes(GHashState *g) override;
108 
109   // Information about the PDB type server dependency, that needs to be loaded
110   // in before merging this OBJ.
111   TypeServer2Record typeServerDependency;
112 };
113 
114 // This class represents the debug type stream of a Microsoft precompiled
115 // headers OBJ (PCH OBJ). This OBJ kind needs to be merged first in the output
116 // PDB, before any other OBJs that depend on this. Note that only MSVC generate
117 // such files, clang does not.
118 class PrecompSource : public TpiSource {
119 public:
120   PrecompSource(ObjFile *f) : TpiSource(PCH, f) {
121     if (!f->pchSignature || !*f->pchSignature)
122       fatal(toString(f) +
123             " claims to be a PCH object, but does not have a valid signature");
124     auto it = mappings.emplace(*f->pchSignature, this);
125     if (!it.second)
126       fatal("a PCH object with the same signature has already been provided (" +
127             toString(it.first->second->file) + " and " + toString(file) + ")");
128   }
129 
130   void loadGHashes() override;
131 
132   bool isDependency() const override { return true; }
133 
134   static std::map<uint32_t, PrecompSource *> mappings;
135 };
136 
137 // This class represents the debug type stream of an OBJ file that depends on a
138 // Microsoft precompiled headers OBJ (see PrecompSource).
139 class UsePrecompSource : public TpiSource {
140 public:
141   UsePrecompSource(ObjFile *f, PrecompRecord precomp)
142       : TpiSource(UsingPCH, f), precompDependency(precomp) {}
143 
144   Error mergeDebugT(TypeMerger *m) override;
145 
146   void loadGHashes() override;
147   void remapTpiWithGHashes(GHashState *g) override;
148 
149 private:
150   Error mergeInPrecompHeaderObj();
151 
152 public:
153   // Information about the Precomp OBJ dependency, that needs to be loaded in
154   // before merging this OBJ.
155   PrecompRecord precompDependency;
156 };
157 } // namespace
158 
159 std::vector<TpiSource *> TpiSource::instances;
160 ArrayRef<TpiSource *> TpiSource::dependencySources;
161 ArrayRef<TpiSource *> TpiSource::objectSources;
162 
163 TpiSource::TpiSource(TpiKind k, ObjFile *f)
164     : kind(k), tpiSrcIdx(instances.size()), file(f) {
165   instances.push_back(this);
166 }
167 
168 // Vtable key method.
169 TpiSource::~TpiSource() {
170   // Silence any assertions about unchecked errors.
171   consumeError(std::move(typeMergingError));
172 }
173 
174 void TpiSource::sortDependencies() {
175   // Order dependencies first, but preserve the existing order.
176   std::vector<TpiSource *> deps;
177   std::vector<TpiSource *> objs;
178   for (TpiSource *s : instances)
179     (s->isDependency() ? deps : objs).push_back(s);
180   uint32_t numDeps = deps.size();
181   uint32_t numObjs = objs.size();
182   instances = std::move(deps);
183   instances.insert(instances.end(), objs.begin(), objs.end());
184   for (uint32_t i = 0, e = instances.size(); i < e; ++i)
185     instances[i]->tpiSrcIdx = i;
186   dependencySources = makeArrayRef(instances.data(), numDeps);
187   objectSources = makeArrayRef(instances.data() + numDeps, numObjs);
188 }
189 
190 TpiSource *lld::coff::makeTpiSource(ObjFile *file) {
191   return make<TpiSource>(TpiSource::Regular, file);
192 }
193 
194 TpiSource *lld::coff::makeTypeServerSource(PDBInputFile *pdbInputFile) {
195   // Type server sources come in pairs: the TPI stream, and the IPI stream.
196   auto *tpiSource = make<TypeServerSource>(pdbInputFile);
197   if (pdbInputFile->session->getPDBFile().hasPDBIpiStream())
198     tpiSource->ipiSrc = make<TypeServerIpiSource>();
199   return tpiSource;
200 }
201 
202 TpiSource *lld::coff::makeUseTypeServerSource(ObjFile *file,
203                                               TypeServer2Record ts) {
204   return make<UseTypeServerSource>(file, ts);
205 }
206 
207 TpiSource *lld::coff::makePrecompSource(ObjFile *file) {
208   return make<PrecompSource>(file);
209 }
210 
211 TpiSource *lld::coff::makeUsePrecompSource(ObjFile *file,
212                                            PrecompRecord precomp) {
213   return make<UsePrecompSource>(file, precomp);
214 }
215 
216 std::map<codeview::GUID, TypeServerSource *> TypeServerSource::mappings;
217 
218 std::map<uint32_t, PrecompSource *> PrecompSource::mappings;
219 
220 bool TpiSource::remapTypeIndex(TypeIndex &ti, TiRefKind refKind) const {
221   if (ti.isSimple())
222     return true;
223 
224   // This can be an item index or a type index. Choose the appropriate map.
225   ArrayRef<TypeIndex> tpiOrIpiMap =
226       (refKind == TiRefKind::IndexRef) ? ipiMap : tpiMap;
227   if (ti.toArrayIndex() >= tpiOrIpiMap.size())
228     return false;
229   ti = tpiOrIpiMap[ti.toArrayIndex()];
230   return true;
231 }
232 
233 void TpiSource::remapRecord(MutableArrayRef<uint8_t> rec,
234                             ArrayRef<TiReference> typeRefs) {
235   MutableArrayRef<uint8_t> contents = rec.drop_front(sizeof(RecordPrefix));
236   for (const TiReference &ref : typeRefs) {
237     unsigned byteSize = ref.Count * sizeof(TypeIndex);
238     if (contents.size() < ref.Offset + byteSize)
239       fatal("symbol record too short");
240 
241     MutableArrayRef<TypeIndex> indices(
242         reinterpret_cast<TypeIndex *>(contents.data() + ref.Offset), ref.Count);
243     for (TypeIndex &ti : indices) {
244       if (!remapTypeIndex(ti, ref.Kind)) {
245         if (config->verbose) {
246           uint16_t kind =
247               reinterpret_cast<const RecordPrefix *>(rec.data())->RecordKind;
248           StringRef fname = file ? file->getName() : "<unknown PDB>";
249           log("failed to remap type index in record of kind 0x" +
250               utohexstr(kind) + " in " + fname + " with bad " +
251               (ref.Kind == TiRefKind::IndexRef ? "item" : "type") +
252               " index 0x" + utohexstr(ti.getIndex()));
253         }
254         ti = TypeIndex(SimpleTypeKind::NotTranslated);
255         continue;
256       }
257     }
258   }
259 }
260 
261 void TpiSource::remapTypesInTypeRecord(MutableArrayRef<uint8_t> rec) {
262   // TODO: Handle errors similar to symbols.
263   SmallVector<TiReference, 32> typeRefs;
264   discoverTypeIndices(CVType(rec), typeRefs);
265   remapRecord(rec, typeRefs);
266 }
267 
268 bool TpiSource::remapTypesInSymbolRecord(MutableArrayRef<uint8_t> rec) {
269   // Discover type index references in the record. Skip it if we don't
270   // know where they are.
271   SmallVector<TiReference, 32> typeRefs;
272   if (!discoverTypeIndicesInSymbol(rec, typeRefs))
273     return false;
274   remapRecord(rec, typeRefs);
275   return true;
276 }
277 
278 // A COFF .debug$H section is currently a clang extension.  This function checks
279 // if a .debug$H section is in a format that we expect / understand, so that we
280 // can ignore any sections which are coincidentally also named .debug$H but do
281 // not contain a format we recognize.
282 static bool canUseDebugH(ArrayRef<uint8_t> debugH) {
283   if (debugH.size() < sizeof(object::debug_h_header))
284     return false;
285   auto *header =
286       reinterpret_cast<const object::debug_h_header *>(debugH.data());
287   debugH = debugH.drop_front(sizeof(object::debug_h_header));
288   return header->Magic == COFF::DEBUG_HASHES_SECTION_MAGIC &&
289          header->Version == 0 &&
290          header->HashAlgorithm == uint16_t(GlobalTypeHashAlg::SHA1_8) &&
291          (debugH.size() % 8 == 0);
292 }
293 
294 static Optional<ArrayRef<uint8_t>> getDebugH(ObjFile *file) {
295   SectionChunk *sec =
296       SectionChunk::findByName(file->getDebugChunks(), ".debug$H");
297   if (!sec)
298     return llvm::None;
299   ArrayRef<uint8_t> contents = sec->getContents();
300   if (!canUseDebugH(contents))
301     return None;
302   return contents;
303 }
304 
305 static ArrayRef<GloballyHashedType>
306 getHashesFromDebugH(ArrayRef<uint8_t> debugH) {
307   assert(canUseDebugH(debugH));
308   debugH = debugH.drop_front(sizeof(object::debug_h_header));
309   uint32_t count = debugH.size() / sizeof(GloballyHashedType);
310   return {reinterpret_cast<const GloballyHashedType *>(debugH.data()), count};
311 }
312 
313 // Merge .debug$T for a generic object file.
314 Error TpiSource::mergeDebugT(TypeMerger *m) {
315   assert(!config->debugGHashes &&
316          "use remapTpiWithGHashes when ghash is enabled");
317 
318   CVTypeArray types;
319   BinaryStreamReader reader(file->debugTypes, support::little);
320   cantFail(reader.readArray(types, reader.getLength()));
321 
322   // When dealing with PCH.OBJ, some indices were already merged.
323   unsigned nbHeadIndices = indexMapStorage.size();
324 
325   if (auto err = mergeTypeAndIdRecords(
326           m->idTable, m->typeTable, indexMapStorage, types, file->pchSignature))
327     fatal("codeview::mergeTypeAndIdRecords failed: " +
328           toString(std::move(err)));
329 
330   // In an object, there is only one mapping for both types and items.
331   tpiMap = indexMapStorage;
332   ipiMap = indexMapStorage;
333 
334   if (config->showSummary) {
335     // Count how many times we saw each type record in our input. This
336     // calculation requires a second pass over the type records to classify each
337     // record as a type or index. This is slow, but this code executes when
338     // collecting statistics.
339     m->tpiCounts.resize(m->getTypeTable().size());
340     m->ipiCounts.resize(m->getIDTable().size());
341     uint32_t srcIdx = nbHeadIndices;
342     for (CVType &ty : types) {
343       TypeIndex dstIdx = tpiMap[srcIdx++];
344       // Type merging may fail, so a complex source type may become the simple
345       // NotTranslated type, which cannot be used as an array index.
346       if (dstIdx.isSimple())
347         continue;
348       SmallVectorImpl<uint32_t> &counts =
349           isIdRecord(ty.kind()) ? m->ipiCounts : m->tpiCounts;
350       ++counts[dstIdx.toArrayIndex()];
351     }
352   }
353 
354   return Error::success();
355 }
356 
357 // Merge types from a type server PDB.
358 Error TypeServerSource::mergeDebugT(TypeMerger *m) {
359   assert(!config->debugGHashes &&
360          "use remapTpiWithGHashes when ghash is enabled");
361 
362   pdb::PDBFile &pdbFile = pdbInputFile->session->getPDBFile();
363   Expected<pdb::TpiStream &> expectedTpi = pdbFile.getPDBTpiStream();
364   if (auto e = expectedTpi.takeError())
365     fatal("Type server does not have TPI stream: " + toString(std::move(e)));
366   pdb::TpiStream *maybeIpi = nullptr;
367   if (pdbFile.hasPDBIpiStream()) {
368     Expected<pdb::TpiStream &> expectedIpi = pdbFile.getPDBIpiStream();
369     if (auto e = expectedIpi.takeError())
370       fatal("Error getting type server IPI stream: " + toString(std::move(e)));
371     maybeIpi = &*expectedIpi;
372   }
373 
374   // Merge TPI first, because the IPI stream will reference type indices.
375   if (auto err = mergeTypeRecords(m->typeTable, indexMapStorage,
376                                   expectedTpi->typeArray()))
377     fatal("codeview::mergeTypeRecords failed: " + toString(std::move(err)));
378   tpiMap = indexMapStorage;
379 
380   // Merge IPI.
381   if (maybeIpi) {
382     if (auto err = mergeIdRecords(m->idTable, tpiMap, ipiSrc->indexMapStorage,
383                                   maybeIpi->typeArray()))
384       fatal("codeview::mergeIdRecords failed: " + toString(std::move(err)));
385     ipiMap = ipiSrc->indexMapStorage;
386   }
387 
388   if (config->showSummary) {
389     // Count how many times we saw each type record in our input. If a
390     // destination type index is present in the source to destination type index
391     // map, that means we saw it once in the input. Add it to our histogram.
392     m->tpiCounts.resize(m->getTypeTable().size());
393     m->ipiCounts.resize(m->getIDTable().size());
394     for (TypeIndex ti : tpiMap)
395       if (!ti.isSimple())
396         ++m->tpiCounts[ti.toArrayIndex()];
397     for (TypeIndex ti : ipiMap)
398       if (!ti.isSimple())
399         ++m->ipiCounts[ti.toArrayIndex()];
400   }
401 
402   return Error::success();
403 }
404 
405 Expected<TypeServerSource *> UseTypeServerSource::getTypeServerSource() {
406   const codeview::GUID &tsId = typeServerDependency.getGuid();
407   StringRef tsPath = typeServerDependency.getName();
408 
409   TypeServerSource *tsSrc;
410   auto it = TypeServerSource::mappings.find(tsId);
411   if (it != TypeServerSource::mappings.end()) {
412     tsSrc = it->second;
413   } else {
414     // The file failed to load, lookup by name
415     PDBInputFile *pdb = PDBInputFile::findFromRecordPath(tsPath, file);
416     if (!pdb)
417       return createFileError(tsPath, errorCodeToError(std::error_code(
418                                          ENOENT, std::generic_category())));
419     // If an error occurred during loading, throw it now
420     if (pdb->loadErr && *pdb->loadErr)
421       return createFileError(tsPath, std::move(*pdb->loadErr));
422 
423     tsSrc = (TypeServerSource *)pdb->debugTypesObj;
424   }
425   return tsSrc;
426 }
427 
428 Error UseTypeServerSource::mergeDebugT(TypeMerger *m) {
429   Expected<TypeServerSource *> tsSrc = getTypeServerSource();
430   if (!tsSrc)
431     return tsSrc.takeError();
432 
433   pdb::PDBFile &pdbSession = (*tsSrc)->pdbInputFile->session->getPDBFile();
434   auto expectedInfo = pdbSession.getPDBInfoStream();
435   if (!expectedInfo)
436     return expectedInfo.takeError();
437 
438   // Just because a file with a matching name was found and it was an actual
439   // PDB file doesn't mean it matches.  For it to match the InfoStream's GUID
440   // must match the GUID specified in the TypeServer2 record.
441   if (expectedInfo->getGuid() != typeServerDependency.getGuid())
442     return createFileError(
443         typeServerDependency.getName(),
444         make_error<pdb::PDBError>(pdb::pdb_error_code::signature_out_of_date));
445 
446   // Reuse the type index map of the type server.
447   tpiMap = (*tsSrc)->tpiMap;
448   ipiMap = (*tsSrc)->ipiMap;
449   return Error::success();
450 }
451 
452 static bool equalsPath(StringRef path1, StringRef path2) {
453 #if defined(_WIN32)
454   return path1.equals_lower(path2);
455 #else
456   return path1.equals(path2);
457 #endif
458 }
459 
460 // Find by name an OBJ provided on the command line
461 static PrecompSource *findObjByName(StringRef fileNameOnly) {
462   SmallString<128> currentPath;
463   for (auto kv : PrecompSource::mappings) {
464     StringRef currentFileName = sys::path::filename(kv.second->file->getName(),
465                                                     sys::path::Style::windows);
466 
467     // Compare based solely on the file name (link.exe behavior)
468     if (equalsPath(currentFileName, fileNameOnly))
469       return kv.second;
470   }
471   return nullptr;
472 }
473 
474 static PrecompSource *findPrecompSource(ObjFile *file, PrecompRecord &pr) {
475   // Cross-compile warning: given that Clang doesn't generate LF_PRECOMP
476   // records, we assume the OBJ comes from a Windows build of cl.exe. Thusly,
477   // the paths embedded in the OBJs are in the Windows format.
478   SmallString<128> prFileName =
479       sys::path::filename(pr.getPrecompFilePath(), sys::path::Style::windows);
480 
481   auto it = PrecompSource::mappings.find(pr.getSignature());
482   if (it != PrecompSource::mappings.end()) {
483     return it->second;
484   }
485   // Lookup by name
486   return findObjByName(prFileName);
487 }
488 
489 static Expected<PrecompSource *> findPrecompMap(ObjFile *file,
490                                                 PrecompRecord &pr) {
491   PrecompSource *precomp = findPrecompSource(file, pr);
492 
493   if (!precomp)
494     return createFileError(
495         pr.getPrecompFilePath(),
496         make_error<pdb::PDBError>(pdb::pdb_error_code::no_matching_pch));
497 
498   if (pr.getSignature() != file->pchSignature)
499     return createFileError(
500         toString(file),
501         make_error<pdb::PDBError>(pdb::pdb_error_code::no_matching_pch));
502 
503   if (pr.getSignature() != *precomp->file->pchSignature)
504     return createFileError(
505         toString(precomp->file),
506         make_error<pdb::PDBError>(pdb::pdb_error_code::no_matching_pch));
507 
508   return precomp;
509 }
510 
511 /// Merges a precompiled headers TPI map into the current TPI map. The
512 /// precompiled headers object will also be loaded and remapped in the
513 /// process.
514 Error UsePrecompSource::mergeInPrecompHeaderObj() {
515   auto e = findPrecompMap(file, precompDependency);
516   if (!e)
517     return e.takeError();
518 
519   PrecompSource *precompSrc = *e;
520   if (precompSrc->tpiMap.empty())
521     return Error::success();
522 
523   assert(precompDependency.getStartTypeIndex() ==
524          TypeIndex::FirstNonSimpleIndex);
525   assert(precompDependency.getTypesCount() <= precompSrc->tpiMap.size());
526   // Use the previously remapped index map from the precompiled headers.
527   indexMapStorage.append(precompSrc->tpiMap.begin(),
528                          precompSrc->tpiMap.begin() +
529                              precompDependency.getTypesCount());
530 
531   return Error::success();
532 }
533 
534 Error UsePrecompSource::mergeDebugT(TypeMerger *m) {
535   // This object was compiled with /Yu, so process the corresponding
536   // precompiled headers object (/Yc) first. Some type indices in the current
537   // object are referencing data in the precompiled headers object, so we need
538   // both to be loaded.
539   if (Error e = mergeInPrecompHeaderObj())
540     return e;
541 
542   return TpiSource::mergeDebugT(m);
543 }
544 
545 uint32_t TpiSource::countTypeServerPDBs() {
546   return TypeServerSource::mappings.size();
547 }
548 
549 uint32_t TpiSource::countPrecompObjs() {
550   return PrecompSource::mappings.size();
551 }
552 
553 void TpiSource::clear() {
554   // Clean up any owned ghash allocations.
555   clearGHashes();
556   TpiSource::instances.clear();
557   TypeServerSource::mappings.clear();
558   PrecompSource::mappings.clear();
559 }
560 
561 //===----------------------------------------------------------------------===//
562 // Parellel GHash type merging implementation.
563 //===----------------------------------------------------------------------===//
564 
565 void TpiSource::loadGHashes() {
566   if (Optional<ArrayRef<uint8_t>> debugH = getDebugH(file)) {
567     ghashes = getHashesFromDebugH(*debugH);
568     ownedGHashes = false;
569   } else {
570     CVTypeArray types;
571     BinaryStreamReader reader(file->debugTypes, support::little);
572     cantFail(reader.readArray(types, reader.getLength()));
573     assignGHashesFromVector(GloballyHashedType::hashTypes(types));
574   }
575 
576   fillIsItemIndexFromDebugT();
577 }
578 
579 // Copies ghashes from a vector into an array. These are long lived, so it's
580 // worth the time to copy these into an appropriately sized vector to reduce
581 // memory usage.
582 void TpiSource::assignGHashesFromVector(
583     std::vector<GloballyHashedType> &&hashVec) {
584   GloballyHashedType *hashes = new GloballyHashedType[hashVec.size()];
585   memcpy(hashes, hashVec.data(), hashVec.size() * sizeof(GloballyHashedType));
586   ghashes = makeArrayRef(hashes, hashVec.size());
587   ownedGHashes = true;
588 }
589 
590 // Faster way to iterate type records. forEachTypeChecked is faster than
591 // iterating CVTypeArray. It avoids virtual readBytes calls in inner loops.
592 static void forEachTypeChecked(ArrayRef<uint8_t> types,
593                                function_ref<void(const CVType &)> fn) {
594   checkError(
595       forEachCodeViewRecord<CVType>(types, [fn](const CVType &ty) -> Error {
596         fn(ty);
597         return Error::success();
598       }));
599 }
600 
601 // Walk over file->debugTypes and fill in the isItemIndex bit vector.
602 // TODO: Store this information in .debug$H so that we don't have to recompute
603 // it. This is the main bottleneck slowing down parallel ghashing with one
604 // thread over single-threaded ghashing.
605 void TpiSource::fillIsItemIndexFromDebugT() {
606   uint32_t index = 0;
607   isItemIndex.resize(ghashes.size());
608   forEachTypeChecked(file->debugTypes, [&](const CVType &ty) {
609     if (isIdRecord(ty.kind()))
610       isItemIndex.set(index);
611     ++index;
612   });
613 }
614 
615 void TpiSource::mergeTypeRecord(TypeIndex curIndex, CVType ty) {
616   // Decide if the merged type goes into TPI or IPI.
617   bool isItem = isIdRecord(ty.kind());
618   MergedInfo &merged = isItem ? mergedIpi : mergedTpi;
619 
620   // Copy the type into our mutable buffer.
621   assert(ty.length() <= codeview::MaxRecordLength);
622   size_t offset = merged.recs.size();
623   size_t newSize = alignTo(ty.length(), 4);
624   merged.recs.resize(offset + newSize);
625   auto newRec = makeMutableArrayRef(&merged.recs[offset], newSize);
626   memcpy(newRec.data(), ty.data().data(), newSize);
627 
628   // Fix up the record prefix and padding bytes if it required resizing.
629   if (newSize != ty.length()) {
630     reinterpret_cast<RecordPrefix *>(newRec.data())->RecordLen = newSize - 2;
631     for (size_t i = ty.length(); i < newSize; ++i)
632       newRec[i] = LF_PAD0 + (newSize - i);
633   }
634 
635   // Remap the type indices in the new record.
636   remapTypesInTypeRecord(newRec);
637   uint32_t pdbHash = check(pdb::hashTypeRecord(CVType(newRec)));
638   merged.recSizes.push_back(static_cast<uint16_t>(newSize));
639   merged.recHashes.push_back(pdbHash);
640 
641   // Retain a mapping from PDB function id to PDB function type. This mapping is
642   // used during symbol procesing to rewrite S_GPROC32_ID symbols to S_GPROC32
643   // symbols.
644   if (ty.kind() == LF_FUNC_ID || ty.kind() == LF_MFUNC_ID) {
645     bool success = ty.length() >= 12;
646     TypeIndex funcId = curIndex;
647     if (success)
648       success &= remapTypeIndex(funcId, TiRefKind::IndexRef);
649     TypeIndex funcType =
650         *reinterpret_cast<const TypeIndex *>(&newRec.data()[8]);
651     if (success) {
652       funcIdToType.push_back({funcId, funcType});
653     } else {
654       StringRef fname = file ? file->getName() : "<unknown PDB>";
655       warn("corrupt LF_[M]FUNC_ID record 0x" + utohexstr(curIndex.getIndex()) +
656            " in " + fname);
657     }
658   }
659 }
660 
661 void TpiSource::mergeUniqueTypeRecords(ArrayRef<uint8_t> typeRecords,
662                                        TypeIndex beginIndex) {
663   // Re-sort the list of unique types by index.
664   if (kind == PDB)
665     assert(std::is_sorted(uniqueTypes.begin(), uniqueTypes.end()));
666   else
667     llvm::sort(uniqueTypes);
668 
669   // Accumulate all the unique types into one buffer in mergedTypes.
670   uint32_t ghashIndex = 0;
671   auto nextUniqueIndex = uniqueTypes.begin();
672   assert(mergedTpi.recs.empty());
673   assert(mergedIpi.recs.empty());
674   forEachTypeChecked(typeRecords, [&](const CVType &ty) {
675     if (nextUniqueIndex != uniqueTypes.end() &&
676         *nextUniqueIndex == ghashIndex) {
677       mergeTypeRecord(beginIndex + ghashIndex, ty);
678       ++nextUniqueIndex;
679     }
680     ++ghashIndex;
681   });
682   assert(nextUniqueIndex == uniqueTypes.end() &&
683          "failed to merge all desired records");
684   assert(uniqueTypes.size() ==
685              mergedTpi.recSizes.size() + mergedIpi.recSizes.size() &&
686          "missing desired record");
687 }
688 
689 void TpiSource::remapTpiWithGHashes(GHashState *g) {
690   assert(config->debugGHashes && "ghashes must be enabled");
691   fillMapFromGHashes(g, indexMapStorage);
692   tpiMap = indexMapStorage;
693   ipiMap = indexMapStorage;
694   mergeUniqueTypeRecords(file->debugTypes);
695   // TODO: Free all unneeded ghash resources now that we have a full index map.
696 }
697 
698 // PDBs do not actually store global hashes, so when merging a type server
699 // PDB we have to synthesize global hashes.  To do this, we first synthesize
700 // global hashes for the TPI stream, since it is independent, then we
701 // synthesize hashes for the IPI stream, using the hashes for the TPI stream
702 // as inputs.
703 void TypeServerSource::loadGHashes() {
704   // Don't hash twice.
705   if (!ghashes.empty())
706     return;
707   pdb::PDBFile &pdbFile = pdbInputFile->session->getPDBFile();
708 
709   // Hash TPI stream.
710   Expected<pdb::TpiStream &> expectedTpi = pdbFile.getPDBTpiStream();
711   if (auto e = expectedTpi.takeError())
712     fatal("Type server does not have TPI stream: " + toString(std::move(e)));
713   assignGHashesFromVector(
714       GloballyHashedType::hashTypes(expectedTpi->typeArray()));
715   isItemIndex.resize(ghashes.size());
716 
717   // Hash IPI stream, which depends on TPI ghashes.
718   if (!pdbFile.hasPDBIpiStream())
719     return;
720   Expected<pdb::TpiStream &> expectedIpi = pdbFile.getPDBIpiStream();
721   if (auto e = expectedIpi.takeError())
722     fatal("error retreiving IPI stream: " + toString(std::move(e)));
723   ipiSrc->assignGHashesFromVector(
724       GloballyHashedType::hashIds(expectedIpi->typeArray(), ghashes));
725 
726   // The IPI stream isItemIndex bitvector should be all ones.
727   ipiSrc->isItemIndex.resize(ipiSrc->ghashes.size());
728   ipiSrc->isItemIndex.set(0, ipiSrc->ghashes.size());
729 }
730 
731 // Flatten discontiguous PDB type arrays to bytes so that we can use
732 // forEachTypeChecked instead of CVTypeArray iteration. Copying all types from
733 // type servers is faster than iterating all object files compiled with /Z7 with
734 // CVTypeArray, which has high overheads due to the virtual interface of
735 // BinaryStream::readBytes.
736 static ArrayRef<uint8_t> typeArrayToBytes(const CVTypeArray &types) {
737   BinaryStreamRef stream = types.getUnderlyingStream();
738   ArrayRef<uint8_t> debugTypes;
739   checkError(stream.readBytes(0, stream.getLength(), debugTypes));
740   return debugTypes;
741 }
742 
743 // Merge types from a type server PDB.
744 void TypeServerSource::remapTpiWithGHashes(GHashState *g) {
745   assert(config->debugGHashes && "ghashes must be enabled");
746 
747   // IPI merging depends on TPI, so do TPI first, then do IPI.  No need to
748   // propagate errors, those should've been handled during ghash loading.
749   pdb::PDBFile &pdbFile = pdbInputFile->session->getPDBFile();
750   pdb::TpiStream &tpi = check(pdbFile.getPDBTpiStream());
751   fillMapFromGHashes(g, indexMapStorage);
752   tpiMap = indexMapStorage;
753   mergeUniqueTypeRecords(typeArrayToBytes(tpi.typeArray()));
754   if (pdbFile.hasPDBIpiStream()) {
755     pdb::TpiStream &ipi = check(pdbFile.getPDBIpiStream());
756     ipiSrc->indexMapStorage.resize(ipiSrc->ghashes.size());
757     ipiSrc->fillMapFromGHashes(g, ipiSrc->indexMapStorage);
758     ipiMap = ipiSrc->indexMapStorage;
759     ipiSrc->tpiMap = tpiMap;
760     ipiSrc->ipiMap = ipiMap;
761     ipiSrc->mergeUniqueTypeRecords(typeArrayToBytes(ipi.typeArray()));
762   }
763 }
764 
765 void UseTypeServerSource::remapTpiWithGHashes(GHashState *g) {
766   // No remapping to do with /Zi objects. Simply use the index map from the type
767   // server. Errors should have been reported earlier. Symbols from this object
768   // will be ignored.
769   Expected<TypeServerSource *> maybeTsSrc = getTypeServerSource();
770   if (!maybeTsSrc) {
771     typeMergingError =
772         joinErrors(std::move(typeMergingError), maybeTsSrc.takeError());
773     return;
774   }
775   TypeServerSource *tsSrc = *maybeTsSrc;
776   tpiMap = tsSrc->tpiMap;
777   ipiMap = tsSrc->ipiMap;
778 }
779 
780 void PrecompSource::loadGHashes() {
781   if (getDebugH(file)) {
782     warn("ignoring .debug$H section; pch with ghash is not implemented");
783   }
784 
785   uint32_t ghashIdx = 0;
786   std::vector<GloballyHashedType> hashVec;
787   forEachTypeChecked(file->debugTypes, [&](const CVType &ty) {
788     // Remember the index of the LF_ENDPRECOMP record so it can be excluded from
789     // the PDB. There must be an entry in the list of ghashes so that the type
790     // indexes of the following records in the /Yc PCH object line up.
791     if (ty.kind() == LF_ENDPRECOMP)
792       endPrecompGHashIdx = ghashIdx;
793 
794     hashVec.push_back(GloballyHashedType::hashType(ty, hashVec, hashVec));
795     isItemIndex.push_back(isIdRecord(ty.kind()));
796     ++ghashIdx;
797   });
798   assignGHashesFromVector(std::move(hashVec));
799 }
800 
801 void UsePrecompSource::loadGHashes() {
802   PrecompSource *pchSrc = findPrecompSource(file, precompDependency);
803   if (!pchSrc)
804     return;
805 
806   // To compute ghashes of a /Yu object file, we need to build on the the
807   // ghashes of the /Yc PCH object. After we are done hashing, discard the
808   // ghashes from the PCH source so we don't unnecessarily try to deduplicate
809   // them.
810   std::vector<GloballyHashedType> hashVec =
811       pchSrc->ghashes.take_front(precompDependency.getTypesCount());
812   forEachTypeChecked(file->debugTypes, [&](const CVType &ty) {
813     hashVec.push_back(GloballyHashedType::hashType(ty, hashVec, hashVec));
814     isItemIndex.push_back(isIdRecord(ty.kind()));
815   });
816   hashVec.erase(hashVec.begin(),
817                 hashVec.begin() + precompDependency.getTypesCount());
818   assignGHashesFromVector(std::move(hashVec));
819 }
820 
821 void UsePrecompSource::remapTpiWithGHashes(GHashState *g) {
822   // This object was compiled with /Yu, so process the corresponding
823   // precompiled headers object (/Yc) first. Some type indices in the current
824   // object are referencing data in the precompiled headers object, so we need
825   // both to be loaded.
826   if (Error e = mergeInPrecompHeaderObj()) {
827     typeMergingError = joinErrors(std::move(typeMergingError), std::move(e));
828     return;
829   }
830 
831   fillMapFromGHashes(g, indexMapStorage);
832   tpiMap = indexMapStorage;
833   ipiMap = indexMapStorage;
834   mergeUniqueTypeRecords(file->debugTypes,
835                          TypeIndex(precompDependency.getStartTypeIndex() +
836                                    precompDependency.getTypesCount()));
837 }
838 
839 namespace {
840 /// A concurrent hash table for global type hashing. It is based on this paper:
841 /// Concurrent Hash Tables: Fast and General(?)!
842 /// https://dl.acm.org/doi/10.1145/3309206
843 ///
844 /// This hash table is meant to be used in two phases:
845 /// 1. concurrent insertions
846 /// 2. concurrent reads
847 /// It does not support lookup, deletion, or rehashing. It uses linear probing.
848 ///
849 /// The paper describes storing a key-value pair in two machine words.
850 /// Generally, the values stored in this map are type indices, and we can use
851 /// those values to recover the ghash key from a side table. This allows us to
852 /// shrink the table entries further at the cost of some loads, and sidesteps
853 /// the need for a 128 bit atomic compare-and-swap operation.
854 ///
855 /// During insertion, a priority function is used to decide which insertion
856 /// should be preferred. This ensures that the output is deterministic. For
857 /// ghashing, lower tpiSrcIdx values (earlier inputs) are preferred.
858 ///
859 class GHashCell;
860 struct GHashTable {
861   GHashCell *table = nullptr;
862   uint32_t tableSize = 0;
863 
864   GHashTable() = default;
865   ~GHashTable();
866 
867   /// Initialize the table with the given size. Because the table cannot be
868   /// resized, the initial size of the table must be large enough to contain all
869   /// inputs, or insertion may not be able to find an empty cell.
870   void init(uint32_t newTableSize);
871 
872   /// Insert the cell with the given ghash into the table. Return the insertion
873   /// position in the table. It is safe for the caller to store the insertion
874   /// position because the table cannot be resized.
875   uint32_t insert(GloballyHashedType ghash, GHashCell newCell);
876 };
877 
878 /// A ghash table cell for deduplicating types from TpiSources.
879 class GHashCell {
880   uint64_t data = 0;
881 
882 public:
883   GHashCell() = default;
884 
885   // Construct data most to least significant so that sorting works well:
886   // - isItem
887   // - tpiSrcIdx
888   // - ghashIdx
889   // Add one to the tpiSrcIdx so that the 0th record from the 0th source has a
890   // non-zero representation.
891   GHashCell(bool isItem, uint32_t tpiSrcIdx, uint32_t ghashIdx)
892       : data((uint64_t(isItem) << 63U) | (uint64_t(tpiSrcIdx + 1) << 32ULL) |
893              ghashIdx) {
894     assert(tpiSrcIdx == getTpiSrcIdx() && "round trip failure");
895     assert(ghashIdx == getGHashIdx() && "round trip failure");
896   }
897 
898   explicit GHashCell(uint64_t data) : data(data) {}
899 
900   // The empty cell is all zeros.
901   bool isEmpty() const { return data == 0ULL; }
902 
903   /// Extract the tpiSrcIdx.
904   uint32_t getTpiSrcIdx() const {
905     return ((uint32_t)(data >> 32U) & 0x7FFFFFFF) - 1;
906   }
907 
908   /// Extract the index into the ghash array of the TpiSource.
909   uint32_t getGHashIdx() const { return (uint32_t)data; }
910 
911   bool isItem() const { return data & (1ULL << 63U); }
912 
913   /// Get the ghash key for this cell.
914   GloballyHashedType getGHash() const {
915     return TpiSource::instances[getTpiSrcIdx()]->ghashes[getGHashIdx()];
916   }
917 
918   /// The priority function for the cell. The data is stored such that lower
919   /// tpiSrcIdx and ghashIdx values are preferred, which means that type record
920   /// from earlier sources are more likely to prevail.
921   friend inline bool operator<(const GHashCell &l, const GHashCell &r) {
922     return l.data < r.data;
923   }
924 };
925 } // namespace
926 
927 namespace lld {
928 namespace coff {
929 /// This type is just a wrapper around GHashTable with external linkage so it
930 /// can be used from a header.
931 struct GHashState {
932   GHashTable table;
933 };
934 } // namespace coff
935 } // namespace lld
936 
937 GHashTable::~GHashTable() { delete[] table; }
938 
939 void GHashTable::init(uint32_t newTableSize) {
940   table = new GHashCell[newTableSize];
941   memset(table, 0, newTableSize * sizeof(GHashCell));
942   tableSize = newTableSize;
943 }
944 
945 uint32_t GHashTable::insert(GloballyHashedType ghash, GHashCell newCell) {
946   assert(!newCell.isEmpty() && "cannot insert empty cell value");
947 
948   // FIXME: The low bytes of SHA1 have low entropy for short records, which
949   // type records are. Swap the byte order for better entropy. A better ghash
950   // won't need this.
951   uint32_t startIdx =
952       ByteSwap_64(*reinterpret_cast<uint64_t *>(&ghash)) % tableSize;
953 
954   // Do a linear probe starting at startIdx.
955   uint32_t idx = startIdx;
956   while (true) {
957     // Run a compare and swap loop. There are four cases:
958     // - cell is empty: CAS into place and return
959     // - cell has matching key, earlier priority: do nothing, return
960     // - cell has matching key, later priority: CAS into place and return
961     // - cell has non-matching key: hash collision, probe next cell
962     auto *cellPtr = reinterpret_cast<std::atomic<GHashCell> *>(&table[idx]);
963     GHashCell oldCell(cellPtr->load());
964     while (oldCell.isEmpty() || oldCell.getGHash() == ghash) {
965       // Check if there is an existing ghash entry with a higher priority
966       // (earlier ordering). If so, this is a duplicate, we are done.
967       if (!oldCell.isEmpty() && oldCell < newCell)
968         return idx;
969       // Either the cell is empty, or our value is higher priority. Try to
970       // compare and swap. If it succeeds, we are done.
971       if (cellPtr->compare_exchange_weak(oldCell, newCell))
972         return idx;
973       // If the CAS failed, check this cell again.
974     }
975 
976     // Advance the probe. Wrap around to the beginning if we run off the end.
977     ++idx;
978     idx = idx == tableSize ? 0 : idx;
979     if (idx == startIdx) {
980       // If this becomes an issue, we could mark failure and rehash from the
981       // beginning with a bigger table. There is no difference between rehashing
982       // internally and starting over.
983       report_fatal_error("ghash table is full");
984     }
985   }
986   llvm_unreachable("left infloop");
987 }
988 
989 TypeMerger::TypeMerger(llvm::BumpPtrAllocator &alloc)
990     : typeTable(alloc), idTable(alloc) {}
991 
992 TypeMerger::~TypeMerger() = default;
993 
994 void TypeMerger::mergeTypesWithGHash() {
995   // Load ghashes. Do type servers and PCH objects first.
996   {
997     ScopedTimer t1(loadGHashTimer);
998     parallelForEach(TpiSource::dependencySources,
999                     [&](TpiSource *source) { source->loadGHashes(); });
1000     parallelForEach(TpiSource::objectSources,
1001                     [&](TpiSource *source) { source->loadGHashes(); });
1002   }
1003 
1004   ScopedTimer t2(mergeGHashTimer);
1005   GHashState ghashState;
1006 
1007   // Estimate the size of hash table needed to deduplicate ghashes. This *must*
1008   // be larger than the number of unique types, or hash table insertion may not
1009   // be able to find a vacant slot. Summing the input types guarantees this, but
1010   // it is a gross overestimate. The table size could be reduced to save memory,
1011   // but it would require implementing rehashing, and this table is generally
1012   // small compared to total memory usage, at eight bytes per input type record,
1013   // and most input type records are larger than eight bytes.
1014   size_t tableSize = 0;
1015   for (TpiSource *source : TpiSource::instances)
1016     tableSize += source->ghashes.size();
1017 
1018   // Cap the table size so that we can use 32-bit cell indices. Type indices are
1019   // also 32-bit, so this is an inherent PDB file format limit anyway.
1020   tableSize = std::min(size_t(INT32_MAX), tableSize);
1021   ghashState.table.init(static_cast<uint32_t>(tableSize));
1022 
1023   // Insert ghashes in parallel. During concurrent insertion, we cannot observe
1024   // the contents of the hash table cell, but we can remember the insertion
1025   // position. Because the table does not rehash, the position will not change
1026   // under insertion. After insertion is done, the value of the cell can be read
1027   // to retreive the final PDB type index.
1028   parallelForEachN(0, TpiSource::instances.size(), [&](size_t tpiSrcIdx) {
1029     TpiSource *source = TpiSource::instances[tpiSrcIdx];
1030     source->indexMapStorage.resize(source->ghashes.size());
1031     for (uint32_t i = 0, e = source->ghashes.size(); i < e; i++) {
1032       if (source->shouldOmitFromPdb(i)) {
1033         source->indexMapStorage[i] = TypeIndex(SimpleTypeKind::NotTranslated);
1034         continue;
1035       }
1036       GloballyHashedType ghash = source->ghashes[i];
1037       bool isItem = source->isItemIndex.test(i);
1038       uint32_t cellIdx =
1039           ghashState.table.insert(ghash, GHashCell(isItem, tpiSrcIdx, i));
1040 
1041       // Store the ghash cell index as a type index in indexMapStorage. Later
1042       // we will replace it with the PDB type index.
1043       source->indexMapStorage[i] = TypeIndex::fromArrayIndex(cellIdx);
1044     }
1045   });
1046 
1047   // Collect all non-empty cells and sort them. This will implicitly assign
1048   // destination type indices, and partition the entries into type records and
1049   // item records. It arranges types in this order:
1050   // - type records
1051   //   - source 0, type 0...
1052   //   - source 1, type 1...
1053   // - item records
1054   //   - source 0, type 1...
1055   //   - source 1, type 0...
1056   std::vector<GHashCell> entries;
1057   for (const GHashCell &cell :
1058        makeArrayRef(ghashState.table.table, tableSize)) {
1059     if (!cell.isEmpty())
1060       entries.push_back(cell);
1061   }
1062   parallelSort(entries, std::less<GHashCell>());
1063   log(formatv("ghash table load factor: {0:p} (size {1} / capacity {2})\n",
1064               double(entries.size()) / tableSize, entries.size(), tableSize));
1065 
1066   // Find out how many type and item indices there are.
1067   auto mid =
1068       std::lower_bound(entries.begin(), entries.end(), GHashCell(true, 0, 0));
1069   assert((mid == entries.end() || mid->isItem()) &&
1070          (mid == entries.begin() || !std::prev(mid)->isItem()) &&
1071          "midpoint is not midpoint");
1072   uint32_t numTypes = std::distance(entries.begin(), mid);
1073   uint32_t numItems = std::distance(mid, entries.end());
1074   log("Tpi record count: " + Twine(numTypes));
1075   log("Ipi record count: " + Twine(numItems));
1076 
1077   // Make a list of the "unique" type records to merge for each tpi source. Type
1078   // merging will skip indices not on this list. Store the destination PDB type
1079   // index for these unique types in the tpiMap for each source. The entries for
1080   // non-unique types will be filled in prior to type merging.
1081   for (uint32_t i = 0, e = entries.size(); i < e; ++i) {
1082     auto &cell = entries[i];
1083     uint32_t tpiSrcIdx = cell.getTpiSrcIdx();
1084     TpiSource *source = TpiSource::instances[tpiSrcIdx];
1085     source->uniqueTypes.push_back(cell.getGHashIdx());
1086 
1087     // Update the ghash table to store the destination PDB type index in the
1088     // table.
1089     uint32_t pdbTypeIndex = i < numTypes ? i : i - numTypes;
1090     uint32_t ghashCellIndex =
1091         source->indexMapStorage[cell.getGHashIdx()].toArrayIndex();
1092     ghashState.table.table[ghashCellIndex] =
1093         GHashCell(cell.isItem(), cell.getTpiSrcIdx(), pdbTypeIndex);
1094   }
1095 
1096   // In parallel, remap all types.
1097   for_each(TpiSource::dependencySources, [&](TpiSource *source) {
1098     source->remapTpiWithGHashes(&ghashState);
1099   });
1100   parallelForEach(TpiSource::objectSources, [&](TpiSource *source) {
1101     source->remapTpiWithGHashes(&ghashState);
1102   });
1103 
1104   // Build a global map of from function ID to function type.
1105   for (TpiSource *source : TpiSource::instances) {
1106     for (auto idToType : source->funcIdToType)
1107       funcIdToType.insert(idToType);
1108     source->funcIdToType.clear();
1109   }
1110 
1111   TpiSource::clearGHashes();
1112 }
1113 
1114 /// Given the index into the ghash table for a particular type, return the type
1115 /// index for that type in the output PDB.
1116 static TypeIndex loadPdbTypeIndexFromCell(GHashState *g,
1117                                           uint32_t ghashCellIdx) {
1118   GHashCell cell = g->table.table[ghashCellIdx];
1119   return TypeIndex::fromArrayIndex(cell.getGHashIdx());
1120 }
1121 
1122 // Fill in a TPI or IPI index map using ghashes. For each source type, use its
1123 // ghash to lookup its final type index in the PDB, and store that in the map.
1124 void TpiSource::fillMapFromGHashes(GHashState *g,
1125                                    SmallVectorImpl<TypeIndex> &mapToFill) {
1126   for (size_t i = 0, e = ghashes.size(); i < e; ++i) {
1127     TypeIndex fakeCellIndex = indexMapStorage[i];
1128     if (fakeCellIndex.isSimple())
1129       mapToFill[i] = fakeCellIndex;
1130     else
1131       mapToFill[i] = loadPdbTypeIndexFromCell(g, fakeCellIndex.toArrayIndex());
1132   }
1133 }
1134 
1135 void TpiSource::clearGHashes() {
1136   for (TpiSource *src : TpiSource::instances) {
1137     if (src->ownedGHashes)
1138       delete[] src->ghashes.data();
1139     src->ghashes = {};
1140     src->isItemIndex.clear();
1141     src->uniqueTypes.clear();
1142   }
1143 }
1144