1e204a6c9SZachary Turner //===- PDBStringTableBuilder.cpp - PDB String Table -------------*- C++ -*-===//
2e204a6c9SZachary Turner //
32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6e204a6c9SZachary Turner //
7e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
8e204a6c9SZachary Turner 
9e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTableBuilder.h"
10c504ae3cSZachary Turner 
11e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
12e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
13e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
14e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamWriter.h"
15e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
16e204a6c9SZachary Turner 
17a6fb536eSZachary Turner #include <map>
18a6fb536eSZachary Turner 
19e204a6c9SZachary Turner using namespace llvm;
20c504ae3cSZachary Turner using namespace llvm::msf;
21e204a6c9SZachary Turner using namespace llvm::support;
22e204a6c9SZachary Turner using namespace llvm::support::endian;
23e204a6c9SZachary Turner using namespace llvm::pdb;
24e204a6c9SZachary Turner 
25f2282762SZachary Turner StringTableHashTraits::StringTableHashTraits(PDBStringTableBuilder &Table)
26f2282762SZachary Turner     : Table(&Table) {}
27f2282762SZachary Turner 
28f2282762SZachary Turner uint32_t StringTableHashTraits::hashLookupKey(StringRef S) const {
29f2282762SZachary Turner   return Table->getIdForString(S);
30f2282762SZachary Turner }
31f2282762SZachary Turner 
32f2282762SZachary Turner StringRef StringTableHashTraits::storageKeyToLookupKey(uint32_t Offset) const {
33f2282762SZachary Turner   return Table->getStringForId(Offset);
34f2282762SZachary Turner }
35f2282762SZachary Turner 
36f2282762SZachary Turner uint32_t StringTableHashTraits::lookupKeyToStorageKey(StringRef S) {
37f2282762SZachary Turner   return Table->insert(S);
38f2282762SZachary Turner }
39f2282762SZachary Turner 
40e204a6c9SZachary Turner uint32_t PDBStringTableBuilder::insert(StringRef S) {
41c504ae3cSZachary Turner   return Strings.insert(S);
42e204a6c9SZachary Turner }
43e204a6c9SZachary Turner 
4471d36ad9SZachary Turner uint32_t PDBStringTableBuilder::getIdForString(StringRef S) const {
4571d36ad9SZachary Turner   return Strings.getIdForString(S);
4671d36ad9SZachary Turner }
4771d36ad9SZachary Turner 
4871d36ad9SZachary Turner StringRef PDBStringTableBuilder::getStringForId(uint32_t Id) const {
4971d36ad9SZachary Turner   return Strings.getStringForId(Id);
5071d36ad9SZachary Turner }
5171d36ad9SZachary Turner 
52*85e2cdacSReid Kleckner static uint32_t computeBucketCount(uint32_t NumStrings) {
53a6fb536eSZachary Turner   // This is a precomputed list of Buckets given the specified number of
54a6fb536eSZachary Turner   // strings.  Matching the reference algorithm exactly is not strictly
55a6fb536eSZachary Turner   // necessary for correctness, but it helps when comparing LLD's PDBs with
56a6fb536eSZachary Turner   // Microsoft's PDBs so as to eliminate superfluous differences.
57a6fb536eSZachary Turner   static std::map<uint32_t, uint32_t> StringsToBuckets = {
58a6fb536eSZachary Turner       {1, 2},
59a6fb536eSZachary Turner       {2, 4},
60a6fb536eSZachary Turner       {4, 7},
61a6fb536eSZachary Turner       {6, 11},
62a6fb536eSZachary Turner       {9, 17},
63a6fb536eSZachary Turner       {13, 26},
64a6fb536eSZachary Turner       {20, 40},
65a6fb536eSZachary Turner       {31, 61},
66a6fb536eSZachary Turner       {46, 92},
67a6fb536eSZachary Turner       {70, 139},
68a6fb536eSZachary Turner       {105, 209},
69a6fb536eSZachary Turner       {157, 314},
70a6fb536eSZachary Turner       {236, 472},
71a6fb536eSZachary Turner       {355, 709},
72a6fb536eSZachary Turner       {532, 1064},
73a6fb536eSZachary Turner       {799, 1597},
74a6fb536eSZachary Turner       {1198, 2396},
75a6fb536eSZachary Turner       {1798, 3595},
76a6fb536eSZachary Turner       {2697, 5393},
77a6fb536eSZachary Turner       {4045, 8090},
78a6fb536eSZachary Turner       {6068, 12136},
79a6fb536eSZachary Turner       {9103, 18205},
80a6fb536eSZachary Turner       {13654, 27308},
81a6fb536eSZachary Turner       {20482, 40963},
82a6fb536eSZachary Turner       {30723, 61445},
83a6fb536eSZachary Turner       {46084, 92168},
84a6fb536eSZachary Turner       {69127, 138253},
85a6fb536eSZachary Turner       {103690, 207380},
86a6fb536eSZachary Turner       {155536, 311071},
87a6fb536eSZachary Turner       {233304, 466607},
88a6fb536eSZachary Turner       {349956, 699911},
89a6fb536eSZachary Turner       {524934, 1049867},
90a6fb536eSZachary Turner       {787401, 1574801},
91a6fb536eSZachary Turner       {1181101, 2362202},
92a6fb536eSZachary Turner       {1771652, 3543304},
93a6fb536eSZachary Turner       {2657479, 5314957},
94a6fb536eSZachary Turner       {3986218, 7972436},
95a6fb536eSZachary Turner       {5979328, 11958655},
96a6fb536eSZachary Turner       {8968992, 17937983},
97a6fb536eSZachary Turner       {13453488, 26906975},
98a6fb536eSZachary Turner       {20180232, 40360463},
99a6fb536eSZachary Turner       {30270348, 60540695},
100a6fb536eSZachary Turner       {45405522, 90811043},
101a6fb536eSZachary Turner       {68108283, 136216565},
102a6fb536eSZachary Turner       {102162424, 204324848},
103a6fb536eSZachary Turner       {153243637, 306487273},
104a6fb536eSZachary Turner       {229865455, 459730910},
105a6fb536eSZachary Turner       {344798183, 689596366},
106a6fb536eSZachary Turner       {517197275, 1034394550},
107a6fb536eSZachary Turner       {775795913, 1551591826}};
108a6fb536eSZachary Turner   auto Entry = StringsToBuckets.lower_bound(NumStrings);
109a6fb536eSZachary Turner   assert(Entry != StringsToBuckets.end());
110a6fb536eSZachary Turner   return Entry->second;
111e204a6c9SZachary Turner }
112e204a6c9SZachary Turner 
113c504ae3cSZachary Turner uint32_t PDBStringTableBuilder::calculateHashTableSize() const {
114c504ae3cSZachary Turner   uint32_t Size = sizeof(uint32_t); // Hash table begins with 4-byte size field.
115c504ae3cSZachary Turner   Size += sizeof(uint32_t) * computeBucketCount(Strings.size());
116dff096f2SDaniel Jasper 
1177dba20bdSZachary Turner   return Size;
1187dba20bdSZachary Turner }
1197dba20bdSZachary Turner 
120c504ae3cSZachary Turner uint32_t PDBStringTableBuilder::calculateSerializedSize() const {
121c504ae3cSZachary Turner   uint32_t Size = 0;
122c504ae3cSZachary Turner   Size += sizeof(PDBStringTableHeader);
123c504ae3cSZachary Turner   Size += Strings.calculateSerializedSize();
124c504ae3cSZachary Turner   Size += calculateHashTableSize();
125c504ae3cSZachary Turner   Size += sizeof(uint32_t); // The /names stream ends with the string count.
126c504ae3cSZachary Turner   return Size;
127c504ae3cSZachary Turner }
128c504ae3cSZachary Turner 
129a8cfc29cSZachary Turner void PDBStringTableBuilder::setStrings(
130a8cfc29cSZachary Turner     const codeview::DebugStringTableSubsection &Strings) {
131a8cfc29cSZachary Turner   this->Strings = Strings;
132a8cfc29cSZachary Turner }
133a8cfc29cSZachary Turner 
134c504ae3cSZachary Turner Error PDBStringTableBuilder::writeHeader(BinaryStreamWriter &Writer) const {
135e204a6c9SZachary Turner   // Write a header
136e204a6c9SZachary Turner   PDBStringTableHeader H;
137e204a6c9SZachary Turner   H.Signature = PDBStringTableSignature;
138e204a6c9SZachary Turner   H.HashVersion = 1;
139c504ae3cSZachary Turner   H.ByteSize = Strings.calculateSerializedSize();
140e204a6c9SZachary Turner   if (auto EC = Writer.writeObject(H))
141e204a6c9SZachary Turner     return EC;
142c504ae3cSZachary Turner   assert(Writer.bytesRemaining() == 0);
143c504ae3cSZachary Turner   return Error::success();
1447dba20bdSZachary Turner }
1457dba20bdSZachary Turner 
146c504ae3cSZachary Turner Error PDBStringTableBuilder::writeStrings(BinaryStreamWriter &Writer) const {
147c504ae3cSZachary Turner   if (auto EC = Strings.commit(Writer))
148c504ae3cSZachary Turner     return EC;
149c504ae3cSZachary Turner 
150c504ae3cSZachary Turner   assert(Writer.bytesRemaining() == 0);
151c504ae3cSZachary Turner   return Error::success();
152c504ae3cSZachary Turner }
153c504ae3cSZachary Turner 
154c504ae3cSZachary Turner Error PDBStringTableBuilder::writeHashTable(BinaryStreamWriter &Writer) const {
155e204a6c9SZachary Turner   // Write a hash table.
156e204a6c9SZachary Turner   uint32_t BucketCount = computeBucketCount(Strings.size());
157e204a6c9SZachary Turner   if (auto EC = Writer.writeInteger(BucketCount))
158e204a6c9SZachary Turner     return EC;
159e204a6c9SZachary Turner   std::vector<ulittle32_t> Buckets(BucketCount);
160e204a6c9SZachary Turner 
161c504ae3cSZachary Turner   for (auto &Pair : Strings) {
162c504ae3cSZachary Turner     StringRef S = Pair.getKey();
163c504ae3cSZachary Turner     uint32_t Offset = Pair.getValue();
164e204a6c9SZachary Turner     uint32_t Hash = hashStringV1(S);
165e204a6c9SZachary Turner 
166e204a6c9SZachary Turner     for (uint32_t I = 0; I != BucketCount; ++I) {
167e204a6c9SZachary Turner       uint32_t Slot = (Hash + I) % BucketCount;
168e204a6c9SZachary Turner       if (Buckets[Slot] != 0)
169e204a6c9SZachary Turner         continue;
170e204a6c9SZachary Turner       Buckets[Slot] = Offset;
171e204a6c9SZachary Turner       break;
172e204a6c9SZachary Turner     }
173e204a6c9SZachary Turner   }
174e204a6c9SZachary Turner 
175e204a6c9SZachary Turner   if (auto EC = Writer.writeArray(ArrayRef<ulittle32_t>(Buckets)))
176e204a6c9SZachary Turner     return EC;
177c504ae3cSZachary Turner 
178c504ae3cSZachary Turner   assert(Writer.bytesRemaining() == 0);
179c504ae3cSZachary Turner   return Error::success();
180c504ae3cSZachary Turner }
181c504ae3cSZachary Turner 
182c504ae3cSZachary Turner Error PDBStringTableBuilder::writeEpilogue(BinaryStreamWriter &Writer) const {
183c504ae3cSZachary Turner   if (auto EC = Writer.writeInteger<uint32_t>(Strings.size()))
184e204a6c9SZachary Turner     return EC;
185c504ae3cSZachary Turner   assert(Writer.bytesRemaining() == 0);
186c504ae3cSZachary Turner   return Error::success();
187c504ae3cSZachary Turner }
188c504ae3cSZachary Turner 
189c504ae3cSZachary Turner Error PDBStringTableBuilder::commit(BinaryStreamWriter &Writer) const {
190c504ae3cSZachary Turner   BinaryStreamWriter SectionWriter;
191c504ae3cSZachary Turner 
192c504ae3cSZachary Turner   std::tie(SectionWriter, Writer) = Writer.split(sizeof(PDBStringTableHeader));
193c504ae3cSZachary Turner   if (auto EC = writeHeader(SectionWriter))
194c504ae3cSZachary Turner     return EC;
195c504ae3cSZachary Turner 
196c504ae3cSZachary Turner   std::tie(SectionWriter, Writer) =
197c504ae3cSZachary Turner       Writer.split(Strings.calculateSerializedSize());
198c504ae3cSZachary Turner   if (auto EC = writeStrings(SectionWriter))
199c504ae3cSZachary Turner     return EC;
200c504ae3cSZachary Turner 
201c504ae3cSZachary Turner   std::tie(SectionWriter, Writer) = Writer.split(calculateHashTableSize());
202c504ae3cSZachary Turner   if (auto EC = writeHashTable(SectionWriter))
203c504ae3cSZachary Turner     return EC;
204c504ae3cSZachary Turner 
205c504ae3cSZachary Turner   std::tie(SectionWriter, Writer) = Writer.split(sizeof(uint32_t));
206c504ae3cSZachary Turner   if (auto EC = writeEpilogue(SectionWriter))
207c504ae3cSZachary Turner     return EC;
208c504ae3cSZachary Turner 
209e204a6c9SZachary Turner   return Error::success();
210e204a6c9SZachary Turner }
211