1c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3e204a6c9SZachary Turner //                     The LLVM Compiler Infrastructure
4e204a6c9SZachary Turner //
5e204a6c9SZachary Turner // This file is distributed under the University of Illinois Open Source
6e204a6c9SZachary Turner // License. See LICENSE.TXT for details.
7e204a6c9SZachary Turner //
8e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
9e204a6c9SZachary Turner 
10e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
11e204a6c9SZachary Turner 
12e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
13e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
14e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
15e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
16e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
17e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
18e204a6c9SZachary Turner 
19e204a6c9SZachary Turner using namespace llvm;
20e204a6c9SZachary Turner using namespace llvm::support;
21e204a6c9SZachary Turner using namespace llvm::pdb;
22e204a6c9SZachary Turner 
23f3b4b2d8SZachary Turner uint32_t PDBStringTable::getByteSize() const { return Header->ByteSize; }
24c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
25c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
26c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
27e204a6c9SZachary Turner 
28c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
29c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
30e204a6c9SZachary Turner     return EC;
31e204a6c9SZachary Turner 
32c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
33e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
34e204a6c9SZachary Turner                                 "Invalid hash table signature");
35c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
36e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
37e204a6c9SZachary Turner                                 "Unsupported hash version");
38e204a6c9SZachary Turner 
39c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
40c504ae3cSZachary Turner   return Error::success();
41c504ae3cSZachary Turner }
42c504ae3cSZachary Turner 
43c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
442d5c2cd3SZachary Turner   BinaryStreamRef Stream;
452d5c2cd3SZachary Turner   if (auto EC = Reader.readStreamRef(Stream))
462d5c2cd3SZachary Turner     return EC;
472d5c2cd3SZachary Turner 
482d5c2cd3SZachary Turner   if (auto EC = Strings.initialize(Stream)) {
49e204a6c9SZachary Turner     return joinErrors(std::move(EC),
50e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
51e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
52c504ae3cSZachary Turner   }
53e204a6c9SZachary Turner 
54c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
55c504ae3cSZachary Turner   return Error::success();
56c504ae3cSZachary Turner }
57c504ae3cSZachary Turner 
58a8cfc29cSZachary Turner const codeview::DebugStringTableSubsectionRef &
59a8cfc29cSZachary Turner PDBStringTable::getStringTable() const {
6092dcdda6SZachary Turner   return Strings;
6192dcdda6SZachary Turner }
6292dcdda6SZachary Turner 
63c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
64e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
65c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
66e204a6c9SZachary Turner     return EC;
67e204a6c9SZachary Turner 
68c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
69e204a6c9SZachary Turner     return joinErrors(std::move(EC),
70e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
71e204a6c9SZachary Turner                                            "Could not read bucket array"));
72c504ae3cSZachary Turner   }
73e204a6c9SZachary Turner 
74e204a6c9SZachary Turner   return Error::success();
75e204a6c9SZachary Turner }
76e204a6c9SZachary Turner 
77c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
78c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
79c504ae3cSZachary Turner     return EC;
80c504ae3cSZachary Turner 
81c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
82c504ae3cSZachary Turner   return Error::success();
83c504ae3cSZachary Turner }
84c504ae3cSZachary Turner 
85c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
86c504ae3cSZachary Turner 
87c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
88c504ae3cSZachary Turner 
89c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
90c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
91c504ae3cSZachary Turner     return EC;
92c504ae3cSZachary Turner 
93c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
94c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
95c504ae3cSZachary Turner     return EC;
96c504ae3cSZachary Turner 
97c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
98c504ae3cSZachary Turner   // function responsible for doing that figure it out.
99c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
100c504ae3cSZachary Turner     return EC;
101c504ae3cSZachary Turner 
102c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
103c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
104c504ae3cSZachary Turner     return EC;
105c504ae3cSZachary Turner 
106c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
107c504ae3cSZachary Turner   return Error::success();
108c504ae3cSZachary Turner }
109e204a6c9SZachary Turner 
1102d5c2cd3SZachary Turner Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
111c504ae3cSZachary Turner   return Strings.getString(ID);
112e204a6c9SZachary Turner }
113e204a6c9SZachary Turner 
1142d5c2cd3SZachary Turner Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
115c504ae3cSZachary Turner   uint32_t Hash =
116c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
117e204a6c9SZachary Turner   size_t Count = IDs.size();
118e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
119e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
120e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
121e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
122e204a6c9SZachary Turner     // we iterate the entire array.
123e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
124e204a6c9SZachary Turner 
125*eb629994SZachary Turner     // If we find 0, it means the item isn't in the hash table.
126e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
127*eb629994SZachary Turner     if (ID == 0)
128*eb629994SZachary Turner       return make_error<RawError>(raw_error_code::no_entry);
1292d5c2cd3SZachary Turner     auto ExpectedStr = getStringForID(ID);
1302d5c2cd3SZachary Turner     if (!ExpectedStr)
1312d5c2cd3SZachary Turner       return ExpectedStr.takeError();
1322d5c2cd3SZachary Turner 
1332d5c2cd3SZachary Turner     if (*ExpectedStr == Str)
134e204a6c9SZachary Turner       return ID;
135e204a6c9SZachary Turner   }
1362d5c2cd3SZachary Turner   return make_error<RawError>(raw_error_code::no_entry);
137e204a6c9SZachary Turner }
138e204a6c9SZachary Turner 
139e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
140e204a6c9SZachary Turner   return IDs;
141e204a6c9SZachary Turner }
142