1c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3*2946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*2946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
5*2946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6e204a6c9SZachary Turner //
7e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
8e204a6c9SZachary Turner 
9e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
10e204a6c9SZachary Turner 
11e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
12e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
13e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
14e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
15e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
16e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
17e204a6c9SZachary Turner 
18e204a6c9SZachary Turner using namespace llvm;
19e204a6c9SZachary Turner using namespace llvm::support;
20e204a6c9SZachary Turner using namespace llvm::pdb;
21e204a6c9SZachary Turner 
22f3b4b2d8SZachary Turner uint32_t PDBStringTable::getByteSize() const { return Header->ByteSize; }
23c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
24c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
25c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
26e204a6c9SZachary Turner 
27c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
28c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
29e204a6c9SZachary Turner     return EC;
30e204a6c9SZachary Turner 
31c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
32e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
33e204a6c9SZachary Turner                                 "Invalid hash table signature");
34c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
35e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
36e204a6c9SZachary Turner                                 "Unsupported hash version");
37e204a6c9SZachary Turner 
38c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
39c504ae3cSZachary Turner   return Error::success();
40c504ae3cSZachary Turner }
41c504ae3cSZachary Turner 
42c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
432d5c2cd3SZachary Turner   BinaryStreamRef Stream;
442d5c2cd3SZachary Turner   if (auto EC = Reader.readStreamRef(Stream))
452d5c2cd3SZachary Turner     return EC;
462d5c2cd3SZachary Turner 
472d5c2cd3SZachary Turner   if (auto EC = Strings.initialize(Stream)) {
48e204a6c9SZachary Turner     return joinErrors(std::move(EC),
49e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
50e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
51c504ae3cSZachary Turner   }
52e204a6c9SZachary Turner 
53c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
54c504ae3cSZachary Turner   return Error::success();
55c504ae3cSZachary Turner }
56c504ae3cSZachary Turner 
57a8cfc29cSZachary Turner const codeview::DebugStringTableSubsectionRef &
58a8cfc29cSZachary Turner PDBStringTable::getStringTable() const {
5992dcdda6SZachary Turner   return Strings;
6092dcdda6SZachary Turner }
6192dcdda6SZachary Turner 
62c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
63e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
64c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
65e204a6c9SZachary Turner     return EC;
66e204a6c9SZachary Turner 
67c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
68e204a6c9SZachary Turner     return joinErrors(std::move(EC),
69e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
70e204a6c9SZachary Turner                                            "Could not read bucket array"));
71c504ae3cSZachary Turner   }
72e204a6c9SZachary Turner 
73e204a6c9SZachary Turner   return Error::success();
74e204a6c9SZachary Turner }
75e204a6c9SZachary Turner 
76c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
77c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
78c504ae3cSZachary Turner     return EC;
79c504ae3cSZachary Turner 
80c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
81c504ae3cSZachary Turner   return Error::success();
82c504ae3cSZachary Turner }
83c504ae3cSZachary Turner 
84c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
85c504ae3cSZachary Turner 
86c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
87c504ae3cSZachary Turner 
88c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
89c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
90c504ae3cSZachary Turner     return EC;
91c504ae3cSZachary Turner 
92c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
93c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
94c504ae3cSZachary Turner     return EC;
95c504ae3cSZachary Turner 
96c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
97c504ae3cSZachary Turner   // function responsible for doing that figure it out.
98c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
99c504ae3cSZachary Turner     return EC;
100c504ae3cSZachary Turner 
101c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
102c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
103c504ae3cSZachary Turner     return EC;
104c504ae3cSZachary Turner 
105c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
106c504ae3cSZachary Turner   return Error::success();
107c504ae3cSZachary Turner }
108e204a6c9SZachary Turner 
1092d5c2cd3SZachary Turner Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
110c504ae3cSZachary Turner   return Strings.getString(ID);
111e204a6c9SZachary Turner }
112e204a6c9SZachary Turner 
1132d5c2cd3SZachary Turner Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
114c504ae3cSZachary Turner   uint32_t Hash =
115c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
116e204a6c9SZachary Turner   size_t Count = IDs.size();
117e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
118e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
119e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
120e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
121e204a6c9SZachary Turner     // we iterate the entire array.
122e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
123e204a6c9SZachary Turner 
124eb629994SZachary Turner     // If we find 0, it means the item isn't in the hash table.
125e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
126eb629994SZachary Turner     if (ID == 0)
127eb629994SZachary Turner       return make_error<RawError>(raw_error_code::no_entry);
1282d5c2cd3SZachary Turner     auto ExpectedStr = getStringForID(ID);
1292d5c2cd3SZachary Turner     if (!ExpectedStr)
1302d5c2cd3SZachary Turner       return ExpectedStr.takeError();
1312d5c2cd3SZachary Turner 
1322d5c2cd3SZachary Turner     if (*ExpectedStr == Str)
133e204a6c9SZachary Turner       return ID;
134e204a6c9SZachary Turner   }
1352d5c2cd3SZachary Turner   return make_error<RawError>(raw_error_code::no_entry);
136e204a6c9SZachary Turner }
137e204a6c9SZachary Turner 
138e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
139e204a6c9SZachary Turner   return IDs;
140e204a6c9SZachary Turner }
141