1*0b57cec5SDimitry Andric //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric
9*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
10*0b57cec5SDimitry Andric
11*0b57cec5SDimitry Andric #include "llvm/ADT/ArrayRef.h"
12*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/Hash.h"
13*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/RawError.h"
14*0b57cec5SDimitry Andric #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
15*0b57cec5SDimitry Andric #include "llvm/Support/BinaryStreamReader.h"
16*0b57cec5SDimitry Andric #include "llvm/Support/Endian.h"
17*0b57cec5SDimitry Andric
18*0b57cec5SDimitry Andric using namespace llvm;
19*0b57cec5SDimitry Andric using namespace llvm::support;
20*0b57cec5SDimitry Andric using namespace llvm::pdb;
21*0b57cec5SDimitry Andric
getByteSize() const22*0b57cec5SDimitry Andric uint32_t PDBStringTable::getByteSize() const { return Header->ByteSize; }
getNameCount() const23*0b57cec5SDimitry Andric uint32_t PDBStringTable::getNameCount() const { return NameCount; }
getHashVersion() const24*0b57cec5SDimitry Andric uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
getSignature() const25*0b57cec5SDimitry Andric uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
26*0b57cec5SDimitry Andric
readHeader(BinaryStreamReader & Reader)27*0b57cec5SDimitry Andric Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
28*0b57cec5SDimitry Andric if (auto EC = Reader.readObject(Header))
29*0b57cec5SDimitry Andric return EC;
30*0b57cec5SDimitry Andric
31*0b57cec5SDimitry Andric if (Header->Signature != PDBStringTableSignature)
32*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::corrupt_file,
33*0b57cec5SDimitry Andric "Invalid hash table signature");
34*0b57cec5SDimitry Andric if (Header->HashVersion != 1 && Header->HashVersion != 2)
35*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::corrupt_file,
36*0b57cec5SDimitry Andric "Unsupported hash version");
37*0b57cec5SDimitry Andric
38*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
39*0b57cec5SDimitry Andric return Error::success();
40*0b57cec5SDimitry Andric }
41*0b57cec5SDimitry Andric
readStrings(BinaryStreamReader & Reader)42*0b57cec5SDimitry Andric Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
43*0b57cec5SDimitry Andric BinaryStreamRef Stream;
44*0b57cec5SDimitry Andric if (auto EC = Reader.readStreamRef(Stream))
45*0b57cec5SDimitry Andric return EC;
46*0b57cec5SDimitry Andric
47*0b57cec5SDimitry Andric if (auto EC = Strings.initialize(Stream)) {
48*0b57cec5SDimitry Andric return joinErrors(std::move(EC),
49*0b57cec5SDimitry Andric make_error<RawError>(raw_error_code::corrupt_file,
50*0b57cec5SDimitry Andric "Invalid hash table byte length"));
51*0b57cec5SDimitry Andric }
52*0b57cec5SDimitry Andric
53*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
54*0b57cec5SDimitry Andric return Error::success();
55*0b57cec5SDimitry Andric }
56*0b57cec5SDimitry Andric
57*0b57cec5SDimitry Andric const codeview::DebugStringTableSubsectionRef &
getStringTable() const58*0b57cec5SDimitry Andric PDBStringTable::getStringTable() const {
59*0b57cec5SDimitry Andric return Strings;
60*0b57cec5SDimitry Andric }
61*0b57cec5SDimitry Andric
readHashTable(BinaryStreamReader & Reader)62*0b57cec5SDimitry Andric Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
63*0b57cec5SDimitry Andric const support::ulittle32_t *HashCount;
64*0b57cec5SDimitry Andric if (auto EC = Reader.readObject(HashCount))
65*0b57cec5SDimitry Andric return EC;
66*0b57cec5SDimitry Andric
67*0b57cec5SDimitry Andric if (auto EC = Reader.readArray(IDs, *HashCount)) {
68*0b57cec5SDimitry Andric return joinErrors(std::move(EC),
69*0b57cec5SDimitry Andric make_error<RawError>(raw_error_code::corrupt_file,
70*0b57cec5SDimitry Andric "Could not read bucket array"));
71*0b57cec5SDimitry Andric }
72*0b57cec5SDimitry Andric
73*0b57cec5SDimitry Andric return Error::success();
74*0b57cec5SDimitry Andric }
75*0b57cec5SDimitry Andric
readEpilogue(BinaryStreamReader & Reader)76*0b57cec5SDimitry Andric Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
77*0b57cec5SDimitry Andric if (auto EC = Reader.readInteger(NameCount))
78*0b57cec5SDimitry Andric return EC;
79*0b57cec5SDimitry Andric
80*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
81*0b57cec5SDimitry Andric return Error::success();
82*0b57cec5SDimitry Andric }
83*0b57cec5SDimitry Andric
reload(BinaryStreamReader & Reader)84*0b57cec5SDimitry Andric Error PDBStringTable::reload(BinaryStreamReader &Reader) {
85*0b57cec5SDimitry Andric
86*0b57cec5SDimitry Andric BinaryStreamReader SectionReader;
87*0b57cec5SDimitry Andric
88*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
89*0b57cec5SDimitry Andric if (auto EC = readHeader(SectionReader))
90*0b57cec5SDimitry Andric return EC;
91*0b57cec5SDimitry Andric
92*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
93*0b57cec5SDimitry Andric if (auto EC = readStrings(SectionReader))
94*0b57cec5SDimitry Andric return EC;
95*0b57cec5SDimitry Andric
96*0b57cec5SDimitry Andric // We don't know how long the hash table is until we parse it, so let the
97*0b57cec5SDimitry Andric // function responsible for doing that figure it out.
98*0b57cec5SDimitry Andric if (auto EC = readHashTable(Reader))
99*0b57cec5SDimitry Andric return EC;
100*0b57cec5SDimitry Andric
101*0b57cec5SDimitry Andric std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
102*0b57cec5SDimitry Andric if (auto EC = readEpilogue(SectionReader))
103*0b57cec5SDimitry Andric return EC;
104*0b57cec5SDimitry Andric
105*0b57cec5SDimitry Andric assert(Reader.bytesRemaining() == 0);
106*0b57cec5SDimitry Andric return Error::success();
107*0b57cec5SDimitry Andric }
108*0b57cec5SDimitry Andric
getStringForID(uint32_t ID) const109*0b57cec5SDimitry Andric Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
110*0b57cec5SDimitry Andric return Strings.getString(ID);
111*0b57cec5SDimitry Andric }
112*0b57cec5SDimitry Andric
getIDForString(StringRef Str) const113*0b57cec5SDimitry Andric Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
114*0b57cec5SDimitry Andric uint32_t Hash =
115*0b57cec5SDimitry Andric (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
116*0b57cec5SDimitry Andric size_t Count = IDs.size();
117*0b57cec5SDimitry Andric uint32_t Start = Hash % Count;
118*0b57cec5SDimitry Andric for (size_t I = 0; I < Count; ++I) {
119*0b57cec5SDimitry Andric // The hash is just a starting point for the search, but if it
120*0b57cec5SDimitry Andric // doesn't work we should find the string no matter what, because
121*0b57cec5SDimitry Andric // we iterate the entire array.
122*0b57cec5SDimitry Andric uint32_t Index = (Start + I) % Count;
123*0b57cec5SDimitry Andric
124*0b57cec5SDimitry Andric // If we find 0, it means the item isn't in the hash table.
125*0b57cec5SDimitry Andric uint32_t ID = IDs[Index];
126*0b57cec5SDimitry Andric if (ID == 0)
127*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::no_entry);
128*0b57cec5SDimitry Andric auto ExpectedStr = getStringForID(ID);
129*0b57cec5SDimitry Andric if (!ExpectedStr)
130*0b57cec5SDimitry Andric return ExpectedStr.takeError();
131*0b57cec5SDimitry Andric
132*0b57cec5SDimitry Andric if (*ExpectedStr == Str)
133*0b57cec5SDimitry Andric return ID;
134*0b57cec5SDimitry Andric }
135*0b57cec5SDimitry Andric return make_error<RawError>(raw_error_code::no_entry);
136*0b57cec5SDimitry Andric }
137*0b57cec5SDimitry Andric
name_ids() const138*0b57cec5SDimitry Andric FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
139*0b57cec5SDimitry Andric return IDs;
140*0b57cec5SDimitry Andric }
141