1c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3e204a6c9SZachary Turner //                     The LLVM Compiler Infrastructure
4e204a6c9SZachary Turner //
5e204a6c9SZachary Turner // This file is distributed under the University of Illinois Open Source
6e204a6c9SZachary Turner // License. See LICENSE.TXT for details.
7e204a6c9SZachary Turner //
8e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
9e204a6c9SZachary Turner 
10e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
11e204a6c9SZachary Turner 
12e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
13c504ae3cSZachary Turner #include "llvm/DebugInfo/MSF/MappedBlockStream.h"
14e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
15e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
16e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
17e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
18e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
19e204a6c9SZachary Turner 
20e204a6c9SZachary Turner using namespace llvm;
21e204a6c9SZachary Turner using namespace llvm::support;
22e204a6c9SZachary Turner using namespace llvm::pdb;
23e204a6c9SZachary Turner 
24c504ae3cSZachary Turner uint32_t PDBStringTable::getByteSize() const { return ByteSize; }
25c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
26c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
27c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
28e204a6c9SZachary Turner 
29c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
30c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
31e204a6c9SZachary Turner     return EC;
32e204a6c9SZachary Turner 
33c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
34e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
35e204a6c9SZachary Turner                                 "Invalid hash table signature");
36c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
37e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
38e204a6c9SZachary Turner                                 "Unsupported hash version");
39e204a6c9SZachary Turner 
40c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
41c504ae3cSZachary Turner   return Error::success();
42c504ae3cSZachary Turner }
43c504ae3cSZachary Turner 
44c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
452d5c2cd3SZachary Turner   BinaryStreamRef Stream;
462d5c2cd3SZachary Turner   if (auto EC = Reader.readStreamRef(Stream))
472d5c2cd3SZachary Turner     return EC;
482d5c2cd3SZachary Turner 
492d5c2cd3SZachary Turner   if (auto EC = Strings.initialize(Stream)) {
50e204a6c9SZachary Turner     return joinErrors(std::move(EC),
51e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
52e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
53c504ae3cSZachary Turner   }
54e204a6c9SZachary Turner 
55c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
56c504ae3cSZachary Turner   return Error::success();
57c504ae3cSZachary Turner }
58c504ae3cSZachary Turner 
59*a8cfc29cSZachary Turner const codeview::DebugStringTableSubsectionRef &
60*a8cfc29cSZachary Turner PDBStringTable::getStringTable() const {
6192dcdda6SZachary Turner   return Strings;
6292dcdda6SZachary Turner }
6392dcdda6SZachary Turner 
64c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
65e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
66c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
67e204a6c9SZachary Turner     return EC;
68e204a6c9SZachary Turner 
69c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
70e204a6c9SZachary Turner     return joinErrors(std::move(EC),
71e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
72e204a6c9SZachary Turner                                            "Could not read bucket array"));
73c504ae3cSZachary Turner   }
74e204a6c9SZachary Turner 
75e204a6c9SZachary Turner   return Error::success();
76e204a6c9SZachary Turner }
77e204a6c9SZachary Turner 
78c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
79c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
80c504ae3cSZachary Turner     return EC;
81c504ae3cSZachary Turner 
82c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
83c504ae3cSZachary Turner   return Error::success();
84c504ae3cSZachary Turner }
85c504ae3cSZachary Turner 
86c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
87c504ae3cSZachary Turner 
88c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
89c504ae3cSZachary Turner 
90c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
91c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
92c504ae3cSZachary Turner     return EC;
93c504ae3cSZachary Turner 
94c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
95c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
96c504ae3cSZachary Turner     return EC;
97c504ae3cSZachary Turner 
98c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
99c504ae3cSZachary Turner   // function responsible for doing that figure it out.
100c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
101c504ae3cSZachary Turner     return EC;
102c504ae3cSZachary Turner 
103c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
104c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
105c504ae3cSZachary Turner     return EC;
106c504ae3cSZachary Turner 
107c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
108c504ae3cSZachary Turner   return Error::success();
109c504ae3cSZachary Turner }
110e204a6c9SZachary Turner 
1112d5c2cd3SZachary Turner Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
112c504ae3cSZachary Turner   return Strings.getString(ID);
113e204a6c9SZachary Turner }
114e204a6c9SZachary Turner 
1152d5c2cd3SZachary Turner Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
116c504ae3cSZachary Turner   uint32_t Hash =
117c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
118e204a6c9SZachary Turner   size_t Count = IDs.size();
119e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
120e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
121e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
122e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
123e204a6c9SZachary Turner     // we iterate the entire array.
124e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
125e204a6c9SZachary Turner 
126e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
1272d5c2cd3SZachary Turner     auto ExpectedStr = getStringForID(ID);
1282d5c2cd3SZachary Turner     if (!ExpectedStr)
1292d5c2cd3SZachary Turner       return ExpectedStr.takeError();
1302d5c2cd3SZachary Turner 
1312d5c2cd3SZachary Turner     if (*ExpectedStr == Str)
132e204a6c9SZachary Turner       return ID;
133e204a6c9SZachary Turner   }
1342d5c2cd3SZachary Turner   return make_error<RawError>(raw_error_code::no_entry);
135e204a6c9SZachary Turner }
136e204a6c9SZachary Turner 
137e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
138e204a6c9SZachary Turner   return IDs;
139e204a6c9SZachary Turner }
140