1c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3e204a6c9SZachary Turner //                     The LLVM Compiler Infrastructure
4e204a6c9SZachary Turner //
5e204a6c9SZachary Turner // This file is distributed under the University of Illinois Open Source
6e204a6c9SZachary Turner // License. See LICENSE.TXT for details.
7e204a6c9SZachary Turner //
8e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
9e204a6c9SZachary Turner 
10e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
11e204a6c9SZachary Turner 
12e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
13c504ae3cSZachary Turner #include "llvm/DebugInfo/MSF/MappedBlockStream.h"
14e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
15e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
16e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
17e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
18e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
19e204a6c9SZachary Turner 
20e204a6c9SZachary Turner using namespace llvm;
21e204a6c9SZachary Turner using namespace llvm::support;
22e204a6c9SZachary Turner using namespace llvm::pdb;
23e204a6c9SZachary Turner 
24c504ae3cSZachary Turner uint32_t PDBStringTable::getByteSize() const { return ByteSize; }
25c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
26c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
27c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
28e204a6c9SZachary Turner 
29c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
30c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
31e204a6c9SZachary Turner     return EC;
32e204a6c9SZachary Turner 
33c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
34e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
35e204a6c9SZachary Turner                                 "Invalid hash table signature");
36c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
37e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
38e204a6c9SZachary Turner                                 "Unsupported hash version");
39e204a6c9SZachary Turner 
40c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
41c504ae3cSZachary Turner   return Error::success();
42c504ae3cSZachary Turner }
43c504ae3cSZachary Turner 
44c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
45*2d5c2cd3SZachary Turner   BinaryStreamRef Stream;
46*2d5c2cd3SZachary Turner   if (auto EC = Reader.readStreamRef(Stream))
47*2d5c2cd3SZachary Turner     return EC;
48*2d5c2cd3SZachary Turner 
49*2d5c2cd3SZachary Turner   if (auto EC = Strings.initialize(Stream)) {
50e204a6c9SZachary Turner     return joinErrors(std::move(EC),
51e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
52e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
53c504ae3cSZachary Turner   }
54e204a6c9SZachary Turner 
55c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
56c504ae3cSZachary Turner   return Error::success();
57c504ae3cSZachary Turner }
58c504ae3cSZachary Turner 
59c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
60e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
61c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
62e204a6c9SZachary Turner     return EC;
63e204a6c9SZachary Turner 
64c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
65e204a6c9SZachary Turner     return joinErrors(std::move(EC),
66e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
67e204a6c9SZachary Turner                                            "Could not read bucket array"));
68c504ae3cSZachary Turner   }
69e204a6c9SZachary Turner 
70e204a6c9SZachary Turner   return Error::success();
71e204a6c9SZachary Turner }
72e204a6c9SZachary Turner 
73c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
74c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
75c504ae3cSZachary Turner     return EC;
76c504ae3cSZachary Turner 
77c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
78c504ae3cSZachary Turner   return Error::success();
79c504ae3cSZachary Turner }
80c504ae3cSZachary Turner 
81c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
82c504ae3cSZachary Turner 
83c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
84c504ae3cSZachary Turner 
85c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
86c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
87c504ae3cSZachary Turner     return EC;
88c504ae3cSZachary Turner 
89c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
90c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
91c504ae3cSZachary Turner     return EC;
92c504ae3cSZachary Turner 
93c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
94c504ae3cSZachary Turner   // function responsible for doing that figure it out.
95c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
96c504ae3cSZachary Turner     return EC;
97c504ae3cSZachary Turner 
98c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
99c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
100c504ae3cSZachary Turner     return EC;
101c504ae3cSZachary Turner 
102c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
103c504ae3cSZachary Turner   return Error::success();
104c504ae3cSZachary Turner }
105e204a6c9SZachary Turner 
106*2d5c2cd3SZachary Turner Expected<StringRef> PDBStringTable::getStringForID(uint32_t ID) const {
107c504ae3cSZachary Turner   return Strings.getString(ID);
108e204a6c9SZachary Turner }
109e204a6c9SZachary Turner 
110*2d5c2cd3SZachary Turner Expected<uint32_t> PDBStringTable::getIDForString(StringRef Str) const {
111c504ae3cSZachary Turner   uint32_t Hash =
112c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
113e204a6c9SZachary Turner   size_t Count = IDs.size();
114e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
115e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
116e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
117e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
118e204a6c9SZachary Turner     // we iterate the entire array.
119e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
120e204a6c9SZachary Turner 
121e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
122*2d5c2cd3SZachary Turner     auto ExpectedStr = getStringForID(ID);
123*2d5c2cd3SZachary Turner     if (!ExpectedStr)
124*2d5c2cd3SZachary Turner       return ExpectedStr.takeError();
125*2d5c2cd3SZachary Turner 
126*2d5c2cd3SZachary Turner     if (*ExpectedStr == Str)
127e204a6c9SZachary Turner       return ID;
128e204a6c9SZachary Turner   }
129*2d5c2cd3SZachary Turner   return make_error<RawError>(raw_error_code::no_entry);
130e204a6c9SZachary Turner }
131e204a6c9SZachary Turner 
132e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
133e204a6c9SZachary Turner   return IDs;
134e204a6c9SZachary Turner }
135