1*c504ae3cSZachary Turner //===- PDBStringTable.cpp - PDB String Table ---------------------*- C++-*-===//
2e204a6c9SZachary Turner //
3e204a6c9SZachary Turner //                     The LLVM Compiler Infrastructure
4e204a6c9SZachary Turner //
5e204a6c9SZachary Turner // This file is distributed under the University of Illinois Open Source
6e204a6c9SZachary Turner // License. See LICENSE.TXT for details.
7e204a6c9SZachary Turner //
8e204a6c9SZachary Turner //===----------------------------------------------------------------------===//
9e204a6c9SZachary Turner 
10e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBStringTable.h"
11e204a6c9SZachary Turner 
12e204a6c9SZachary Turner #include "llvm/ADT/ArrayRef.h"
13*c504ae3cSZachary Turner #include "llvm/DebugInfo/MSF/MappedBlockStream.h"
14e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/Hash.h"
15e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawError.h"
16e204a6c9SZachary Turner #include "llvm/DebugInfo/PDB/Native/RawTypes.h"
17e204a6c9SZachary Turner #include "llvm/Support/BinaryStreamReader.h"
18e204a6c9SZachary Turner #include "llvm/Support/Endian.h"
19e204a6c9SZachary Turner 
20e204a6c9SZachary Turner using namespace llvm;
21e204a6c9SZachary Turner using namespace llvm::support;
22e204a6c9SZachary Turner using namespace llvm::pdb;
23e204a6c9SZachary Turner 
24*c504ae3cSZachary Turner uint32_t PDBStringTable::getByteSize() const { return ByteSize; }
25*c504ae3cSZachary Turner uint32_t PDBStringTable::getNameCount() const { return NameCount; }
26*c504ae3cSZachary Turner uint32_t PDBStringTable::getHashVersion() const { return Header->HashVersion; }
27*c504ae3cSZachary Turner uint32_t PDBStringTable::getSignature() const { return Header->Signature; }
28e204a6c9SZachary Turner 
29*c504ae3cSZachary Turner Error PDBStringTable::readHeader(BinaryStreamReader &Reader) {
30*c504ae3cSZachary Turner   if (auto EC = Reader.readObject(Header))
31e204a6c9SZachary Turner     return EC;
32e204a6c9SZachary Turner 
33*c504ae3cSZachary Turner   if (Header->Signature != PDBStringTableSignature)
34e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
35e204a6c9SZachary Turner                                 "Invalid hash table signature");
36*c504ae3cSZachary Turner   if (Header->HashVersion != 1 && Header->HashVersion != 2)
37e204a6c9SZachary Turner     return make_error<RawError>(raw_error_code::corrupt_file,
38e204a6c9SZachary Turner                                 "Unsupported hash version");
39e204a6c9SZachary Turner 
40*c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
41*c504ae3cSZachary Turner   return Error::success();
42*c504ae3cSZachary Turner }
43*c504ae3cSZachary Turner 
44*c504ae3cSZachary Turner Error PDBStringTable::readStrings(BinaryStreamReader &Reader) {
45*c504ae3cSZachary Turner   if (auto EC = Strings.initialize(Reader)) {
46e204a6c9SZachary Turner     return joinErrors(std::move(EC),
47e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
48e204a6c9SZachary Turner                                            "Invalid hash table byte length"));
49*c504ae3cSZachary Turner   }
50e204a6c9SZachary Turner 
51*c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
52*c504ae3cSZachary Turner   return Error::success();
53*c504ae3cSZachary Turner }
54*c504ae3cSZachary Turner 
55*c504ae3cSZachary Turner Error PDBStringTable::readHashTable(BinaryStreamReader &Reader) {
56e204a6c9SZachary Turner   const support::ulittle32_t *HashCount;
57*c504ae3cSZachary Turner   if (auto EC = Reader.readObject(HashCount))
58e204a6c9SZachary Turner     return EC;
59e204a6c9SZachary Turner 
60*c504ae3cSZachary Turner   if (auto EC = Reader.readArray(IDs, *HashCount)) {
61e204a6c9SZachary Turner     return joinErrors(std::move(EC),
62e204a6c9SZachary Turner                       make_error<RawError>(raw_error_code::corrupt_file,
63e204a6c9SZachary Turner                                            "Could not read bucket array"));
64*c504ae3cSZachary Turner   }
65e204a6c9SZachary Turner 
66e204a6c9SZachary Turner   return Error::success();
67e204a6c9SZachary Turner }
68e204a6c9SZachary Turner 
69*c504ae3cSZachary Turner Error PDBStringTable::readEpilogue(BinaryStreamReader &Reader) {
70*c504ae3cSZachary Turner   if (auto EC = Reader.readInteger(NameCount))
71*c504ae3cSZachary Turner     return EC;
72*c504ae3cSZachary Turner 
73*c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
74*c504ae3cSZachary Turner   return Error::success();
75*c504ae3cSZachary Turner }
76*c504ae3cSZachary Turner 
77*c504ae3cSZachary Turner Error PDBStringTable::reload(BinaryStreamReader &Reader) {
78*c504ae3cSZachary Turner 
79*c504ae3cSZachary Turner   BinaryStreamReader SectionReader;
80*c504ae3cSZachary Turner 
81*c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(PDBStringTableHeader));
82*c504ae3cSZachary Turner   if (auto EC = readHeader(SectionReader))
83*c504ae3cSZachary Turner     return EC;
84*c504ae3cSZachary Turner 
85*c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(Header->ByteSize);
86*c504ae3cSZachary Turner   if (auto EC = readStrings(SectionReader))
87*c504ae3cSZachary Turner     return EC;
88*c504ae3cSZachary Turner 
89*c504ae3cSZachary Turner   // We don't know how long the hash table is until we parse it, so let the
90*c504ae3cSZachary Turner   // function responsible for doing that figure it out.
91*c504ae3cSZachary Turner   if (auto EC = readHashTable(Reader))
92*c504ae3cSZachary Turner     return EC;
93*c504ae3cSZachary Turner 
94*c504ae3cSZachary Turner   std::tie(SectionReader, Reader) = Reader.split(sizeof(uint32_t));
95*c504ae3cSZachary Turner   if (auto EC = readEpilogue(SectionReader))
96*c504ae3cSZachary Turner     return EC;
97*c504ae3cSZachary Turner 
98*c504ae3cSZachary Turner   assert(Reader.bytesRemaining() == 0);
99*c504ae3cSZachary Turner   return Error::success();
100*c504ae3cSZachary Turner }
101e204a6c9SZachary Turner 
102e204a6c9SZachary Turner StringRef PDBStringTable::getStringForID(uint32_t ID) const {
103*c504ae3cSZachary Turner   return Strings.getString(ID);
104e204a6c9SZachary Turner }
105e204a6c9SZachary Turner 
106e204a6c9SZachary Turner uint32_t PDBStringTable::getIDForString(StringRef Str) const {
107*c504ae3cSZachary Turner   uint32_t Hash =
108*c504ae3cSZachary Turner       (Header->HashVersion == 1) ? hashStringV1(Str) : hashStringV2(Str);
109e204a6c9SZachary Turner   size_t Count = IDs.size();
110e204a6c9SZachary Turner   uint32_t Start = Hash % Count;
111e204a6c9SZachary Turner   for (size_t I = 0; I < Count; ++I) {
112e204a6c9SZachary Turner     // The hash is just a starting point for the search, but if it
113e204a6c9SZachary Turner     // doesn't work we should find the string no matter what, because
114e204a6c9SZachary Turner     // we iterate the entire array.
115e204a6c9SZachary Turner     uint32_t Index = (Start + I) % Count;
116e204a6c9SZachary Turner 
117e204a6c9SZachary Turner     uint32_t ID = IDs[Index];
118e204a6c9SZachary Turner     StringRef S = getStringForID(ID);
119e204a6c9SZachary Turner     if (S == Str)
120e204a6c9SZachary Turner       return ID;
121e204a6c9SZachary Turner   }
122e204a6c9SZachary Turner   // IDs[0] contains the ID of the "invalid" entry.
123e204a6c9SZachary Turner   return IDs[0];
124e204a6c9SZachary Turner }
125e204a6c9SZachary Turner 
126e204a6c9SZachary Turner FixedStreamArray<support::ulittle32_t> PDBStringTable::name_ids() const {
127e204a6c9SZachary Turner   return IDs;
128e204a6c9SZachary Turner }
129