180814287SRaphael Isemann //===-- PdbIndex.cpp ------------------------------------------------------===//
2307f5ae8SZachary Turner //
32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6307f5ae8SZachary Turner //
7307f5ae8SZachary Turner //===----------------------------------------------------------------------===//
8307f5ae8SZachary Turner
9307f5ae8SZachary Turner #include "PdbIndex.h"
10307f5ae8SZachary Turner #include "PdbUtil.h"
11307f5ae8SZachary Turner
12307f5ae8SZachary Turner #include "llvm/DebugInfo/CodeView/SymbolDeserializer.h"
13307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/DbiStream.h"
14307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/GlobalsStream.h"
15307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/ISectionContribVisitor.h"
16307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/PDBFile.h"
17307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/PublicsStream.h"
18307f5ae8SZachary Turner #include "llvm/DebugInfo/PDB/Native/SymbolStream.h"
192f7efbc9SZachary Turner #include "llvm/DebugInfo/PDB/Native/TpiStream.h"
20307f5ae8SZachary Turner #include "llvm/Object/COFF.h"
21307f5ae8SZachary Turner #include "llvm/Support/Error.h"
22307f5ae8SZachary Turner
23307f5ae8SZachary Turner #include "lldb/Utility/LLDBAssert.h"
24307f5ae8SZachary Turner #include "lldb/lldb-defines.h"
25307f5ae8SZachary Turner
26307f5ae8SZachary Turner using namespace lldb_private;
27307f5ae8SZachary Turner using namespace lldb_private::npdb;
28307f5ae8SZachary Turner using namespace llvm::codeview;
29307f5ae8SZachary Turner using namespace llvm::pdb;
30307f5ae8SZachary Turner
PdbIndex()31307f5ae8SZachary Turner PdbIndex::PdbIndex() : m_cus(*this), m_va_to_modi(m_allocator) {}
32307f5ae8SZachary Turner
33307f5ae8SZachary Turner #define ASSIGN_PTR_OR_RETURN(result_ptr, expr) \
34307f5ae8SZachary Turner { \
35307f5ae8SZachary Turner auto expected_result = expr; \
36307f5ae8SZachary Turner if (!expected_result) \
37307f5ae8SZachary Turner return expected_result.takeError(); \
38307f5ae8SZachary Turner result_ptr = &expected_result.get(); \
39307f5ae8SZachary Turner }
40307f5ae8SZachary Turner
41307f5ae8SZachary Turner llvm::Expected<std::unique_ptr<PdbIndex>>
create(llvm::pdb::PDBFile * file)42242e1e99SZequan Wu PdbIndex::create(llvm::pdb::PDBFile *file) {
43307f5ae8SZachary Turner lldbassert(file);
44307f5ae8SZachary Turner
45307f5ae8SZachary Turner std::unique_ptr<PdbIndex> result(new PdbIndex());
46307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_dbi, file->getPDBDbiStream());
47307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_tpi, file->getPDBTpiStream());
48307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_ipi, file->getPDBIpiStream());
49307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_info, file->getPDBInfoStream());
50307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_publics, file->getPDBPublicsStream());
51307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_globals, file->getPDBGlobalsStream());
52307f5ae8SZachary Turner ASSIGN_PTR_OR_RETURN(result->m_symrecords, file->getPDBSymbolStream());
53307f5ae8SZachary Turner
542f7efbc9SZachary Turner result->m_tpi->buildHashMap();
552f7efbc9SZachary Turner
56242e1e99SZequan Wu result->m_file = file;
57307f5ae8SZachary Turner
58307f5ae8SZachary Turner return std::move(result);
59307f5ae8SZachary Turner }
60307f5ae8SZachary Turner
MakeVirtualAddress(uint16_t segment,uint32_t offset) const61307f5ae8SZachary Turner lldb::addr_t PdbIndex::MakeVirtualAddress(uint16_t segment,
62307f5ae8SZachary Turner uint32_t offset) const {
63307f5ae8SZachary Turner uint32_t max_section = dbi().getSectionHeaders().size();
64*8a790e65SZequan Wu // Segment indices are 1-based.
65307f5ae8SZachary Turner // If this is an absolute symbol, it's indicated by the magic section index
66307f5ae8SZachary Turner // |max_section+1|. In this case, the offset is meaningless, so just return.
67*8a790e65SZequan Wu if (segment == 0 || segment > max_section)
68307f5ae8SZachary Turner return LLDB_INVALID_ADDRESS;
69307f5ae8SZachary Turner
70307f5ae8SZachary Turner const llvm::object::coff_section &cs = dbi().getSectionHeaders()[segment - 1];
71307f5ae8SZachary Turner return m_load_address + static_cast<lldb::addr_t>(cs.VirtualAddress) +
72307f5ae8SZachary Turner static_cast<lldb::addr_t>(offset);
73307f5ae8SZachary Turner }
74307f5ae8SZachary Turner
75307f5ae8SZachary Turner llvm::Optional<uint16_t>
GetModuleIndexForAddr(uint16_t segment,uint32_t offset) const76307f5ae8SZachary Turner PdbIndex::GetModuleIndexForAddr(uint16_t segment, uint32_t offset) const {
77307f5ae8SZachary Turner return GetModuleIndexForVa(MakeVirtualAddress(segment, offset));
78307f5ae8SZachary Turner }
79307f5ae8SZachary Turner
GetModuleIndexForVa(lldb::addr_t va) const80307f5ae8SZachary Turner llvm::Optional<uint16_t> PdbIndex::GetModuleIndexForVa(lldb::addr_t va) const {
81307f5ae8SZachary Turner auto iter = m_va_to_modi.find(va);
82307f5ae8SZachary Turner if (iter == m_va_to_modi.end())
83307f5ae8SZachary Turner return llvm::None;
84307f5ae8SZachary Turner
85307f5ae8SZachary Turner return iter.value();
86307f5ae8SZachary Turner }
87307f5ae8SZachary Turner
ParseSectionContribs()88307f5ae8SZachary Turner void PdbIndex::ParseSectionContribs() {
89307f5ae8SZachary Turner class Visitor : public ISectionContribVisitor {
90307f5ae8SZachary Turner PdbIndex &m_ctx;
91307f5ae8SZachary Turner llvm::IntervalMap<uint64_t, uint16_t> &m_imap;
92307f5ae8SZachary Turner
93307f5ae8SZachary Turner public:
94307f5ae8SZachary Turner Visitor(PdbIndex &ctx, llvm::IntervalMap<uint64_t, uint16_t> &imap)
95307f5ae8SZachary Turner : m_ctx(ctx), m_imap(imap) {}
96307f5ae8SZachary Turner
97307f5ae8SZachary Turner void visit(const SectionContrib &C) override {
982f7efbc9SZachary Turner if (C.Size == 0)
992f7efbc9SZachary Turner return;
1002f7efbc9SZachary Turner
101307f5ae8SZachary Turner uint64_t va = m_ctx.MakeVirtualAddress(C.ISect, C.Off);
102*8a790e65SZequan Wu if (va == LLDB_INVALID_ADDRESS)
103*8a790e65SZequan Wu return;
104307f5ae8SZachary Turner uint64_t end = va + C.Size;
105307f5ae8SZachary Turner // IntervalMap's start and end represent a closed range, not a half-open
106307f5ae8SZachary Turner // range, so we have to subtract 1.
107307f5ae8SZachary Turner m_imap.insert(va, end - 1, C.Imod);
108307f5ae8SZachary Turner }
109307f5ae8SZachary Turner void visit(const SectionContrib2 &C) override { visit(C.Base); }
110307f5ae8SZachary Turner };
111307f5ae8SZachary Turner Visitor v(*this, m_va_to_modi);
112307f5ae8SZachary Turner dbi().visitSectionContributions(v);
113307f5ae8SZachary Turner }
114307f5ae8SZachary Turner
BuildAddrToSymbolMap(CompilandIndexItem & cci)115307f5ae8SZachary Turner void PdbIndex::BuildAddrToSymbolMap(CompilandIndexItem &cci) {
116307f5ae8SZachary Turner lldbassert(cci.m_symbols_by_va.empty() &&
117307f5ae8SZachary Turner "Addr to symbol map is already built!");
1186284aee9SZachary Turner uint16_t modi = cci.m_id.modi;
119307f5ae8SZachary Turner const CVSymbolArray &syms = cci.m_debug_stream.getSymbolArray();
120307f5ae8SZachary Turner for (auto iter = syms.begin(); iter != syms.end(); ++iter) {
121307f5ae8SZachary Turner if (!SymbolHasAddress(*iter))
122307f5ae8SZachary Turner continue;
123307f5ae8SZachary Turner
124307f5ae8SZachary Turner SegmentOffset so = GetSegmentAndOffset(*iter);
125*8a790e65SZequan Wu lldb::addr_t va = MakeVirtualAddress(so.segment, so.offset);
126*8a790e65SZequan Wu if (va == LLDB_INVALID_ADDRESS)
127*8a790e65SZequan Wu continue;
128307f5ae8SZachary Turner
129579264bdSZachary Turner PdbCompilandSymId cu_sym_id(modi, iter.offset());
130307f5ae8SZachary Turner
13138d4a6c4SAdrian McCarthy // It's rare, but we could have multiple symbols with the same address
13238d4a6c4SAdrian McCarthy // because of identical comdat folding. Right now, the first one will win.
13310ac299aSZachary Turner cci.m_symbols_by_va.insert(std::make_pair(va, PdbSymUid(cu_sym_id)));
134307f5ae8SZachary Turner }
135307f5ae8SZachary Turner }
136307f5ae8SZachary Turner
FindSymbolsByVa(lldb::addr_t va)137307f5ae8SZachary Turner std::vector<SymbolAndUid> PdbIndex::FindSymbolsByVa(lldb::addr_t va) {
138307f5ae8SZachary Turner std::vector<SymbolAndUid> result;
139307f5ae8SZachary Turner
140307f5ae8SZachary Turner llvm::Optional<uint16_t> modi = GetModuleIndexForVa(va);
141307f5ae8SZachary Turner if (!modi)
142307f5ae8SZachary Turner return result;
143307f5ae8SZachary Turner
144307f5ae8SZachary Turner CompilandIndexItem &cci = compilands().GetOrCreateCompiland(*modi);
145307f5ae8SZachary Turner if (cci.m_symbols_by_va.empty())
146307f5ae8SZachary Turner BuildAddrToSymbolMap(cci);
147307f5ae8SZachary Turner
148307f5ae8SZachary Turner // The map is sorted by starting address of the symbol. So for example
149307f5ae8SZachary Turner // we could (in theory) have this situation
150307f5ae8SZachary Turner //
151307f5ae8SZachary Turner // [------------------]
152307f5ae8SZachary Turner // [----------]
153307f5ae8SZachary Turner // [-----------]
154307f5ae8SZachary Turner // [-------------]
155307f5ae8SZachary Turner // [----]
156307f5ae8SZachary Turner // [-----]
157307f5ae8SZachary Turner // ^ Address we're searching for
158307f5ae8SZachary Turner // In order to find this, we use the upper_bound of the key value which would
159307f5ae8SZachary Turner // be the first symbol whose starting address is higher than the element we're
160307f5ae8SZachary Turner // searching for.
161307f5ae8SZachary Turner
162307f5ae8SZachary Turner auto ub = cci.m_symbols_by_va.upper_bound(va);
163307f5ae8SZachary Turner
164307f5ae8SZachary Turner for (auto iter = cci.m_symbols_by_va.begin(); iter != ub; ++iter) {
1656284aee9SZachary Turner PdbCompilandSymId cu_sym_id = iter->second.asCompilandSym();
166307f5ae8SZachary Turner CVSymbol sym = ReadSymbolRecord(cu_sym_id);
167307f5ae8SZachary Turner
168307f5ae8SZachary Turner SegmentOffsetLength sol;
169307f5ae8SZachary Turner if (SymbolIsCode(sym))
170307f5ae8SZachary Turner sol = GetSegmentOffsetAndLength(sym);
171307f5ae8SZachary Turner else
172307f5ae8SZachary Turner sol.so = GetSegmentAndOffset(sym);
173307f5ae8SZachary Turner
174*8a790e65SZequan Wu lldb::addr_t start = MakeVirtualAddress(sol.so.segment, sol.so.offset);
175*8a790e65SZequan Wu if (start == LLDB_INVALID_ADDRESS)
176*8a790e65SZequan Wu continue;
177*8a790e65SZequan Wu
178307f5ae8SZachary Turner lldb::addr_t end = start + sol.length;
179307f5ae8SZachary Turner if (va >= start && va < end)
180307f5ae8SZachary Turner result.push_back({std::move(sym), iter->second});
181307f5ae8SZachary Turner }
182307f5ae8SZachary Turner
183307f5ae8SZachary Turner return result;
184307f5ae8SZachary Turner }
185307f5ae8SZachary Turner
ReadSymbolRecord(PdbCompilandSymId cu_sym) const1866284aee9SZachary Turner CVSymbol PdbIndex::ReadSymbolRecord(PdbCompilandSymId cu_sym) const {
1876284aee9SZachary Turner const CompilandIndexItem *cci = compilands().GetCompiland(cu_sym.modi);
188579264bdSZachary Turner auto iter = cci->m_debug_stream.getSymbolArray().at(cu_sym.offset);
189307f5ae8SZachary Turner lldbassert(iter != cci->m_debug_stream.getSymbolArray().end());
190307f5ae8SZachary Turner return *iter;
191307f5ae8SZachary Turner }
1923790029dSZachary Turner
ReadSymbolRecord(PdbGlobalSymId global) const1933790029dSZachary Turner CVSymbol PdbIndex::ReadSymbolRecord(PdbGlobalSymId global) const {
1943790029dSZachary Turner return symrecords().readRecord(global.offset);
1953790029dSZachary Turner }
196