1 //===- DWARFContext.cpp ---------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "llvm/DebugInfo/DWARF/DWARFContext.h" 10 #include "llvm/ADT/MapVector.h" 11 #include "llvm/ADT/STLExtras.h" 12 #include "llvm/ADT/SmallString.h" 13 #include "llvm/ADT/SmallVector.h" 14 #include "llvm/ADT/StringRef.h" 15 #include "llvm/ADT/StringSwitch.h" 16 #include "llvm/BinaryFormat/Dwarf.h" 17 #include "llvm/DebugInfo/DWARF/DWARFAcceleratorTable.h" 18 #include "llvm/DebugInfo/DWARF/DWARFCompileUnit.h" 19 #include "llvm/DebugInfo/DWARF/DWARFDataExtractor.h" 20 #include "llvm/DebugInfo/DWARF/DWARFDebugAbbrev.h" 21 #include "llvm/DebugInfo/DWARF/DWARFDebugAddr.h" 22 #include "llvm/DebugInfo/DWARF/DWARFDebugArangeSet.h" 23 #include "llvm/DebugInfo/DWARF/DWARFDebugAranges.h" 24 #include "llvm/DebugInfo/DWARF/DWARFDebugFrame.h" 25 #include "llvm/DebugInfo/DWARF/DWARFDebugLine.h" 26 #include "llvm/DebugInfo/DWARF/DWARFDebugLoc.h" 27 #include "llvm/DebugInfo/DWARF/DWARFDebugMacro.h" 28 #include "llvm/DebugInfo/DWARF/DWARFDebugPubTable.h" 29 #include "llvm/DebugInfo/DWARF/DWARFDebugRangeList.h" 30 #include "llvm/DebugInfo/DWARF/DWARFDebugRnglists.h" 31 #include "llvm/DebugInfo/DWARF/DWARFDie.h" 32 #include "llvm/DebugInfo/DWARF/DWARFFormValue.h" 33 #include "llvm/DebugInfo/DWARF/DWARFGdbIndex.h" 34 #include "llvm/DebugInfo/DWARF/DWARFListTable.h" 35 #include "llvm/DebugInfo/DWARF/DWARFLocationExpression.h" 36 #include "llvm/DebugInfo/DWARF/DWARFRelocMap.h" 37 #include "llvm/DebugInfo/DWARF/DWARFSection.h" 38 #include "llvm/DebugInfo/DWARF/DWARFTypeUnit.h" 39 #include "llvm/DebugInfo/DWARF/DWARFUnitIndex.h" 40 #include "llvm/DebugInfo/DWARF/DWARFVerifier.h" 41 #include "llvm/MC/MCRegisterInfo.h" 42 #include "llvm/MC/TargetRegistry.h" 43 #include "llvm/Object/Decompressor.h" 44 #include "llvm/Object/MachO.h" 45 #include "llvm/Object/ObjectFile.h" 46 #include "llvm/Object/RelocationResolver.h" 47 #include "llvm/Support/Casting.h" 48 #include "llvm/Support/DataExtractor.h" 49 #include "llvm/Support/Error.h" 50 #include "llvm/Support/Format.h" 51 #include "llvm/Support/LEB128.h" 52 #include "llvm/Support/MemoryBuffer.h" 53 #include "llvm/Support/Path.h" 54 #include "llvm/Support/raw_ostream.h" 55 #include <algorithm> 56 #include <cstdint> 57 #include <deque> 58 #include <map> 59 #include <string> 60 #include <utility> 61 #include <vector> 62 63 using namespace llvm; 64 using namespace dwarf; 65 using namespace object; 66 67 #define DEBUG_TYPE "dwarf" 68 69 using DWARFLineTable = DWARFDebugLine::LineTable; 70 using FileLineInfoKind = DILineInfoSpecifier::FileLineInfoKind; 71 using FunctionNameKind = DILineInfoSpecifier::FunctionNameKind; 72 73 DWARFContext::DWARFContext(std::unique_ptr<const DWARFObject> DObj, 74 std::string DWPName, 75 std::function<void(Error)> RecoverableErrorHandler, 76 std::function<void(Error)> WarningHandler) 77 : DIContext(CK_DWARF), DWPName(std::move(DWPName)), 78 RecoverableErrorHandler(RecoverableErrorHandler), 79 WarningHandler(WarningHandler), DObj(std::move(DObj)) {} 80 81 DWARFContext::~DWARFContext() = default; 82 83 /// Dump the UUID load command. 84 static void dumpUUID(raw_ostream &OS, const ObjectFile &Obj) { 85 auto *MachO = dyn_cast<MachOObjectFile>(&Obj); 86 if (!MachO) 87 return; 88 for (auto LC : MachO->load_commands()) { 89 raw_ostream::uuid_t UUID; 90 if (LC.C.cmd == MachO::LC_UUID) { 91 if (LC.C.cmdsize < sizeof(UUID) + sizeof(LC.C)) { 92 OS << "error: UUID load command is too short.\n"; 93 return; 94 } 95 OS << "UUID: "; 96 memcpy(&UUID, LC.Ptr+sizeof(LC.C), sizeof(UUID)); 97 OS.write_uuid(UUID); 98 Triple T = MachO->getArchTriple(); 99 OS << " (" << T.getArchName() << ')'; 100 OS << ' ' << MachO->getFileName() << '\n'; 101 } 102 } 103 } 104 105 using ContributionCollection = 106 std::vector<Optional<StrOffsetsContributionDescriptor>>; 107 108 // Collect all the contributions to the string offsets table from all units, 109 // sort them by their starting offsets and remove duplicates. 110 static ContributionCollection 111 collectContributionData(DWARFContext::unit_iterator_range Units) { 112 ContributionCollection Contributions; 113 for (const auto &U : Units) 114 if (const auto &C = U->getStringOffsetsTableContribution()) 115 Contributions.push_back(C); 116 // Sort the contributions so that any invalid ones are placed at 117 // the start of the contributions vector. This way they are reported 118 // first. 119 llvm::sort(Contributions, 120 [](const Optional<StrOffsetsContributionDescriptor> &L, 121 const Optional<StrOffsetsContributionDescriptor> &R) { 122 if (L && R) 123 return L->Base < R->Base; 124 return R.hasValue(); 125 }); 126 127 // Uniquify contributions, as it is possible that units (specifically 128 // type units in dwo or dwp files) share contributions. We don't want 129 // to report them more than once. 130 Contributions.erase( 131 std::unique(Contributions.begin(), Contributions.end(), 132 [](const Optional<StrOffsetsContributionDescriptor> &L, 133 const Optional<StrOffsetsContributionDescriptor> &R) { 134 if (L && R) 135 return L->Base == R->Base && L->Size == R->Size; 136 return false; 137 }), 138 Contributions.end()); 139 return Contributions; 140 } 141 142 // Dump a DWARF string offsets section. This may be a DWARF v5 formatted 143 // string offsets section, where each compile or type unit contributes a 144 // number of entries (string offsets), with each contribution preceded by 145 // a header containing size and version number. Alternatively, it may be a 146 // monolithic series of string offsets, as generated by the pre-DWARF v5 147 // implementation of split DWARF; however, in that case we still need to 148 // collect contributions of units because the size of the offsets (4 or 8 149 // bytes) depends on the format of the referencing unit (DWARF32 or DWARF64). 150 static void dumpStringOffsetsSection(raw_ostream &OS, DIDumpOptions DumpOpts, 151 StringRef SectionName, 152 const DWARFObject &Obj, 153 const DWARFSection &StringOffsetsSection, 154 StringRef StringSection, 155 DWARFContext::unit_iterator_range Units, 156 bool LittleEndian) { 157 auto Contributions = collectContributionData(Units); 158 DWARFDataExtractor StrOffsetExt(Obj, StringOffsetsSection, LittleEndian, 0); 159 DataExtractor StrData(StringSection, LittleEndian, 0); 160 uint64_t SectionSize = StringOffsetsSection.Data.size(); 161 uint64_t Offset = 0; 162 for (auto &Contribution : Contributions) { 163 // Report an ill-formed contribution. 164 if (!Contribution) { 165 OS << "error: invalid contribution to string offsets table in section ." 166 << SectionName << ".\n"; 167 return; 168 } 169 170 dwarf::DwarfFormat Format = Contribution->getFormat(); 171 int OffsetDumpWidth = 2 * dwarf::getDwarfOffsetByteSize(Format); 172 uint16_t Version = Contribution->getVersion(); 173 uint64_t ContributionHeader = Contribution->Base; 174 // In DWARF v5 there is a contribution header that immediately precedes 175 // the string offsets base (the location we have previously retrieved from 176 // the CU DIE's DW_AT_str_offsets attribute). The header is located either 177 // 8 or 16 bytes before the base, depending on the contribution's format. 178 if (Version >= 5) 179 ContributionHeader -= Format == DWARF32 ? 8 : 16; 180 181 // Detect overlapping contributions. 182 if (Offset > ContributionHeader) { 183 DumpOpts.RecoverableErrorHandler(createStringError( 184 errc::invalid_argument, 185 "overlapping contributions to string offsets table in section .%s.", 186 SectionName.data())); 187 } 188 // Report a gap in the table. 189 if (Offset < ContributionHeader) { 190 OS << format("0x%8.8" PRIx64 ": Gap, length = ", Offset); 191 OS << (ContributionHeader - Offset) << "\n"; 192 } 193 OS << format("0x%8.8" PRIx64 ": ", ContributionHeader); 194 // In DWARF v5 the contribution size in the descriptor does not equal 195 // the originally encoded length (it does not contain the length of the 196 // version field and the padding, a total of 4 bytes). Add them back in 197 // for reporting. 198 OS << "Contribution size = " << (Contribution->Size + (Version < 5 ? 0 : 4)) 199 << ", Format = " << dwarf::FormatString(Format) 200 << ", Version = " << Version << "\n"; 201 202 Offset = Contribution->Base; 203 unsigned EntrySize = Contribution->getDwarfOffsetByteSize(); 204 while (Offset - Contribution->Base < Contribution->Size) { 205 OS << format("0x%8.8" PRIx64 ": ", Offset); 206 uint64_t StringOffset = 207 StrOffsetExt.getRelocatedValue(EntrySize, &Offset); 208 OS << format("%0*" PRIx64 " ", OffsetDumpWidth, StringOffset); 209 const char *S = StrData.getCStr(&StringOffset); 210 if (S) 211 OS << format("\"%s\"", S); 212 OS << "\n"; 213 } 214 } 215 // Report a gap at the end of the table. 216 if (Offset < SectionSize) { 217 OS << format("0x%8.8" PRIx64 ": Gap, length = ", Offset); 218 OS << (SectionSize - Offset) << "\n"; 219 } 220 } 221 222 // Dump the .debug_addr section. 223 static void dumpAddrSection(raw_ostream &OS, DWARFDataExtractor &AddrData, 224 DIDumpOptions DumpOpts, uint16_t Version, 225 uint8_t AddrSize) { 226 uint64_t Offset = 0; 227 while (AddrData.isValidOffset(Offset)) { 228 DWARFDebugAddrTable AddrTable; 229 uint64_t TableOffset = Offset; 230 if (Error Err = AddrTable.extract(AddrData, &Offset, Version, AddrSize, 231 DumpOpts.WarningHandler)) { 232 DumpOpts.RecoverableErrorHandler(std::move(Err)); 233 // Keep going after an error, if we can, assuming that the length field 234 // could be read. If it couldn't, stop reading the section. 235 if (auto TableLength = AddrTable.getFullLength()) { 236 Offset = TableOffset + *TableLength; 237 continue; 238 } 239 break; 240 } 241 AddrTable.dump(OS, DumpOpts); 242 } 243 } 244 245 // Dump the .debug_rnglists or .debug_rnglists.dwo section (DWARF v5). 246 static void dumpRnglistsSection( 247 raw_ostream &OS, DWARFDataExtractor &rnglistData, 248 llvm::function_ref<Optional<object::SectionedAddress>(uint32_t)> 249 LookupPooledAddress, 250 DIDumpOptions DumpOpts) { 251 uint64_t Offset = 0; 252 while (rnglistData.isValidOffset(Offset)) { 253 llvm::DWARFDebugRnglistTable Rnglists; 254 uint64_t TableOffset = Offset; 255 if (Error Err = Rnglists.extract(rnglistData, &Offset)) { 256 DumpOpts.RecoverableErrorHandler(std::move(Err)); 257 uint64_t Length = Rnglists.length(); 258 // Keep going after an error, if we can, assuming that the length field 259 // could be read. If it couldn't, stop reading the section. 260 if (Length == 0) 261 break; 262 Offset = TableOffset + Length; 263 } else { 264 Rnglists.dump(rnglistData, OS, LookupPooledAddress, DumpOpts); 265 } 266 } 267 } 268 269 std::unique_ptr<DWARFDebugMacro> 270 DWARFContext::parseMacroOrMacinfo(MacroSecType SectionType) { 271 auto Macro = std::make_unique<DWARFDebugMacro>(); 272 auto ParseAndDump = [&](DWARFDataExtractor &Data, bool IsMacro) { 273 if (Error Err = IsMacro ? Macro->parseMacro(SectionType == MacroSection 274 ? compile_units() 275 : dwo_compile_units(), 276 SectionType == MacroSection 277 ? getStringExtractor() 278 : getStringDWOExtractor(), 279 Data) 280 : Macro->parseMacinfo(Data)) { 281 RecoverableErrorHandler(std::move(Err)); 282 Macro = nullptr; 283 } 284 }; 285 switch (SectionType) { 286 case MacinfoSection: { 287 DWARFDataExtractor Data(DObj->getMacinfoSection(), isLittleEndian(), 0); 288 ParseAndDump(Data, /*IsMacro=*/false); 289 break; 290 } 291 case MacinfoDwoSection: { 292 DWARFDataExtractor Data(DObj->getMacinfoDWOSection(), isLittleEndian(), 0); 293 ParseAndDump(Data, /*IsMacro=*/false); 294 break; 295 } 296 case MacroSection: { 297 DWARFDataExtractor Data(*DObj, DObj->getMacroSection(), isLittleEndian(), 298 0); 299 ParseAndDump(Data, /*IsMacro=*/true); 300 break; 301 } 302 case MacroDwoSection: { 303 DWARFDataExtractor Data(DObj->getMacroDWOSection(), isLittleEndian(), 0); 304 ParseAndDump(Data, /*IsMacro=*/true); 305 break; 306 } 307 } 308 return Macro; 309 } 310 311 static void dumpLoclistsSection(raw_ostream &OS, DIDumpOptions DumpOpts, 312 DWARFDataExtractor Data, 313 const MCRegisterInfo *MRI, 314 const DWARFObject &Obj, 315 Optional<uint64_t> DumpOffset) { 316 uint64_t Offset = 0; 317 318 while (Data.isValidOffset(Offset)) { 319 DWARFListTableHeader Header(".debug_loclists", "locations"); 320 if (Error E = Header.extract(Data, &Offset)) { 321 DumpOpts.RecoverableErrorHandler(std::move(E)); 322 return; 323 } 324 325 Header.dump(Data, OS, DumpOpts); 326 327 uint64_t EndOffset = Header.length() + Header.getHeaderOffset(); 328 Data.setAddressSize(Header.getAddrSize()); 329 DWARFDebugLoclists Loc(Data, Header.getVersion()); 330 if (DumpOffset) { 331 if (DumpOffset >= Offset && DumpOffset < EndOffset) { 332 Offset = *DumpOffset; 333 Loc.dumpLocationList(&Offset, OS, /*BaseAddr=*/None, MRI, Obj, nullptr, 334 DumpOpts, /*Indent=*/0); 335 OS << "\n"; 336 return; 337 } 338 } else { 339 Loc.dumpRange(Offset, EndOffset - Offset, OS, MRI, Obj, DumpOpts); 340 } 341 Offset = EndOffset; 342 } 343 } 344 345 static void dumpPubTableSection(raw_ostream &OS, DIDumpOptions DumpOpts, 346 DWARFDataExtractor Data, bool GnuStyle) { 347 DWARFDebugPubTable Table; 348 Table.extract(Data, GnuStyle, DumpOpts.RecoverableErrorHandler); 349 Table.dump(OS); 350 } 351 352 void DWARFContext::dump( 353 raw_ostream &OS, DIDumpOptions DumpOpts, 354 std::array<Optional<uint64_t>, DIDT_ID_Count> DumpOffsets) { 355 uint64_t DumpType = DumpOpts.DumpType; 356 357 StringRef Extension = sys::path::extension(DObj->getFileName()); 358 bool IsDWO = (Extension == ".dwo") || (Extension == ".dwp"); 359 360 // Print UUID header. 361 const auto *ObjFile = DObj->getFile(); 362 if (DumpType & DIDT_UUID) 363 dumpUUID(OS, *ObjFile); 364 365 // Print a header for each explicitly-requested section. 366 // Otherwise just print one for non-empty sections. 367 // Only print empty .dwo section headers when dumping a .dwo file. 368 bool Explicit = DumpType != DIDT_All && !IsDWO; 369 bool ExplicitDWO = Explicit && IsDWO; 370 auto shouldDump = [&](bool Explicit, const char *Name, unsigned ID, 371 StringRef Section) -> Optional<uint64_t> * { 372 unsigned Mask = 1U << ID; 373 bool Should = (DumpType & Mask) && (Explicit || !Section.empty()); 374 if (!Should) 375 return nullptr; 376 OS << "\n" << Name << " contents:\n"; 377 return &DumpOffsets[ID]; 378 }; 379 380 // Dump individual sections. 381 if (shouldDump(Explicit, ".debug_abbrev", DIDT_ID_DebugAbbrev, 382 DObj->getAbbrevSection())) 383 getDebugAbbrev()->dump(OS); 384 if (shouldDump(ExplicitDWO, ".debug_abbrev.dwo", DIDT_ID_DebugAbbrev, 385 DObj->getAbbrevDWOSection())) 386 getDebugAbbrevDWO()->dump(OS); 387 388 auto dumpDebugInfo = [&](const char *Name, unit_iterator_range Units) { 389 OS << '\n' << Name << " contents:\n"; 390 if (auto DumpOffset = DumpOffsets[DIDT_ID_DebugInfo]) 391 for (const auto &U : Units) 392 U->getDIEForOffset(DumpOffset.getValue()) 393 .dump(OS, 0, DumpOpts.noImplicitRecursion()); 394 else 395 for (const auto &U : Units) 396 U->dump(OS, DumpOpts); 397 }; 398 if ((DumpType & DIDT_DebugInfo)) { 399 if (Explicit || getNumCompileUnits()) 400 dumpDebugInfo(".debug_info", info_section_units()); 401 if (ExplicitDWO || getNumDWOCompileUnits()) 402 dumpDebugInfo(".debug_info.dwo", dwo_info_section_units()); 403 } 404 405 auto dumpDebugType = [&](const char *Name, unit_iterator_range Units) { 406 OS << '\n' << Name << " contents:\n"; 407 for (const auto &U : Units) 408 if (auto DumpOffset = DumpOffsets[DIDT_ID_DebugTypes]) 409 U->getDIEForOffset(*DumpOffset) 410 .dump(OS, 0, DumpOpts.noImplicitRecursion()); 411 else 412 U->dump(OS, DumpOpts); 413 }; 414 if ((DumpType & DIDT_DebugTypes)) { 415 if (Explicit || getNumTypeUnits()) 416 dumpDebugType(".debug_types", types_section_units()); 417 if (ExplicitDWO || getNumDWOTypeUnits()) 418 dumpDebugType(".debug_types.dwo", dwo_types_section_units()); 419 } 420 421 DIDumpOptions LLDumpOpts = DumpOpts; 422 if (LLDumpOpts.Verbose) 423 LLDumpOpts.DisplayRawContents = true; 424 425 if (const auto *Off = shouldDump(Explicit, ".debug_loc", DIDT_ID_DebugLoc, 426 DObj->getLocSection().Data)) { 427 getDebugLoc()->dump(OS, getRegisterInfo(), *DObj, LLDumpOpts, *Off); 428 } 429 if (const auto *Off = 430 shouldDump(Explicit, ".debug_loclists", DIDT_ID_DebugLoclists, 431 DObj->getLoclistsSection().Data)) { 432 DWARFDataExtractor Data(*DObj, DObj->getLoclistsSection(), isLittleEndian(), 433 0); 434 dumpLoclistsSection(OS, LLDumpOpts, Data, getRegisterInfo(), *DObj, *Off); 435 } 436 if (const auto *Off = 437 shouldDump(ExplicitDWO, ".debug_loclists.dwo", DIDT_ID_DebugLoclists, 438 DObj->getLoclistsDWOSection().Data)) { 439 DWARFDataExtractor Data(*DObj, DObj->getLoclistsDWOSection(), 440 isLittleEndian(), 0); 441 dumpLoclistsSection(OS, LLDumpOpts, Data, getRegisterInfo(), *DObj, *Off); 442 } 443 444 if (const auto *Off = 445 shouldDump(ExplicitDWO, ".debug_loc.dwo", DIDT_ID_DebugLoc, 446 DObj->getLocDWOSection().Data)) { 447 DWARFDataExtractor Data(*DObj, DObj->getLocDWOSection(), isLittleEndian(), 448 4); 449 DWARFDebugLoclists Loc(Data, /*Version=*/4); 450 if (*Off) { 451 uint64_t Offset = **Off; 452 Loc.dumpLocationList(&Offset, OS, 453 /*BaseAddr=*/None, getRegisterInfo(), *DObj, nullptr, 454 LLDumpOpts, /*Indent=*/0); 455 OS << "\n"; 456 } else { 457 Loc.dumpRange(0, Data.getData().size(), OS, getRegisterInfo(), *DObj, 458 LLDumpOpts); 459 } 460 } 461 462 if (const Optional<uint64_t> *Off = 463 shouldDump(Explicit, ".debug_frame", DIDT_ID_DebugFrame, 464 DObj->getFrameSection().Data)) { 465 if (Expected<const DWARFDebugFrame *> DF = getDebugFrame()) 466 (*DF)->dump(OS, DumpOpts, getRegisterInfo(), *Off); 467 else 468 RecoverableErrorHandler(DF.takeError()); 469 } 470 471 if (const Optional<uint64_t> *Off = 472 shouldDump(Explicit, ".eh_frame", DIDT_ID_DebugFrame, 473 DObj->getEHFrameSection().Data)) { 474 if (Expected<const DWARFDebugFrame *> DF = getEHFrame()) 475 (*DF)->dump(OS, DumpOpts, getRegisterInfo(), *Off); 476 else 477 RecoverableErrorHandler(DF.takeError()); 478 } 479 480 if (shouldDump(Explicit, ".debug_macro", DIDT_ID_DebugMacro, 481 DObj->getMacroSection().Data)) { 482 if (auto Macro = getDebugMacro()) 483 Macro->dump(OS); 484 } 485 486 if (shouldDump(Explicit, ".debug_macro.dwo", DIDT_ID_DebugMacro, 487 DObj->getMacroDWOSection())) { 488 if (auto MacroDWO = getDebugMacroDWO()) 489 MacroDWO->dump(OS); 490 } 491 492 if (shouldDump(Explicit, ".debug_macinfo", DIDT_ID_DebugMacro, 493 DObj->getMacinfoSection())) { 494 if (auto Macinfo = getDebugMacinfo()) 495 Macinfo->dump(OS); 496 } 497 498 if (shouldDump(Explicit, ".debug_macinfo.dwo", DIDT_ID_DebugMacro, 499 DObj->getMacinfoDWOSection())) { 500 if (auto MacinfoDWO = getDebugMacinfoDWO()) 501 MacinfoDWO->dump(OS); 502 } 503 504 if (shouldDump(Explicit, ".debug_aranges", DIDT_ID_DebugAranges, 505 DObj->getArangesSection())) { 506 uint64_t offset = 0; 507 DWARFDataExtractor arangesData(DObj->getArangesSection(), isLittleEndian(), 508 0); 509 DWARFDebugArangeSet set; 510 while (arangesData.isValidOffset(offset)) { 511 if (Error E = 512 set.extract(arangesData, &offset, DumpOpts.WarningHandler)) { 513 RecoverableErrorHandler(std::move(E)); 514 break; 515 } 516 set.dump(OS); 517 } 518 } 519 520 auto DumpLineSection = [&](DWARFDebugLine::SectionParser Parser, 521 DIDumpOptions DumpOpts, 522 Optional<uint64_t> DumpOffset) { 523 while (!Parser.done()) { 524 if (DumpOffset && Parser.getOffset() != *DumpOffset) { 525 Parser.skip(DumpOpts.WarningHandler, DumpOpts.WarningHandler); 526 continue; 527 } 528 OS << "debug_line[" << format("0x%8.8" PRIx64, Parser.getOffset()) 529 << "]\n"; 530 Parser.parseNext(DumpOpts.WarningHandler, DumpOpts.WarningHandler, &OS, 531 DumpOpts.Verbose); 532 } 533 }; 534 535 auto DumpStrSection = [&](StringRef Section) { 536 DataExtractor StrData(Section, isLittleEndian(), 0); 537 uint64_t Offset = 0; 538 uint64_t StrOffset = 0; 539 while (StrData.isValidOffset(Offset)) { 540 Error Err = Error::success(); 541 const char *CStr = StrData.getCStr(&Offset, &Err); 542 if (Err) { 543 DumpOpts.WarningHandler(std::move(Err)); 544 return; 545 } 546 OS << format("0x%8.8" PRIx64 ": \"", StrOffset); 547 OS.write_escaped(CStr); 548 OS << "\"\n"; 549 StrOffset = Offset; 550 } 551 }; 552 553 if (const auto *Off = shouldDump(Explicit, ".debug_line", DIDT_ID_DebugLine, 554 DObj->getLineSection().Data)) { 555 DWARFDataExtractor LineData(*DObj, DObj->getLineSection(), isLittleEndian(), 556 0); 557 DWARFDebugLine::SectionParser Parser(LineData, *this, normal_units()); 558 DumpLineSection(Parser, DumpOpts, *Off); 559 } 560 561 if (const auto *Off = 562 shouldDump(ExplicitDWO, ".debug_line.dwo", DIDT_ID_DebugLine, 563 DObj->getLineDWOSection().Data)) { 564 DWARFDataExtractor LineData(*DObj, DObj->getLineDWOSection(), 565 isLittleEndian(), 0); 566 DWARFDebugLine::SectionParser Parser(LineData, *this, dwo_units()); 567 DumpLineSection(Parser, DumpOpts, *Off); 568 } 569 570 if (shouldDump(Explicit, ".debug_cu_index", DIDT_ID_DebugCUIndex, 571 DObj->getCUIndexSection())) { 572 getCUIndex().dump(OS); 573 } 574 575 if (shouldDump(Explicit, ".debug_tu_index", DIDT_ID_DebugTUIndex, 576 DObj->getTUIndexSection())) { 577 getTUIndex().dump(OS); 578 } 579 580 if (shouldDump(Explicit, ".debug_str", DIDT_ID_DebugStr, 581 DObj->getStrSection())) 582 DumpStrSection(DObj->getStrSection()); 583 584 if (shouldDump(ExplicitDWO, ".debug_str.dwo", DIDT_ID_DebugStr, 585 DObj->getStrDWOSection())) 586 DumpStrSection(DObj->getStrDWOSection()); 587 588 if (shouldDump(Explicit, ".debug_line_str", DIDT_ID_DebugLineStr, 589 DObj->getLineStrSection())) 590 DumpStrSection(DObj->getLineStrSection()); 591 592 if (shouldDump(Explicit, ".debug_addr", DIDT_ID_DebugAddr, 593 DObj->getAddrSection().Data)) { 594 DWARFDataExtractor AddrData(*DObj, DObj->getAddrSection(), 595 isLittleEndian(), 0); 596 dumpAddrSection(OS, AddrData, DumpOpts, getMaxVersion(), getCUAddrSize()); 597 } 598 599 if (shouldDump(Explicit, ".debug_ranges", DIDT_ID_DebugRanges, 600 DObj->getRangesSection().Data)) { 601 uint8_t savedAddressByteSize = getCUAddrSize(); 602 DWARFDataExtractor rangesData(*DObj, DObj->getRangesSection(), 603 isLittleEndian(), savedAddressByteSize); 604 uint64_t offset = 0; 605 DWARFDebugRangeList rangeList; 606 while (rangesData.isValidOffset(offset)) { 607 if (Error E = rangeList.extract(rangesData, &offset)) { 608 DumpOpts.RecoverableErrorHandler(std::move(E)); 609 break; 610 } 611 rangeList.dump(OS); 612 } 613 } 614 615 auto LookupPooledAddress = [&](uint32_t Index) -> Optional<SectionedAddress> { 616 const auto &CUs = compile_units(); 617 auto I = CUs.begin(); 618 if (I == CUs.end()) 619 return None; 620 return (*I)->getAddrOffsetSectionItem(Index); 621 }; 622 623 if (shouldDump(Explicit, ".debug_rnglists", DIDT_ID_DebugRnglists, 624 DObj->getRnglistsSection().Data)) { 625 DWARFDataExtractor RnglistData(*DObj, DObj->getRnglistsSection(), 626 isLittleEndian(), 0); 627 dumpRnglistsSection(OS, RnglistData, LookupPooledAddress, DumpOpts); 628 } 629 630 if (shouldDump(ExplicitDWO, ".debug_rnglists.dwo", DIDT_ID_DebugRnglists, 631 DObj->getRnglistsDWOSection().Data)) { 632 DWARFDataExtractor RnglistData(*DObj, DObj->getRnglistsDWOSection(), 633 isLittleEndian(), 0); 634 dumpRnglistsSection(OS, RnglistData, LookupPooledAddress, DumpOpts); 635 } 636 637 if (shouldDump(Explicit, ".debug_pubnames", DIDT_ID_DebugPubnames, 638 DObj->getPubnamesSection().Data)) { 639 DWARFDataExtractor PubTableData(*DObj, DObj->getPubnamesSection(), 640 isLittleEndian(), 0); 641 dumpPubTableSection(OS, DumpOpts, PubTableData, /*GnuStyle=*/false); 642 } 643 644 if (shouldDump(Explicit, ".debug_pubtypes", DIDT_ID_DebugPubtypes, 645 DObj->getPubtypesSection().Data)) { 646 DWARFDataExtractor PubTableData(*DObj, DObj->getPubtypesSection(), 647 isLittleEndian(), 0); 648 dumpPubTableSection(OS, DumpOpts, PubTableData, /*GnuStyle=*/false); 649 } 650 651 if (shouldDump(Explicit, ".debug_gnu_pubnames", DIDT_ID_DebugGnuPubnames, 652 DObj->getGnuPubnamesSection().Data)) { 653 DWARFDataExtractor PubTableData(*DObj, DObj->getGnuPubnamesSection(), 654 isLittleEndian(), 0); 655 dumpPubTableSection(OS, DumpOpts, PubTableData, /*GnuStyle=*/true); 656 } 657 658 if (shouldDump(Explicit, ".debug_gnu_pubtypes", DIDT_ID_DebugGnuPubtypes, 659 DObj->getGnuPubtypesSection().Data)) { 660 DWARFDataExtractor PubTableData(*DObj, DObj->getGnuPubtypesSection(), 661 isLittleEndian(), 0); 662 dumpPubTableSection(OS, DumpOpts, PubTableData, /*GnuStyle=*/true); 663 } 664 665 if (shouldDump(Explicit, ".debug_str_offsets", DIDT_ID_DebugStrOffsets, 666 DObj->getStrOffsetsSection().Data)) 667 dumpStringOffsetsSection( 668 OS, DumpOpts, "debug_str_offsets", *DObj, DObj->getStrOffsetsSection(), 669 DObj->getStrSection(), normal_units(), isLittleEndian()); 670 if (shouldDump(ExplicitDWO, ".debug_str_offsets.dwo", DIDT_ID_DebugStrOffsets, 671 DObj->getStrOffsetsDWOSection().Data)) 672 dumpStringOffsetsSection(OS, DumpOpts, "debug_str_offsets.dwo", *DObj, 673 DObj->getStrOffsetsDWOSection(), 674 DObj->getStrDWOSection(), dwo_units(), 675 isLittleEndian()); 676 677 if (shouldDump(Explicit, ".gdb_index", DIDT_ID_GdbIndex, 678 DObj->getGdbIndexSection())) { 679 getGdbIndex().dump(OS); 680 } 681 682 if (shouldDump(Explicit, ".apple_names", DIDT_ID_AppleNames, 683 DObj->getAppleNamesSection().Data)) 684 getAppleNames().dump(OS); 685 686 if (shouldDump(Explicit, ".apple_types", DIDT_ID_AppleTypes, 687 DObj->getAppleTypesSection().Data)) 688 getAppleTypes().dump(OS); 689 690 if (shouldDump(Explicit, ".apple_namespaces", DIDT_ID_AppleNamespaces, 691 DObj->getAppleNamespacesSection().Data)) 692 getAppleNamespaces().dump(OS); 693 694 if (shouldDump(Explicit, ".apple_objc", DIDT_ID_AppleObjC, 695 DObj->getAppleObjCSection().Data)) 696 getAppleObjC().dump(OS); 697 if (shouldDump(Explicit, ".debug_names", DIDT_ID_DebugNames, 698 DObj->getNamesSection().Data)) 699 getDebugNames().dump(OS); 700 } 701 702 DWARFTypeUnit *DWARFContext::getTypeUnitForHash(uint16_t Version, uint64_t Hash, 703 bool IsDWO) { 704 parseDWOUnits(LazyParse); 705 706 if (const auto &TUI = getTUIndex()) { 707 if (const auto *R = TUI.getFromHash(Hash)) 708 return dyn_cast_or_null<DWARFTypeUnit>( 709 DWOUnits.getUnitForIndexEntry(*R)); 710 return nullptr; 711 } 712 713 struct UnitContainers { 714 const DWARFUnitVector &Units; 715 Optional<DenseMap<uint64_t, DWARFTypeUnit *>> ⤅ 716 }; 717 UnitContainers Units = IsDWO ? UnitContainers{DWOUnits, DWOTypeUnits} 718 : UnitContainers{NormalUnits, NormalTypeUnits}; 719 if (!Units.Map) { 720 Units.Map.emplace(); 721 for (const auto &U : IsDWO ? dwo_units() : normal_units()) { 722 if (DWARFTypeUnit *TU = dyn_cast<DWARFTypeUnit>(U.get())) 723 (*Units.Map)[TU->getTypeHash()] = TU; 724 } 725 } 726 727 return (*Units.Map)[Hash]; 728 } 729 730 DWARFCompileUnit *DWARFContext::getDWOCompileUnitForHash(uint64_t Hash) { 731 parseDWOUnits(LazyParse); 732 733 if (const auto &CUI = getCUIndex()) { 734 if (const auto *R = CUI.getFromHash(Hash)) 735 return dyn_cast_or_null<DWARFCompileUnit>( 736 DWOUnits.getUnitForIndexEntry(*R)); 737 return nullptr; 738 } 739 740 // If there's no index, just search through the CUs in the DWO - there's 741 // probably only one unless this is something like LTO - though an in-process 742 // built/cached lookup table could be used in that case to improve repeated 743 // lookups of different CUs in the DWO. 744 for (const auto &DWOCU : dwo_compile_units()) { 745 // Might not have parsed DWO ID yet. 746 if (!DWOCU->getDWOId()) { 747 if (Optional<uint64_t> DWOId = 748 toUnsigned(DWOCU->getUnitDIE().find(DW_AT_GNU_dwo_id))) 749 DWOCU->setDWOId(*DWOId); 750 else 751 // No DWO ID? 752 continue; 753 } 754 if (DWOCU->getDWOId() == Hash) 755 return dyn_cast<DWARFCompileUnit>(DWOCU.get()); 756 } 757 return nullptr; 758 } 759 760 DWARFDie DWARFContext::getDIEForOffset(uint64_t Offset) { 761 parseNormalUnits(); 762 if (auto *CU = NormalUnits.getUnitForOffset(Offset)) 763 return CU->getDIEForOffset(Offset); 764 return DWARFDie(); 765 } 766 767 bool DWARFContext::verify(raw_ostream &OS, DIDumpOptions DumpOpts) { 768 bool Success = true; 769 DWARFVerifier verifier(OS, *this, DumpOpts); 770 771 Success &= verifier.handleDebugAbbrev(); 772 if (DumpOpts.DumpType & DIDT_DebugCUIndex) 773 Success &= verifier.handleDebugCUIndex(); 774 if (DumpOpts.DumpType & DIDT_DebugTUIndex) 775 Success &= verifier.handleDebugTUIndex(); 776 if (DumpOpts.DumpType & DIDT_DebugInfo) 777 Success &= verifier.handleDebugInfo(); 778 if (DumpOpts.DumpType & DIDT_DebugLine) 779 Success &= verifier.handleDebugLine(); 780 Success &= verifier.handleAccelTables(); 781 return Success; 782 } 783 784 const DWARFUnitIndex &DWARFContext::getCUIndex() { 785 if (CUIndex) 786 return *CUIndex; 787 788 DataExtractor CUIndexData(DObj->getCUIndexSection(), isLittleEndian(), 0); 789 790 CUIndex = std::make_unique<DWARFUnitIndex>(DW_SECT_INFO); 791 CUIndex->parse(CUIndexData); 792 return *CUIndex; 793 } 794 795 const DWARFUnitIndex &DWARFContext::getTUIndex() { 796 if (TUIndex) 797 return *TUIndex; 798 799 DataExtractor TUIndexData(DObj->getTUIndexSection(), isLittleEndian(), 0); 800 801 TUIndex = std::make_unique<DWARFUnitIndex>(DW_SECT_EXT_TYPES); 802 TUIndex->parse(TUIndexData); 803 return *TUIndex; 804 } 805 806 DWARFGdbIndex &DWARFContext::getGdbIndex() { 807 if (GdbIndex) 808 return *GdbIndex; 809 810 DataExtractor GdbIndexData(DObj->getGdbIndexSection(), true /*LE*/, 0); 811 GdbIndex = std::make_unique<DWARFGdbIndex>(); 812 GdbIndex->parse(GdbIndexData); 813 return *GdbIndex; 814 } 815 816 const DWARFDebugAbbrev *DWARFContext::getDebugAbbrev() { 817 if (Abbrev) 818 return Abbrev.get(); 819 820 DataExtractor abbrData(DObj->getAbbrevSection(), isLittleEndian(), 0); 821 822 Abbrev.reset(new DWARFDebugAbbrev()); 823 Abbrev->extract(abbrData); 824 return Abbrev.get(); 825 } 826 827 const DWARFDebugAbbrev *DWARFContext::getDebugAbbrevDWO() { 828 if (AbbrevDWO) 829 return AbbrevDWO.get(); 830 831 DataExtractor abbrData(DObj->getAbbrevDWOSection(), isLittleEndian(), 0); 832 AbbrevDWO.reset(new DWARFDebugAbbrev()); 833 AbbrevDWO->extract(abbrData); 834 return AbbrevDWO.get(); 835 } 836 837 const DWARFDebugLoc *DWARFContext::getDebugLoc() { 838 if (Loc) 839 return Loc.get(); 840 841 // Assume all units have the same address byte size. 842 auto LocData = 843 getNumCompileUnits() 844 ? DWARFDataExtractor(*DObj, DObj->getLocSection(), isLittleEndian(), 845 getUnitAtIndex(0)->getAddressByteSize()) 846 : DWARFDataExtractor("", isLittleEndian(), 0); 847 Loc.reset(new DWARFDebugLoc(std::move(LocData))); 848 return Loc.get(); 849 } 850 851 const DWARFDebugAranges *DWARFContext::getDebugAranges() { 852 if (Aranges) 853 return Aranges.get(); 854 855 Aranges.reset(new DWARFDebugAranges()); 856 Aranges->generate(this); 857 return Aranges.get(); 858 } 859 860 Expected<const DWARFDebugFrame *> DWARFContext::getDebugFrame() { 861 if (DebugFrame) 862 return DebugFrame.get(); 863 864 const DWARFSection &DS = DObj->getFrameSection(); 865 866 // There's a "bug" in the DWARFv3 standard with respect to the target address 867 // size within debug frame sections. While DWARF is supposed to be independent 868 // of its container, FDEs have fields with size being "target address size", 869 // which isn't specified in DWARF in general. It's only specified for CUs, but 870 // .eh_frame can appear without a .debug_info section. Follow the example of 871 // other tools (libdwarf) and extract this from the container (ObjectFile 872 // provides this information). This problem is fixed in DWARFv4 873 // See this dwarf-discuss discussion for more details: 874 // http://lists.dwarfstd.org/htdig.cgi/dwarf-discuss-dwarfstd.org/2011-December/001173.html 875 DWARFDataExtractor DebugFrameData(*DObj, DS, isLittleEndian(), 876 DObj->getAddressSize()); 877 auto DF = 878 std::make_unique<DWARFDebugFrame>(getArch(), /*IsEH=*/false, DS.Address); 879 if (Error E = DF->parse(DebugFrameData)) 880 return std::move(E); 881 882 DebugFrame.swap(DF); 883 return DebugFrame.get(); 884 } 885 886 Expected<const DWARFDebugFrame *> DWARFContext::getEHFrame() { 887 if (EHFrame) 888 return EHFrame.get(); 889 890 const DWARFSection &DS = DObj->getEHFrameSection(); 891 DWARFDataExtractor DebugFrameData(*DObj, DS, isLittleEndian(), 892 DObj->getAddressSize()); 893 894 auto DF = 895 std::make_unique<DWARFDebugFrame>(getArch(), /*IsEH=*/true, DS.Address); 896 if (Error E = DF->parse(DebugFrameData)) 897 return std::move(E); 898 DebugFrame.swap(DF); 899 return DebugFrame.get(); 900 } 901 902 const DWARFDebugMacro *DWARFContext::getDebugMacro() { 903 if (!Macro) 904 Macro = parseMacroOrMacinfo(MacroSection); 905 return Macro.get(); 906 } 907 908 const DWARFDebugMacro *DWARFContext::getDebugMacroDWO() { 909 if (!MacroDWO) 910 MacroDWO = parseMacroOrMacinfo(MacroDwoSection); 911 return MacroDWO.get(); 912 } 913 914 const DWARFDebugMacro *DWARFContext::getDebugMacinfo() { 915 if (!Macinfo) 916 Macinfo = parseMacroOrMacinfo(MacinfoSection); 917 return Macinfo.get(); 918 } 919 920 const DWARFDebugMacro *DWARFContext::getDebugMacinfoDWO() { 921 if (!MacinfoDWO) 922 MacinfoDWO = parseMacroOrMacinfo(MacinfoDwoSection); 923 return MacinfoDWO.get(); 924 } 925 926 template <typename T> 927 static T &getAccelTable(std::unique_ptr<T> &Cache, const DWARFObject &Obj, 928 const DWARFSection &Section, StringRef StringSection, 929 bool IsLittleEndian) { 930 if (Cache) 931 return *Cache; 932 DWARFDataExtractor AccelSection(Obj, Section, IsLittleEndian, 0); 933 DataExtractor StrData(StringSection, IsLittleEndian, 0); 934 Cache.reset(new T(AccelSection, StrData)); 935 if (Error E = Cache->extract()) 936 llvm::consumeError(std::move(E)); 937 return *Cache; 938 } 939 940 const DWARFDebugNames &DWARFContext::getDebugNames() { 941 return getAccelTable(Names, *DObj, DObj->getNamesSection(), 942 DObj->getStrSection(), isLittleEndian()); 943 } 944 945 const AppleAcceleratorTable &DWARFContext::getAppleNames() { 946 return getAccelTable(AppleNames, *DObj, DObj->getAppleNamesSection(), 947 DObj->getStrSection(), isLittleEndian()); 948 } 949 950 const AppleAcceleratorTable &DWARFContext::getAppleTypes() { 951 return getAccelTable(AppleTypes, *DObj, DObj->getAppleTypesSection(), 952 DObj->getStrSection(), isLittleEndian()); 953 } 954 955 const AppleAcceleratorTable &DWARFContext::getAppleNamespaces() { 956 return getAccelTable(AppleNamespaces, *DObj, 957 DObj->getAppleNamespacesSection(), 958 DObj->getStrSection(), isLittleEndian()); 959 } 960 961 const AppleAcceleratorTable &DWARFContext::getAppleObjC() { 962 return getAccelTable(AppleObjC, *DObj, DObj->getAppleObjCSection(), 963 DObj->getStrSection(), isLittleEndian()); 964 } 965 966 const DWARFDebugLine::LineTable * 967 DWARFContext::getLineTableForUnit(DWARFUnit *U) { 968 Expected<const DWARFDebugLine::LineTable *> ExpectedLineTable = 969 getLineTableForUnit(U, WarningHandler); 970 if (!ExpectedLineTable) { 971 WarningHandler(ExpectedLineTable.takeError()); 972 return nullptr; 973 } 974 return *ExpectedLineTable; 975 } 976 977 Expected<const DWARFDebugLine::LineTable *> DWARFContext::getLineTableForUnit( 978 DWARFUnit *U, function_ref<void(Error)> RecoverableErrorHandler) { 979 if (!Line) 980 Line.reset(new DWARFDebugLine); 981 982 auto UnitDIE = U->getUnitDIE(); 983 if (!UnitDIE) 984 return nullptr; 985 986 auto Offset = toSectionOffset(UnitDIE.find(DW_AT_stmt_list)); 987 if (!Offset) 988 return nullptr; // No line table for this compile unit. 989 990 uint64_t stmtOffset = *Offset + U->getLineTableOffset(); 991 // See if the line table is cached. 992 if (const DWARFLineTable *lt = Line->getLineTable(stmtOffset)) 993 return lt; 994 995 // Make sure the offset is good before we try to parse. 996 if (stmtOffset >= U->getLineSection().Data.size()) 997 return nullptr; 998 999 // We have to parse it first. 1000 DWARFDataExtractor lineData(*DObj, U->getLineSection(), isLittleEndian(), 1001 U->getAddressByteSize()); 1002 return Line->getOrParseLineTable(lineData, stmtOffset, *this, U, 1003 RecoverableErrorHandler); 1004 } 1005 1006 void DWARFContext::parseNormalUnits() { 1007 if (!NormalUnits.empty()) 1008 return; 1009 DObj->forEachInfoSections([&](const DWARFSection &S) { 1010 NormalUnits.addUnitsForSection(*this, S, DW_SECT_INFO); 1011 }); 1012 NormalUnits.finishedInfoUnits(); 1013 DObj->forEachTypesSections([&](const DWARFSection &S) { 1014 NormalUnits.addUnitsForSection(*this, S, DW_SECT_EXT_TYPES); 1015 }); 1016 } 1017 1018 void DWARFContext::parseDWOUnits(bool Lazy) { 1019 if (!DWOUnits.empty()) 1020 return; 1021 DObj->forEachInfoDWOSections([&](const DWARFSection &S) { 1022 DWOUnits.addUnitsForDWOSection(*this, S, DW_SECT_INFO, Lazy); 1023 }); 1024 DWOUnits.finishedInfoUnits(); 1025 DObj->forEachTypesDWOSections([&](const DWARFSection &S) { 1026 DWOUnits.addUnitsForDWOSection(*this, S, DW_SECT_EXT_TYPES, Lazy); 1027 }); 1028 } 1029 1030 DWARFCompileUnit *DWARFContext::getCompileUnitForOffset(uint64_t Offset) { 1031 parseNormalUnits(); 1032 return dyn_cast_or_null<DWARFCompileUnit>( 1033 NormalUnits.getUnitForOffset(Offset)); 1034 } 1035 1036 DWARFCompileUnit *DWARFContext::getCompileUnitForAddress(uint64_t Address) { 1037 // First, get the offset of the compile unit. 1038 uint64_t CUOffset = getDebugAranges()->findAddress(Address); 1039 // Retrieve the compile unit. 1040 return getCompileUnitForOffset(CUOffset); 1041 } 1042 1043 DWARFContext::DIEsForAddress DWARFContext::getDIEsForAddress(uint64_t Address) { 1044 DIEsForAddress Result; 1045 1046 DWARFCompileUnit *CU = getCompileUnitForAddress(Address); 1047 if (!CU) 1048 return Result; 1049 1050 Result.CompileUnit = CU; 1051 Result.FunctionDIE = CU->getSubroutineForAddress(Address); 1052 1053 std::vector<DWARFDie> Worklist; 1054 Worklist.push_back(Result.FunctionDIE); 1055 while (!Worklist.empty()) { 1056 DWARFDie DIE = Worklist.back(); 1057 Worklist.pop_back(); 1058 1059 if (!DIE.isValid()) 1060 continue; 1061 1062 if (DIE.getTag() == DW_TAG_lexical_block && 1063 DIE.addressRangeContainsAddress(Address)) { 1064 Result.BlockDIE = DIE; 1065 break; 1066 } 1067 1068 append_range(Worklist, DIE); 1069 } 1070 1071 return Result; 1072 } 1073 1074 /// TODO: change input parameter from "uint64_t Address" 1075 /// into "SectionedAddress Address" 1076 static bool getFunctionNameAndStartLineForAddress( 1077 DWARFCompileUnit *CU, uint64_t Address, FunctionNameKind Kind, 1078 DILineInfoSpecifier::FileLineInfoKind FileNameKind, 1079 std::string &FunctionName, std::string &StartFile, uint32_t &StartLine, 1080 Optional<uint64_t> &StartAddress) { 1081 // The address may correspond to instruction in some inlined function, 1082 // so we have to build the chain of inlined functions and take the 1083 // name of the topmost function in it. 1084 SmallVector<DWARFDie, 4> InlinedChain; 1085 CU->getInlinedChainForAddress(Address, InlinedChain); 1086 if (InlinedChain.empty()) 1087 return false; 1088 1089 const DWARFDie &DIE = InlinedChain[0]; 1090 bool FoundResult = false; 1091 const char *Name = nullptr; 1092 if (Kind != FunctionNameKind::None && (Name = DIE.getSubroutineName(Kind))) { 1093 FunctionName = Name; 1094 FoundResult = true; 1095 } 1096 std::string DeclFile = DIE.getDeclFile(FileNameKind); 1097 if (!DeclFile.empty()) { 1098 StartFile = DeclFile; 1099 FoundResult = true; 1100 } 1101 if (auto DeclLineResult = DIE.getDeclLine()) { 1102 StartLine = DeclLineResult; 1103 FoundResult = true; 1104 } 1105 if (auto LowPcAddr = toSectionedAddress(DIE.find(DW_AT_low_pc))) 1106 StartAddress = LowPcAddr->Address; 1107 return FoundResult; 1108 } 1109 1110 static Optional<uint64_t> getTypeSize(DWARFDie Type, uint64_t PointerSize) { 1111 if (auto SizeAttr = Type.find(DW_AT_byte_size)) 1112 if (Optional<uint64_t> Size = SizeAttr->getAsUnsignedConstant()) 1113 return Size; 1114 1115 switch (Type.getTag()) { 1116 case DW_TAG_pointer_type: 1117 case DW_TAG_reference_type: 1118 case DW_TAG_rvalue_reference_type: 1119 return PointerSize; 1120 case DW_TAG_ptr_to_member_type: { 1121 if (DWARFDie BaseType = Type.getAttributeValueAsReferencedDie(DW_AT_type)) 1122 if (BaseType.getTag() == DW_TAG_subroutine_type) 1123 return 2 * PointerSize; 1124 return PointerSize; 1125 } 1126 case DW_TAG_const_type: 1127 case DW_TAG_immutable_type: 1128 case DW_TAG_volatile_type: 1129 case DW_TAG_restrict_type: 1130 case DW_TAG_typedef: { 1131 if (DWARFDie BaseType = Type.getAttributeValueAsReferencedDie(DW_AT_type)) 1132 return getTypeSize(BaseType, PointerSize); 1133 break; 1134 } 1135 case DW_TAG_array_type: { 1136 DWARFDie BaseType = Type.getAttributeValueAsReferencedDie(DW_AT_type); 1137 if (!BaseType) 1138 return Optional<uint64_t>(); 1139 Optional<uint64_t> BaseSize = getTypeSize(BaseType, PointerSize); 1140 if (!BaseSize) 1141 return Optional<uint64_t>(); 1142 uint64_t Size = *BaseSize; 1143 for (DWARFDie Child : Type) { 1144 if (Child.getTag() != DW_TAG_subrange_type) 1145 continue; 1146 1147 if (auto ElemCountAttr = Child.find(DW_AT_count)) 1148 if (Optional<uint64_t> ElemCount = 1149 ElemCountAttr->getAsUnsignedConstant()) 1150 Size *= *ElemCount; 1151 if (auto UpperBoundAttr = Child.find(DW_AT_upper_bound)) 1152 if (Optional<int64_t> UpperBound = 1153 UpperBoundAttr->getAsSignedConstant()) { 1154 int64_t LowerBound = 0; 1155 if (auto LowerBoundAttr = Child.find(DW_AT_lower_bound)) 1156 LowerBound = LowerBoundAttr->getAsSignedConstant().getValueOr(0); 1157 Size *= *UpperBound - LowerBound + 1; 1158 } 1159 } 1160 return Size; 1161 } 1162 default: 1163 break; 1164 } 1165 return Optional<uint64_t>(); 1166 } 1167 1168 static Optional<int64_t> 1169 getExpressionFrameOffset(ArrayRef<uint8_t> Expr, 1170 Optional<unsigned> FrameBaseReg) { 1171 if (!Expr.empty() && 1172 (Expr[0] == DW_OP_fbreg || 1173 (FrameBaseReg && Expr[0] == DW_OP_breg0 + *FrameBaseReg))) { 1174 unsigned Count; 1175 int64_t Offset = decodeSLEB128(Expr.data() + 1, &Count, Expr.end()); 1176 // A single DW_OP_fbreg or DW_OP_breg. 1177 if (Expr.size() == Count + 1) 1178 return Offset; 1179 // Same + DW_OP_deref (Fortran arrays look like this). 1180 if (Expr.size() == Count + 2 && Expr[Count + 1] == DW_OP_deref) 1181 return Offset; 1182 // Fallthrough. Do not accept ex. (DW_OP_breg W29, DW_OP_stack_value) 1183 } 1184 return None; 1185 } 1186 1187 void DWARFContext::addLocalsForDie(DWARFCompileUnit *CU, DWARFDie Subprogram, 1188 DWARFDie Die, std::vector<DILocal> &Result) { 1189 if (Die.getTag() == DW_TAG_variable || 1190 Die.getTag() == DW_TAG_formal_parameter) { 1191 DILocal Local; 1192 if (const char *Name = Subprogram.getSubroutineName(DINameKind::ShortName)) 1193 Local.FunctionName = Name; 1194 1195 Optional<unsigned> FrameBaseReg; 1196 if (auto FrameBase = Subprogram.find(DW_AT_frame_base)) 1197 if (Optional<ArrayRef<uint8_t>> Expr = FrameBase->getAsBlock()) 1198 if (!Expr->empty() && (*Expr)[0] >= DW_OP_reg0 && 1199 (*Expr)[0] <= DW_OP_reg31) { 1200 FrameBaseReg = (*Expr)[0] - DW_OP_reg0; 1201 } 1202 1203 if (Expected<std::vector<DWARFLocationExpression>> Loc = 1204 Die.getLocations(DW_AT_location)) { 1205 for (const auto &Entry : *Loc) { 1206 if (Optional<int64_t> FrameOffset = 1207 getExpressionFrameOffset(Entry.Expr, FrameBaseReg)) { 1208 Local.FrameOffset = *FrameOffset; 1209 break; 1210 } 1211 } 1212 } else { 1213 // FIXME: missing DW_AT_location is OK here, but other errors should be 1214 // reported to the user. 1215 consumeError(Loc.takeError()); 1216 } 1217 1218 if (auto TagOffsetAttr = Die.find(DW_AT_LLVM_tag_offset)) 1219 Local.TagOffset = TagOffsetAttr->getAsUnsignedConstant(); 1220 1221 if (auto Origin = 1222 Die.getAttributeValueAsReferencedDie(DW_AT_abstract_origin)) 1223 Die = Origin; 1224 if (auto NameAttr = Die.find(DW_AT_name)) 1225 if (Optional<const char *> Name = dwarf::toString(*NameAttr)) 1226 Local.Name = *Name; 1227 if (auto Type = Die.getAttributeValueAsReferencedDie(DW_AT_type)) 1228 Local.Size = getTypeSize(Type, getCUAddrSize()); 1229 if (auto DeclFileAttr = Die.find(DW_AT_decl_file)) { 1230 if (const auto *LT = CU->getContext().getLineTableForUnit(CU)) 1231 LT->getFileNameByIndex( 1232 DeclFileAttr->getAsUnsignedConstant().getValue(), 1233 CU->getCompilationDir(), 1234 DILineInfoSpecifier::FileLineInfoKind::AbsoluteFilePath, 1235 Local.DeclFile); 1236 } 1237 if (auto DeclLineAttr = Die.find(DW_AT_decl_line)) 1238 Local.DeclLine = DeclLineAttr->getAsUnsignedConstant().getValue(); 1239 1240 Result.push_back(Local); 1241 return; 1242 } 1243 1244 if (Die.getTag() == DW_TAG_inlined_subroutine) 1245 if (auto Origin = 1246 Die.getAttributeValueAsReferencedDie(DW_AT_abstract_origin)) 1247 Subprogram = Origin; 1248 1249 for (auto Child : Die) 1250 addLocalsForDie(CU, Subprogram, Child, Result); 1251 } 1252 1253 std::vector<DILocal> 1254 DWARFContext::getLocalsForAddress(object::SectionedAddress Address) { 1255 std::vector<DILocal> Result; 1256 DWARFCompileUnit *CU = getCompileUnitForAddress(Address.Address); 1257 if (!CU) 1258 return Result; 1259 1260 DWARFDie Subprogram = CU->getSubroutineForAddress(Address.Address); 1261 if (Subprogram.isValid()) 1262 addLocalsForDie(CU, Subprogram, Subprogram, Result); 1263 return Result; 1264 } 1265 1266 DILineInfo DWARFContext::getLineInfoForAddress(object::SectionedAddress Address, 1267 DILineInfoSpecifier Spec) { 1268 DILineInfo Result; 1269 1270 DWARFCompileUnit *CU = getCompileUnitForAddress(Address.Address); 1271 if (!CU) 1272 return Result; 1273 1274 getFunctionNameAndStartLineForAddress( 1275 CU, Address.Address, Spec.FNKind, Spec.FLIKind, Result.FunctionName, 1276 Result.StartFileName, Result.StartLine, Result.StartAddress); 1277 if (Spec.FLIKind != FileLineInfoKind::None) { 1278 if (const DWARFLineTable *LineTable = getLineTableForUnit(CU)) { 1279 LineTable->getFileLineInfoForAddress( 1280 {Address.Address, Address.SectionIndex}, CU->getCompilationDir(), 1281 Spec.FLIKind, Result); 1282 } 1283 } 1284 return Result; 1285 } 1286 1287 DILineInfoTable DWARFContext::getLineInfoForAddressRange( 1288 object::SectionedAddress Address, uint64_t Size, DILineInfoSpecifier Spec) { 1289 DILineInfoTable Lines; 1290 DWARFCompileUnit *CU = getCompileUnitForAddress(Address.Address); 1291 if (!CU) 1292 return Lines; 1293 1294 uint32_t StartLine = 0; 1295 std::string StartFileName; 1296 std::string FunctionName(DILineInfo::BadString); 1297 Optional<uint64_t> StartAddress; 1298 getFunctionNameAndStartLineForAddress(CU, Address.Address, Spec.FNKind, 1299 Spec.FLIKind, FunctionName, 1300 StartFileName, StartLine, StartAddress); 1301 1302 // If the Specifier says we don't need FileLineInfo, just 1303 // return the top-most function at the starting address. 1304 if (Spec.FLIKind == FileLineInfoKind::None) { 1305 DILineInfo Result; 1306 Result.FunctionName = FunctionName; 1307 Result.StartFileName = StartFileName; 1308 Result.StartLine = StartLine; 1309 Result.StartAddress = StartAddress; 1310 Lines.push_back(std::make_pair(Address.Address, Result)); 1311 return Lines; 1312 } 1313 1314 const DWARFLineTable *LineTable = getLineTableForUnit(CU); 1315 1316 // Get the index of row we're looking for in the line table. 1317 std::vector<uint32_t> RowVector; 1318 if (!LineTable->lookupAddressRange({Address.Address, Address.SectionIndex}, 1319 Size, RowVector)) { 1320 return Lines; 1321 } 1322 1323 for (uint32_t RowIndex : RowVector) { 1324 // Take file number and line/column from the row. 1325 const DWARFDebugLine::Row &Row = LineTable->Rows[RowIndex]; 1326 DILineInfo Result; 1327 LineTable->getFileNameByIndex(Row.File, CU->getCompilationDir(), 1328 Spec.FLIKind, Result.FileName); 1329 Result.FunctionName = FunctionName; 1330 Result.Line = Row.Line; 1331 Result.Column = Row.Column; 1332 Result.StartFileName = StartFileName; 1333 Result.StartLine = StartLine; 1334 Result.StartAddress = StartAddress; 1335 Lines.push_back(std::make_pair(Row.Address.Address, Result)); 1336 } 1337 1338 return Lines; 1339 } 1340 1341 DIInliningInfo 1342 DWARFContext::getInliningInfoForAddress(object::SectionedAddress Address, 1343 DILineInfoSpecifier Spec) { 1344 DIInliningInfo InliningInfo; 1345 1346 DWARFCompileUnit *CU = getCompileUnitForAddress(Address.Address); 1347 if (!CU) 1348 return InliningInfo; 1349 1350 const DWARFLineTable *LineTable = nullptr; 1351 SmallVector<DWARFDie, 4> InlinedChain; 1352 CU->getInlinedChainForAddress(Address.Address, InlinedChain); 1353 if (InlinedChain.size() == 0) { 1354 // If there is no DIE for address (e.g. it is in unavailable .dwo file), 1355 // try to at least get file/line info from symbol table. 1356 if (Spec.FLIKind != FileLineInfoKind::None) { 1357 DILineInfo Frame; 1358 LineTable = getLineTableForUnit(CU); 1359 if (LineTable && LineTable->getFileLineInfoForAddress( 1360 {Address.Address, Address.SectionIndex}, 1361 CU->getCompilationDir(), Spec.FLIKind, Frame)) 1362 InliningInfo.addFrame(Frame); 1363 } 1364 return InliningInfo; 1365 } 1366 1367 uint32_t CallFile = 0, CallLine = 0, CallColumn = 0, CallDiscriminator = 0; 1368 for (uint32_t i = 0, n = InlinedChain.size(); i != n; i++) { 1369 DWARFDie &FunctionDIE = InlinedChain[i]; 1370 DILineInfo Frame; 1371 // Get function name if necessary. 1372 if (const char *Name = FunctionDIE.getSubroutineName(Spec.FNKind)) 1373 Frame.FunctionName = Name; 1374 if (auto DeclLineResult = FunctionDIE.getDeclLine()) 1375 Frame.StartLine = DeclLineResult; 1376 Frame.StartFileName = FunctionDIE.getDeclFile(Spec.FLIKind); 1377 if (auto LowPcAddr = toSectionedAddress(FunctionDIE.find(DW_AT_low_pc))) 1378 Frame.StartAddress = LowPcAddr->Address; 1379 if (Spec.FLIKind != FileLineInfoKind::None) { 1380 if (i == 0) { 1381 // For the topmost frame, initialize the line table of this 1382 // compile unit and fetch file/line info from it. 1383 LineTable = getLineTableForUnit(CU); 1384 // For the topmost routine, get file/line info from line table. 1385 if (LineTable) 1386 LineTable->getFileLineInfoForAddress( 1387 {Address.Address, Address.SectionIndex}, CU->getCompilationDir(), 1388 Spec.FLIKind, Frame); 1389 } else { 1390 // Otherwise, use call file, call line and call column from 1391 // previous DIE in inlined chain. 1392 if (LineTable) 1393 LineTable->getFileNameByIndex(CallFile, CU->getCompilationDir(), 1394 Spec.FLIKind, Frame.FileName); 1395 Frame.Line = CallLine; 1396 Frame.Column = CallColumn; 1397 Frame.Discriminator = CallDiscriminator; 1398 } 1399 // Get call file/line/column of a current DIE. 1400 if (i + 1 < n) { 1401 FunctionDIE.getCallerFrame(CallFile, CallLine, CallColumn, 1402 CallDiscriminator); 1403 } 1404 } 1405 InliningInfo.addFrame(Frame); 1406 } 1407 return InliningInfo; 1408 } 1409 1410 std::shared_ptr<DWARFContext> 1411 DWARFContext::getDWOContext(StringRef AbsolutePath) { 1412 if (auto S = DWP.lock()) { 1413 DWARFContext *Ctxt = S->Context.get(); 1414 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt); 1415 } 1416 1417 std::weak_ptr<DWOFile> *Entry = &DWOFiles[AbsolutePath]; 1418 1419 if (auto S = Entry->lock()) { 1420 DWARFContext *Ctxt = S->Context.get(); 1421 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt); 1422 } 1423 1424 Expected<OwningBinary<ObjectFile>> Obj = [&] { 1425 if (!CheckedForDWP) { 1426 SmallString<128> DWPName; 1427 auto Obj = object::ObjectFile::createObjectFile( 1428 this->DWPName.empty() 1429 ? (DObj->getFileName() + ".dwp").toStringRef(DWPName) 1430 : StringRef(this->DWPName)); 1431 if (Obj) { 1432 Entry = &DWP; 1433 return Obj; 1434 } else { 1435 CheckedForDWP = true; 1436 // TODO: Should this error be handled (maybe in a high verbosity mode) 1437 // before falling back to .dwo files? 1438 consumeError(Obj.takeError()); 1439 } 1440 } 1441 1442 return object::ObjectFile::createObjectFile(AbsolutePath); 1443 }(); 1444 1445 if (!Obj) { 1446 // TODO: Actually report errors helpfully. 1447 consumeError(Obj.takeError()); 1448 return nullptr; 1449 } 1450 1451 auto S = std::make_shared<DWOFile>(); 1452 S->File = std::move(Obj.get()); 1453 S->Context = DWARFContext::create(*S->File.getBinary(), 1454 ProcessDebugRelocations::Ignore); 1455 *Entry = S; 1456 auto *Ctxt = S->Context.get(); 1457 return std::shared_ptr<DWARFContext>(std::move(S), Ctxt); 1458 } 1459 1460 static Error createError(const Twine &Reason, llvm::Error E) { 1461 return make_error<StringError>(Reason + toString(std::move(E)), 1462 inconvertibleErrorCode()); 1463 } 1464 1465 /// SymInfo contains information about symbol: it's address 1466 /// and section index which is -1LL for absolute symbols. 1467 struct SymInfo { 1468 uint64_t Address; 1469 uint64_t SectionIndex; 1470 }; 1471 1472 /// Returns the address of symbol relocation used against and a section index. 1473 /// Used for futher relocations computation. Symbol's section load address is 1474 static Expected<SymInfo> getSymbolInfo(const object::ObjectFile &Obj, 1475 const RelocationRef &Reloc, 1476 const LoadedObjectInfo *L, 1477 std::map<SymbolRef, SymInfo> &Cache) { 1478 SymInfo Ret = {0, (uint64_t)-1LL}; 1479 object::section_iterator RSec = Obj.section_end(); 1480 object::symbol_iterator Sym = Reloc.getSymbol(); 1481 1482 std::map<SymbolRef, SymInfo>::iterator CacheIt = Cache.end(); 1483 // First calculate the address of the symbol or section as it appears 1484 // in the object file 1485 if (Sym != Obj.symbol_end()) { 1486 bool New; 1487 std::tie(CacheIt, New) = Cache.insert({*Sym, {0, 0}}); 1488 if (!New) 1489 return CacheIt->second; 1490 1491 Expected<uint64_t> SymAddrOrErr = Sym->getAddress(); 1492 if (!SymAddrOrErr) 1493 return createError("failed to compute symbol address: ", 1494 SymAddrOrErr.takeError()); 1495 1496 // Also remember what section this symbol is in for later 1497 auto SectOrErr = Sym->getSection(); 1498 if (!SectOrErr) 1499 return createError("failed to get symbol section: ", 1500 SectOrErr.takeError()); 1501 1502 RSec = *SectOrErr; 1503 Ret.Address = *SymAddrOrErr; 1504 } else if (auto *MObj = dyn_cast<MachOObjectFile>(&Obj)) { 1505 RSec = MObj->getRelocationSection(Reloc.getRawDataRefImpl()); 1506 Ret.Address = RSec->getAddress(); 1507 } 1508 1509 if (RSec != Obj.section_end()) 1510 Ret.SectionIndex = RSec->getIndex(); 1511 1512 // If we are given load addresses for the sections, we need to adjust: 1513 // SymAddr = (Address of Symbol Or Section in File) - 1514 // (Address of Section in File) + 1515 // (Load Address of Section) 1516 // RSec is now either the section being targeted or the section 1517 // containing the symbol being targeted. In either case, 1518 // we need to perform the same computation. 1519 if (L && RSec != Obj.section_end()) 1520 if (uint64_t SectionLoadAddress = L->getSectionLoadAddress(*RSec)) 1521 Ret.Address += SectionLoadAddress - RSec->getAddress(); 1522 1523 if (CacheIt != Cache.end()) 1524 CacheIt->second = Ret; 1525 1526 return Ret; 1527 } 1528 1529 static bool isRelocScattered(const object::ObjectFile &Obj, 1530 const RelocationRef &Reloc) { 1531 const MachOObjectFile *MachObj = dyn_cast<MachOObjectFile>(&Obj); 1532 if (!MachObj) 1533 return false; 1534 // MachO also has relocations that point to sections and 1535 // scattered relocations. 1536 auto RelocInfo = MachObj->getRelocation(Reloc.getRawDataRefImpl()); 1537 return MachObj->isRelocationScattered(RelocInfo); 1538 } 1539 1540 namespace { 1541 struct DWARFSectionMap final : public DWARFSection { 1542 RelocAddrMap Relocs; 1543 }; 1544 1545 class DWARFObjInMemory final : public DWARFObject { 1546 bool IsLittleEndian; 1547 uint8_t AddressSize; 1548 StringRef FileName; 1549 const object::ObjectFile *Obj = nullptr; 1550 std::vector<SectionName> SectionNames; 1551 1552 using InfoSectionMap = MapVector<object::SectionRef, DWARFSectionMap, 1553 std::map<object::SectionRef, unsigned>>; 1554 1555 InfoSectionMap InfoSections; 1556 InfoSectionMap TypesSections; 1557 InfoSectionMap InfoDWOSections; 1558 InfoSectionMap TypesDWOSections; 1559 1560 DWARFSectionMap LocSection; 1561 DWARFSectionMap LoclistsSection; 1562 DWARFSectionMap LoclistsDWOSection; 1563 DWARFSectionMap LineSection; 1564 DWARFSectionMap RangesSection; 1565 DWARFSectionMap RnglistsSection; 1566 DWARFSectionMap StrOffsetsSection; 1567 DWARFSectionMap LineDWOSection; 1568 DWARFSectionMap FrameSection; 1569 DWARFSectionMap EHFrameSection; 1570 DWARFSectionMap LocDWOSection; 1571 DWARFSectionMap StrOffsetsDWOSection; 1572 DWARFSectionMap RangesDWOSection; 1573 DWARFSectionMap RnglistsDWOSection; 1574 DWARFSectionMap AddrSection; 1575 DWARFSectionMap AppleNamesSection; 1576 DWARFSectionMap AppleTypesSection; 1577 DWARFSectionMap AppleNamespacesSection; 1578 DWARFSectionMap AppleObjCSection; 1579 DWARFSectionMap NamesSection; 1580 DWARFSectionMap PubnamesSection; 1581 DWARFSectionMap PubtypesSection; 1582 DWARFSectionMap GnuPubnamesSection; 1583 DWARFSectionMap GnuPubtypesSection; 1584 DWARFSectionMap MacroSection; 1585 1586 DWARFSectionMap *mapNameToDWARFSection(StringRef Name) { 1587 return StringSwitch<DWARFSectionMap *>(Name) 1588 .Case("debug_loc", &LocSection) 1589 .Case("debug_loclists", &LoclistsSection) 1590 .Case("debug_loclists.dwo", &LoclistsDWOSection) 1591 .Case("debug_line", &LineSection) 1592 .Case("debug_frame", &FrameSection) 1593 .Case("eh_frame", &EHFrameSection) 1594 .Case("debug_str_offsets", &StrOffsetsSection) 1595 .Case("debug_ranges", &RangesSection) 1596 .Case("debug_rnglists", &RnglistsSection) 1597 .Case("debug_loc.dwo", &LocDWOSection) 1598 .Case("debug_line.dwo", &LineDWOSection) 1599 .Case("debug_names", &NamesSection) 1600 .Case("debug_rnglists.dwo", &RnglistsDWOSection) 1601 .Case("debug_str_offsets.dwo", &StrOffsetsDWOSection) 1602 .Case("debug_addr", &AddrSection) 1603 .Case("apple_names", &AppleNamesSection) 1604 .Case("debug_pubnames", &PubnamesSection) 1605 .Case("debug_pubtypes", &PubtypesSection) 1606 .Case("debug_gnu_pubnames", &GnuPubnamesSection) 1607 .Case("debug_gnu_pubtypes", &GnuPubtypesSection) 1608 .Case("apple_types", &AppleTypesSection) 1609 .Case("apple_namespaces", &AppleNamespacesSection) 1610 .Case("apple_namespac", &AppleNamespacesSection) 1611 .Case("apple_objc", &AppleObjCSection) 1612 .Case("debug_macro", &MacroSection) 1613 .Default(nullptr); 1614 } 1615 1616 StringRef AbbrevSection; 1617 StringRef ArangesSection; 1618 StringRef StrSection; 1619 StringRef MacinfoSection; 1620 StringRef MacinfoDWOSection; 1621 StringRef MacroDWOSection; 1622 StringRef AbbrevDWOSection; 1623 StringRef StrDWOSection; 1624 StringRef CUIndexSection; 1625 StringRef GdbIndexSection; 1626 StringRef TUIndexSection; 1627 StringRef LineStrSection; 1628 1629 // A deque holding section data whose iterators are not invalidated when 1630 // new decompressed sections are inserted at the end. 1631 std::deque<SmallString<0>> UncompressedSections; 1632 1633 StringRef *mapSectionToMember(StringRef Name) { 1634 if (DWARFSection *Sec = mapNameToDWARFSection(Name)) 1635 return &Sec->Data; 1636 return StringSwitch<StringRef *>(Name) 1637 .Case("debug_abbrev", &AbbrevSection) 1638 .Case("debug_aranges", &ArangesSection) 1639 .Case("debug_str", &StrSection) 1640 .Case("debug_macinfo", &MacinfoSection) 1641 .Case("debug_macinfo.dwo", &MacinfoDWOSection) 1642 .Case("debug_macro.dwo", &MacroDWOSection) 1643 .Case("debug_abbrev.dwo", &AbbrevDWOSection) 1644 .Case("debug_str.dwo", &StrDWOSection) 1645 .Case("debug_cu_index", &CUIndexSection) 1646 .Case("debug_tu_index", &TUIndexSection) 1647 .Case("gdb_index", &GdbIndexSection) 1648 .Case("debug_line_str", &LineStrSection) 1649 // Any more debug info sections go here. 1650 .Default(nullptr); 1651 } 1652 1653 /// If Sec is compressed section, decompresses and updates its contents 1654 /// provided by Data. Otherwise leaves it unchanged. 1655 Error maybeDecompress(const object::SectionRef &Sec, StringRef Name, 1656 StringRef &Data) { 1657 if (!Decompressor::isCompressed(Sec)) 1658 return Error::success(); 1659 1660 Expected<Decompressor> Decompressor = 1661 Decompressor::create(Name, Data, IsLittleEndian, AddressSize == 8); 1662 if (!Decompressor) 1663 return Decompressor.takeError(); 1664 1665 SmallString<0> Out; 1666 if (auto Err = Decompressor->resizeAndDecompress(Out)) 1667 return Err; 1668 1669 UncompressedSections.push_back(std::move(Out)); 1670 Data = UncompressedSections.back(); 1671 1672 return Error::success(); 1673 } 1674 1675 public: 1676 DWARFObjInMemory(const StringMap<std::unique_ptr<MemoryBuffer>> &Sections, 1677 uint8_t AddrSize, bool IsLittleEndian) 1678 : IsLittleEndian(IsLittleEndian) { 1679 for (const auto &SecIt : Sections) { 1680 if (StringRef *SectionData = mapSectionToMember(SecIt.first())) 1681 *SectionData = SecIt.second->getBuffer(); 1682 else if (SecIt.first() == "debug_info") 1683 // Find debug_info and debug_types data by section rather than name as 1684 // there are multiple, comdat grouped, of these sections. 1685 InfoSections[SectionRef()].Data = SecIt.second->getBuffer(); 1686 else if (SecIt.first() == "debug_info.dwo") 1687 InfoDWOSections[SectionRef()].Data = SecIt.second->getBuffer(); 1688 else if (SecIt.first() == "debug_types") 1689 TypesSections[SectionRef()].Data = SecIt.second->getBuffer(); 1690 else if (SecIt.first() == "debug_types.dwo") 1691 TypesDWOSections[SectionRef()].Data = SecIt.second->getBuffer(); 1692 } 1693 } 1694 DWARFObjInMemory(const object::ObjectFile &Obj, const LoadedObjectInfo *L, 1695 function_ref<void(Error)> HandleError, 1696 function_ref<void(Error)> HandleWarning, 1697 DWARFContext::ProcessDebugRelocations RelocAction) 1698 : IsLittleEndian(Obj.isLittleEndian()), 1699 AddressSize(Obj.getBytesInAddress()), FileName(Obj.getFileName()), 1700 Obj(&Obj) { 1701 1702 StringMap<unsigned> SectionAmountMap; 1703 for (const SectionRef &Section : Obj.sections()) { 1704 StringRef Name; 1705 if (auto NameOrErr = Section.getName()) 1706 Name = *NameOrErr; 1707 else 1708 consumeError(NameOrErr.takeError()); 1709 1710 ++SectionAmountMap[Name]; 1711 SectionNames.push_back({ Name, true }); 1712 1713 // Skip BSS and Virtual sections, they aren't interesting. 1714 if (Section.isBSS() || Section.isVirtual()) 1715 continue; 1716 1717 // Skip sections stripped by dsymutil. 1718 if (Section.isStripped()) 1719 continue; 1720 1721 StringRef Data; 1722 Expected<section_iterator> SecOrErr = Section.getRelocatedSection(); 1723 if (!SecOrErr) { 1724 HandleError(createError("failed to get relocated section: ", 1725 SecOrErr.takeError())); 1726 continue; 1727 } 1728 1729 // Try to obtain an already relocated version of this section. 1730 // Else use the unrelocated section from the object file. We'll have to 1731 // apply relocations ourselves later. 1732 section_iterator RelocatedSection = 1733 Obj.isRelocatableObject() ? *SecOrErr : Obj.section_end(); 1734 if (!L || !L->getLoadedSectionContents(*RelocatedSection, Data)) { 1735 Expected<StringRef> E = Section.getContents(); 1736 if (E) 1737 Data = *E; 1738 else 1739 // maybeDecompress below will error. 1740 consumeError(E.takeError()); 1741 } 1742 1743 if (auto Err = maybeDecompress(Section, Name, Data)) { 1744 HandleError(createError("failed to decompress '" + Name + "', ", 1745 std::move(Err))); 1746 continue; 1747 } 1748 1749 // Compressed sections names in GNU style starts from ".z", 1750 // at this point section is decompressed and we drop compression prefix. 1751 Name = Name.substr( 1752 Name.find_first_not_of("._z")); // Skip ".", "z" and "_" prefixes. 1753 1754 // Map platform specific debug section names to DWARF standard section 1755 // names. 1756 Name = Obj.mapDebugSectionName(Name); 1757 1758 if (StringRef *SectionData = mapSectionToMember(Name)) { 1759 *SectionData = Data; 1760 if (Name == "debug_ranges") { 1761 // FIXME: Use the other dwo range section when we emit it. 1762 RangesDWOSection.Data = Data; 1763 } else if (Name == "debug_frame" || Name == "eh_frame") { 1764 if (DWARFSection *S = mapNameToDWARFSection(Name)) 1765 S->Address = Section.getAddress(); 1766 } 1767 } else if (InfoSectionMap *Sections = 1768 StringSwitch<InfoSectionMap *>(Name) 1769 .Case("debug_info", &InfoSections) 1770 .Case("debug_info.dwo", &InfoDWOSections) 1771 .Case("debug_types", &TypesSections) 1772 .Case("debug_types.dwo", &TypesDWOSections) 1773 .Default(nullptr)) { 1774 // Find debug_info and debug_types data by section rather than name as 1775 // there are multiple, comdat grouped, of these sections. 1776 DWARFSectionMap &S = (*Sections)[Section]; 1777 S.Data = Data; 1778 } 1779 1780 if (RelocatedSection != Obj.section_end() && Name.contains(".dwo")) 1781 HandleWarning( 1782 createError("Unexpected relocations for dwo section " + Name)); 1783 1784 if (RelocatedSection == Obj.section_end() || 1785 (RelocAction == DWARFContext::ProcessDebugRelocations::Ignore)) 1786 continue; 1787 1788 StringRef RelSecName; 1789 if (auto NameOrErr = RelocatedSection->getName()) 1790 RelSecName = *NameOrErr; 1791 else 1792 consumeError(NameOrErr.takeError()); 1793 1794 // If the section we're relocating was relocated already by the JIT, 1795 // then we used the relocated version above, so we do not need to process 1796 // relocations for it now. 1797 StringRef RelSecData; 1798 if (L && L->getLoadedSectionContents(*RelocatedSection, RelSecData)) 1799 continue; 1800 1801 // In Mach-o files, the relocations do not need to be applied if 1802 // there is no load offset to apply. The value read at the 1803 // relocation point already factors in the section address 1804 // (actually applying the relocations will produce wrong results 1805 // as the section address will be added twice). 1806 if (!L && isa<MachOObjectFile>(&Obj)) 1807 continue; 1808 1809 RelSecName = RelSecName.substr( 1810 RelSecName.find_first_not_of("._z")); // Skip . and _ prefixes. 1811 1812 // TODO: Add support for relocations in other sections as needed. 1813 // Record relocations for the debug_info and debug_line sections. 1814 DWARFSectionMap *Sec = mapNameToDWARFSection(RelSecName); 1815 RelocAddrMap *Map = Sec ? &Sec->Relocs : nullptr; 1816 if (!Map) { 1817 // Find debug_info and debug_types relocs by section rather than name 1818 // as there are multiple, comdat grouped, of these sections. 1819 if (RelSecName == "debug_info") 1820 Map = &static_cast<DWARFSectionMap &>(InfoSections[*RelocatedSection]) 1821 .Relocs; 1822 else if (RelSecName == "debug_types") 1823 Map = 1824 &static_cast<DWARFSectionMap &>(TypesSections[*RelocatedSection]) 1825 .Relocs; 1826 else 1827 continue; 1828 } 1829 1830 if (Section.relocation_begin() == Section.relocation_end()) 1831 continue; 1832 1833 // Symbol to [address, section index] cache mapping. 1834 std::map<SymbolRef, SymInfo> AddrCache; 1835 SupportsRelocation Supports; 1836 RelocationResolver Resolver; 1837 std::tie(Supports, Resolver) = getRelocationResolver(Obj); 1838 for (const RelocationRef &Reloc : Section.relocations()) { 1839 // FIXME: it's not clear how to correctly handle scattered 1840 // relocations. 1841 if (isRelocScattered(Obj, Reloc)) 1842 continue; 1843 1844 Expected<SymInfo> SymInfoOrErr = 1845 getSymbolInfo(Obj, Reloc, L, AddrCache); 1846 if (!SymInfoOrErr) { 1847 HandleError(SymInfoOrErr.takeError()); 1848 continue; 1849 } 1850 1851 // Check if Resolver can handle this relocation type early so as not to 1852 // handle invalid cases in DWARFDataExtractor. 1853 // 1854 // TODO Don't store Resolver in every RelocAddrEntry. 1855 if (Supports && Supports(Reloc.getType())) { 1856 auto I = Map->try_emplace( 1857 Reloc.getOffset(), 1858 RelocAddrEntry{SymInfoOrErr->SectionIndex, Reloc, 1859 SymInfoOrErr->Address, 1860 Optional<object::RelocationRef>(), 0, Resolver}); 1861 // If we didn't successfully insert that's because we already had a 1862 // relocation for that offset. Store it as a second relocation in the 1863 // same RelocAddrEntry instead. 1864 if (!I.second) { 1865 RelocAddrEntry &entry = I.first->getSecond(); 1866 if (entry.Reloc2) { 1867 HandleError(createError( 1868 "At most two relocations per offset are supported")); 1869 } 1870 entry.Reloc2 = Reloc; 1871 entry.SymbolValue2 = SymInfoOrErr->Address; 1872 } 1873 } else { 1874 SmallString<32> Type; 1875 Reloc.getTypeName(Type); 1876 // FIXME: Support more relocations & change this to an error 1877 HandleWarning( 1878 createError("failed to compute relocation: " + Type + ", ", 1879 errorCodeToError(object_error::parse_failed))); 1880 } 1881 } 1882 } 1883 1884 for (SectionName &S : SectionNames) 1885 if (SectionAmountMap[S.Name] > 1) 1886 S.IsNameUnique = false; 1887 } 1888 1889 Optional<RelocAddrEntry> find(const DWARFSection &S, 1890 uint64_t Pos) const override { 1891 auto &Sec = static_cast<const DWARFSectionMap &>(S); 1892 RelocAddrMap::const_iterator AI = Sec.Relocs.find(Pos); 1893 if (AI == Sec.Relocs.end()) 1894 return None; 1895 return AI->second; 1896 } 1897 1898 const object::ObjectFile *getFile() const override { return Obj; } 1899 1900 ArrayRef<SectionName> getSectionNames() const override { 1901 return SectionNames; 1902 } 1903 1904 bool isLittleEndian() const override { return IsLittleEndian; } 1905 StringRef getAbbrevDWOSection() const override { return AbbrevDWOSection; } 1906 const DWARFSection &getLineDWOSection() const override { 1907 return LineDWOSection; 1908 } 1909 const DWARFSection &getLocDWOSection() const override { 1910 return LocDWOSection; 1911 } 1912 StringRef getStrDWOSection() const override { return StrDWOSection; } 1913 const DWARFSection &getStrOffsetsDWOSection() const override { 1914 return StrOffsetsDWOSection; 1915 } 1916 const DWARFSection &getRangesDWOSection() const override { 1917 return RangesDWOSection; 1918 } 1919 const DWARFSection &getRnglistsDWOSection() const override { 1920 return RnglistsDWOSection; 1921 } 1922 const DWARFSection &getLoclistsDWOSection() const override { 1923 return LoclistsDWOSection; 1924 } 1925 const DWARFSection &getAddrSection() const override { return AddrSection; } 1926 StringRef getCUIndexSection() const override { return CUIndexSection; } 1927 StringRef getGdbIndexSection() const override { return GdbIndexSection; } 1928 StringRef getTUIndexSection() const override { return TUIndexSection; } 1929 1930 // DWARF v5 1931 const DWARFSection &getStrOffsetsSection() const override { 1932 return StrOffsetsSection; 1933 } 1934 StringRef getLineStrSection() const override { return LineStrSection; } 1935 1936 // Sections for DWARF5 split dwarf proposal. 1937 void forEachInfoDWOSections( 1938 function_ref<void(const DWARFSection &)> F) const override { 1939 for (auto &P : InfoDWOSections) 1940 F(P.second); 1941 } 1942 void forEachTypesDWOSections( 1943 function_ref<void(const DWARFSection &)> F) const override { 1944 for (auto &P : TypesDWOSections) 1945 F(P.second); 1946 } 1947 1948 StringRef getAbbrevSection() const override { return AbbrevSection; } 1949 const DWARFSection &getLocSection() const override { return LocSection; } 1950 const DWARFSection &getLoclistsSection() const override { return LoclistsSection; } 1951 StringRef getArangesSection() const override { return ArangesSection; } 1952 const DWARFSection &getFrameSection() const override { 1953 return FrameSection; 1954 } 1955 const DWARFSection &getEHFrameSection() const override { 1956 return EHFrameSection; 1957 } 1958 const DWARFSection &getLineSection() const override { return LineSection; } 1959 StringRef getStrSection() const override { return StrSection; } 1960 const DWARFSection &getRangesSection() const override { return RangesSection; } 1961 const DWARFSection &getRnglistsSection() const override { 1962 return RnglistsSection; 1963 } 1964 const DWARFSection &getMacroSection() const override { return MacroSection; } 1965 StringRef getMacroDWOSection() const override { return MacroDWOSection; } 1966 StringRef getMacinfoSection() const override { return MacinfoSection; } 1967 StringRef getMacinfoDWOSection() const override { return MacinfoDWOSection; } 1968 const DWARFSection &getPubnamesSection() const override { return PubnamesSection; } 1969 const DWARFSection &getPubtypesSection() const override { return PubtypesSection; } 1970 const DWARFSection &getGnuPubnamesSection() const override { 1971 return GnuPubnamesSection; 1972 } 1973 const DWARFSection &getGnuPubtypesSection() const override { 1974 return GnuPubtypesSection; 1975 } 1976 const DWARFSection &getAppleNamesSection() const override { 1977 return AppleNamesSection; 1978 } 1979 const DWARFSection &getAppleTypesSection() const override { 1980 return AppleTypesSection; 1981 } 1982 const DWARFSection &getAppleNamespacesSection() const override { 1983 return AppleNamespacesSection; 1984 } 1985 const DWARFSection &getAppleObjCSection() const override { 1986 return AppleObjCSection; 1987 } 1988 const DWARFSection &getNamesSection() const override { 1989 return NamesSection; 1990 } 1991 1992 StringRef getFileName() const override { return FileName; } 1993 uint8_t getAddressSize() const override { return AddressSize; } 1994 void forEachInfoSections( 1995 function_ref<void(const DWARFSection &)> F) const override { 1996 for (auto &P : InfoSections) 1997 F(P.second); 1998 } 1999 void forEachTypesSections( 2000 function_ref<void(const DWARFSection &)> F) const override { 2001 for (auto &P : TypesSections) 2002 F(P.second); 2003 } 2004 }; 2005 } // namespace 2006 2007 std::unique_ptr<DWARFContext> 2008 DWARFContext::create(const object::ObjectFile &Obj, 2009 ProcessDebugRelocations RelocAction, 2010 const LoadedObjectInfo *L, std::string DWPName, 2011 std::function<void(Error)> RecoverableErrorHandler, 2012 std::function<void(Error)> WarningHandler) { 2013 auto DObj = std::make_unique<DWARFObjInMemory>( 2014 Obj, L, RecoverableErrorHandler, WarningHandler, RelocAction); 2015 return std::make_unique<DWARFContext>(std::move(DObj), std::move(DWPName), 2016 RecoverableErrorHandler, 2017 WarningHandler); 2018 } 2019 2020 std::unique_ptr<DWARFContext> 2021 DWARFContext::create(const StringMap<std::unique_ptr<MemoryBuffer>> &Sections, 2022 uint8_t AddrSize, bool isLittleEndian, 2023 std::function<void(Error)> RecoverableErrorHandler, 2024 std::function<void(Error)> WarningHandler) { 2025 auto DObj = 2026 std::make_unique<DWARFObjInMemory>(Sections, AddrSize, isLittleEndian); 2027 return std::make_unique<DWARFContext>( 2028 std::move(DObj), "", RecoverableErrorHandler, WarningHandler); 2029 } 2030 2031 Error DWARFContext::loadRegisterInfo(const object::ObjectFile &Obj) { 2032 // Detect the architecture from the object file. We usually don't need OS 2033 // info to lookup a target and create register info. 2034 Triple TT; 2035 TT.setArch(Triple::ArchType(Obj.getArch())); 2036 TT.setVendor(Triple::UnknownVendor); 2037 TT.setOS(Triple::UnknownOS); 2038 std::string TargetLookupError; 2039 const Target *TheTarget = 2040 TargetRegistry::lookupTarget(TT.str(), TargetLookupError); 2041 if (!TargetLookupError.empty()) 2042 return createStringError(errc::invalid_argument, 2043 TargetLookupError.c_str()); 2044 RegInfo.reset(TheTarget->createMCRegInfo(TT.str())); 2045 return Error::success(); 2046 } 2047 2048 uint8_t DWARFContext::getCUAddrSize() { 2049 // In theory, different compile units may have different address byte 2050 // sizes, but for simplicity we just use the address byte size of the 2051 // first compile unit. In practice the address size field is repeated across 2052 // various DWARF headers (at least in version 5) to make it easier to dump 2053 // them independently, not to enable varying the address size. 2054 auto CUs = compile_units(); 2055 return CUs.empty() ? 0 : (*CUs.begin())->getAddressByteSize(); 2056 } 2057