1 //===-- llvm/lib/CodeGen/AsmPrinter/CodeViewDebug.cpp --*- C++ -*--===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file contains support for writing Microsoft CodeView debug info. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "CodeViewDebug.h" 15 #include "llvm/DebugInfo/CodeView/CodeView.h" 16 #include "llvm/DebugInfo/CodeView/FieldListRecordBuilder.h" 17 #include "llvm/DebugInfo/CodeView/Line.h" 18 #include "llvm/DebugInfo/CodeView/SymbolRecord.h" 19 #include "llvm/DebugInfo/CodeView/TypeDumper.h" 20 #include "llvm/DebugInfo/CodeView/TypeIndex.h" 21 #include "llvm/DebugInfo/CodeView/TypeRecord.h" 22 #include "llvm/MC/MCExpr.h" 23 #include "llvm/MC/MCSectionCOFF.h" 24 #include "llvm/MC/MCSymbol.h" 25 #include "llvm/Support/COFF.h" 26 #include "llvm/Support/ScopedPrinter.h" 27 #include "llvm/Target/TargetSubtargetInfo.h" 28 #include "llvm/Target/TargetRegisterInfo.h" 29 #include "llvm/Target/TargetFrameLowering.h" 30 31 using namespace llvm; 32 using namespace llvm::codeview; 33 34 CodeViewDebug::CodeViewDebug(AsmPrinter *AP) 35 : DebugHandlerBase(AP), OS(*Asm->OutStreamer), CurFn(nullptr) { 36 // If module doesn't have named metadata anchors or COFF debug section 37 // is not available, skip any debug info related stuff. 38 if (!MMI->getModule()->getNamedMetadata("llvm.dbg.cu") || 39 !AP->getObjFileLowering().getCOFFDebugSymbolsSection()) { 40 Asm = nullptr; 41 return; 42 } 43 44 // Tell MMI that we have debug info. 45 MMI->setDebugInfoAvailability(true); 46 } 47 48 StringRef CodeViewDebug::getFullFilepath(const DIFile *File) { 49 std::string &Filepath = FileToFilepathMap[File]; 50 if (!Filepath.empty()) 51 return Filepath; 52 53 StringRef Dir = File->getDirectory(), Filename = File->getFilename(); 54 55 // Clang emits directory and relative filename info into the IR, but CodeView 56 // operates on full paths. We could change Clang to emit full paths too, but 57 // that would increase the IR size and probably not needed for other users. 58 // For now, just concatenate and canonicalize the path here. 59 if (Filename.find(':') == 1) 60 Filepath = Filename; 61 else 62 Filepath = (Dir + "\\" + Filename).str(); 63 64 // Canonicalize the path. We have to do it textually because we may no longer 65 // have access the file in the filesystem. 66 // First, replace all slashes with backslashes. 67 std::replace(Filepath.begin(), Filepath.end(), '/', '\\'); 68 69 // Remove all "\.\" with "\". 70 size_t Cursor = 0; 71 while ((Cursor = Filepath.find("\\.\\", Cursor)) != std::string::npos) 72 Filepath.erase(Cursor, 2); 73 74 // Replace all "\XXX\..\" with "\". Don't try too hard though as the original 75 // path should be well-formatted, e.g. start with a drive letter, etc. 76 Cursor = 0; 77 while ((Cursor = Filepath.find("\\..\\", Cursor)) != std::string::npos) { 78 // Something's wrong if the path starts with "\..\", abort. 79 if (Cursor == 0) 80 break; 81 82 size_t PrevSlash = Filepath.rfind('\\', Cursor - 1); 83 if (PrevSlash == std::string::npos) 84 // Something's wrong, abort. 85 break; 86 87 Filepath.erase(PrevSlash, Cursor + 3 - PrevSlash); 88 // The next ".." might be following the one we've just erased. 89 Cursor = PrevSlash; 90 } 91 92 // Remove all duplicate backslashes. 93 Cursor = 0; 94 while ((Cursor = Filepath.find("\\\\", Cursor)) != std::string::npos) 95 Filepath.erase(Cursor, 1); 96 97 return Filepath; 98 } 99 100 unsigned CodeViewDebug::maybeRecordFile(const DIFile *F) { 101 unsigned NextId = FileIdMap.size() + 1; 102 auto Insertion = FileIdMap.insert(std::make_pair(F, NextId)); 103 if (Insertion.second) { 104 // We have to compute the full filepath and emit a .cv_file directive. 105 StringRef FullPath = getFullFilepath(F); 106 NextId = OS.EmitCVFileDirective(NextId, FullPath); 107 assert(NextId == FileIdMap.size() && ".cv_file directive failed"); 108 } 109 return Insertion.first->second; 110 } 111 112 CodeViewDebug::InlineSite & 113 CodeViewDebug::getInlineSite(const DILocation *InlinedAt, 114 const DISubprogram *Inlinee) { 115 auto SiteInsertion = CurFn->InlineSites.insert({InlinedAt, InlineSite()}); 116 InlineSite *Site = &SiteInsertion.first->second; 117 if (SiteInsertion.second) { 118 Site->SiteFuncId = NextFuncId++; 119 Site->Inlinee = Inlinee; 120 InlinedSubprograms.insert(Inlinee); 121 getFuncIdForSubprogram(Inlinee); 122 } 123 return *Site; 124 } 125 126 TypeIndex CodeViewDebug::getFuncIdForSubprogram(const DISubprogram *SP) { 127 // It's possible to ask for the FuncId of a function which doesn't have a 128 // subprogram: inlining a function with debug info into a function with none. 129 if (!SP) 130 return TypeIndex::None(); 131 132 // Check if we've already translated this subprogram. 133 auto I = TypeIndices.find(SP); 134 if (I != TypeIndices.end()) 135 return I->second; 136 137 TypeIndex ParentScope = TypeIndex(0); 138 StringRef DisplayName = SP->getDisplayName(); 139 FuncIdRecord FuncId(ParentScope, getTypeIndex(SP->getType()), DisplayName); 140 TypeIndex TI = TypeTable.writeFuncId(FuncId); 141 142 recordTypeIndexForDINode(SP, TI); 143 return TI; 144 } 145 146 void CodeViewDebug::recordTypeIndexForDINode(const DINode *Node, TypeIndex TI) { 147 auto InsertResult = TypeIndices.insert({Node, TI}); 148 (void)InsertResult; 149 assert(InsertResult.second && "DINode was already assigned a type index"); 150 } 151 152 void CodeViewDebug::recordLocalVariable(LocalVariable &&Var, 153 const DILocation *InlinedAt) { 154 if (InlinedAt) { 155 // This variable was inlined. Associate it with the InlineSite. 156 const DISubprogram *Inlinee = Var.DIVar->getScope()->getSubprogram(); 157 InlineSite &Site = getInlineSite(InlinedAt, Inlinee); 158 Site.InlinedLocals.emplace_back(Var); 159 } else { 160 // This variable goes in the main ProcSym. 161 CurFn->Locals.emplace_back(Var); 162 } 163 } 164 165 static void addLocIfNotPresent(SmallVectorImpl<const DILocation *> &Locs, 166 const DILocation *Loc) { 167 auto B = Locs.begin(), E = Locs.end(); 168 if (std::find(B, E, Loc) == E) 169 Locs.push_back(Loc); 170 } 171 172 void CodeViewDebug::maybeRecordLocation(const DebugLoc &DL, 173 const MachineFunction *MF) { 174 // Skip this instruction if it has the same location as the previous one. 175 if (DL == CurFn->LastLoc) 176 return; 177 178 const DIScope *Scope = DL.get()->getScope(); 179 if (!Scope) 180 return; 181 182 // Skip this line if it is longer than the maximum we can record. 183 LineInfo LI(DL.getLine(), DL.getLine(), /*IsStatement=*/true); 184 if (LI.getStartLine() != DL.getLine() || LI.isAlwaysStepInto() || 185 LI.isNeverStepInto()) 186 return; 187 188 ColumnInfo CI(DL.getCol(), /*EndColumn=*/0); 189 if (CI.getStartColumn() != DL.getCol()) 190 return; 191 192 if (!CurFn->HaveLineInfo) 193 CurFn->HaveLineInfo = true; 194 unsigned FileId = 0; 195 if (CurFn->LastLoc.get() && CurFn->LastLoc->getFile() == DL->getFile()) 196 FileId = CurFn->LastFileId; 197 else 198 FileId = CurFn->LastFileId = maybeRecordFile(DL->getFile()); 199 CurFn->LastLoc = DL; 200 201 unsigned FuncId = CurFn->FuncId; 202 if (const DILocation *SiteLoc = DL->getInlinedAt()) { 203 const DILocation *Loc = DL.get(); 204 205 // If this location was actually inlined from somewhere else, give it the ID 206 // of the inline call site. 207 FuncId = 208 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()).SiteFuncId; 209 210 // Ensure we have links in the tree of inline call sites. 211 bool FirstLoc = true; 212 while ((SiteLoc = Loc->getInlinedAt())) { 213 InlineSite &Site = 214 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()); 215 if (!FirstLoc) 216 addLocIfNotPresent(Site.ChildSites, Loc); 217 FirstLoc = false; 218 Loc = SiteLoc; 219 } 220 addLocIfNotPresent(CurFn->ChildSites, Loc); 221 } 222 223 OS.EmitCVLocDirective(FuncId, FileId, DL.getLine(), DL.getCol(), 224 /*PrologueEnd=*/false, 225 /*IsStmt=*/false, DL->getFilename()); 226 } 227 228 void CodeViewDebug::emitCodeViewMagicVersion() { 229 OS.EmitValueToAlignment(4); 230 OS.AddComment("Debug section magic"); 231 OS.EmitIntValue(COFF::DEBUG_SECTION_MAGIC, 4); 232 } 233 234 void CodeViewDebug::endModule() { 235 if (!Asm || !MMI->hasDebugInfo()) 236 return; 237 238 assert(Asm != nullptr); 239 240 // The COFF .debug$S section consists of several subsections, each starting 241 // with a 4-byte control code (e.g. 0xF1, 0xF2, etc) and then a 4-byte length 242 // of the payload followed by the payload itself. The subsections are 4-byte 243 // aligned. 244 245 // Use the generic .debug$S section, and make a subsection for all the inlined 246 // subprograms. 247 switchToDebugSectionForSymbol(nullptr); 248 emitInlineeLinesSubsection(); 249 250 // Emit per-function debug information. 251 for (auto &P : FnDebugInfo) 252 if (!P.first->isDeclarationForLinker()) 253 emitDebugInfoForFunction(P.first, P.second); 254 255 // Emit global variable debug information. 256 setCurrentSubprogram(nullptr); 257 emitDebugInfoForGlobals(); 258 259 // Switch back to the generic .debug$S section after potentially processing 260 // comdat symbol sections. 261 switchToDebugSectionForSymbol(nullptr); 262 263 // Emit UDT records for any types used by global variables. 264 if (!GlobalUDTs.empty()) { 265 MCSymbol *SymbolsEnd = beginCVSubsection(ModuleSubstreamKind::Symbols); 266 emitDebugInfoForUDTs(GlobalUDTs); 267 endCVSubsection(SymbolsEnd); 268 } 269 270 // This subsection holds a file index to offset in string table table. 271 OS.AddComment("File index to string table offset subsection"); 272 OS.EmitCVFileChecksumsDirective(); 273 274 // This subsection holds the string table. 275 OS.AddComment("String table"); 276 OS.EmitCVStringTableDirective(); 277 278 // Emit type information last, so that any types we translate while emitting 279 // function info are included. 280 emitTypeInformation(); 281 282 clear(); 283 } 284 285 static void emitNullTerminatedSymbolName(MCStreamer &OS, StringRef S) { 286 // Microsoft's linker seems to have trouble with symbol names longer than 287 // 0xffd8 bytes. 288 S = S.substr(0, 0xffd8); 289 SmallString<32> NullTerminatedString(S); 290 NullTerminatedString.push_back('\0'); 291 OS.EmitBytes(NullTerminatedString); 292 } 293 294 void CodeViewDebug::emitTypeInformation() { 295 // Do nothing if we have no debug info or if no non-trivial types were emitted 296 // to TypeTable during codegen. 297 NamedMDNode *CU_Nodes = 298 MMI->getModule()->getNamedMetadata("llvm.dbg.cu"); 299 if (!CU_Nodes) 300 return; 301 if (TypeTable.empty()) 302 return; 303 304 // Start the .debug$T section with 0x4. 305 OS.SwitchSection(Asm->getObjFileLowering().getCOFFDebugTypesSection()); 306 emitCodeViewMagicVersion(); 307 308 SmallString<8> CommentPrefix; 309 if (OS.isVerboseAsm()) { 310 CommentPrefix += '\t'; 311 CommentPrefix += Asm->MAI->getCommentString(); 312 CommentPrefix += ' '; 313 } 314 315 CVTypeDumper CVTD(nullptr, /*PrintRecordBytes=*/false); 316 TypeTable.ForEachRecord( 317 [&](TypeIndex Index, StringRef Record) { 318 if (OS.isVerboseAsm()) { 319 // Emit a block comment describing the type record for readability. 320 SmallString<512> CommentBlock; 321 raw_svector_ostream CommentOS(CommentBlock); 322 ScopedPrinter SP(CommentOS); 323 SP.setPrefix(CommentPrefix); 324 CVTD.setPrinter(&SP); 325 Error EC = CVTD.dump({Record.bytes_begin(), Record.bytes_end()}); 326 assert(!EC && "produced malformed type record"); 327 consumeError(std::move(EC)); 328 // emitRawComment will insert its own tab and comment string before 329 // the first line, so strip off our first one. It also prints its own 330 // newline. 331 OS.emitRawComment( 332 CommentOS.str().drop_front(CommentPrefix.size() - 1).rtrim()); 333 } 334 OS.EmitBinaryData(Record); 335 }); 336 } 337 338 void CodeViewDebug::emitInlineeLinesSubsection() { 339 if (InlinedSubprograms.empty()) 340 return; 341 342 343 OS.AddComment("Inlinee lines subsection"); 344 MCSymbol *InlineEnd = beginCVSubsection(ModuleSubstreamKind::InlineeLines); 345 346 // We don't provide any extra file info. 347 // FIXME: Find out if debuggers use this info. 348 OS.AddComment("Inlinee lines signature"); 349 OS.EmitIntValue(unsigned(InlineeLinesSignature::Normal), 4); 350 351 for (const DISubprogram *SP : InlinedSubprograms) { 352 assert(TypeIndices.count(SP)); 353 TypeIndex InlineeIdx = TypeIndices[SP]; 354 355 OS.AddBlankLine(); 356 unsigned FileId = maybeRecordFile(SP->getFile()); 357 OS.AddComment("Inlined function " + SP->getDisplayName() + " starts at " + 358 SP->getFilename() + Twine(':') + Twine(SP->getLine())); 359 OS.AddBlankLine(); 360 // The filechecksum table uses 8 byte entries for now, and file ids start at 361 // 1. 362 unsigned FileOffset = (FileId - 1) * 8; 363 OS.AddComment("Type index of inlined function"); 364 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 365 OS.AddComment("Offset into filechecksum table"); 366 OS.EmitIntValue(FileOffset, 4); 367 OS.AddComment("Starting line number"); 368 OS.EmitIntValue(SP->getLine(), 4); 369 } 370 371 endCVSubsection(InlineEnd); 372 } 373 374 void CodeViewDebug::collectInlineSiteChildren( 375 SmallVectorImpl<unsigned> &Children, const FunctionInfo &FI, 376 const InlineSite &Site) { 377 for (const DILocation *ChildSiteLoc : Site.ChildSites) { 378 auto I = FI.InlineSites.find(ChildSiteLoc); 379 const InlineSite &ChildSite = I->second; 380 Children.push_back(ChildSite.SiteFuncId); 381 collectInlineSiteChildren(Children, FI, ChildSite); 382 } 383 } 384 385 void CodeViewDebug::emitInlinedCallSite(const FunctionInfo &FI, 386 const DILocation *InlinedAt, 387 const InlineSite &Site) { 388 MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(), 389 *InlineEnd = MMI->getContext().createTempSymbol(); 390 391 assert(TypeIndices.count(Site.Inlinee)); 392 TypeIndex InlineeIdx = TypeIndices[Site.Inlinee]; 393 394 // SymbolRecord 395 OS.AddComment("Record length"); 396 OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 2); // RecordLength 397 OS.EmitLabel(InlineBegin); 398 OS.AddComment("Record kind: S_INLINESITE"); 399 OS.EmitIntValue(SymbolKind::S_INLINESITE, 2); // RecordKind 400 401 OS.AddComment("PtrParent"); 402 OS.EmitIntValue(0, 4); 403 OS.AddComment("PtrEnd"); 404 OS.EmitIntValue(0, 4); 405 OS.AddComment("Inlinee type index"); 406 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 407 408 unsigned FileId = maybeRecordFile(Site.Inlinee->getFile()); 409 unsigned StartLineNum = Site.Inlinee->getLine(); 410 SmallVector<unsigned, 3> SecondaryFuncIds; 411 collectInlineSiteChildren(SecondaryFuncIds, FI, Site); 412 413 OS.EmitCVInlineLinetableDirective(Site.SiteFuncId, FileId, StartLineNum, 414 FI.Begin, FI.End, SecondaryFuncIds); 415 416 OS.EmitLabel(InlineEnd); 417 418 for (const LocalVariable &Var : Site.InlinedLocals) 419 emitLocalVariable(Var); 420 421 // Recurse on child inlined call sites before closing the scope. 422 for (const DILocation *ChildSite : Site.ChildSites) { 423 auto I = FI.InlineSites.find(ChildSite); 424 assert(I != FI.InlineSites.end() && 425 "child site not in function inline site map"); 426 emitInlinedCallSite(FI, ChildSite, I->second); 427 } 428 429 // Close the scope. 430 OS.AddComment("Record length"); 431 OS.EmitIntValue(2, 2); // RecordLength 432 OS.AddComment("Record kind: S_INLINESITE_END"); 433 OS.EmitIntValue(SymbolKind::S_INLINESITE_END, 2); // RecordKind 434 } 435 436 void CodeViewDebug::switchToDebugSectionForSymbol(const MCSymbol *GVSym) { 437 // If we have a symbol, it may be in a section that is COMDAT. If so, find the 438 // comdat key. A section may be comdat because of -ffunction-sections or 439 // because it is comdat in the IR. 440 MCSectionCOFF *GVSec = 441 GVSym ? dyn_cast<MCSectionCOFF>(&GVSym->getSection()) : nullptr; 442 const MCSymbol *KeySym = GVSec ? GVSec->getCOMDATSymbol() : nullptr; 443 444 MCSectionCOFF *DebugSec = cast<MCSectionCOFF>( 445 Asm->getObjFileLowering().getCOFFDebugSymbolsSection()); 446 DebugSec = OS.getContext().getAssociativeCOFFSection(DebugSec, KeySym); 447 448 OS.SwitchSection(DebugSec); 449 450 // Emit the magic version number if this is the first time we've switched to 451 // this section. 452 if (ComdatDebugSections.insert(DebugSec).second) 453 emitCodeViewMagicVersion(); 454 } 455 456 void CodeViewDebug::emitDebugInfoForFunction(const Function *GV, 457 FunctionInfo &FI) { 458 // For each function there is a separate subsection 459 // which holds the PC to file:line table. 460 const MCSymbol *Fn = Asm->getSymbol(GV); 461 assert(Fn); 462 463 // Switch to the to a comdat section, if appropriate. 464 switchToDebugSectionForSymbol(Fn); 465 466 StringRef FuncName; 467 auto *SP = GV->getSubprogram(); 468 setCurrentSubprogram(SP); 469 if (SP != nullptr) 470 FuncName = SP->getDisplayName(); 471 472 // If our DISubprogram name is empty, use the mangled name. 473 if (FuncName.empty()) 474 FuncName = GlobalValue::getRealLinkageName(GV->getName()); 475 476 // Emit a symbol subsection, required by VS2012+ to find function boundaries. 477 OS.AddComment("Symbol subsection for " + Twine(FuncName)); 478 MCSymbol *SymbolsEnd = beginCVSubsection(ModuleSubstreamKind::Symbols); 479 { 480 MCSymbol *ProcRecordBegin = MMI->getContext().createTempSymbol(), 481 *ProcRecordEnd = MMI->getContext().createTempSymbol(); 482 OS.AddComment("Record length"); 483 OS.emitAbsoluteSymbolDiff(ProcRecordEnd, ProcRecordBegin, 2); 484 OS.EmitLabel(ProcRecordBegin); 485 486 OS.AddComment("Record kind: S_GPROC32_ID"); 487 OS.EmitIntValue(unsigned(SymbolKind::S_GPROC32_ID), 2); 488 489 // These fields are filled in by tools like CVPACK which run after the fact. 490 OS.AddComment("PtrParent"); 491 OS.EmitIntValue(0, 4); 492 OS.AddComment("PtrEnd"); 493 OS.EmitIntValue(0, 4); 494 OS.AddComment("PtrNext"); 495 OS.EmitIntValue(0, 4); 496 // This is the important bit that tells the debugger where the function 497 // code is located and what's its size: 498 OS.AddComment("Code size"); 499 OS.emitAbsoluteSymbolDiff(FI.End, Fn, 4); 500 OS.AddComment("Offset after prologue"); 501 OS.EmitIntValue(0, 4); 502 OS.AddComment("Offset before epilogue"); 503 OS.EmitIntValue(0, 4); 504 OS.AddComment("Function type index"); 505 OS.EmitIntValue(getFuncIdForSubprogram(GV->getSubprogram()).getIndex(), 4); 506 OS.AddComment("Function section relative address"); 507 OS.EmitCOFFSecRel32(Fn); 508 OS.AddComment("Function section index"); 509 OS.EmitCOFFSectionIndex(Fn); 510 OS.AddComment("Flags"); 511 OS.EmitIntValue(0, 1); 512 // Emit the function display name as a null-terminated string. 513 OS.AddComment("Function name"); 514 // Truncate the name so we won't overflow the record length field. 515 emitNullTerminatedSymbolName(OS, FuncName); 516 OS.EmitLabel(ProcRecordEnd); 517 518 for (const LocalVariable &Var : FI.Locals) 519 emitLocalVariable(Var); 520 521 // Emit inlined call site information. Only emit functions inlined directly 522 // into the parent function. We'll emit the other sites recursively as part 523 // of their parent inline site. 524 for (const DILocation *InlinedAt : FI.ChildSites) { 525 auto I = FI.InlineSites.find(InlinedAt); 526 assert(I != FI.InlineSites.end() && 527 "child site not in function inline site map"); 528 emitInlinedCallSite(FI, InlinedAt, I->second); 529 } 530 531 if (SP != nullptr) 532 emitDebugInfoForUDTs(LocalUDTs); 533 534 // We're done with this function. 535 OS.AddComment("Record length"); 536 OS.EmitIntValue(0x0002, 2); 537 OS.AddComment("Record kind: S_PROC_ID_END"); 538 OS.EmitIntValue(unsigned(SymbolKind::S_PROC_ID_END), 2); 539 } 540 endCVSubsection(SymbolsEnd); 541 542 // We have an assembler directive that takes care of the whole line table. 543 OS.EmitCVLinetableDirective(FI.FuncId, Fn, FI.End); 544 } 545 546 CodeViewDebug::LocalVarDefRange 547 CodeViewDebug::createDefRangeMem(uint16_t CVRegister, int Offset) { 548 LocalVarDefRange DR; 549 DR.InMemory = -1; 550 DR.DataOffset = Offset; 551 assert(DR.DataOffset == Offset && "truncation"); 552 DR.StructOffset = 0; 553 DR.CVRegister = CVRegister; 554 return DR; 555 } 556 557 CodeViewDebug::LocalVarDefRange 558 CodeViewDebug::createDefRangeReg(uint16_t CVRegister) { 559 LocalVarDefRange DR; 560 DR.InMemory = 0; 561 DR.DataOffset = 0; 562 DR.StructOffset = 0; 563 DR.CVRegister = CVRegister; 564 return DR; 565 } 566 567 void CodeViewDebug::collectVariableInfoFromMMITable( 568 DenseSet<InlinedVariable> &Processed) { 569 const TargetSubtargetInfo &TSI = Asm->MF->getSubtarget(); 570 const TargetFrameLowering *TFI = TSI.getFrameLowering(); 571 const TargetRegisterInfo *TRI = TSI.getRegisterInfo(); 572 573 for (const MachineModuleInfo::VariableDbgInfo &VI : 574 MMI->getVariableDbgInfo()) { 575 if (!VI.Var) 576 continue; 577 assert(VI.Var->isValidLocationForIntrinsic(VI.Loc) && 578 "Expected inlined-at fields to agree"); 579 580 Processed.insert(InlinedVariable(VI.Var, VI.Loc->getInlinedAt())); 581 LexicalScope *Scope = LScopes.findLexicalScope(VI.Loc); 582 583 // If variable scope is not found then skip this variable. 584 if (!Scope) 585 continue; 586 587 // Get the frame register used and the offset. 588 unsigned FrameReg = 0; 589 int FrameOffset = TFI->getFrameIndexReference(*Asm->MF, VI.Slot, FrameReg); 590 uint16_t CVReg = TRI->getCodeViewRegNum(FrameReg); 591 592 // Calculate the label ranges. 593 LocalVarDefRange DefRange = createDefRangeMem(CVReg, FrameOffset); 594 for (const InsnRange &Range : Scope->getRanges()) { 595 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 596 const MCSymbol *End = getLabelAfterInsn(Range.second); 597 End = End ? End : Asm->getFunctionEnd(); 598 DefRange.Ranges.emplace_back(Begin, End); 599 } 600 601 LocalVariable Var; 602 Var.DIVar = VI.Var; 603 Var.DefRanges.emplace_back(std::move(DefRange)); 604 recordLocalVariable(std::move(Var), VI.Loc->getInlinedAt()); 605 } 606 } 607 608 void CodeViewDebug::collectVariableInfo(const DISubprogram *SP) { 609 DenseSet<InlinedVariable> Processed; 610 // Grab the variable info that was squirreled away in the MMI side-table. 611 collectVariableInfoFromMMITable(Processed); 612 613 const TargetRegisterInfo *TRI = Asm->MF->getSubtarget().getRegisterInfo(); 614 615 for (const auto &I : DbgValues) { 616 InlinedVariable IV = I.first; 617 if (Processed.count(IV)) 618 continue; 619 const DILocalVariable *DIVar = IV.first; 620 const DILocation *InlinedAt = IV.second; 621 622 // Instruction ranges, specifying where IV is accessible. 623 const auto &Ranges = I.second; 624 625 LexicalScope *Scope = nullptr; 626 if (InlinedAt) 627 Scope = LScopes.findInlinedScope(DIVar->getScope(), InlinedAt); 628 else 629 Scope = LScopes.findLexicalScope(DIVar->getScope()); 630 // If variable scope is not found then skip this variable. 631 if (!Scope) 632 continue; 633 634 LocalVariable Var; 635 Var.DIVar = DIVar; 636 637 // Calculate the definition ranges. 638 for (auto I = Ranges.begin(), E = Ranges.end(); I != E; ++I) { 639 const InsnRange &Range = *I; 640 const MachineInstr *DVInst = Range.first; 641 assert(DVInst->isDebugValue() && "Invalid History entry"); 642 const DIExpression *DIExpr = DVInst->getDebugExpression(); 643 644 // Bail if there is a complex DWARF expression for now. 645 if (DIExpr && DIExpr->getNumElements() > 0) 646 continue; 647 648 // Bail if operand 0 is not a valid register. This means the variable is a 649 // simple constant, or is described by a complex expression. 650 // FIXME: Find a way to represent constant variables, since they are 651 // relatively common. 652 unsigned Reg = 653 DVInst->getOperand(0).isReg() ? DVInst->getOperand(0).getReg() : 0; 654 if (Reg == 0) 655 continue; 656 657 // Handle the two cases we can handle: indirect in memory and in register. 658 bool IsIndirect = DVInst->getOperand(1).isImm(); 659 unsigned CVReg = TRI->getCodeViewRegNum(DVInst->getOperand(0).getReg()); 660 { 661 LocalVarDefRange DefRange; 662 if (IsIndirect) { 663 int64_t Offset = DVInst->getOperand(1).getImm(); 664 DefRange = createDefRangeMem(CVReg, Offset); 665 } else { 666 DefRange = createDefRangeReg(CVReg); 667 } 668 if (Var.DefRanges.empty() || 669 Var.DefRanges.back().isDifferentLocation(DefRange)) { 670 Var.DefRanges.emplace_back(std::move(DefRange)); 671 } 672 } 673 674 // Compute the label range. 675 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 676 const MCSymbol *End = getLabelAfterInsn(Range.second); 677 if (!End) { 678 if (std::next(I) != E) 679 End = getLabelBeforeInsn(std::next(I)->first); 680 else 681 End = Asm->getFunctionEnd(); 682 } 683 684 // If the last range end is our begin, just extend the last range. 685 // Otherwise make a new range. 686 SmallVectorImpl<std::pair<const MCSymbol *, const MCSymbol *>> &Ranges = 687 Var.DefRanges.back().Ranges; 688 if (!Ranges.empty() && Ranges.back().second == Begin) 689 Ranges.back().second = End; 690 else 691 Ranges.emplace_back(Begin, End); 692 693 // FIXME: Do more range combining. 694 } 695 696 recordLocalVariable(std::move(Var), InlinedAt); 697 } 698 } 699 700 void CodeViewDebug::beginFunction(const MachineFunction *MF) { 701 assert(!CurFn && "Can't process two functions at once!"); 702 703 if (!Asm || !MMI->hasDebugInfo()) 704 return; 705 706 DebugHandlerBase::beginFunction(MF); 707 708 const Function *GV = MF->getFunction(); 709 assert(FnDebugInfo.count(GV) == false); 710 CurFn = &FnDebugInfo[GV]; 711 CurFn->FuncId = NextFuncId++; 712 CurFn->Begin = Asm->getFunctionBegin(); 713 714 // Find the end of the function prolog. First known non-DBG_VALUE and 715 // non-frame setup location marks the beginning of the function body. 716 // FIXME: is there a simpler a way to do this? Can we just search 717 // for the first instruction of the function, not the last of the prolog? 718 DebugLoc PrologEndLoc; 719 bool EmptyPrologue = true; 720 for (const auto &MBB : *MF) { 721 for (const auto &MI : MBB) { 722 if (!MI.isDebugValue() && !MI.getFlag(MachineInstr::FrameSetup) && 723 MI.getDebugLoc()) { 724 PrologEndLoc = MI.getDebugLoc(); 725 break; 726 } else if (!MI.isDebugValue()) { 727 EmptyPrologue = false; 728 } 729 } 730 } 731 732 // Record beginning of function if we have a non-empty prologue. 733 if (PrologEndLoc && !EmptyPrologue) { 734 DebugLoc FnStartDL = PrologEndLoc.getFnDebugLoc(); 735 maybeRecordLocation(FnStartDL, MF); 736 } 737 } 738 739 TypeIndex CodeViewDebug::lowerType(const DIType *Ty) { 740 // Generic dispatch for lowering an unknown type. 741 switch (Ty->getTag()) { 742 case dwarf::DW_TAG_array_type: 743 return lowerTypeArray(cast<DICompositeType>(Ty)); 744 case dwarf::DW_TAG_typedef: 745 return lowerTypeAlias(cast<DIDerivedType>(Ty)); 746 case dwarf::DW_TAG_base_type: 747 return lowerTypeBasic(cast<DIBasicType>(Ty)); 748 case dwarf::DW_TAG_pointer_type: 749 case dwarf::DW_TAG_reference_type: 750 case dwarf::DW_TAG_rvalue_reference_type: 751 return lowerTypePointer(cast<DIDerivedType>(Ty)); 752 case dwarf::DW_TAG_ptr_to_member_type: 753 return lowerTypeMemberPointer(cast<DIDerivedType>(Ty)); 754 case dwarf::DW_TAG_const_type: 755 case dwarf::DW_TAG_volatile_type: 756 return lowerTypeModifier(cast<DIDerivedType>(Ty)); 757 case dwarf::DW_TAG_subroutine_type: 758 return lowerTypeFunction(cast<DISubroutineType>(Ty)); 759 case dwarf::DW_TAG_class_type: 760 case dwarf::DW_TAG_structure_type: 761 return lowerTypeClass(cast<DICompositeType>(Ty)); 762 case dwarf::DW_TAG_union_type: 763 return lowerTypeUnion(cast<DICompositeType>(Ty)); 764 default: 765 // Use the null type index. 766 return TypeIndex(); 767 } 768 } 769 770 static const DISubprogram *getQualifiedNameComponents( 771 const DIScope *Scope, SmallVectorImpl<StringRef> &QualifiedNameComponents) { 772 const DISubprogram *ClosestSubprogram = nullptr; 773 while (Scope != nullptr) { 774 if (ClosestSubprogram == nullptr) 775 ClosestSubprogram = dyn_cast<DISubprogram>(Scope); 776 StringRef ScopeName = Scope->getName(); 777 if (!ScopeName.empty()) 778 QualifiedNameComponents.push_back(ScopeName); 779 Scope = Scope->getScope().resolve(); 780 } 781 return ClosestSubprogram; 782 } 783 784 static std::string getQualifiedName(ArrayRef<StringRef> QualifiedNameComponents, 785 StringRef TypeName) { 786 std::string FullyQualifiedName; 787 for (StringRef QualifiedNameComponent : reverse(QualifiedNameComponents)) { 788 FullyQualifiedName.append(QualifiedNameComponent); 789 FullyQualifiedName.append("::"); 790 } 791 FullyQualifiedName.append(TypeName); 792 return FullyQualifiedName; 793 } 794 795 TypeIndex CodeViewDebug::lowerTypeAlias(const DIDerivedType *Ty) { 796 DITypeRef UnderlyingTypeRef = Ty->getBaseType(); 797 TypeIndex UnderlyingTypeIndex = getTypeIndex(UnderlyingTypeRef); 798 StringRef TypeName = Ty->getName(); 799 800 SmallVector<StringRef, 5> QualifiedNameComponents; 801 const DISubprogram *ClosestSubprogram = getQualifiedNameComponents( 802 Ty->getScope().resolve(), QualifiedNameComponents); 803 804 if (ClosestSubprogram == nullptr) { 805 std::string FullyQualifiedName = 806 getQualifiedName(QualifiedNameComponents, TypeName); 807 GlobalUDTs.emplace_back(std::move(FullyQualifiedName), UnderlyingTypeIndex); 808 } else if (ClosestSubprogram == CurrentSubprogram) { 809 std::string FullyQualifiedName = 810 getQualifiedName(QualifiedNameComponents, TypeName); 811 LocalUDTs.emplace_back(std::move(FullyQualifiedName), UnderlyingTypeIndex); 812 } 813 // TODO: What if the ClosestSubprogram is neither null or the current 814 // subprogram? Currently, the UDT just gets dropped on the floor. 815 // 816 // The current behavior is not desirable. To get maximal fidelity, we would 817 // need to perform all type translation before beginning emission of .debug$S 818 // and then make LocalUDTs a member of FunctionInfo 819 820 if (UnderlyingTypeIndex == TypeIndex(SimpleTypeKind::Int32Long) && 821 TypeName == "HRESULT") 822 return TypeIndex(SimpleTypeKind::HResult); 823 if (UnderlyingTypeIndex == TypeIndex(SimpleTypeKind::UInt16Short) && 824 TypeName == "wchar_t") 825 return TypeIndex(SimpleTypeKind::WideCharacter); 826 return UnderlyingTypeIndex; 827 } 828 829 TypeIndex CodeViewDebug::lowerTypeArray(const DICompositeType *Ty) { 830 DITypeRef ElementTypeRef = Ty->getBaseType(); 831 TypeIndex ElementTypeIndex = getTypeIndex(ElementTypeRef); 832 // IndexType is size_t, which depends on the bitness of the target. 833 TypeIndex IndexType = Asm->MAI->getPointerSize() == 8 834 ? TypeIndex(SimpleTypeKind::UInt64Quad) 835 : TypeIndex(SimpleTypeKind::UInt32Long); 836 uint64_t Size = Ty->getSizeInBits() / 8; 837 ArrayRecord Record(ElementTypeIndex, IndexType, Size, Ty->getName()); 838 return TypeTable.writeArray(Record); 839 } 840 841 TypeIndex CodeViewDebug::lowerTypeBasic(const DIBasicType *Ty) { 842 TypeIndex Index; 843 dwarf::TypeKind Kind; 844 uint32_t ByteSize; 845 846 Kind = static_cast<dwarf::TypeKind>(Ty->getEncoding()); 847 ByteSize = Ty->getSizeInBits() / 8; 848 849 SimpleTypeKind STK = SimpleTypeKind::None; 850 switch (Kind) { 851 case dwarf::DW_ATE_address: 852 // FIXME: Translate 853 break; 854 case dwarf::DW_ATE_boolean: 855 switch (ByteSize) { 856 case 1: STK = SimpleTypeKind::Boolean8; break; 857 case 2: STK = SimpleTypeKind::Boolean16; break; 858 case 4: STK = SimpleTypeKind::Boolean32; break; 859 case 8: STK = SimpleTypeKind::Boolean64; break; 860 case 16: STK = SimpleTypeKind::Boolean128; break; 861 } 862 break; 863 case dwarf::DW_ATE_complex_float: 864 switch (ByteSize) { 865 case 2: STK = SimpleTypeKind::Complex16; break; 866 case 4: STK = SimpleTypeKind::Complex32; break; 867 case 8: STK = SimpleTypeKind::Complex64; break; 868 case 10: STK = SimpleTypeKind::Complex80; break; 869 case 16: STK = SimpleTypeKind::Complex128; break; 870 } 871 break; 872 case dwarf::DW_ATE_float: 873 switch (ByteSize) { 874 case 2: STK = SimpleTypeKind::Float16; break; 875 case 4: STK = SimpleTypeKind::Float32; break; 876 case 6: STK = SimpleTypeKind::Float48; break; 877 case 8: STK = SimpleTypeKind::Float64; break; 878 case 10: STK = SimpleTypeKind::Float80; break; 879 case 16: STK = SimpleTypeKind::Float128; break; 880 } 881 break; 882 case dwarf::DW_ATE_signed: 883 switch (ByteSize) { 884 case 1: STK = SimpleTypeKind::SByte; break; 885 case 2: STK = SimpleTypeKind::Int16Short; break; 886 case 4: STK = SimpleTypeKind::Int32; break; 887 case 8: STK = SimpleTypeKind::Int64Quad; break; 888 case 16: STK = SimpleTypeKind::Int128Oct; break; 889 } 890 break; 891 case dwarf::DW_ATE_unsigned: 892 switch (ByteSize) { 893 case 1: STK = SimpleTypeKind::Byte; break; 894 case 2: STK = SimpleTypeKind::UInt16Short; break; 895 case 4: STK = SimpleTypeKind::UInt32; break; 896 case 8: STK = SimpleTypeKind::UInt64Quad; break; 897 case 16: STK = SimpleTypeKind::UInt128Oct; break; 898 } 899 break; 900 case dwarf::DW_ATE_UTF: 901 switch (ByteSize) { 902 case 2: STK = SimpleTypeKind::Character16; break; 903 case 4: STK = SimpleTypeKind::Character32; break; 904 } 905 break; 906 case dwarf::DW_ATE_signed_char: 907 if (ByteSize == 1) 908 STK = SimpleTypeKind::SignedCharacter; 909 break; 910 case dwarf::DW_ATE_unsigned_char: 911 if (ByteSize == 1) 912 STK = SimpleTypeKind::UnsignedCharacter; 913 break; 914 default: 915 break; 916 } 917 918 // Apply some fixups based on the source-level type name. 919 if (STK == SimpleTypeKind::Int32 && Ty->getName() == "long int") 920 STK = SimpleTypeKind::Int32Long; 921 if (STK == SimpleTypeKind::UInt32 && Ty->getName() == "long unsigned int") 922 STK = SimpleTypeKind::UInt32Long; 923 if (STK == SimpleTypeKind::UInt16Short && 924 (Ty->getName() == "wchar_t" || Ty->getName() == "__wchar_t")) 925 STK = SimpleTypeKind::WideCharacter; 926 if ((STK == SimpleTypeKind::SignedCharacter || 927 STK == SimpleTypeKind::UnsignedCharacter) && 928 Ty->getName() == "char") 929 STK = SimpleTypeKind::NarrowCharacter; 930 931 return TypeIndex(STK); 932 } 933 934 TypeIndex CodeViewDebug::lowerTypePointer(const DIDerivedType *Ty) { 935 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 936 937 // Pointers to simple types can use SimpleTypeMode, rather than having a 938 // dedicated pointer type record. 939 if (PointeeTI.isSimple() && 940 PointeeTI.getSimpleMode() == SimpleTypeMode::Direct && 941 Ty->getTag() == dwarf::DW_TAG_pointer_type) { 942 SimpleTypeMode Mode = Ty->getSizeInBits() == 64 943 ? SimpleTypeMode::NearPointer64 944 : SimpleTypeMode::NearPointer32; 945 return TypeIndex(PointeeTI.getSimpleKind(), Mode); 946 } 947 948 PointerKind PK = 949 Ty->getSizeInBits() == 64 ? PointerKind::Near64 : PointerKind::Near32; 950 PointerMode PM = PointerMode::Pointer; 951 switch (Ty->getTag()) { 952 default: llvm_unreachable("not a pointer tag type"); 953 case dwarf::DW_TAG_pointer_type: 954 PM = PointerMode::Pointer; 955 break; 956 case dwarf::DW_TAG_reference_type: 957 PM = PointerMode::LValueReference; 958 break; 959 case dwarf::DW_TAG_rvalue_reference_type: 960 PM = PointerMode::RValueReference; 961 break; 962 } 963 // FIXME: MSVC folds qualifiers into PointerOptions in the context of a method 964 // 'this' pointer, but not normal contexts. Figure out what we're supposed to 965 // do. 966 PointerOptions PO = PointerOptions::None; 967 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8); 968 return TypeTable.writePointer(PR); 969 } 970 971 TypeIndex CodeViewDebug::lowerTypeMemberPointer(const DIDerivedType *Ty) { 972 assert(Ty->getTag() == dwarf::DW_TAG_ptr_to_member_type); 973 TypeIndex ClassTI = getTypeIndex(Ty->getClassType()); 974 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 975 PointerKind PK = Asm->MAI->getPointerSize() == 8 ? PointerKind::Near64 976 : PointerKind::Near32; 977 PointerMode PM = isa<DISubroutineType>(Ty->getBaseType()) 978 ? PointerMode::PointerToMemberFunction 979 : PointerMode::PointerToDataMember; 980 PointerOptions PO = PointerOptions::None; // FIXME 981 // FIXME: Thread this ABI info through metadata. 982 PointerToMemberRepresentation PMR = PointerToMemberRepresentation::Unknown; 983 MemberPointerInfo MPI(ClassTI, PMR); 984 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8, MPI); 985 return TypeTable.writePointer(PR); 986 } 987 988 /// Given a DWARF calling convention, get the CodeView equivalent. If we don't 989 /// have a translation, use the NearC convention. 990 static CallingConvention dwarfCCToCodeView(unsigned DwarfCC) { 991 switch (DwarfCC) { 992 case dwarf::DW_CC_normal: return CallingConvention::NearC; 993 case dwarf::DW_CC_BORLAND_msfastcall: return CallingConvention::NearFast; 994 case dwarf::DW_CC_BORLAND_thiscall: return CallingConvention::ThisCall; 995 case dwarf::DW_CC_BORLAND_stdcall: return CallingConvention::NearStdCall; 996 case dwarf::DW_CC_BORLAND_pascal: return CallingConvention::NearPascal; 997 case dwarf::DW_CC_LLVM_vectorcall: return CallingConvention::NearVector; 998 } 999 return CallingConvention::NearC; 1000 } 1001 1002 TypeIndex CodeViewDebug::lowerTypeModifier(const DIDerivedType *Ty) { 1003 ModifierOptions Mods = ModifierOptions::None; 1004 bool IsModifier = true; 1005 const DIType *BaseTy = Ty; 1006 while (IsModifier && BaseTy) { 1007 // FIXME: Need to add DWARF tag for __unaligned. 1008 switch (BaseTy->getTag()) { 1009 case dwarf::DW_TAG_const_type: 1010 Mods |= ModifierOptions::Const; 1011 break; 1012 case dwarf::DW_TAG_volatile_type: 1013 Mods |= ModifierOptions::Volatile; 1014 break; 1015 default: 1016 IsModifier = false; 1017 break; 1018 } 1019 if (IsModifier) 1020 BaseTy = cast<DIDerivedType>(BaseTy)->getBaseType().resolve(); 1021 } 1022 TypeIndex ModifiedTI = getTypeIndex(BaseTy); 1023 ModifierRecord MR(ModifiedTI, Mods); 1024 return TypeTable.writeModifier(MR); 1025 } 1026 1027 TypeIndex CodeViewDebug::lowerTypeFunction(const DISubroutineType *Ty) { 1028 SmallVector<TypeIndex, 8> ReturnAndArgTypeIndices; 1029 for (DITypeRef ArgTypeRef : Ty->getTypeArray()) 1030 ReturnAndArgTypeIndices.push_back(getTypeIndex(ArgTypeRef)); 1031 1032 TypeIndex ReturnTypeIndex = TypeIndex::Void(); 1033 ArrayRef<TypeIndex> ArgTypeIndices = None; 1034 if (!ReturnAndArgTypeIndices.empty()) { 1035 auto ReturnAndArgTypesRef = makeArrayRef(ReturnAndArgTypeIndices); 1036 ReturnTypeIndex = ReturnAndArgTypesRef.front(); 1037 ArgTypeIndices = ReturnAndArgTypesRef.drop_front(); 1038 } 1039 1040 ArgListRecord ArgListRec(TypeRecordKind::ArgList, ArgTypeIndices); 1041 TypeIndex ArgListIndex = TypeTable.writeArgList(ArgListRec); 1042 1043 CallingConvention CC = dwarfCCToCodeView(Ty->getCC()); 1044 1045 // TODO: Some functions are member functions, we should use a more appropriate 1046 // record for those. 1047 ProcedureRecord Procedure(ReturnTypeIndex, CC, FunctionOptions::None, 1048 ArgTypeIndices.size(), ArgListIndex); 1049 return TypeTable.writeProcedure(Procedure); 1050 } 1051 1052 static MemberAccess translateAccessFlags(unsigned RecordTag, 1053 const DIType *Member) { 1054 switch (Member->getFlags() & DINode::FlagAccessibility) { 1055 case DINode::FlagPrivate: return MemberAccess::Private; 1056 case DINode::FlagPublic: return MemberAccess::Public; 1057 case DINode::FlagProtected: return MemberAccess::Protected; 1058 case 0: 1059 // If there was no explicit access control, provide the default for the tag. 1060 return RecordTag == dwarf::DW_TAG_class_type ? MemberAccess::Private 1061 : MemberAccess::Public; 1062 } 1063 llvm_unreachable("access flags are exclusive"); 1064 } 1065 1066 static TypeRecordKind getRecordKind(const DICompositeType *Ty) { 1067 switch (Ty->getTag()) { 1068 case dwarf::DW_TAG_class_type: return TypeRecordKind::Class; 1069 case dwarf::DW_TAG_structure_type: return TypeRecordKind::Struct; 1070 } 1071 llvm_unreachable("unexpected tag"); 1072 } 1073 1074 /// Return the HasUniqueName option if it should be present in ClassOptions, or 1075 /// None otherwise. 1076 static ClassOptions getRecordUniqueNameOption(const DICompositeType *Ty) { 1077 // MSVC always sets this flag now, even for local types. Clang doesn't always 1078 // appear to give every type a linkage name, which may be problematic for us. 1079 // FIXME: Investigate the consequences of not following them here. 1080 return !Ty->getIdentifier().empty() ? ClassOptions::HasUniqueName 1081 : ClassOptions::None; 1082 } 1083 1084 TypeIndex CodeViewDebug::lowerTypeClass(const DICompositeType *Ty) { 1085 // First, construct the forward decl. Don't look into Ty to compute the 1086 // forward decl options, since it might not be available in all TUs. 1087 TypeRecordKind Kind = getRecordKind(Ty); 1088 ClassOptions CO = 1089 ClassOptions::ForwardReference | getRecordUniqueNameOption(Ty); 1090 TypeIndex FwdDeclTI = TypeTable.writeClass(ClassRecord( 1091 Kind, 0, CO, HfaKind::None, WindowsRTClassKind::None, TypeIndex(), 1092 TypeIndex(), TypeIndex(), 0, Ty->getName(), Ty->getIdentifier())); 1093 return FwdDeclTI; 1094 } 1095 1096 TypeIndex CodeViewDebug::lowerCompleteTypeClass(const DICompositeType *Ty) { 1097 // Construct the field list and complete type record. 1098 TypeRecordKind Kind = getRecordKind(Ty); 1099 // FIXME: Other ClassOptions, like ContainsNestedClass and NestedClass. 1100 ClassOptions CO = ClassOptions::None | getRecordUniqueNameOption(Ty); 1101 TypeIndex FTI; 1102 unsigned FieldCount; 1103 std::tie(FTI, FieldCount) = lowerRecordFieldList(Ty); 1104 1105 uint64_t SizeInBytes = Ty->getSizeInBits() / 8; 1106 return TypeTable.writeClass(ClassRecord(Kind, FieldCount, CO, HfaKind::None, 1107 WindowsRTClassKind::None, FTI, 1108 TypeIndex(), TypeIndex(), SizeInBytes, 1109 Ty->getName(), Ty->getIdentifier())); 1110 // FIXME: Make an LF_UDT_SRC_LINE record. 1111 } 1112 1113 TypeIndex CodeViewDebug::lowerTypeUnion(const DICompositeType *Ty) { 1114 ClassOptions CO = 1115 ClassOptions::ForwardReference | getRecordUniqueNameOption(Ty); 1116 TypeIndex FwdDeclTI = 1117 TypeTable.writeUnion(UnionRecord(0, CO, HfaKind::None, TypeIndex(), 0, 1118 Ty->getName(), Ty->getIdentifier())); 1119 return FwdDeclTI; 1120 } 1121 1122 TypeIndex CodeViewDebug::lowerCompleteTypeUnion(const DICompositeType *Ty) { 1123 ClassOptions CO = ClassOptions::None | getRecordUniqueNameOption(Ty); 1124 TypeIndex FTI; 1125 unsigned FieldCount; 1126 std::tie(FTI, FieldCount) = lowerRecordFieldList(Ty); 1127 uint64_t SizeInBytes = Ty->getSizeInBits() / 8; 1128 return TypeTable.writeUnion(UnionRecord(FieldCount, CO, HfaKind::None, FTI, 1129 SizeInBytes, Ty->getName(), 1130 Ty->getIdentifier())); 1131 // FIXME: Make an LF_UDT_SRC_LINE record. 1132 } 1133 1134 std::pair<TypeIndex, unsigned> 1135 CodeViewDebug::lowerRecordFieldList(const DICompositeType *Ty) { 1136 // Manually count members. MSVC appears to count everything that generates a 1137 // field list record. Each individual overload in a method overload group 1138 // contributes to this count, even though the overload group is a single field 1139 // list record. 1140 unsigned MemberCount = 0; 1141 FieldListRecordBuilder Fields; 1142 for (const DINode *Element : Ty->getElements()) { 1143 // We assume that the frontend provides all members in source declaration 1144 // order, which is what MSVC does. 1145 if (!Element) 1146 continue; 1147 if (auto *SP = dyn_cast<DISubprogram>(Element)) { 1148 // C++ method. 1149 // FIXME: Overloaded methods are grouped together, so we'll need two 1150 // passes to group them. 1151 (void)SP; 1152 } else if (auto *Member = dyn_cast<DIDerivedType>(Element)) { 1153 if (Member->getTag() == dwarf::DW_TAG_member) { 1154 if (Member->isStaticMember()) { 1155 // Static data member. 1156 Fields.writeStaticDataMember(StaticDataMemberRecord( 1157 translateAccessFlags(Ty->getTag(), Member), 1158 getTypeIndex(Member->getBaseType()), Member->getName())); 1159 MemberCount++; 1160 } else { 1161 // Data member. 1162 // FIXME: Make a BitFieldRecord for bitfields. 1163 Fields.writeDataMember(DataMemberRecord( 1164 translateAccessFlags(Ty->getTag(), Member), 1165 getTypeIndex(Member->getBaseType()), 1166 Member->getOffsetInBits() / 8, Member->getName())); 1167 MemberCount++; 1168 } 1169 } else if (Member->getTag() == dwarf::DW_TAG_friend) { 1170 // Ignore friend members. It appears that MSVC emitted info about 1171 // friends in the past, but modern versions do not. 1172 } 1173 // FIXME: Get clang to emit nested types here and do something with 1174 // them. 1175 } 1176 // Skip other unrecognized kinds of elements. 1177 } 1178 return {TypeTable.writeFieldList(Fields), MemberCount}; 1179 } 1180 1181 TypeIndex CodeViewDebug::getTypeIndex(DITypeRef TypeRef) { 1182 const DIType *Ty = TypeRef.resolve(); 1183 1184 // The null DIType is the void type. Don't try to hash it. 1185 if (!Ty) 1186 return TypeIndex::Void(); 1187 1188 // Check if we've already translated this type. Don't try to do a 1189 // get-or-create style insertion that caches the hash lookup across the 1190 // lowerType call. It will update the TypeIndices map. 1191 auto I = TypeIndices.find(Ty); 1192 if (I != TypeIndices.end()) 1193 return I->second; 1194 1195 TypeIndex TI = lowerType(Ty); 1196 1197 recordTypeIndexForDINode(Ty, TI); 1198 return TI; 1199 } 1200 1201 TypeIndex CodeViewDebug::getCompleteTypeIndex(DITypeRef TypeRef) { 1202 const DIType *Ty = TypeRef.resolve(); 1203 1204 // The null DIType is the void type. Don't try to hash it. 1205 if (!Ty) 1206 return TypeIndex::Void(); 1207 1208 // If this is a non-record type, the complete type index is the same as the 1209 // normal type index. Just call getTypeIndex. 1210 switch (Ty->getTag()) { 1211 case dwarf::DW_TAG_class_type: 1212 case dwarf::DW_TAG_structure_type: 1213 case dwarf::DW_TAG_union_type: 1214 break; 1215 default: 1216 return getTypeIndex(Ty); 1217 } 1218 1219 // Check if we've already translated the complete record type. Lowering a 1220 // complete type should never trigger lowering another complete type, so we 1221 // can reuse the hash table lookup result. 1222 const auto *CTy = cast<DICompositeType>(Ty); 1223 auto InsertResult = CompleteTypeIndices.insert({CTy, TypeIndex()}); 1224 if (!InsertResult.second) 1225 return InsertResult.first->second; 1226 1227 // Make sure the forward declaration is emitted first. It's unclear if this 1228 // is necessary, but MSVC does it, and we should follow suit until we can show 1229 // otherwise. 1230 TypeIndex FwdDeclTI = getTypeIndex(CTy); 1231 1232 // Just use the forward decl if we don't have complete type info. This might 1233 // happen if the frontend is using modules and expects the complete definition 1234 // to be emitted elsewhere. 1235 if (CTy->isForwardDecl()) 1236 return FwdDeclTI; 1237 1238 TypeIndex TI; 1239 switch (CTy->getTag()) { 1240 case dwarf::DW_TAG_class_type: 1241 case dwarf::DW_TAG_structure_type: 1242 TI = lowerCompleteTypeClass(CTy); 1243 break; 1244 case dwarf::DW_TAG_union_type: 1245 TI = lowerCompleteTypeUnion(CTy); 1246 break; 1247 default: 1248 llvm_unreachable("not a record"); 1249 } 1250 1251 InsertResult.first->second = TI; 1252 return TI; 1253 } 1254 1255 void CodeViewDebug::emitLocalVariable(const LocalVariable &Var) { 1256 // LocalSym record, see SymbolRecord.h for more info. 1257 MCSymbol *LocalBegin = MMI->getContext().createTempSymbol(), 1258 *LocalEnd = MMI->getContext().createTempSymbol(); 1259 OS.AddComment("Record length"); 1260 OS.emitAbsoluteSymbolDiff(LocalEnd, LocalBegin, 2); 1261 OS.EmitLabel(LocalBegin); 1262 1263 OS.AddComment("Record kind: S_LOCAL"); 1264 OS.EmitIntValue(unsigned(SymbolKind::S_LOCAL), 2); 1265 1266 LocalSymFlags Flags = LocalSymFlags::None; 1267 if (Var.DIVar->isParameter()) 1268 Flags |= LocalSymFlags::IsParameter; 1269 if (Var.DefRanges.empty()) 1270 Flags |= LocalSymFlags::IsOptimizedOut; 1271 1272 OS.AddComment("TypeIndex"); 1273 TypeIndex TI = getCompleteTypeIndex(Var.DIVar->getType()); 1274 OS.EmitIntValue(TI.getIndex(), 4); 1275 OS.AddComment("Flags"); 1276 OS.EmitIntValue(static_cast<uint16_t>(Flags), 2); 1277 // Truncate the name so we won't overflow the record length field. 1278 emitNullTerminatedSymbolName(OS, Var.DIVar->getName()); 1279 OS.EmitLabel(LocalEnd); 1280 1281 // Calculate the on disk prefix of the appropriate def range record. The 1282 // records and on disk formats are described in SymbolRecords.h. BytePrefix 1283 // should be big enough to hold all forms without memory allocation. 1284 SmallString<20> BytePrefix; 1285 for (const LocalVarDefRange &DefRange : Var.DefRanges) { 1286 BytePrefix.clear(); 1287 // FIXME: Handle bitpieces. 1288 if (DefRange.StructOffset != 0) 1289 continue; 1290 1291 if (DefRange.InMemory) { 1292 DefRangeRegisterRelSym Sym(DefRange.CVRegister, 0, DefRange.DataOffset, 0, 1293 0, 0, ArrayRef<LocalVariableAddrGap>()); 1294 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER_REL); 1295 BytePrefix += 1296 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 1297 BytePrefix += 1298 StringRef(reinterpret_cast<const char *>(&Sym.Header), 1299 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 1300 } else { 1301 assert(DefRange.DataOffset == 0 && "unexpected offset into register"); 1302 // Unclear what matters here. 1303 DefRangeRegisterSym Sym(DefRange.CVRegister, 0, 0, 0, 0, 1304 ArrayRef<LocalVariableAddrGap>()); 1305 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER); 1306 BytePrefix += 1307 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 1308 BytePrefix += 1309 StringRef(reinterpret_cast<const char *>(&Sym.Header), 1310 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 1311 } 1312 OS.EmitCVDefRangeDirective(DefRange.Ranges, BytePrefix); 1313 } 1314 } 1315 1316 void CodeViewDebug::endFunction(const MachineFunction *MF) { 1317 if (!Asm || !CurFn) // We haven't created any debug info for this function. 1318 return; 1319 1320 const Function *GV = MF->getFunction(); 1321 assert(FnDebugInfo.count(GV)); 1322 assert(CurFn == &FnDebugInfo[GV]); 1323 1324 collectVariableInfo(GV->getSubprogram()); 1325 1326 DebugHandlerBase::endFunction(MF); 1327 1328 // Don't emit anything if we don't have any line tables. 1329 if (!CurFn->HaveLineInfo) { 1330 FnDebugInfo.erase(GV); 1331 CurFn = nullptr; 1332 return; 1333 } 1334 1335 CurFn->End = Asm->getFunctionEnd(); 1336 1337 CurFn = nullptr; 1338 } 1339 1340 void CodeViewDebug::beginInstruction(const MachineInstr *MI) { 1341 DebugHandlerBase::beginInstruction(MI); 1342 1343 // Ignore DBG_VALUE locations and function prologue. 1344 if (!Asm || MI->isDebugValue() || MI->getFlag(MachineInstr::FrameSetup)) 1345 return; 1346 DebugLoc DL = MI->getDebugLoc(); 1347 if (DL == PrevInstLoc || !DL) 1348 return; 1349 maybeRecordLocation(DL, Asm->MF); 1350 } 1351 1352 MCSymbol *CodeViewDebug::beginCVSubsection(ModuleSubstreamKind Kind) { 1353 MCSymbol *BeginLabel = MMI->getContext().createTempSymbol(), 1354 *EndLabel = MMI->getContext().createTempSymbol(); 1355 OS.EmitIntValue(unsigned(Kind), 4); 1356 OS.AddComment("Subsection size"); 1357 OS.emitAbsoluteSymbolDiff(EndLabel, BeginLabel, 4); 1358 OS.EmitLabel(BeginLabel); 1359 return EndLabel; 1360 } 1361 1362 void CodeViewDebug::endCVSubsection(MCSymbol *EndLabel) { 1363 OS.EmitLabel(EndLabel); 1364 // Every subsection must be aligned to a 4-byte boundary. 1365 OS.EmitValueToAlignment(4); 1366 } 1367 1368 void CodeViewDebug::emitDebugInfoForUDTs( 1369 ArrayRef<std::pair<std::string, TypeIndex>> UDTs) { 1370 for (const std::pair<std::string, codeview::TypeIndex> &UDT : UDTs) { 1371 MCSymbol *UDTRecordBegin = MMI->getContext().createTempSymbol(), 1372 *UDTRecordEnd = MMI->getContext().createTempSymbol(); 1373 OS.AddComment("Record length"); 1374 OS.emitAbsoluteSymbolDiff(UDTRecordEnd, UDTRecordBegin, 2); 1375 OS.EmitLabel(UDTRecordBegin); 1376 1377 OS.AddComment("Record kind: S_UDT"); 1378 OS.EmitIntValue(unsigned(SymbolKind::S_UDT), 2); 1379 1380 OS.AddComment("Type"); 1381 OS.EmitIntValue(UDT.second.getIndex(), 4); 1382 1383 emitNullTerminatedSymbolName(OS, UDT.first); 1384 OS.EmitLabel(UDTRecordEnd); 1385 } 1386 } 1387 1388 void CodeViewDebug::emitDebugInfoForGlobals() { 1389 NamedMDNode *CUs = MMI->getModule()->getNamedMetadata("llvm.dbg.cu"); 1390 for (const MDNode *Node : CUs->operands()) { 1391 const auto *CU = cast<DICompileUnit>(Node); 1392 1393 // First, emit all globals that are not in a comdat in a single symbol 1394 // substream. MSVC doesn't like it if the substream is empty, so only open 1395 // it if we have at least one global to emit. 1396 switchToDebugSectionForSymbol(nullptr); 1397 MCSymbol *EndLabel = nullptr; 1398 for (const DIGlobalVariable *G : CU->getGlobalVariables()) { 1399 if (const auto *GV = dyn_cast_or_null<GlobalVariable>(G->getVariable())) { 1400 if (!GV->hasComdat() && !GV->isDeclarationForLinker()) { 1401 if (!EndLabel) { 1402 OS.AddComment("Symbol subsection for globals"); 1403 EndLabel = beginCVSubsection(ModuleSubstreamKind::Symbols); 1404 } 1405 emitDebugInfoForGlobal(G, Asm->getSymbol(GV)); 1406 } 1407 } 1408 } 1409 if (EndLabel) 1410 endCVSubsection(EndLabel); 1411 1412 // Second, emit each global that is in a comdat into its own .debug$S 1413 // section along with its own symbol substream. 1414 for (const DIGlobalVariable *G : CU->getGlobalVariables()) { 1415 if (const auto *GV = dyn_cast_or_null<GlobalVariable>(G->getVariable())) { 1416 if (GV->hasComdat()) { 1417 MCSymbol *GVSym = Asm->getSymbol(GV); 1418 OS.AddComment("Symbol subsection for " + 1419 Twine(GlobalValue::getRealLinkageName(GV->getName()))); 1420 switchToDebugSectionForSymbol(GVSym); 1421 EndLabel = beginCVSubsection(ModuleSubstreamKind::Symbols); 1422 emitDebugInfoForGlobal(G, GVSym); 1423 endCVSubsection(EndLabel); 1424 } 1425 } 1426 } 1427 } 1428 } 1429 1430 void CodeViewDebug::emitDebugInfoForGlobal(const DIGlobalVariable *DIGV, 1431 MCSymbol *GVSym) { 1432 // DataSym record, see SymbolRecord.h for more info. 1433 // FIXME: Thread local data, etc 1434 MCSymbol *DataBegin = MMI->getContext().createTempSymbol(), 1435 *DataEnd = MMI->getContext().createTempSymbol(); 1436 OS.AddComment("Record length"); 1437 OS.emitAbsoluteSymbolDiff(DataEnd, DataBegin, 2); 1438 OS.EmitLabel(DataBegin); 1439 OS.AddComment("Record kind: S_GDATA32"); 1440 OS.EmitIntValue(unsigned(SymbolKind::S_GDATA32), 2); 1441 OS.AddComment("Type"); 1442 OS.EmitIntValue(getCompleteTypeIndex(DIGV->getType()).getIndex(), 4); 1443 OS.AddComment("DataOffset"); 1444 OS.EmitCOFFSecRel32(GVSym); 1445 OS.AddComment("Segment"); 1446 OS.EmitCOFFSectionIndex(GVSym); 1447 OS.AddComment("Name"); 1448 emitNullTerminatedSymbolName(OS, DIGV->getName()); 1449 OS.EmitLabel(DataEnd); 1450 } 1451