1 //===-- llvm/lib/CodeGen/AsmPrinter/CodeViewDebug.cpp --*- C++ -*--===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file contains support for writing Microsoft CodeView debug info. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "CodeViewDebug.h" 15 #include "llvm/DebugInfo/CodeView/CodeView.h" 16 #include "llvm/DebugInfo/CodeView/Line.h" 17 #include "llvm/DebugInfo/CodeView/SymbolRecord.h" 18 #include "llvm/DebugInfo/CodeView/TypeDumper.h" 19 #include "llvm/DebugInfo/CodeView/TypeIndex.h" 20 #include "llvm/DebugInfo/CodeView/TypeRecord.h" 21 #include "llvm/MC/MCExpr.h" 22 #include "llvm/MC/MCSectionCOFF.h" 23 #include "llvm/MC/MCSymbol.h" 24 #include "llvm/Support/COFF.h" 25 #include "llvm/Support/ScopedPrinter.h" 26 #include "llvm/Target/TargetSubtargetInfo.h" 27 #include "llvm/Target/TargetRegisterInfo.h" 28 #include "llvm/Target/TargetFrameLowering.h" 29 30 using namespace llvm; 31 using namespace llvm::codeview; 32 33 CodeViewDebug::CodeViewDebug(AsmPrinter *AP) 34 : DebugHandlerBase(AP), OS(*Asm->OutStreamer), CurFn(nullptr) { 35 // If module doesn't have named metadata anchors or COFF debug section 36 // is not available, skip any debug info related stuff. 37 if (!MMI->getModule()->getNamedMetadata("llvm.dbg.cu") || 38 !AP->getObjFileLowering().getCOFFDebugSymbolsSection()) { 39 Asm = nullptr; 40 return; 41 } 42 43 // Tell MMI that we have debug info. 44 MMI->setDebugInfoAvailability(true); 45 } 46 47 StringRef CodeViewDebug::getFullFilepath(const DIFile *File) { 48 std::string &Filepath = FileToFilepathMap[File]; 49 if (!Filepath.empty()) 50 return Filepath; 51 52 StringRef Dir = File->getDirectory(), Filename = File->getFilename(); 53 54 // Clang emits directory and relative filename info into the IR, but CodeView 55 // operates on full paths. We could change Clang to emit full paths too, but 56 // that would increase the IR size and probably not needed for other users. 57 // For now, just concatenate and canonicalize the path here. 58 if (Filename.find(':') == 1) 59 Filepath = Filename; 60 else 61 Filepath = (Dir + "\\" + Filename).str(); 62 63 // Canonicalize the path. We have to do it textually because we may no longer 64 // have access the file in the filesystem. 65 // First, replace all slashes with backslashes. 66 std::replace(Filepath.begin(), Filepath.end(), '/', '\\'); 67 68 // Remove all "\.\" with "\". 69 size_t Cursor = 0; 70 while ((Cursor = Filepath.find("\\.\\", Cursor)) != std::string::npos) 71 Filepath.erase(Cursor, 2); 72 73 // Replace all "\XXX\..\" with "\". Don't try too hard though as the original 74 // path should be well-formatted, e.g. start with a drive letter, etc. 75 Cursor = 0; 76 while ((Cursor = Filepath.find("\\..\\", Cursor)) != std::string::npos) { 77 // Something's wrong if the path starts with "\..\", abort. 78 if (Cursor == 0) 79 break; 80 81 size_t PrevSlash = Filepath.rfind('\\', Cursor - 1); 82 if (PrevSlash == std::string::npos) 83 // Something's wrong, abort. 84 break; 85 86 Filepath.erase(PrevSlash, Cursor + 3 - PrevSlash); 87 // The next ".." might be following the one we've just erased. 88 Cursor = PrevSlash; 89 } 90 91 // Remove all duplicate backslashes. 92 Cursor = 0; 93 while ((Cursor = Filepath.find("\\\\", Cursor)) != std::string::npos) 94 Filepath.erase(Cursor, 1); 95 96 return Filepath; 97 } 98 99 unsigned CodeViewDebug::maybeRecordFile(const DIFile *F) { 100 unsigned NextId = FileIdMap.size() + 1; 101 auto Insertion = FileIdMap.insert(std::make_pair(F, NextId)); 102 if (Insertion.second) { 103 // We have to compute the full filepath and emit a .cv_file directive. 104 StringRef FullPath = getFullFilepath(F); 105 NextId = OS.EmitCVFileDirective(NextId, FullPath); 106 assert(NextId == FileIdMap.size() && ".cv_file directive failed"); 107 } 108 return Insertion.first->second; 109 } 110 111 CodeViewDebug::InlineSite & 112 CodeViewDebug::getInlineSite(const DILocation *InlinedAt, 113 const DISubprogram *Inlinee) { 114 auto SiteInsertion = CurFn->InlineSites.insert({InlinedAt, InlineSite()}); 115 InlineSite *Site = &SiteInsertion.first->second; 116 if (SiteInsertion.second) { 117 Site->SiteFuncId = NextFuncId++; 118 Site->Inlinee = Inlinee; 119 InlinedSubprograms.insert(Inlinee); 120 getFuncIdForSubprogram(Inlinee); 121 } 122 return *Site; 123 } 124 125 TypeIndex CodeViewDebug::getFuncIdForSubprogram(const DISubprogram *SP) { 126 // It's possible to ask for the FuncId of a function which doesn't have a 127 // subprogram: inlining a function with debug info into a function with none. 128 if (!SP) 129 return TypeIndex::Void(); 130 131 // Check if we've already translated this subprogram. 132 auto I = TypeIndices.find(SP); 133 if (I != TypeIndices.end()) 134 return I->second; 135 136 TypeIndex ParentScope = TypeIndex(0); 137 StringRef DisplayName = SP->getDisplayName(); 138 FuncIdRecord FuncId(ParentScope, getTypeIndex(SP->getType()), DisplayName); 139 TypeIndex TI = TypeTable.writeFuncId(FuncId); 140 141 auto InsertResult = TypeIndices.insert({SP, TI}); 142 (void)InsertResult; 143 assert(InsertResult.second && "DISubprogram lowered twice"); 144 return TI; 145 } 146 147 void CodeViewDebug::recordLocalVariable(LocalVariable &&Var, 148 const DILocation *InlinedAt) { 149 if (InlinedAt) { 150 // This variable was inlined. Associate it with the InlineSite. 151 const DISubprogram *Inlinee = Var.DIVar->getScope()->getSubprogram(); 152 InlineSite &Site = getInlineSite(InlinedAt, Inlinee); 153 Site.InlinedLocals.emplace_back(Var); 154 } else { 155 // This variable goes in the main ProcSym. 156 CurFn->Locals.emplace_back(Var); 157 } 158 } 159 160 static void addLocIfNotPresent(SmallVectorImpl<const DILocation *> &Locs, 161 const DILocation *Loc) { 162 auto B = Locs.begin(), E = Locs.end(); 163 if (std::find(B, E, Loc) == E) 164 Locs.push_back(Loc); 165 } 166 167 void CodeViewDebug::maybeRecordLocation(DebugLoc DL, 168 const MachineFunction *MF) { 169 // Skip this instruction if it has the same location as the previous one. 170 if (DL == CurFn->LastLoc) 171 return; 172 173 const DIScope *Scope = DL.get()->getScope(); 174 if (!Scope) 175 return; 176 177 // Skip this line if it is longer than the maximum we can record. 178 LineInfo LI(DL.getLine(), DL.getLine(), /*IsStatement=*/true); 179 if (LI.getStartLine() != DL.getLine() || LI.isAlwaysStepInto() || 180 LI.isNeverStepInto()) 181 return; 182 183 ColumnInfo CI(DL.getCol(), /*EndColumn=*/0); 184 if (CI.getStartColumn() != DL.getCol()) 185 return; 186 187 if (!CurFn->HaveLineInfo) 188 CurFn->HaveLineInfo = true; 189 unsigned FileId = 0; 190 if (CurFn->LastLoc.get() && CurFn->LastLoc->getFile() == DL->getFile()) 191 FileId = CurFn->LastFileId; 192 else 193 FileId = CurFn->LastFileId = maybeRecordFile(DL->getFile()); 194 CurFn->LastLoc = DL; 195 196 unsigned FuncId = CurFn->FuncId; 197 if (const DILocation *SiteLoc = DL->getInlinedAt()) { 198 const DILocation *Loc = DL.get(); 199 200 // If this location was actually inlined from somewhere else, give it the ID 201 // of the inline call site. 202 FuncId = 203 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()).SiteFuncId; 204 205 // Ensure we have links in the tree of inline call sites. 206 bool FirstLoc = true; 207 while ((SiteLoc = Loc->getInlinedAt())) { 208 InlineSite &Site = 209 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()); 210 if (!FirstLoc) 211 addLocIfNotPresent(Site.ChildSites, Loc); 212 FirstLoc = false; 213 Loc = SiteLoc; 214 } 215 addLocIfNotPresent(CurFn->ChildSites, Loc); 216 } 217 218 OS.EmitCVLocDirective(FuncId, FileId, DL.getLine(), DL.getCol(), 219 /*PrologueEnd=*/false, 220 /*IsStmt=*/false, DL->getFilename()); 221 } 222 223 void CodeViewDebug::emitCodeViewMagicVersion() { 224 OS.EmitValueToAlignment(4); 225 OS.AddComment("Debug section magic"); 226 OS.EmitIntValue(COFF::DEBUG_SECTION_MAGIC, 4); 227 } 228 229 void CodeViewDebug::endModule() { 230 if (FnDebugInfo.empty()) 231 return; 232 233 assert(Asm != nullptr); 234 235 // The COFF .debug$S section consists of several subsections, each starting 236 // with a 4-byte control code (e.g. 0xF1, 0xF2, etc) and then a 4-byte length 237 // of the payload followed by the payload itself. The subsections are 4-byte 238 // aligned. 239 240 // Make a subsection for all the inlined subprograms. 241 emitInlineeLinesSubsection(); 242 243 // Emit per-function debug information. 244 for (auto &P : FnDebugInfo) 245 emitDebugInfoForFunction(P.first, P.second); 246 247 // Switch back to the generic .debug$S section after potentially processing 248 // comdat symbol sections. 249 switchToDebugSectionForSymbol(nullptr); 250 251 // This subsection holds a file index to offset in string table table. 252 OS.AddComment("File index to string table offset subsection"); 253 OS.EmitCVFileChecksumsDirective(); 254 255 // This subsection holds the string table. 256 OS.AddComment("String table"); 257 OS.EmitCVStringTableDirective(); 258 259 // Emit type information last, so that any types we translate while emitting 260 // function info are included. 261 emitTypeInformation(); 262 263 clear(); 264 } 265 266 static void emitNullTerminatedSymbolName(MCStreamer &OS, StringRef S) { 267 // Microsoft's linker seems to have trouble with symbol names longer than 268 // 0xffd8 bytes. 269 S = S.substr(0, 0xffd8); 270 SmallString<32> NullTerminatedString(S); 271 NullTerminatedString.push_back('\0'); 272 OS.EmitBytes(NullTerminatedString); 273 } 274 275 void CodeViewDebug::emitTypeInformation() { 276 // Do nothing if we have no debug info or if no non-trivial types were emitted 277 // to TypeTable during codegen. 278 NamedMDNode *CU_Nodes = 279 MMI->getModule()->getNamedMetadata("llvm.dbg.cu"); 280 if (!CU_Nodes) 281 return; 282 if (TypeTable.empty()) 283 return; 284 285 // Start the .debug$T section with 0x4. 286 OS.SwitchSection(Asm->getObjFileLowering().getCOFFDebugTypesSection()); 287 emitCodeViewMagicVersion(); 288 289 SmallString<8> CommentPrefix; 290 if (OS.isVerboseAsm()) { 291 CommentPrefix += '\t'; 292 CommentPrefix += Asm->MAI->getCommentString(); 293 CommentPrefix += ' '; 294 } 295 296 CVTypeDumper CVTD(nullptr, /*PrintRecordBytes=*/false); 297 TypeTable.ForEachRecord( 298 [&](TypeIndex Index, StringRef Record) { 299 if (OS.isVerboseAsm()) { 300 // Emit a block comment describing the type record for readability. 301 SmallString<512> CommentBlock; 302 raw_svector_ostream CommentOS(CommentBlock); 303 ScopedPrinter SP(CommentOS); 304 SP.setPrefix(CommentPrefix); 305 CVTD.setPrinter(&SP); 306 bool DumpSuccess = 307 CVTD.dump({Record.bytes_begin(), Record.bytes_end()}); 308 (void)DumpSuccess; 309 assert(DumpSuccess && "produced malformed type record"); 310 // emitRawComment will insert its own tab and comment string before 311 // the first line, so strip off our first one. It also prints its own 312 // newline. 313 OS.emitRawComment( 314 CommentOS.str().drop_front(CommentPrefix.size() - 1).rtrim()); 315 } 316 OS.EmitBinaryData(Record); 317 }); 318 } 319 320 void CodeViewDebug::emitInlineeLinesSubsection() { 321 if (InlinedSubprograms.empty()) 322 return; 323 324 // Use the generic .debug$S section. 325 switchToDebugSectionForSymbol(nullptr); 326 327 MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(), 328 *InlineEnd = MMI->getContext().createTempSymbol(); 329 330 OS.AddComment("Inlinee lines subsection"); 331 OS.EmitIntValue(unsigned(ModuleSubstreamKind::InlineeLines), 4); 332 OS.AddComment("Subsection size"); 333 OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 4); 334 OS.EmitLabel(InlineBegin); 335 336 // We don't provide any extra file info. 337 // FIXME: Find out if debuggers use this info. 338 OS.AddComment("Inlinee lines signature"); 339 OS.EmitIntValue(unsigned(InlineeLinesSignature::Normal), 4); 340 341 for (const DISubprogram *SP : InlinedSubprograms) { 342 assert(TypeIndices.count(SP)); 343 TypeIndex InlineeIdx = TypeIndices[SP]; 344 345 OS.AddBlankLine(); 346 unsigned FileId = maybeRecordFile(SP->getFile()); 347 OS.AddComment("Inlined function " + SP->getDisplayName() + " starts at " + 348 SP->getFilename() + Twine(':') + Twine(SP->getLine())); 349 OS.AddBlankLine(); 350 // The filechecksum table uses 8 byte entries for now, and file ids start at 351 // 1. 352 unsigned FileOffset = (FileId - 1) * 8; 353 OS.AddComment("Type index of inlined function"); 354 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 355 OS.AddComment("Offset into filechecksum table"); 356 OS.EmitIntValue(FileOffset, 4); 357 OS.AddComment("Starting line number"); 358 OS.EmitIntValue(SP->getLine(), 4); 359 } 360 361 OS.EmitLabel(InlineEnd); 362 } 363 364 void CodeViewDebug::collectInlineSiteChildren( 365 SmallVectorImpl<unsigned> &Children, const FunctionInfo &FI, 366 const InlineSite &Site) { 367 for (const DILocation *ChildSiteLoc : Site.ChildSites) { 368 auto I = FI.InlineSites.find(ChildSiteLoc); 369 const InlineSite &ChildSite = I->second; 370 Children.push_back(ChildSite.SiteFuncId); 371 collectInlineSiteChildren(Children, FI, ChildSite); 372 } 373 } 374 375 void CodeViewDebug::emitInlinedCallSite(const FunctionInfo &FI, 376 const DILocation *InlinedAt, 377 const InlineSite &Site) { 378 MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(), 379 *InlineEnd = MMI->getContext().createTempSymbol(); 380 381 assert(TypeIndices.count(Site.Inlinee)); 382 TypeIndex InlineeIdx = TypeIndices[Site.Inlinee]; 383 384 // SymbolRecord 385 OS.AddComment("Record length"); 386 OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 2); // RecordLength 387 OS.EmitLabel(InlineBegin); 388 OS.AddComment("Record kind: S_INLINESITE"); 389 OS.EmitIntValue(SymbolKind::S_INLINESITE, 2); // RecordKind 390 391 OS.AddComment("PtrParent"); 392 OS.EmitIntValue(0, 4); 393 OS.AddComment("PtrEnd"); 394 OS.EmitIntValue(0, 4); 395 OS.AddComment("Inlinee type index"); 396 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 397 398 unsigned FileId = maybeRecordFile(Site.Inlinee->getFile()); 399 unsigned StartLineNum = Site.Inlinee->getLine(); 400 SmallVector<unsigned, 3> SecondaryFuncIds; 401 collectInlineSiteChildren(SecondaryFuncIds, FI, Site); 402 403 OS.EmitCVInlineLinetableDirective(Site.SiteFuncId, FileId, StartLineNum, 404 FI.Begin, FI.End, SecondaryFuncIds); 405 406 OS.EmitLabel(InlineEnd); 407 408 for (const LocalVariable &Var : Site.InlinedLocals) 409 emitLocalVariable(Var); 410 411 // Recurse on child inlined call sites before closing the scope. 412 for (const DILocation *ChildSite : Site.ChildSites) { 413 auto I = FI.InlineSites.find(ChildSite); 414 assert(I != FI.InlineSites.end() && 415 "child site not in function inline site map"); 416 emitInlinedCallSite(FI, ChildSite, I->second); 417 } 418 419 // Close the scope. 420 OS.AddComment("Record length"); 421 OS.EmitIntValue(2, 2); // RecordLength 422 OS.AddComment("Record kind: S_INLINESITE_END"); 423 OS.EmitIntValue(SymbolKind::S_INLINESITE_END, 2); // RecordKind 424 } 425 426 void CodeViewDebug::switchToDebugSectionForSymbol(const MCSymbol *GVSym) { 427 // If we have a symbol, it may be in a section that is COMDAT. If so, find the 428 // comdat key. A section may be comdat because of -ffunction-sections or 429 // because it is comdat in the IR. 430 MCSectionCOFF *GVSec = 431 GVSym ? dyn_cast<MCSectionCOFF>(&GVSym->getSection()) : nullptr; 432 const MCSymbol *KeySym = GVSec ? GVSec->getCOMDATSymbol() : nullptr; 433 434 MCSectionCOFF *DebugSec = cast<MCSectionCOFF>( 435 Asm->getObjFileLowering().getCOFFDebugSymbolsSection()); 436 DebugSec = OS.getContext().getAssociativeCOFFSection(DebugSec, KeySym); 437 438 OS.SwitchSection(DebugSec); 439 440 // Emit the magic version number if this is the first time we've switched to 441 // this section. 442 if (ComdatDebugSections.insert(DebugSec).second) 443 emitCodeViewMagicVersion(); 444 } 445 446 void CodeViewDebug::emitDebugInfoForFunction(const Function *GV, 447 FunctionInfo &FI) { 448 // For each function there is a separate subsection 449 // which holds the PC to file:line table. 450 const MCSymbol *Fn = Asm->getSymbol(GV); 451 assert(Fn); 452 453 // Switch to the to a comdat section, if appropriate. 454 switchToDebugSectionForSymbol(Fn); 455 456 StringRef FuncName; 457 if (auto *SP = GV->getSubprogram()) 458 FuncName = SP->getDisplayName(); 459 460 // If our DISubprogram name is empty, use the mangled name. 461 if (FuncName.empty()) 462 FuncName = GlobalValue::getRealLinkageName(GV->getName()); 463 464 // Emit a symbol subsection, required by VS2012+ to find function boundaries. 465 MCSymbol *SymbolsBegin = MMI->getContext().createTempSymbol(), 466 *SymbolsEnd = MMI->getContext().createTempSymbol(); 467 OS.AddComment("Symbol subsection for " + Twine(FuncName)); 468 OS.EmitIntValue(unsigned(ModuleSubstreamKind::Symbols), 4); 469 OS.AddComment("Subsection size"); 470 OS.emitAbsoluteSymbolDiff(SymbolsEnd, SymbolsBegin, 4); 471 OS.EmitLabel(SymbolsBegin); 472 { 473 MCSymbol *ProcRecordBegin = MMI->getContext().createTempSymbol(), 474 *ProcRecordEnd = MMI->getContext().createTempSymbol(); 475 OS.AddComment("Record length"); 476 OS.emitAbsoluteSymbolDiff(ProcRecordEnd, ProcRecordBegin, 2); 477 OS.EmitLabel(ProcRecordBegin); 478 479 OS.AddComment("Record kind: S_GPROC32_ID"); 480 OS.EmitIntValue(unsigned(SymbolKind::S_GPROC32_ID), 2); 481 482 // These fields are filled in by tools like CVPACK which run after the fact. 483 OS.AddComment("PtrParent"); 484 OS.EmitIntValue(0, 4); 485 OS.AddComment("PtrEnd"); 486 OS.EmitIntValue(0, 4); 487 OS.AddComment("PtrNext"); 488 OS.EmitIntValue(0, 4); 489 // This is the important bit that tells the debugger where the function 490 // code is located and what's its size: 491 OS.AddComment("Code size"); 492 OS.emitAbsoluteSymbolDiff(FI.End, Fn, 4); 493 OS.AddComment("Offset after prologue"); 494 OS.EmitIntValue(0, 4); 495 OS.AddComment("Offset before epilogue"); 496 OS.EmitIntValue(0, 4); 497 OS.AddComment("Function type index"); 498 OS.EmitIntValue(getFuncIdForSubprogram(GV->getSubprogram()).getIndex(), 4); 499 OS.AddComment("Function section relative address"); 500 OS.EmitCOFFSecRel32(Fn); 501 OS.AddComment("Function section index"); 502 OS.EmitCOFFSectionIndex(Fn); 503 OS.AddComment("Flags"); 504 OS.EmitIntValue(0, 1); 505 // Emit the function display name as a null-terminated string. 506 OS.AddComment("Function name"); 507 // Truncate the name so we won't overflow the record length field. 508 emitNullTerminatedSymbolName(OS, FuncName); 509 OS.EmitLabel(ProcRecordEnd); 510 511 for (const LocalVariable &Var : FI.Locals) 512 emitLocalVariable(Var); 513 514 // Emit inlined call site information. Only emit functions inlined directly 515 // into the parent function. We'll emit the other sites recursively as part 516 // of their parent inline site. 517 for (const DILocation *InlinedAt : FI.ChildSites) { 518 auto I = FI.InlineSites.find(InlinedAt); 519 assert(I != FI.InlineSites.end() && 520 "child site not in function inline site map"); 521 emitInlinedCallSite(FI, InlinedAt, I->second); 522 } 523 524 // We're done with this function. 525 OS.AddComment("Record length"); 526 OS.EmitIntValue(0x0002, 2); 527 OS.AddComment("Record kind: S_PROC_ID_END"); 528 OS.EmitIntValue(unsigned(SymbolKind::S_PROC_ID_END), 2); 529 } 530 OS.EmitLabel(SymbolsEnd); 531 // Every subsection must be aligned to a 4-byte boundary. 532 OS.EmitValueToAlignment(4); 533 534 // We have an assembler directive that takes care of the whole line table. 535 OS.EmitCVLinetableDirective(FI.FuncId, Fn, FI.End); 536 } 537 538 CodeViewDebug::LocalVarDefRange 539 CodeViewDebug::createDefRangeMem(uint16_t CVRegister, int Offset) { 540 LocalVarDefRange DR; 541 DR.InMemory = -1; 542 DR.DataOffset = Offset; 543 assert(DR.DataOffset == Offset && "truncation"); 544 DR.StructOffset = 0; 545 DR.CVRegister = CVRegister; 546 return DR; 547 } 548 549 CodeViewDebug::LocalVarDefRange 550 CodeViewDebug::createDefRangeReg(uint16_t CVRegister) { 551 LocalVarDefRange DR; 552 DR.InMemory = 0; 553 DR.DataOffset = 0; 554 DR.StructOffset = 0; 555 DR.CVRegister = CVRegister; 556 return DR; 557 } 558 559 void CodeViewDebug::collectVariableInfoFromMMITable( 560 DenseSet<InlinedVariable> &Processed) { 561 const TargetSubtargetInfo &TSI = Asm->MF->getSubtarget(); 562 const TargetFrameLowering *TFI = TSI.getFrameLowering(); 563 const TargetRegisterInfo *TRI = TSI.getRegisterInfo(); 564 565 for (const MachineModuleInfo::VariableDbgInfo &VI : 566 MMI->getVariableDbgInfo()) { 567 if (!VI.Var) 568 continue; 569 assert(VI.Var->isValidLocationForIntrinsic(VI.Loc) && 570 "Expected inlined-at fields to agree"); 571 572 Processed.insert(InlinedVariable(VI.Var, VI.Loc->getInlinedAt())); 573 LexicalScope *Scope = LScopes.findLexicalScope(VI.Loc); 574 575 // If variable scope is not found then skip this variable. 576 if (!Scope) 577 continue; 578 579 // Get the frame register used and the offset. 580 unsigned FrameReg = 0; 581 int FrameOffset = TFI->getFrameIndexReference(*Asm->MF, VI.Slot, FrameReg); 582 uint16_t CVReg = TRI->getCodeViewRegNum(FrameReg); 583 584 // Calculate the label ranges. 585 LocalVarDefRange DefRange = createDefRangeMem(CVReg, FrameOffset); 586 for (const InsnRange &Range : Scope->getRanges()) { 587 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 588 const MCSymbol *End = getLabelAfterInsn(Range.second); 589 End = End ? End : Asm->getFunctionEnd(); 590 DefRange.Ranges.emplace_back(Begin, End); 591 } 592 593 LocalVariable Var; 594 Var.DIVar = VI.Var; 595 Var.DefRanges.emplace_back(std::move(DefRange)); 596 recordLocalVariable(std::move(Var), VI.Loc->getInlinedAt()); 597 } 598 } 599 600 void CodeViewDebug::collectVariableInfo(const DISubprogram *SP) { 601 DenseSet<InlinedVariable> Processed; 602 // Grab the variable info that was squirreled away in the MMI side-table. 603 collectVariableInfoFromMMITable(Processed); 604 605 const TargetRegisterInfo *TRI = Asm->MF->getSubtarget().getRegisterInfo(); 606 607 for (const auto &I : DbgValues) { 608 InlinedVariable IV = I.first; 609 if (Processed.count(IV)) 610 continue; 611 const DILocalVariable *DIVar = IV.first; 612 const DILocation *InlinedAt = IV.second; 613 614 // Instruction ranges, specifying where IV is accessible. 615 const auto &Ranges = I.second; 616 617 LexicalScope *Scope = nullptr; 618 if (InlinedAt) 619 Scope = LScopes.findInlinedScope(DIVar->getScope(), InlinedAt); 620 else 621 Scope = LScopes.findLexicalScope(DIVar->getScope()); 622 // If variable scope is not found then skip this variable. 623 if (!Scope) 624 continue; 625 626 LocalVariable Var; 627 Var.DIVar = DIVar; 628 629 // Calculate the definition ranges. 630 for (auto I = Ranges.begin(), E = Ranges.end(); I != E; ++I) { 631 const InsnRange &Range = *I; 632 const MachineInstr *DVInst = Range.first; 633 assert(DVInst->isDebugValue() && "Invalid History entry"); 634 const DIExpression *DIExpr = DVInst->getDebugExpression(); 635 636 // Bail if there is a complex DWARF expression for now. 637 if (DIExpr && DIExpr->getNumElements() > 0) 638 continue; 639 640 // Bail if operand 0 is not a valid register. This means the variable is a 641 // simple constant, or is described by a complex expression. 642 // FIXME: Find a way to represent constant variables, since they are 643 // relatively common. 644 unsigned Reg = 645 DVInst->getOperand(0).isReg() ? DVInst->getOperand(0).getReg() : 0; 646 if (Reg == 0) 647 continue; 648 649 // Handle the two cases we can handle: indirect in memory and in register. 650 bool IsIndirect = DVInst->getOperand(1).isImm(); 651 unsigned CVReg = TRI->getCodeViewRegNum(DVInst->getOperand(0).getReg()); 652 { 653 LocalVarDefRange DefRange; 654 if (IsIndirect) { 655 int64_t Offset = DVInst->getOperand(1).getImm(); 656 DefRange = createDefRangeMem(CVReg, Offset); 657 } else { 658 DefRange = createDefRangeReg(CVReg); 659 } 660 if (Var.DefRanges.empty() || 661 Var.DefRanges.back().isDifferentLocation(DefRange)) { 662 Var.DefRanges.emplace_back(std::move(DefRange)); 663 } 664 } 665 666 // Compute the label range. 667 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 668 const MCSymbol *End = getLabelAfterInsn(Range.second); 669 if (!End) { 670 if (std::next(I) != E) 671 End = getLabelBeforeInsn(std::next(I)->first); 672 else 673 End = Asm->getFunctionEnd(); 674 } 675 676 // If the last range end is our begin, just extend the last range. 677 // Otherwise make a new range. 678 SmallVectorImpl<std::pair<const MCSymbol *, const MCSymbol *>> &Ranges = 679 Var.DefRanges.back().Ranges; 680 if (!Ranges.empty() && Ranges.back().second == Begin) 681 Ranges.back().second = End; 682 else 683 Ranges.emplace_back(Begin, End); 684 685 // FIXME: Do more range combining. 686 } 687 688 recordLocalVariable(std::move(Var), InlinedAt); 689 } 690 } 691 692 void CodeViewDebug::beginFunction(const MachineFunction *MF) { 693 assert(!CurFn && "Can't process two functions at once!"); 694 695 if (!Asm || !MMI->hasDebugInfo()) 696 return; 697 698 DebugHandlerBase::beginFunction(MF); 699 700 const Function *GV = MF->getFunction(); 701 assert(FnDebugInfo.count(GV) == false); 702 CurFn = &FnDebugInfo[GV]; 703 CurFn->FuncId = NextFuncId++; 704 CurFn->Begin = Asm->getFunctionBegin(); 705 706 // Find the end of the function prolog. First known non-DBG_VALUE and 707 // non-frame setup location marks the beginning of the function body. 708 // FIXME: is there a simpler a way to do this? Can we just search 709 // for the first instruction of the function, not the last of the prolog? 710 DebugLoc PrologEndLoc; 711 bool EmptyPrologue = true; 712 for (const auto &MBB : *MF) { 713 for (const auto &MI : MBB) { 714 if (!MI.isDebugValue() && !MI.getFlag(MachineInstr::FrameSetup) && 715 MI.getDebugLoc()) { 716 PrologEndLoc = MI.getDebugLoc(); 717 break; 718 } else if (!MI.isDebugValue()) { 719 EmptyPrologue = false; 720 } 721 } 722 } 723 724 // Record beginning of function if we have a non-empty prologue. 725 if (PrologEndLoc && !EmptyPrologue) { 726 DebugLoc FnStartDL = PrologEndLoc.getFnDebugLoc(); 727 maybeRecordLocation(FnStartDL, MF); 728 } 729 } 730 731 TypeIndex CodeViewDebug::lowerType(const DIType *Ty) { 732 // Generic dispatch for lowering an unknown type. 733 switch (Ty->getTag()) { 734 case dwarf::DW_TAG_typedef: 735 return lowerTypeAlias(cast<DIDerivedType>(Ty)); 736 case dwarf::DW_TAG_base_type: 737 return lowerTypeBasic(cast<DIBasicType>(Ty)); 738 case dwarf::DW_TAG_pointer_type: 739 case dwarf::DW_TAG_reference_type: 740 case dwarf::DW_TAG_rvalue_reference_type: 741 return lowerTypePointer(cast<DIDerivedType>(Ty)); 742 case dwarf::DW_TAG_ptr_to_member_type: 743 return lowerTypeMemberPointer(cast<DIDerivedType>(Ty)); 744 case dwarf::DW_TAG_const_type: 745 case dwarf::DW_TAG_volatile_type: 746 return lowerTypeModifier(cast<DIDerivedType>(Ty)); 747 case dwarf::DW_TAG_subroutine_type: 748 return lowerTypeFunction(cast<DISubroutineType>(Ty)); 749 default: 750 // Use the null type index. 751 return TypeIndex(); 752 } 753 } 754 755 TypeIndex CodeViewDebug::lowerTypeAlias(const DIDerivedType *Ty) { 756 // TODO: MSVC emits a S_UDT record. 757 DITypeRef UnderlyingTypeRef = Ty->getBaseType(); 758 TypeIndex UnderlyingTypeIndex = getTypeIndex(UnderlyingTypeRef); 759 if (UnderlyingTypeIndex == TypeIndex(SimpleTypeKind::Int32Long) && 760 Ty->getName() == "HRESULT") 761 return TypeIndex(SimpleTypeKind::HResult); 762 return UnderlyingTypeIndex; 763 } 764 765 TypeIndex CodeViewDebug::lowerTypeBasic(const DIBasicType *Ty) { 766 TypeIndex Index; 767 dwarf::TypeKind Kind; 768 uint32_t ByteSize; 769 770 Kind = static_cast<dwarf::TypeKind>(Ty->getEncoding()); 771 ByteSize = Ty->getSizeInBits() / 8; 772 773 SimpleTypeKind STK = SimpleTypeKind::None; 774 switch (Kind) { 775 case dwarf::DW_ATE_address: 776 // FIXME: Translate 777 break; 778 case dwarf::DW_ATE_boolean: 779 switch (ByteSize) { 780 case 1: STK = SimpleTypeKind::Boolean8; break; 781 case 2: STK = SimpleTypeKind::Boolean16; break; 782 case 4: STK = SimpleTypeKind::Boolean32; break; 783 case 8: STK = SimpleTypeKind::Boolean64; break; 784 case 16: STK = SimpleTypeKind::Boolean128; break; 785 } 786 break; 787 case dwarf::DW_ATE_complex_float: 788 switch (ByteSize) { 789 case 2: STK = SimpleTypeKind::Complex16; break; 790 case 4: STK = SimpleTypeKind::Complex32; break; 791 case 8: STK = SimpleTypeKind::Complex64; break; 792 case 10: STK = SimpleTypeKind::Complex80; break; 793 case 16: STK = SimpleTypeKind::Complex128; break; 794 } 795 break; 796 case dwarf::DW_ATE_float: 797 switch (ByteSize) { 798 case 2: STK = SimpleTypeKind::Float16; break; 799 case 4: STK = SimpleTypeKind::Float32; break; 800 case 6: STK = SimpleTypeKind::Float48; break; 801 case 8: STK = SimpleTypeKind::Float64; break; 802 case 10: STK = SimpleTypeKind::Float80; break; 803 case 16: STK = SimpleTypeKind::Float128; break; 804 } 805 break; 806 case dwarf::DW_ATE_signed: 807 switch (ByteSize) { 808 case 1: STK = SimpleTypeKind::SByte; break; 809 case 2: STK = SimpleTypeKind::Int16Short; break; 810 case 4: STK = SimpleTypeKind::Int32; break; 811 case 8: STK = SimpleTypeKind::Int64Quad; break; 812 case 16: STK = SimpleTypeKind::Int128Oct; break; 813 } 814 break; 815 case dwarf::DW_ATE_unsigned: 816 switch (ByteSize) { 817 case 1: STK = SimpleTypeKind::Byte; break; 818 case 2: STK = SimpleTypeKind::UInt16Short; break; 819 case 4: STK = SimpleTypeKind::UInt32; break; 820 case 8: STK = SimpleTypeKind::UInt64Quad; break; 821 case 16: STK = SimpleTypeKind::UInt128Oct; break; 822 } 823 break; 824 case dwarf::DW_ATE_UTF: 825 switch (ByteSize) { 826 case 2: STK = SimpleTypeKind::Character16; break; 827 case 4: STK = SimpleTypeKind::Character32; break; 828 } 829 break; 830 case dwarf::DW_ATE_signed_char: 831 if (ByteSize == 1) 832 STK = SimpleTypeKind::SignedCharacter; 833 break; 834 case dwarf::DW_ATE_unsigned_char: 835 if (ByteSize == 1) 836 STK = SimpleTypeKind::UnsignedCharacter; 837 break; 838 default: 839 break; 840 } 841 842 // Apply some fixups based on the source-level type name. 843 if (STK == SimpleTypeKind::Int32 && Ty->getName() == "long int") 844 STK = SimpleTypeKind::Int32Long; 845 if (STK == SimpleTypeKind::UInt32 && Ty->getName() == "long unsigned int") 846 STK = SimpleTypeKind::UInt32Long; 847 if ((STK == SimpleTypeKind::Int16Short || 848 STK == SimpleTypeKind::UInt16Short) && 849 Ty->getName() == "wchar_t") 850 STK = SimpleTypeKind::WideCharacter; 851 if ((STK == SimpleTypeKind::SignedCharacter || 852 STK == SimpleTypeKind::UnsignedCharacter) && 853 Ty->getName() == "char") 854 STK = SimpleTypeKind::NarrowCharacter; 855 856 return TypeIndex(STK); 857 } 858 859 TypeIndex CodeViewDebug::lowerTypePointer(const DIDerivedType *Ty) { 860 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 861 862 // Pointers to simple types can use SimpleTypeMode, rather than having a 863 // dedicated pointer type record. 864 if (PointeeTI.isSimple() && 865 PointeeTI.getSimpleMode() == SimpleTypeMode::Direct && 866 Ty->getTag() == dwarf::DW_TAG_pointer_type) { 867 SimpleTypeMode Mode = Ty->getSizeInBits() == 64 868 ? SimpleTypeMode::NearPointer64 869 : SimpleTypeMode::NearPointer32; 870 return TypeIndex(PointeeTI.getSimpleKind(), Mode); 871 } 872 873 PointerKind PK = 874 Ty->getSizeInBits() == 64 ? PointerKind::Near64 : PointerKind::Near32; 875 PointerMode PM = PointerMode::Pointer; 876 switch (Ty->getTag()) { 877 default: llvm_unreachable("not a pointer tag type"); 878 case dwarf::DW_TAG_pointer_type: 879 PM = PointerMode::Pointer; 880 break; 881 case dwarf::DW_TAG_reference_type: 882 PM = PointerMode::LValueReference; 883 break; 884 case dwarf::DW_TAG_rvalue_reference_type: 885 PM = PointerMode::RValueReference; 886 break; 887 } 888 // FIXME: MSVC folds qualifiers into PointerOptions in the context of a method 889 // 'this' pointer, but not normal contexts. Figure out what we're supposed to 890 // do. 891 PointerOptions PO = PointerOptions::None; 892 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8); 893 return TypeTable.writePointer(PR); 894 } 895 896 TypeIndex CodeViewDebug::lowerTypeMemberPointer(const DIDerivedType *Ty) { 897 assert(Ty->getTag() == dwarf::DW_TAG_ptr_to_member_type); 898 TypeIndex ClassTI = getTypeIndex(Ty->getClassType()); 899 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 900 PointerKind PK = Asm->MAI->getPointerSize() == 8 ? PointerKind::Near64 901 : PointerKind::Near32; 902 PointerMode PM = isa<DISubroutineType>(Ty->getBaseType()) 903 ? PointerMode::PointerToMemberFunction 904 : PointerMode::PointerToDataMember; 905 PointerOptions PO = PointerOptions::None; // FIXME 906 // FIXME: Thread this ABI info through metadata. 907 PointerToMemberRepresentation PMR = PointerToMemberRepresentation::Unknown; 908 MemberPointerInfo MPI(ClassTI, PMR); 909 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8, MPI); 910 return TypeTable.writePointer(PR); 911 } 912 913 TypeIndex CodeViewDebug::lowerTypeModifier(const DIDerivedType *Ty) { 914 ModifierOptions Mods = ModifierOptions::None; 915 bool IsModifier = true; 916 const DIType *BaseTy = Ty; 917 while (IsModifier && BaseTy) { 918 // FIXME: Need to add DWARF tag for __unaligned. 919 switch (BaseTy->getTag()) { 920 case dwarf::DW_TAG_const_type: 921 Mods |= ModifierOptions::Const; 922 break; 923 case dwarf::DW_TAG_volatile_type: 924 Mods |= ModifierOptions::Volatile; 925 break; 926 default: 927 IsModifier = false; 928 break; 929 } 930 if (IsModifier) 931 BaseTy = cast<DIDerivedType>(BaseTy)->getBaseType().resolve(); 932 } 933 TypeIndex ModifiedTI = getTypeIndex(BaseTy); 934 ModifierRecord MR(ModifiedTI, Mods); 935 return TypeTable.writeModifier(MR); 936 } 937 938 TypeIndex CodeViewDebug::lowerTypeFunction(const DISubroutineType *Ty) { 939 SmallVector<TypeIndex, 8> ReturnAndArgTypeIndices; 940 for (DITypeRef ArgTypeRef : Ty->getTypeArray()) 941 ReturnAndArgTypeIndices.push_back(getTypeIndex(ArgTypeRef)); 942 943 TypeIndex ReturnTypeIndex = TypeIndex::Void(); 944 ArrayRef<TypeIndex> ArgTypeIndices = None; 945 if (!ReturnAndArgTypeIndices.empty()) { 946 auto ReturnAndArgTypesRef = makeArrayRef(ReturnAndArgTypeIndices); 947 ReturnTypeIndex = ReturnAndArgTypesRef.front(); 948 ArgTypeIndices = ReturnAndArgTypesRef.drop_front(); 949 } 950 951 ArgListRecord ArgListRec(TypeRecordKind::ArgList, ArgTypeIndices); 952 TypeIndex ArgListIndex = TypeTable.writeArgList(ArgListRec); 953 954 // TODO: We should use DW_AT_calling_convention to determine what CC this 955 // procedure record should have. 956 // TODO: Some functions are member functions, we should use a more appropriate 957 // record for those. 958 ProcedureRecord Procedure(ReturnTypeIndex, CallingConvention::NearC, 959 FunctionOptions::None, ArgTypeIndices.size(), 960 ArgListIndex); 961 return TypeTable.writeProcedure(Procedure); 962 } 963 964 TypeIndex CodeViewDebug::getTypeIndex(DITypeRef TypeRef) { 965 const DIType *Ty = TypeRef.resolve(); 966 967 // The null DIType is the void type. Don't try to hash it. 968 if (!Ty) 969 return TypeIndex::Void(); 970 971 // Check if we've already translated this type. 972 auto I = TypeIndices.find(Ty); 973 if (I != TypeIndices.end()) 974 return I->second; 975 976 TypeIndex TI = lowerType(Ty); 977 978 auto InsertResult = TypeIndices.insert({Ty, TI}); 979 (void)InsertResult; 980 assert(InsertResult.second && "DIType lowered twice"); 981 return TI; 982 } 983 984 void CodeViewDebug::emitLocalVariable(const LocalVariable &Var) { 985 // LocalSym record, see SymbolRecord.h for more info. 986 MCSymbol *LocalBegin = MMI->getContext().createTempSymbol(), 987 *LocalEnd = MMI->getContext().createTempSymbol(); 988 OS.AddComment("Record length"); 989 OS.emitAbsoluteSymbolDiff(LocalEnd, LocalBegin, 2); 990 OS.EmitLabel(LocalBegin); 991 992 OS.AddComment("Record kind: S_LOCAL"); 993 OS.EmitIntValue(unsigned(SymbolKind::S_LOCAL), 2); 994 995 LocalSymFlags Flags = LocalSymFlags::None; 996 if (Var.DIVar->isParameter()) 997 Flags |= LocalSymFlags::IsParameter; 998 if (Var.DefRanges.empty()) 999 Flags |= LocalSymFlags::IsOptimizedOut; 1000 1001 OS.AddComment("TypeIndex"); 1002 TypeIndex TI = getTypeIndex(Var.DIVar->getType()); 1003 OS.EmitIntValue(TI.getIndex(), 4); 1004 OS.AddComment("Flags"); 1005 OS.EmitIntValue(static_cast<uint16_t>(Flags), 2); 1006 // Truncate the name so we won't overflow the record length field. 1007 emitNullTerminatedSymbolName(OS, Var.DIVar->getName()); 1008 OS.EmitLabel(LocalEnd); 1009 1010 // Calculate the on disk prefix of the appropriate def range record. The 1011 // records and on disk formats are described in SymbolRecords.h. BytePrefix 1012 // should be big enough to hold all forms without memory allocation. 1013 SmallString<20> BytePrefix; 1014 for (const LocalVarDefRange &DefRange : Var.DefRanges) { 1015 BytePrefix.clear(); 1016 // FIXME: Handle bitpieces. 1017 if (DefRange.StructOffset != 0) 1018 continue; 1019 1020 if (DefRange.InMemory) { 1021 DefRangeRegisterRelSym Sym(DefRange.CVRegister, 0, DefRange.DataOffset, 0, 1022 0, 0, ArrayRef<LocalVariableAddrGap>()); 1023 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER_REL); 1024 BytePrefix += 1025 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 1026 BytePrefix += 1027 StringRef(reinterpret_cast<const char *>(&Sym.Header), 1028 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 1029 } else { 1030 assert(DefRange.DataOffset == 0 && "unexpected offset into register"); 1031 // Unclear what matters here. 1032 DefRangeRegisterSym Sym(DefRange.CVRegister, 0, 0, 0, 0, 1033 ArrayRef<LocalVariableAddrGap>()); 1034 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER); 1035 BytePrefix += 1036 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 1037 BytePrefix += 1038 StringRef(reinterpret_cast<const char *>(&Sym.Header), 1039 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 1040 } 1041 OS.EmitCVDefRangeDirective(DefRange.Ranges, BytePrefix); 1042 } 1043 } 1044 1045 void CodeViewDebug::endFunction(const MachineFunction *MF) { 1046 if (!Asm || !CurFn) // We haven't created any debug info for this function. 1047 return; 1048 1049 const Function *GV = MF->getFunction(); 1050 assert(FnDebugInfo.count(GV)); 1051 assert(CurFn == &FnDebugInfo[GV]); 1052 1053 collectVariableInfo(GV->getSubprogram()); 1054 1055 DebugHandlerBase::endFunction(MF); 1056 1057 // Don't emit anything if we don't have any line tables. 1058 if (!CurFn->HaveLineInfo) { 1059 FnDebugInfo.erase(GV); 1060 CurFn = nullptr; 1061 return; 1062 } 1063 1064 CurFn->End = Asm->getFunctionEnd(); 1065 1066 CurFn = nullptr; 1067 } 1068 1069 void CodeViewDebug::beginInstruction(const MachineInstr *MI) { 1070 DebugHandlerBase::beginInstruction(MI); 1071 1072 // Ignore DBG_VALUE locations and function prologue. 1073 if (!Asm || MI->isDebugValue() || MI->getFlag(MachineInstr::FrameSetup)) 1074 return; 1075 DebugLoc DL = MI->getDebugLoc(); 1076 if (DL == PrevInstLoc || !DL) 1077 return; 1078 maybeRecordLocation(DL, Asm->MF); 1079 } 1080