1 //===-- llvm/lib/CodeGen/AsmPrinter/CodeViewDebug.cpp --*- C++ -*--===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file contains support for writing Microsoft CodeView debug info. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "CodeViewDebug.h" 15 #include "llvm/DebugInfo/CodeView/CodeView.h" 16 #include "llvm/DebugInfo/CodeView/Line.h" 17 #include "llvm/DebugInfo/CodeView/SymbolRecord.h" 18 #include "llvm/DebugInfo/CodeView/TypeDumper.h" 19 #include "llvm/DebugInfo/CodeView/TypeIndex.h" 20 #include "llvm/DebugInfo/CodeView/TypeRecord.h" 21 #include "llvm/MC/MCExpr.h" 22 #include "llvm/MC/MCSectionCOFF.h" 23 #include "llvm/MC/MCSymbol.h" 24 #include "llvm/Support/COFF.h" 25 #include "llvm/Support/ScopedPrinter.h" 26 #include "llvm/Target/TargetSubtargetInfo.h" 27 #include "llvm/Target/TargetRegisterInfo.h" 28 #include "llvm/Target/TargetFrameLowering.h" 29 30 using namespace llvm; 31 using namespace llvm::codeview; 32 33 CodeViewDebug::CodeViewDebug(AsmPrinter *AP) 34 : DebugHandlerBase(AP), OS(*Asm->OutStreamer), CurFn(nullptr) { 35 // If module doesn't have named metadata anchors or COFF debug section 36 // is not available, skip any debug info related stuff. 37 if (!MMI->getModule()->getNamedMetadata("llvm.dbg.cu") || 38 !AP->getObjFileLowering().getCOFFDebugSymbolsSection()) { 39 Asm = nullptr; 40 return; 41 } 42 43 // Tell MMI that we have debug info. 44 MMI->setDebugInfoAvailability(true); 45 } 46 47 StringRef CodeViewDebug::getFullFilepath(const DIFile *File) { 48 std::string &Filepath = FileToFilepathMap[File]; 49 if (!Filepath.empty()) 50 return Filepath; 51 52 StringRef Dir = File->getDirectory(), Filename = File->getFilename(); 53 54 // Clang emits directory and relative filename info into the IR, but CodeView 55 // operates on full paths. We could change Clang to emit full paths too, but 56 // that would increase the IR size and probably not needed for other users. 57 // For now, just concatenate and canonicalize the path here. 58 if (Filename.find(':') == 1) 59 Filepath = Filename; 60 else 61 Filepath = (Dir + "\\" + Filename).str(); 62 63 // Canonicalize the path. We have to do it textually because we may no longer 64 // have access the file in the filesystem. 65 // First, replace all slashes with backslashes. 66 std::replace(Filepath.begin(), Filepath.end(), '/', '\\'); 67 68 // Remove all "\.\" with "\". 69 size_t Cursor = 0; 70 while ((Cursor = Filepath.find("\\.\\", Cursor)) != std::string::npos) 71 Filepath.erase(Cursor, 2); 72 73 // Replace all "\XXX\..\" with "\". Don't try too hard though as the original 74 // path should be well-formatted, e.g. start with a drive letter, etc. 75 Cursor = 0; 76 while ((Cursor = Filepath.find("\\..\\", Cursor)) != std::string::npos) { 77 // Something's wrong if the path starts with "\..\", abort. 78 if (Cursor == 0) 79 break; 80 81 size_t PrevSlash = Filepath.rfind('\\', Cursor - 1); 82 if (PrevSlash == std::string::npos) 83 // Something's wrong, abort. 84 break; 85 86 Filepath.erase(PrevSlash, Cursor + 3 - PrevSlash); 87 // The next ".." might be following the one we've just erased. 88 Cursor = PrevSlash; 89 } 90 91 // Remove all duplicate backslashes. 92 Cursor = 0; 93 while ((Cursor = Filepath.find("\\\\", Cursor)) != std::string::npos) 94 Filepath.erase(Cursor, 1); 95 96 return Filepath; 97 } 98 99 unsigned CodeViewDebug::maybeRecordFile(const DIFile *F) { 100 unsigned NextId = FileIdMap.size() + 1; 101 auto Insertion = FileIdMap.insert(std::make_pair(F, NextId)); 102 if (Insertion.second) { 103 // We have to compute the full filepath and emit a .cv_file directive. 104 StringRef FullPath = getFullFilepath(F); 105 NextId = OS.EmitCVFileDirective(NextId, FullPath); 106 assert(NextId == FileIdMap.size() && ".cv_file directive failed"); 107 } 108 return Insertion.first->second; 109 } 110 111 CodeViewDebug::InlineSite & 112 CodeViewDebug::getInlineSite(const DILocation *InlinedAt, 113 const DISubprogram *Inlinee) { 114 auto SiteInsertion = CurFn->InlineSites.insert({InlinedAt, InlineSite()}); 115 InlineSite *Site = &SiteInsertion.first->second; 116 if (SiteInsertion.second) { 117 Site->SiteFuncId = NextFuncId++; 118 Site->Inlinee = Inlinee; 119 InlinedSubprograms.insert(Inlinee); 120 recordFuncIdForSubprogram(Inlinee); 121 } 122 return *Site; 123 } 124 125 TypeIndex CodeViewDebug::getGenericFunctionTypeIndex() { 126 if (VoidFnTyIdx.getIndex() != 0) 127 return VoidFnTyIdx; 128 129 ArrayRef<TypeIndex> NoArgs; 130 ArgListRecord ArgListRec(TypeRecordKind::ArgList, NoArgs); 131 TypeIndex ArgListIndex = TypeTable.writeArgList(ArgListRec); 132 133 ProcedureRecord Procedure(TypeIndex::Void(), CallingConvention::NearC, 134 FunctionOptions::None, 0, ArgListIndex); 135 VoidFnTyIdx = TypeTable.writeProcedure(Procedure); 136 return VoidFnTyIdx; 137 } 138 139 void CodeViewDebug::recordFuncIdForSubprogram(const DISubprogram *SP) { 140 TypeIndex ParentScope = TypeIndex(0); 141 StringRef DisplayName = SP->getDisplayName(); 142 FuncIdRecord FuncId(ParentScope, getGenericFunctionTypeIndex(), DisplayName); 143 TypeIndex TI = TypeTable.writeFuncId(FuncId); 144 TypeIndices[SP] = TI; 145 } 146 147 void CodeViewDebug::recordLocalVariable(LocalVariable &&Var, 148 const DILocation *InlinedAt) { 149 if (InlinedAt) { 150 // This variable was inlined. Associate it with the InlineSite. 151 const DISubprogram *Inlinee = Var.DIVar->getScope()->getSubprogram(); 152 InlineSite &Site = getInlineSite(InlinedAt, Inlinee); 153 Site.InlinedLocals.emplace_back(Var); 154 } else { 155 // This variable goes in the main ProcSym. 156 CurFn->Locals.emplace_back(Var); 157 } 158 } 159 160 static void addLocIfNotPresent(SmallVectorImpl<const DILocation *> &Locs, 161 const DILocation *Loc) { 162 auto B = Locs.begin(), E = Locs.end(); 163 if (std::find(B, E, Loc) == E) 164 Locs.push_back(Loc); 165 } 166 167 void CodeViewDebug::maybeRecordLocation(DebugLoc DL, 168 const MachineFunction *MF) { 169 // Skip this instruction if it has the same location as the previous one. 170 if (DL == CurFn->LastLoc) 171 return; 172 173 const DIScope *Scope = DL.get()->getScope(); 174 if (!Scope) 175 return; 176 177 // Skip this line if it is longer than the maximum we can record. 178 LineInfo LI(DL.getLine(), DL.getLine(), /*IsStatement=*/true); 179 if (LI.getStartLine() != DL.getLine() || LI.isAlwaysStepInto() || 180 LI.isNeverStepInto()) 181 return; 182 183 ColumnInfo CI(DL.getCol(), /*EndColumn=*/0); 184 if (CI.getStartColumn() != DL.getCol()) 185 return; 186 187 if (!CurFn->HaveLineInfo) 188 CurFn->HaveLineInfo = true; 189 unsigned FileId = 0; 190 if (CurFn->LastLoc.get() && CurFn->LastLoc->getFile() == DL->getFile()) 191 FileId = CurFn->LastFileId; 192 else 193 FileId = CurFn->LastFileId = maybeRecordFile(DL->getFile()); 194 CurFn->LastLoc = DL; 195 196 unsigned FuncId = CurFn->FuncId; 197 if (const DILocation *SiteLoc = DL->getInlinedAt()) { 198 const DILocation *Loc = DL.get(); 199 200 // If this location was actually inlined from somewhere else, give it the ID 201 // of the inline call site. 202 FuncId = 203 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()).SiteFuncId; 204 205 // Ensure we have links in the tree of inline call sites. 206 bool FirstLoc = true; 207 while ((SiteLoc = Loc->getInlinedAt())) { 208 InlineSite &Site = 209 getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()); 210 if (!FirstLoc) 211 addLocIfNotPresent(Site.ChildSites, Loc); 212 FirstLoc = false; 213 Loc = SiteLoc; 214 } 215 addLocIfNotPresent(CurFn->ChildSites, Loc); 216 } 217 218 OS.EmitCVLocDirective(FuncId, FileId, DL.getLine(), DL.getCol(), 219 /*PrologueEnd=*/false, 220 /*IsStmt=*/false, DL->getFilename()); 221 } 222 223 void CodeViewDebug::emitCodeViewMagicVersion() { 224 OS.EmitValueToAlignment(4); 225 OS.AddComment("Debug section magic"); 226 OS.EmitIntValue(COFF::DEBUG_SECTION_MAGIC, 4); 227 } 228 229 void CodeViewDebug::endModule() { 230 if (FnDebugInfo.empty()) 231 return; 232 233 assert(Asm != nullptr); 234 235 // The COFF .debug$S section consists of several subsections, each starting 236 // with a 4-byte control code (e.g. 0xF1, 0xF2, etc) and then a 4-byte length 237 // of the payload followed by the payload itself. The subsections are 4-byte 238 // aligned. 239 240 // Make a subsection for all the inlined subprograms. 241 emitInlineeLinesSubsection(); 242 243 // Emit per-function debug information. 244 for (auto &P : FnDebugInfo) 245 emitDebugInfoForFunction(P.first, P.second); 246 247 // Switch back to the generic .debug$S section after potentially processing 248 // comdat symbol sections. 249 switchToDebugSectionForSymbol(nullptr); 250 251 // This subsection holds a file index to offset in string table table. 252 OS.AddComment("File index to string table offset subsection"); 253 OS.EmitCVFileChecksumsDirective(); 254 255 // This subsection holds the string table. 256 OS.AddComment("String table"); 257 OS.EmitCVStringTableDirective(); 258 259 // Emit type information last, so that any types we translate while emitting 260 // function info are included. 261 emitTypeInformation(); 262 263 clear(); 264 } 265 266 static void emitNullTerminatedSymbolName(MCStreamer &OS, StringRef S) { 267 // Microsoft's linker seems to have trouble with symbol names longer than 268 // 0xffd8 bytes. 269 S = S.substr(0, 0xffd8); 270 SmallString<32> NullTerminatedString(S); 271 NullTerminatedString.push_back('\0'); 272 OS.EmitBytes(NullTerminatedString); 273 } 274 275 void CodeViewDebug::emitTypeInformation() { 276 // Do nothing if we have no debug info or if no non-trivial types were emitted 277 // to TypeTable during codegen. 278 NamedMDNode *CU_Nodes = 279 MMI->getModule()->getNamedMetadata("llvm.dbg.cu"); 280 if (!CU_Nodes) 281 return; 282 if (TypeTable.empty()) 283 return; 284 285 // Start the .debug$T section with 0x4. 286 OS.SwitchSection(Asm->getObjFileLowering().getCOFFDebugTypesSection()); 287 emitCodeViewMagicVersion(); 288 289 SmallString<8> CommentPrefix; 290 if (OS.isVerboseAsm()) { 291 CommentPrefix += '\t'; 292 CommentPrefix += Asm->MAI->getCommentString(); 293 CommentPrefix += ' '; 294 } 295 296 CVTypeDumper CVTD(nullptr, /*PrintRecordBytes=*/false); 297 TypeTable.ForEachRecord( 298 [&](TypeIndex Index, StringRef Record) { 299 if (OS.isVerboseAsm()) { 300 // Emit a block comment describing the type record for readability. 301 SmallString<512> CommentBlock; 302 raw_svector_ostream CommentOS(CommentBlock); 303 ScopedPrinter SP(CommentOS); 304 SP.setPrefix(CommentPrefix); 305 CVTD.setPrinter(&SP); 306 bool DumpSuccess = 307 CVTD.dump({Record.bytes_begin(), Record.bytes_end()}); 308 (void)DumpSuccess; 309 assert(DumpSuccess && "produced malformed type record"); 310 // emitRawComment will insert its own tab and comment string before 311 // the first line, so strip off our first one. It also prints its own 312 // newline. 313 OS.emitRawComment( 314 CommentOS.str().drop_front(CommentPrefix.size() - 1).rtrim()); 315 } 316 OS.EmitBinaryData(Record); 317 }); 318 } 319 320 void CodeViewDebug::emitInlineeLinesSubsection() { 321 if (InlinedSubprograms.empty()) 322 return; 323 324 // Use the generic .debug$S section. 325 switchToDebugSectionForSymbol(nullptr); 326 327 MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(), 328 *InlineEnd = MMI->getContext().createTempSymbol(); 329 330 OS.AddComment("Inlinee lines subsection"); 331 OS.EmitIntValue(unsigned(ModuleSubstreamKind::InlineeLines), 4); 332 OS.AddComment("Subsection size"); 333 OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 4); 334 OS.EmitLabel(InlineBegin); 335 336 // We don't provide any extra file info. 337 // FIXME: Find out if debuggers use this info. 338 OS.AddComment("Inlinee lines signature"); 339 OS.EmitIntValue(unsigned(InlineeLinesSignature::Normal), 4); 340 341 for (const DISubprogram *SP : InlinedSubprograms) { 342 assert(TypeIndices.count(SP)); 343 TypeIndex InlineeIdx = TypeIndices[SP]; 344 345 OS.AddBlankLine(); 346 unsigned FileId = maybeRecordFile(SP->getFile()); 347 OS.AddComment("Inlined function " + SP->getDisplayName() + " starts at " + 348 SP->getFilename() + Twine(':') + Twine(SP->getLine())); 349 OS.AddBlankLine(); 350 // The filechecksum table uses 8 byte entries for now, and file ids start at 351 // 1. 352 unsigned FileOffset = (FileId - 1) * 8; 353 OS.AddComment("Type index of inlined function"); 354 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 355 OS.AddComment("Offset into filechecksum table"); 356 OS.EmitIntValue(FileOffset, 4); 357 OS.AddComment("Starting line number"); 358 OS.EmitIntValue(SP->getLine(), 4); 359 } 360 361 OS.EmitLabel(InlineEnd); 362 } 363 364 void CodeViewDebug::collectInlineSiteChildren( 365 SmallVectorImpl<unsigned> &Children, const FunctionInfo &FI, 366 const InlineSite &Site) { 367 for (const DILocation *ChildSiteLoc : Site.ChildSites) { 368 auto I = FI.InlineSites.find(ChildSiteLoc); 369 const InlineSite &ChildSite = I->second; 370 Children.push_back(ChildSite.SiteFuncId); 371 collectInlineSiteChildren(Children, FI, ChildSite); 372 } 373 } 374 375 void CodeViewDebug::emitInlinedCallSite(const FunctionInfo &FI, 376 const DILocation *InlinedAt, 377 const InlineSite &Site) { 378 MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(), 379 *InlineEnd = MMI->getContext().createTempSymbol(); 380 381 assert(TypeIndices.count(Site.Inlinee)); 382 TypeIndex InlineeIdx = TypeIndices[Site.Inlinee]; 383 384 // SymbolRecord 385 OS.AddComment("Record length"); 386 OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 2); // RecordLength 387 OS.EmitLabel(InlineBegin); 388 OS.AddComment("Record kind: S_INLINESITE"); 389 OS.EmitIntValue(SymbolKind::S_INLINESITE, 2); // RecordKind 390 391 OS.AddComment("PtrParent"); 392 OS.EmitIntValue(0, 4); 393 OS.AddComment("PtrEnd"); 394 OS.EmitIntValue(0, 4); 395 OS.AddComment("Inlinee type index"); 396 OS.EmitIntValue(InlineeIdx.getIndex(), 4); 397 398 unsigned FileId = maybeRecordFile(Site.Inlinee->getFile()); 399 unsigned StartLineNum = Site.Inlinee->getLine(); 400 SmallVector<unsigned, 3> SecondaryFuncIds; 401 collectInlineSiteChildren(SecondaryFuncIds, FI, Site); 402 403 OS.EmitCVInlineLinetableDirective(Site.SiteFuncId, FileId, StartLineNum, 404 FI.Begin, FI.End, SecondaryFuncIds); 405 406 OS.EmitLabel(InlineEnd); 407 408 for (const LocalVariable &Var : Site.InlinedLocals) 409 emitLocalVariable(Var); 410 411 // Recurse on child inlined call sites before closing the scope. 412 for (const DILocation *ChildSite : Site.ChildSites) { 413 auto I = FI.InlineSites.find(ChildSite); 414 assert(I != FI.InlineSites.end() && 415 "child site not in function inline site map"); 416 emitInlinedCallSite(FI, ChildSite, I->second); 417 } 418 419 // Close the scope. 420 OS.AddComment("Record length"); 421 OS.EmitIntValue(2, 2); // RecordLength 422 OS.AddComment("Record kind: S_INLINESITE_END"); 423 OS.EmitIntValue(SymbolKind::S_INLINESITE_END, 2); // RecordKind 424 } 425 426 void CodeViewDebug::switchToDebugSectionForSymbol(const MCSymbol *GVSym) { 427 // If we have a symbol, it may be in a section that is COMDAT. If so, find the 428 // comdat key. A section may be comdat because of -ffunction-sections or 429 // because it is comdat in the IR. 430 MCSectionCOFF *GVSec = 431 GVSym ? dyn_cast<MCSectionCOFF>(&GVSym->getSection()) : nullptr; 432 const MCSymbol *KeySym = GVSec ? GVSec->getCOMDATSymbol() : nullptr; 433 434 MCSectionCOFF *DebugSec = cast<MCSectionCOFF>( 435 Asm->getObjFileLowering().getCOFFDebugSymbolsSection()); 436 DebugSec = OS.getContext().getAssociativeCOFFSection(DebugSec, KeySym); 437 438 OS.SwitchSection(DebugSec); 439 440 // Emit the magic version number if this is the first time we've switched to 441 // this section. 442 if (ComdatDebugSections.insert(DebugSec).second) 443 emitCodeViewMagicVersion(); 444 } 445 446 void CodeViewDebug::emitDebugInfoForFunction(const Function *GV, 447 FunctionInfo &FI) { 448 // For each function there is a separate subsection 449 // which holds the PC to file:line table. 450 const MCSymbol *Fn = Asm->getSymbol(GV); 451 assert(Fn); 452 453 // Switch to the to a comdat section, if appropriate. 454 switchToDebugSectionForSymbol(Fn); 455 456 StringRef FuncName; 457 if (auto *SP = GV->getSubprogram()) 458 FuncName = SP->getDisplayName(); 459 460 // If our DISubprogram name is empty, use the mangled name. 461 if (FuncName.empty()) 462 FuncName = GlobalValue::getRealLinkageName(GV->getName()); 463 464 // Emit a symbol subsection, required by VS2012+ to find function boundaries. 465 MCSymbol *SymbolsBegin = MMI->getContext().createTempSymbol(), 466 *SymbolsEnd = MMI->getContext().createTempSymbol(); 467 OS.AddComment("Symbol subsection for " + Twine(FuncName)); 468 OS.EmitIntValue(unsigned(ModuleSubstreamKind::Symbols), 4); 469 OS.AddComment("Subsection size"); 470 OS.emitAbsoluteSymbolDiff(SymbolsEnd, SymbolsBegin, 4); 471 OS.EmitLabel(SymbolsBegin); 472 { 473 MCSymbol *ProcRecordBegin = MMI->getContext().createTempSymbol(), 474 *ProcRecordEnd = MMI->getContext().createTempSymbol(); 475 OS.AddComment("Record length"); 476 OS.emitAbsoluteSymbolDiff(ProcRecordEnd, ProcRecordBegin, 2); 477 OS.EmitLabel(ProcRecordBegin); 478 479 OS.AddComment("Record kind: S_GPROC32_ID"); 480 OS.EmitIntValue(unsigned(SymbolKind::S_GPROC32_ID), 2); 481 482 // These fields are filled in by tools like CVPACK which run after the fact. 483 OS.AddComment("PtrParent"); 484 OS.EmitIntValue(0, 4); 485 OS.AddComment("PtrEnd"); 486 OS.EmitIntValue(0, 4); 487 OS.AddComment("PtrNext"); 488 OS.EmitIntValue(0, 4); 489 // This is the important bit that tells the debugger where the function 490 // code is located and what's its size: 491 OS.AddComment("Code size"); 492 OS.emitAbsoluteSymbolDiff(FI.End, Fn, 4); 493 OS.AddComment("Offset after prologue"); 494 OS.EmitIntValue(0, 4); 495 OS.AddComment("Offset before epilogue"); 496 OS.EmitIntValue(0, 4); 497 OS.AddComment("Function type index"); 498 OS.EmitIntValue(0, 4); 499 OS.AddComment("Function section relative address"); 500 OS.EmitCOFFSecRel32(Fn); 501 OS.AddComment("Function section index"); 502 OS.EmitCOFFSectionIndex(Fn); 503 OS.AddComment("Flags"); 504 OS.EmitIntValue(0, 1); 505 // Emit the function display name as a null-terminated string. 506 OS.AddComment("Function name"); 507 // Truncate the name so we won't overflow the record length field. 508 emitNullTerminatedSymbolName(OS, FuncName); 509 OS.EmitLabel(ProcRecordEnd); 510 511 for (const LocalVariable &Var : FI.Locals) 512 emitLocalVariable(Var); 513 514 // Emit inlined call site information. Only emit functions inlined directly 515 // into the parent function. We'll emit the other sites recursively as part 516 // of their parent inline site. 517 for (const DILocation *InlinedAt : FI.ChildSites) { 518 auto I = FI.InlineSites.find(InlinedAt); 519 assert(I != FI.InlineSites.end() && 520 "child site not in function inline site map"); 521 emitInlinedCallSite(FI, InlinedAt, I->second); 522 } 523 524 // We're done with this function. 525 OS.AddComment("Record length"); 526 OS.EmitIntValue(0x0002, 2); 527 OS.AddComment("Record kind: S_PROC_ID_END"); 528 OS.EmitIntValue(unsigned(SymbolKind::S_PROC_ID_END), 2); 529 } 530 OS.EmitLabel(SymbolsEnd); 531 // Every subsection must be aligned to a 4-byte boundary. 532 OS.EmitValueToAlignment(4); 533 534 // We have an assembler directive that takes care of the whole line table. 535 OS.EmitCVLinetableDirective(FI.FuncId, Fn, FI.End); 536 } 537 538 CodeViewDebug::LocalVarDefRange 539 CodeViewDebug::createDefRangeMem(uint16_t CVRegister, int Offset) { 540 LocalVarDefRange DR; 541 DR.InMemory = -1; 542 DR.DataOffset = Offset; 543 assert(DR.DataOffset == Offset && "truncation"); 544 DR.StructOffset = 0; 545 DR.CVRegister = CVRegister; 546 return DR; 547 } 548 549 CodeViewDebug::LocalVarDefRange 550 CodeViewDebug::createDefRangeReg(uint16_t CVRegister) { 551 LocalVarDefRange DR; 552 DR.InMemory = 0; 553 DR.DataOffset = 0; 554 DR.StructOffset = 0; 555 DR.CVRegister = CVRegister; 556 return DR; 557 } 558 559 void CodeViewDebug::collectVariableInfoFromMMITable( 560 DenseSet<InlinedVariable> &Processed) { 561 const TargetSubtargetInfo &TSI = Asm->MF->getSubtarget(); 562 const TargetFrameLowering *TFI = TSI.getFrameLowering(); 563 const TargetRegisterInfo *TRI = TSI.getRegisterInfo(); 564 565 for (const MachineModuleInfo::VariableDbgInfo &VI : 566 MMI->getVariableDbgInfo()) { 567 if (!VI.Var) 568 continue; 569 assert(VI.Var->isValidLocationForIntrinsic(VI.Loc) && 570 "Expected inlined-at fields to agree"); 571 572 Processed.insert(InlinedVariable(VI.Var, VI.Loc->getInlinedAt())); 573 LexicalScope *Scope = LScopes.findLexicalScope(VI.Loc); 574 575 // If variable scope is not found then skip this variable. 576 if (!Scope) 577 continue; 578 579 // Get the frame register used and the offset. 580 unsigned FrameReg = 0; 581 int FrameOffset = TFI->getFrameIndexReference(*Asm->MF, VI.Slot, FrameReg); 582 uint16_t CVReg = TRI->getCodeViewRegNum(FrameReg); 583 584 // Calculate the label ranges. 585 LocalVarDefRange DefRange = createDefRangeMem(CVReg, FrameOffset); 586 for (const InsnRange &Range : Scope->getRanges()) { 587 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 588 const MCSymbol *End = getLabelAfterInsn(Range.second); 589 End = End ? End : Asm->getFunctionEnd(); 590 DefRange.Ranges.emplace_back(Begin, End); 591 } 592 593 LocalVariable Var; 594 Var.DIVar = VI.Var; 595 Var.DefRanges.emplace_back(std::move(DefRange)); 596 recordLocalVariable(std::move(Var), VI.Loc->getInlinedAt()); 597 } 598 } 599 600 void CodeViewDebug::collectVariableInfo(const DISubprogram *SP) { 601 DenseSet<InlinedVariable> Processed; 602 // Grab the variable info that was squirreled away in the MMI side-table. 603 collectVariableInfoFromMMITable(Processed); 604 605 const TargetRegisterInfo *TRI = Asm->MF->getSubtarget().getRegisterInfo(); 606 607 for (const auto &I : DbgValues) { 608 InlinedVariable IV = I.first; 609 if (Processed.count(IV)) 610 continue; 611 const DILocalVariable *DIVar = IV.first; 612 const DILocation *InlinedAt = IV.second; 613 614 // Instruction ranges, specifying where IV is accessible. 615 const auto &Ranges = I.second; 616 617 LexicalScope *Scope = nullptr; 618 if (InlinedAt) 619 Scope = LScopes.findInlinedScope(DIVar->getScope(), InlinedAt); 620 else 621 Scope = LScopes.findLexicalScope(DIVar->getScope()); 622 // If variable scope is not found then skip this variable. 623 if (!Scope) 624 continue; 625 626 LocalVariable Var; 627 Var.DIVar = DIVar; 628 629 // Calculate the definition ranges. 630 for (auto I = Ranges.begin(), E = Ranges.end(); I != E; ++I) { 631 const InsnRange &Range = *I; 632 const MachineInstr *DVInst = Range.first; 633 assert(DVInst->isDebugValue() && "Invalid History entry"); 634 const DIExpression *DIExpr = DVInst->getDebugExpression(); 635 636 // Bail if there is a complex DWARF expression for now. 637 if (DIExpr && DIExpr->getNumElements() > 0) 638 continue; 639 640 // Bail if operand 0 is not a valid register. This means the variable is a 641 // simple constant, or is described by a complex expression. 642 // FIXME: Find a way to represent constant variables, since they are 643 // relatively common. 644 unsigned Reg = 645 DVInst->getOperand(0).isReg() ? DVInst->getOperand(0).getReg() : 0; 646 if (Reg == 0) 647 continue; 648 649 // Handle the two cases we can handle: indirect in memory and in register. 650 bool IsIndirect = DVInst->getOperand(1).isImm(); 651 unsigned CVReg = TRI->getCodeViewRegNum(DVInst->getOperand(0).getReg()); 652 { 653 LocalVarDefRange DefRange; 654 if (IsIndirect) { 655 int64_t Offset = DVInst->getOperand(1).getImm(); 656 DefRange = createDefRangeMem(CVReg, Offset); 657 } else { 658 DefRange = createDefRangeReg(CVReg); 659 } 660 if (Var.DefRanges.empty() || 661 Var.DefRanges.back().isDifferentLocation(DefRange)) { 662 Var.DefRanges.emplace_back(std::move(DefRange)); 663 } 664 } 665 666 // Compute the label range. 667 const MCSymbol *Begin = getLabelBeforeInsn(Range.first); 668 const MCSymbol *End = getLabelAfterInsn(Range.second); 669 if (!End) { 670 if (std::next(I) != E) 671 End = getLabelBeforeInsn(std::next(I)->first); 672 else 673 End = Asm->getFunctionEnd(); 674 } 675 676 // If the last range end is our begin, just extend the last range. 677 // Otherwise make a new range. 678 SmallVectorImpl<std::pair<const MCSymbol *, const MCSymbol *>> &Ranges = 679 Var.DefRanges.back().Ranges; 680 if (!Ranges.empty() && Ranges.back().second == Begin) 681 Ranges.back().second = End; 682 else 683 Ranges.emplace_back(Begin, End); 684 685 // FIXME: Do more range combining. 686 } 687 688 recordLocalVariable(std::move(Var), InlinedAt); 689 } 690 } 691 692 void CodeViewDebug::beginFunction(const MachineFunction *MF) { 693 assert(!CurFn && "Can't process two functions at once!"); 694 695 if (!Asm || !MMI->hasDebugInfo()) 696 return; 697 698 DebugHandlerBase::beginFunction(MF); 699 700 const Function *GV = MF->getFunction(); 701 assert(FnDebugInfo.count(GV) == false); 702 CurFn = &FnDebugInfo[GV]; 703 CurFn->FuncId = NextFuncId++; 704 CurFn->Begin = Asm->getFunctionBegin(); 705 706 // Find the end of the function prolog. First known non-DBG_VALUE and 707 // non-frame setup location marks the beginning of the function body. 708 // FIXME: is there a simpler a way to do this? Can we just search 709 // for the first instruction of the function, not the last of the prolog? 710 DebugLoc PrologEndLoc; 711 bool EmptyPrologue = true; 712 for (const auto &MBB : *MF) { 713 for (const auto &MI : MBB) { 714 if (!MI.isDebugValue() && !MI.getFlag(MachineInstr::FrameSetup) && 715 MI.getDebugLoc()) { 716 PrologEndLoc = MI.getDebugLoc(); 717 break; 718 } else if (!MI.isDebugValue()) { 719 EmptyPrologue = false; 720 } 721 } 722 } 723 724 // Record beginning of function if we have a non-empty prologue. 725 if (PrologEndLoc && !EmptyPrologue) { 726 DebugLoc FnStartDL = PrologEndLoc.getFnDebugLoc(); 727 maybeRecordLocation(FnStartDL, MF); 728 } 729 } 730 731 TypeIndex CodeViewDebug::lowerType(const DIType *Ty) { 732 // Generic dispatch for lowering an unknown type. 733 switch (Ty->getTag()) { 734 case dwarf::DW_TAG_base_type: 735 return lowerTypeBasic(cast<DIBasicType>(Ty)); 736 case dwarf::DW_TAG_pointer_type: 737 case dwarf::DW_TAG_reference_type: 738 case dwarf::DW_TAG_rvalue_reference_type: 739 return lowerTypePointer(cast<DIDerivedType>(Ty)); 740 case dwarf::DW_TAG_ptr_to_member_type: 741 return lowerTypeMemberPointer(cast<DIDerivedType>(Ty)); 742 case dwarf::DW_TAG_const_type: 743 case dwarf::DW_TAG_volatile_type: 744 return lowerTypeModifier(cast<DIDerivedType>(Ty)); 745 default: 746 // Use the null type index. 747 return TypeIndex(); 748 } 749 } 750 751 TypeIndex CodeViewDebug::lowerTypeBasic(const DIBasicType *Ty) { 752 TypeIndex Index; 753 dwarf::TypeKind Kind; 754 uint32_t ByteSize; 755 756 Kind = static_cast<dwarf::TypeKind>(Ty->getEncoding()); 757 ByteSize = Ty->getSizeInBits() >> 3; 758 759 SimpleTypeKind STK = SimpleTypeKind::None; 760 switch (Kind) { 761 case dwarf::DW_ATE_address: 762 // FIXME: Translate 763 break; 764 case dwarf::DW_ATE_boolean: 765 switch (ByteSize) { 766 case 1: STK = SimpleTypeKind::Boolean8; break; 767 case 2: STK = SimpleTypeKind::Boolean16; break; 768 case 4: STK = SimpleTypeKind::Boolean32; break; 769 case 8: STK = SimpleTypeKind::Boolean64; break; 770 } 771 break; 772 case dwarf::DW_ATE_complex_float: 773 switch (ByteSize) { 774 case 4: STK = SimpleTypeKind::Complex32; break; 775 case 8: STK = SimpleTypeKind::Complex64; break; 776 case 10: STK = SimpleTypeKind::Complex80; break; 777 case 16: STK = SimpleTypeKind::Complex128; break; 778 } 779 break; 780 case dwarf::DW_ATE_float: 781 switch (ByteSize) { 782 case 4: STK = SimpleTypeKind::Float32; break; 783 case 6: STK = SimpleTypeKind::Float48; break; 784 case 8: STK = SimpleTypeKind::Float64; break; 785 case 10: STK = SimpleTypeKind::Float80; break; 786 case 16: STK = SimpleTypeKind::Float128; break; 787 } 788 break; 789 case dwarf::DW_ATE_signed: 790 switch (ByteSize) { 791 case 1: STK = SimpleTypeKind::SByte; break; 792 case 2: STK = SimpleTypeKind::Int16Short; break; 793 case 4: STK = SimpleTypeKind::Int32; break; 794 case 8: STK = SimpleTypeKind::Int64; break; 795 } 796 break; 797 case dwarf::DW_ATE_unsigned: 798 switch (ByteSize) { 799 case 1: STK = SimpleTypeKind::Byte; break; 800 case 2: STK = SimpleTypeKind::UInt16Short; break; 801 case 4: STK = SimpleTypeKind::UInt32; break; 802 case 8: STK = SimpleTypeKind::UInt64; break; 803 } 804 break; 805 case dwarf::DW_ATE_UTF: 806 switch (ByteSize) { 807 case 2: STK = SimpleTypeKind::Character16; break; 808 case 4: STK = SimpleTypeKind::Character32; break; 809 } 810 break; 811 case dwarf::DW_ATE_signed_char: 812 if (ByteSize == 1) 813 STK = SimpleTypeKind::SignedCharacter; 814 break; 815 case dwarf::DW_ATE_unsigned_char: 816 if (ByteSize == 1) 817 STK = SimpleTypeKind::UnsignedCharacter; 818 break; 819 default: 820 break; 821 } 822 823 // Apply some fixups based on the source-level type name. 824 if (STK == SimpleTypeKind::Int32 && Ty->getName() == "long int") 825 STK = SimpleTypeKind::Int32Long; 826 if (STK == SimpleTypeKind::UInt32 && Ty->getName() == "long unsigned int") 827 STK = SimpleTypeKind::UInt32Long; 828 if ((STK == SimpleTypeKind::Int16Short || 829 STK == SimpleTypeKind::UInt16Short) && 830 Ty->getName() == "wchar_t") 831 STK = SimpleTypeKind::WideCharacter; 832 if ((STK == SimpleTypeKind::SignedCharacter || 833 STK == SimpleTypeKind::UnsignedCharacter) && 834 Ty->getName() == "char") 835 STK = SimpleTypeKind::NarrowCharacter; 836 837 return TypeIndex(STK); 838 } 839 840 TypeIndex CodeViewDebug::lowerTypePointer(const DIDerivedType *Ty) { 841 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 842 843 // Pointers to simple types can use SimpleTypeMode, rather than having a 844 // dedicated pointer type record. 845 if (PointeeTI.isSimple() && 846 PointeeTI.getSimpleMode() == SimpleTypeMode::Direct && 847 Ty->getTag() == dwarf::DW_TAG_pointer_type) { 848 SimpleTypeMode Mode = Ty->getSizeInBits() == 64 849 ? SimpleTypeMode::NearPointer64 850 : SimpleTypeMode::NearPointer32; 851 return TypeIndex(PointeeTI.getSimpleKind(), Mode); 852 } 853 854 PointerKind PK = 855 Ty->getSizeInBits() == 64 ? PointerKind::Near64 : PointerKind::Near32; 856 PointerMode PM = PointerMode::Pointer; 857 switch (Ty->getTag()) { 858 default: llvm_unreachable("not a pointer tag type"); 859 case dwarf::DW_TAG_pointer_type: 860 PM = PointerMode::Pointer; 861 break; 862 case dwarf::DW_TAG_reference_type: 863 PM = PointerMode::LValueReference; 864 break; 865 case dwarf::DW_TAG_rvalue_reference_type: 866 PM = PointerMode::RValueReference; 867 break; 868 } 869 // FIXME: MSVC folds qualifiers into PointerOptions in the context of a method 870 // 'this' pointer, but not normal contexts. Figure out what we're supposed to 871 // do. 872 PointerOptions PO = PointerOptions::None; 873 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8); 874 return TypeTable.writePointer(PR); 875 } 876 877 TypeIndex CodeViewDebug::lowerTypeMemberPointer(const DIDerivedType *Ty) { 878 assert(Ty->getTag() == dwarf::DW_TAG_ptr_to_member_type); 879 TypeIndex ClassTI = getTypeIndex(Ty->getClassType()); 880 TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType()); 881 PointerKind PK = Asm->MAI->getPointerSize() == 8 ? PointerKind::Near64 882 : PointerKind::Near32; 883 PointerMode PM = isa<DISubroutineType>(Ty->getBaseType()) 884 ? PointerMode::PointerToMemberFunction 885 : PointerMode::PointerToDataMember; 886 PointerOptions PO = PointerOptions::None; // FIXME 887 // FIXME: Thread this ABI info through metadata. 888 PointerToMemberRepresentation PMR = PointerToMemberRepresentation::Unknown; 889 MemberPointerInfo MPI(ClassTI, PMR); 890 PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8, MPI); 891 return TypeTable.writePointer(PR); 892 } 893 894 TypeIndex CodeViewDebug::lowerTypeModifier(const DIDerivedType *Ty) { 895 ModifierOptions Mods = ModifierOptions::None; 896 bool IsModifier = true; 897 const DIType *BaseTy = Ty; 898 while (IsModifier) { 899 assert(BaseTy); 900 // FIXME: Need to add DWARF tag for __unaligned. 901 switch (BaseTy->getTag()) { 902 case dwarf::DW_TAG_const_type: 903 Mods |= ModifierOptions::Const; 904 break; 905 case dwarf::DW_TAG_volatile_type: 906 Mods |= ModifierOptions::Volatile; 907 break; 908 default: 909 IsModifier = false; 910 break; 911 } 912 if (IsModifier) 913 BaseTy = cast<DIDerivedType>(BaseTy)->getBaseType().resolve(); 914 } 915 TypeIndex ModifiedTI = getTypeIndex(BaseTy); 916 ModifierRecord MR(ModifiedTI, Mods); 917 return TypeTable.writeModifier(MR); 918 } 919 920 TypeIndex CodeViewDebug::getTypeIndex(DITypeRef TypeRef) { 921 const DIType *Ty = TypeRef.resolve(); 922 923 // The null DIType is the void type. Don't try to hash it. 924 if (!Ty) 925 return TypeIndex::Void(); 926 927 // Check if we've already translated this type. 928 auto I = TypeIndices.find(Ty); 929 if (I != TypeIndices.end()) 930 return I->second; 931 932 TypeIndex TI = lowerType(Ty); 933 934 auto InsertResult = TypeIndices.insert({Ty, TI}); 935 (void)InsertResult; 936 assert(InsertResult.second && "DIType lowered twice"); 937 return TI; 938 } 939 940 void CodeViewDebug::emitLocalVariable(const LocalVariable &Var) { 941 // LocalSym record, see SymbolRecord.h for more info. 942 MCSymbol *LocalBegin = MMI->getContext().createTempSymbol(), 943 *LocalEnd = MMI->getContext().createTempSymbol(); 944 OS.AddComment("Record length"); 945 OS.emitAbsoluteSymbolDiff(LocalEnd, LocalBegin, 2); 946 OS.EmitLabel(LocalBegin); 947 948 OS.AddComment("Record kind: S_LOCAL"); 949 OS.EmitIntValue(unsigned(SymbolKind::S_LOCAL), 2); 950 951 LocalSymFlags Flags = LocalSymFlags::None; 952 if (Var.DIVar->isParameter()) 953 Flags |= LocalSymFlags::IsParameter; 954 if (Var.DefRanges.empty()) 955 Flags |= LocalSymFlags::IsOptimizedOut; 956 957 OS.AddComment("TypeIndex"); 958 TypeIndex TI = getTypeIndex(Var.DIVar->getType()); 959 OS.EmitIntValue(TI.getIndex(), 4); 960 OS.AddComment("Flags"); 961 OS.EmitIntValue(static_cast<uint16_t>(Flags), 2); 962 // Truncate the name so we won't overflow the record length field. 963 emitNullTerminatedSymbolName(OS, Var.DIVar->getName()); 964 OS.EmitLabel(LocalEnd); 965 966 // Calculate the on disk prefix of the appropriate def range record. The 967 // records and on disk formats are described in SymbolRecords.h. BytePrefix 968 // should be big enough to hold all forms without memory allocation. 969 SmallString<20> BytePrefix; 970 for (const LocalVarDefRange &DefRange : Var.DefRanges) { 971 BytePrefix.clear(); 972 // FIXME: Handle bitpieces. 973 if (DefRange.StructOffset != 0) 974 continue; 975 976 if (DefRange.InMemory) { 977 DefRangeRegisterRelSym Sym(DefRange.CVRegister, 0, DefRange.DataOffset, 0, 978 0, 0, ArrayRef<LocalVariableAddrGap>()); 979 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER_REL); 980 BytePrefix += 981 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 982 BytePrefix += 983 StringRef(reinterpret_cast<const char *>(&Sym.Header), 984 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 985 } else { 986 assert(DefRange.DataOffset == 0 && "unexpected offset into register"); 987 // Unclear what matters here. 988 DefRangeRegisterSym Sym(DefRange.CVRegister, 0, 0, 0, 0, 989 ArrayRef<LocalVariableAddrGap>()); 990 ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER); 991 BytePrefix += 992 StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind)); 993 BytePrefix += 994 StringRef(reinterpret_cast<const char *>(&Sym.Header), 995 sizeof(Sym.Header) - sizeof(LocalVariableAddrRange)); 996 } 997 OS.EmitCVDefRangeDirective(DefRange.Ranges, BytePrefix); 998 } 999 } 1000 1001 void CodeViewDebug::endFunction(const MachineFunction *MF) { 1002 if (!Asm || !CurFn) // We haven't created any debug info for this function. 1003 return; 1004 1005 const Function *GV = MF->getFunction(); 1006 assert(FnDebugInfo.count(GV)); 1007 assert(CurFn == &FnDebugInfo[GV]); 1008 1009 collectVariableInfo(GV->getSubprogram()); 1010 1011 DebugHandlerBase::endFunction(MF); 1012 1013 // Don't emit anything if we don't have any line tables. 1014 if (!CurFn->HaveLineInfo) { 1015 FnDebugInfo.erase(GV); 1016 CurFn = nullptr; 1017 return; 1018 } 1019 1020 CurFn->End = Asm->getFunctionEnd(); 1021 1022 CurFn = nullptr; 1023 } 1024 1025 void CodeViewDebug::beginInstruction(const MachineInstr *MI) { 1026 DebugHandlerBase::beginInstruction(MI); 1027 1028 // Ignore DBG_VALUE locations and function prologue. 1029 if (!Asm || MI->isDebugValue() || MI->getFlag(MachineInstr::FrameSetup)) 1030 return; 1031 DebugLoc DL = MI->getDebugLoc(); 1032 if (DL == PrevInstLoc || !DL) 1033 return; 1034 maybeRecordLocation(DL, Asm->MF); 1035 } 1036