1 //===-- llvm/lib/CodeGen/AsmPrinter/CodeViewDebug.cpp --*- C++ -*--===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for writing Microsoft CodeView debug info.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "CodeViewDebug.h"
15 #include "llvm/DebugInfo/CodeView/CodeView.h"
16 #include "llvm/DebugInfo/CodeView/Line.h"
17 #include "llvm/DebugInfo/CodeView/SymbolRecord.h"
18 #include "llvm/DebugInfo/CodeView/TypeDumper.h"
19 #include "llvm/DebugInfo/CodeView/TypeIndex.h"
20 #include "llvm/DebugInfo/CodeView/TypeRecord.h"
21 #include "llvm/MC/MCExpr.h"
22 #include "llvm/MC/MCSectionCOFF.h"
23 #include "llvm/MC/MCSymbol.h"
24 #include "llvm/Support/COFF.h"
25 #include "llvm/Support/ScopedPrinter.h"
26 #include "llvm/Target/TargetSubtargetInfo.h"
27 #include "llvm/Target/TargetRegisterInfo.h"
28 #include "llvm/Target/TargetFrameLowering.h"
29 
30 using namespace llvm;
31 using namespace llvm::codeview;
32 
33 CodeViewDebug::CodeViewDebug(AsmPrinter *AP)
34     : DebugHandlerBase(AP), OS(*Asm->OutStreamer), CurFn(nullptr) {
35   // If module doesn't have named metadata anchors or COFF debug section
36   // is not available, skip any debug info related stuff.
37   if (!MMI->getModule()->getNamedMetadata("llvm.dbg.cu") ||
38       !AP->getObjFileLowering().getCOFFDebugSymbolsSection()) {
39     Asm = nullptr;
40     return;
41   }
42 
43   // Tell MMI that we have debug info.
44   MMI->setDebugInfoAvailability(true);
45 }
46 
47 StringRef CodeViewDebug::getFullFilepath(const DIFile *File) {
48   std::string &Filepath = FileToFilepathMap[File];
49   if (!Filepath.empty())
50     return Filepath;
51 
52   StringRef Dir = File->getDirectory(), Filename = File->getFilename();
53 
54   // Clang emits directory and relative filename info into the IR, but CodeView
55   // operates on full paths.  We could change Clang to emit full paths too, but
56   // that would increase the IR size and probably not needed for other users.
57   // For now, just concatenate and canonicalize the path here.
58   if (Filename.find(':') == 1)
59     Filepath = Filename;
60   else
61     Filepath = (Dir + "\\" + Filename).str();
62 
63   // Canonicalize the path.  We have to do it textually because we may no longer
64   // have access the file in the filesystem.
65   // First, replace all slashes with backslashes.
66   std::replace(Filepath.begin(), Filepath.end(), '/', '\\');
67 
68   // Remove all "\.\" with "\".
69   size_t Cursor = 0;
70   while ((Cursor = Filepath.find("\\.\\", Cursor)) != std::string::npos)
71     Filepath.erase(Cursor, 2);
72 
73   // Replace all "\XXX\..\" with "\".  Don't try too hard though as the original
74   // path should be well-formatted, e.g. start with a drive letter, etc.
75   Cursor = 0;
76   while ((Cursor = Filepath.find("\\..\\", Cursor)) != std::string::npos) {
77     // Something's wrong if the path starts with "\..\", abort.
78     if (Cursor == 0)
79       break;
80 
81     size_t PrevSlash = Filepath.rfind('\\', Cursor - 1);
82     if (PrevSlash == std::string::npos)
83       // Something's wrong, abort.
84       break;
85 
86     Filepath.erase(PrevSlash, Cursor + 3 - PrevSlash);
87     // The next ".." might be following the one we've just erased.
88     Cursor = PrevSlash;
89   }
90 
91   // Remove all duplicate backslashes.
92   Cursor = 0;
93   while ((Cursor = Filepath.find("\\\\", Cursor)) != std::string::npos)
94     Filepath.erase(Cursor, 1);
95 
96   return Filepath;
97 }
98 
99 unsigned CodeViewDebug::maybeRecordFile(const DIFile *F) {
100   unsigned NextId = FileIdMap.size() + 1;
101   auto Insertion = FileIdMap.insert(std::make_pair(F, NextId));
102   if (Insertion.second) {
103     // We have to compute the full filepath and emit a .cv_file directive.
104     StringRef FullPath = getFullFilepath(F);
105     NextId = OS.EmitCVFileDirective(NextId, FullPath);
106     assert(NextId == FileIdMap.size() && ".cv_file directive failed");
107   }
108   return Insertion.first->second;
109 }
110 
111 CodeViewDebug::InlineSite &
112 CodeViewDebug::getInlineSite(const DILocation *InlinedAt,
113                              const DISubprogram *Inlinee) {
114   auto SiteInsertion = CurFn->InlineSites.insert({InlinedAt, InlineSite()});
115   InlineSite *Site = &SiteInsertion.first->second;
116   if (SiteInsertion.second) {
117     Site->SiteFuncId = NextFuncId++;
118     Site->Inlinee = Inlinee;
119     InlinedSubprograms.insert(Inlinee);
120     recordFuncIdForSubprogram(Inlinee);
121   }
122   return *Site;
123 }
124 
125 TypeIndex CodeViewDebug::getGenericFunctionTypeIndex() {
126   if (VoidFnTyIdx.getIndex() != 0)
127     return VoidFnTyIdx;
128 
129   ArrayRef<TypeIndex> NoArgs;
130   ArgListRecord ArgListRec(TypeRecordKind::ArgList, NoArgs);
131   TypeIndex ArgListIndex = TypeTable.writeArgList(ArgListRec);
132 
133   ProcedureRecord Procedure(TypeIndex::Void(), CallingConvention::NearC,
134                             FunctionOptions::None, 0, ArgListIndex);
135   VoidFnTyIdx = TypeTable.writeProcedure(Procedure);
136   return VoidFnTyIdx;
137 }
138 
139 void CodeViewDebug::recordFuncIdForSubprogram(const DISubprogram *SP) {
140   TypeIndex ParentScope = TypeIndex(0);
141   StringRef DisplayName = SP->getDisplayName();
142   FuncIdRecord FuncId(ParentScope, getGenericFunctionTypeIndex(), DisplayName);
143   TypeIndex TI = TypeTable.writeFuncId(FuncId);
144   TypeIndices[SP] = TI;
145 }
146 
147 void CodeViewDebug::recordLocalVariable(LocalVariable &&Var,
148                                         const DILocation *InlinedAt) {
149   if (InlinedAt) {
150     // This variable was inlined. Associate it with the InlineSite.
151     const DISubprogram *Inlinee = Var.DIVar->getScope()->getSubprogram();
152     InlineSite &Site = getInlineSite(InlinedAt, Inlinee);
153     Site.InlinedLocals.emplace_back(Var);
154   } else {
155     // This variable goes in the main ProcSym.
156     CurFn->Locals.emplace_back(Var);
157   }
158 }
159 
160 static void addLocIfNotPresent(SmallVectorImpl<const DILocation *> &Locs,
161                                const DILocation *Loc) {
162   auto B = Locs.begin(), E = Locs.end();
163   if (std::find(B, E, Loc) == E)
164     Locs.push_back(Loc);
165 }
166 
167 void CodeViewDebug::maybeRecordLocation(DebugLoc DL,
168                                         const MachineFunction *MF) {
169   // Skip this instruction if it has the same location as the previous one.
170   if (DL == CurFn->LastLoc)
171     return;
172 
173   const DIScope *Scope = DL.get()->getScope();
174   if (!Scope)
175     return;
176 
177   // Skip this line if it is longer than the maximum we can record.
178   LineInfo LI(DL.getLine(), DL.getLine(), /*IsStatement=*/true);
179   if (LI.getStartLine() != DL.getLine() || LI.isAlwaysStepInto() ||
180       LI.isNeverStepInto())
181     return;
182 
183   ColumnInfo CI(DL.getCol(), /*EndColumn=*/0);
184   if (CI.getStartColumn() != DL.getCol())
185     return;
186 
187   if (!CurFn->HaveLineInfo)
188     CurFn->HaveLineInfo = true;
189   unsigned FileId = 0;
190   if (CurFn->LastLoc.get() && CurFn->LastLoc->getFile() == DL->getFile())
191     FileId = CurFn->LastFileId;
192   else
193     FileId = CurFn->LastFileId = maybeRecordFile(DL->getFile());
194   CurFn->LastLoc = DL;
195 
196   unsigned FuncId = CurFn->FuncId;
197   if (const DILocation *SiteLoc = DL->getInlinedAt()) {
198     const DILocation *Loc = DL.get();
199 
200     // If this location was actually inlined from somewhere else, give it the ID
201     // of the inline call site.
202     FuncId =
203         getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()).SiteFuncId;
204 
205     // Ensure we have links in the tree of inline call sites.
206     bool FirstLoc = true;
207     while ((SiteLoc = Loc->getInlinedAt())) {
208       InlineSite &Site =
209           getInlineSite(SiteLoc, Loc->getScope()->getSubprogram());
210       if (!FirstLoc)
211         addLocIfNotPresent(Site.ChildSites, Loc);
212       FirstLoc = false;
213       Loc = SiteLoc;
214     }
215     addLocIfNotPresent(CurFn->ChildSites, Loc);
216   }
217 
218   OS.EmitCVLocDirective(FuncId, FileId, DL.getLine(), DL.getCol(),
219                         /*PrologueEnd=*/false,
220                         /*IsStmt=*/false, DL->getFilename());
221 }
222 
223 void CodeViewDebug::emitCodeViewMagicVersion() {
224   OS.EmitValueToAlignment(4);
225   OS.AddComment("Debug section magic");
226   OS.EmitIntValue(COFF::DEBUG_SECTION_MAGIC, 4);
227 }
228 
229 void CodeViewDebug::endModule() {
230   if (FnDebugInfo.empty())
231     return;
232 
233   assert(Asm != nullptr);
234 
235   // The COFF .debug$S section consists of several subsections, each starting
236   // with a 4-byte control code (e.g. 0xF1, 0xF2, etc) and then a 4-byte length
237   // of the payload followed by the payload itself.  The subsections are 4-byte
238   // aligned.
239 
240   // Make a subsection for all the inlined subprograms.
241   emitInlineeLinesSubsection();
242 
243   // Emit per-function debug information.
244   for (auto &P : FnDebugInfo)
245     emitDebugInfoForFunction(P.first, P.second);
246 
247   // Switch back to the generic .debug$S section after potentially processing
248   // comdat symbol sections.
249   switchToDebugSectionForSymbol(nullptr);
250 
251   // This subsection holds a file index to offset in string table table.
252   OS.AddComment("File index to string table offset subsection");
253   OS.EmitCVFileChecksumsDirective();
254 
255   // This subsection holds the string table.
256   OS.AddComment("String table");
257   OS.EmitCVStringTableDirective();
258 
259   // Emit type information last, so that any types we translate while emitting
260   // function info are included.
261   emitTypeInformation();
262 
263   clear();
264 }
265 
266 static void emitNullTerminatedSymbolName(MCStreamer &OS, StringRef S) {
267   // Microsoft's linker seems to have trouble with symbol names longer than
268   // 0xffd8 bytes.
269   S = S.substr(0, 0xffd8);
270   SmallString<32> NullTerminatedString(S);
271   NullTerminatedString.push_back('\0');
272   OS.EmitBytes(NullTerminatedString);
273 }
274 
275 void CodeViewDebug::emitTypeInformation() {
276   // Do nothing if we have no debug info or if no non-trivial types were emitted
277   // to TypeTable during codegen.
278   NamedMDNode *CU_Nodes =
279       MMI->getModule()->getNamedMetadata("llvm.dbg.cu");
280   if (!CU_Nodes)
281     return;
282   if (TypeTable.empty())
283     return;
284 
285   // Start the .debug$T section with 0x4.
286   OS.SwitchSection(Asm->getObjFileLowering().getCOFFDebugTypesSection());
287   emitCodeViewMagicVersion();
288 
289   SmallString<8> CommentPrefix;
290   if (OS.isVerboseAsm()) {
291     CommentPrefix += '\t';
292     CommentPrefix += Asm->MAI->getCommentString();
293     CommentPrefix += ' ';
294   }
295 
296   CVTypeDumper CVTD(nullptr, /*PrintRecordBytes=*/false);
297   TypeTable.ForEachRecord(
298       [&](TypeIndex Index, StringRef Record) {
299         if (OS.isVerboseAsm()) {
300           // Emit a block comment describing the type record for readability.
301           SmallString<512> CommentBlock;
302           raw_svector_ostream CommentOS(CommentBlock);
303           ScopedPrinter SP(CommentOS);
304           SP.setPrefix(CommentPrefix);
305           CVTD.setPrinter(&SP);
306           bool DumpSuccess =
307               CVTD.dump({Record.bytes_begin(), Record.bytes_end()});
308           (void)DumpSuccess;
309           assert(DumpSuccess && "produced malformed type record");
310           // emitRawComment will insert its own tab and comment string before
311           // the first line, so strip off our first one. It also prints its own
312           // newline.
313           OS.emitRawComment(
314               CommentOS.str().drop_front(CommentPrefix.size() - 1).rtrim());
315         }
316         OS.EmitBinaryData(Record);
317       });
318 }
319 
320 void CodeViewDebug::emitInlineeLinesSubsection() {
321   if (InlinedSubprograms.empty())
322     return;
323 
324   // Use the generic .debug$S section.
325   switchToDebugSectionForSymbol(nullptr);
326 
327   MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(),
328            *InlineEnd = MMI->getContext().createTempSymbol();
329 
330   OS.AddComment("Inlinee lines subsection");
331   OS.EmitIntValue(unsigned(ModuleSubstreamKind::InlineeLines), 4);
332   OS.AddComment("Subsection size");
333   OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 4);
334   OS.EmitLabel(InlineBegin);
335 
336   // We don't provide any extra file info.
337   // FIXME: Find out if debuggers use this info.
338   OS.AddComment("Inlinee lines signature");
339   OS.EmitIntValue(unsigned(InlineeLinesSignature::Normal), 4);
340 
341   for (const DISubprogram *SP : InlinedSubprograms) {
342     assert(TypeIndices.count(SP));
343     TypeIndex InlineeIdx = TypeIndices[SP];
344 
345     OS.AddBlankLine();
346     unsigned FileId = maybeRecordFile(SP->getFile());
347     OS.AddComment("Inlined function " + SP->getDisplayName() + " starts at " +
348                   SP->getFilename() + Twine(':') + Twine(SP->getLine()));
349     OS.AddBlankLine();
350     // The filechecksum table uses 8 byte entries for now, and file ids start at
351     // 1.
352     unsigned FileOffset = (FileId - 1) * 8;
353     OS.AddComment("Type index of inlined function");
354     OS.EmitIntValue(InlineeIdx.getIndex(), 4);
355     OS.AddComment("Offset into filechecksum table");
356     OS.EmitIntValue(FileOffset, 4);
357     OS.AddComment("Starting line number");
358     OS.EmitIntValue(SP->getLine(), 4);
359   }
360 
361   OS.EmitLabel(InlineEnd);
362 }
363 
364 void CodeViewDebug::collectInlineSiteChildren(
365     SmallVectorImpl<unsigned> &Children, const FunctionInfo &FI,
366     const InlineSite &Site) {
367   for (const DILocation *ChildSiteLoc : Site.ChildSites) {
368     auto I = FI.InlineSites.find(ChildSiteLoc);
369     const InlineSite &ChildSite = I->second;
370     Children.push_back(ChildSite.SiteFuncId);
371     collectInlineSiteChildren(Children, FI, ChildSite);
372   }
373 }
374 
375 void CodeViewDebug::emitInlinedCallSite(const FunctionInfo &FI,
376                                         const DILocation *InlinedAt,
377                                         const InlineSite &Site) {
378   MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(),
379            *InlineEnd = MMI->getContext().createTempSymbol();
380 
381   assert(TypeIndices.count(Site.Inlinee));
382   TypeIndex InlineeIdx = TypeIndices[Site.Inlinee];
383 
384   // SymbolRecord
385   OS.AddComment("Record length");
386   OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 2);   // RecordLength
387   OS.EmitLabel(InlineBegin);
388   OS.AddComment("Record kind: S_INLINESITE");
389   OS.EmitIntValue(SymbolKind::S_INLINESITE, 2); // RecordKind
390 
391   OS.AddComment("PtrParent");
392   OS.EmitIntValue(0, 4);
393   OS.AddComment("PtrEnd");
394   OS.EmitIntValue(0, 4);
395   OS.AddComment("Inlinee type index");
396   OS.EmitIntValue(InlineeIdx.getIndex(), 4);
397 
398   unsigned FileId = maybeRecordFile(Site.Inlinee->getFile());
399   unsigned StartLineNum = Site.Inlinee->getLine();
400   SmallVector<unsigned, 3> SecondaryFuncIds;
401   collectInlineSiteChildren(SecondaryFuncIds, FI, Site);
402 
403   OS.EmitCVInlineLinetableDirective(Site.SiteFuncId, FileId, StartLineNum,
404                                     FI.Begin, FI.End, SecondaryFuncIds);
405 
406   OS.EmitLabel(InlineEnd);
407 
408   for (const LocalVariable &Var : Site.InlinedLocals)
409     emitLocalVariable(Var);
410 
411   // Recurse on child inlined call sites before closing the scope.
412   for (const DILocation *ChildSite : Site.ChildSites) {
413     auto I = FI.InlineSites.find(ChildSite);
414     assert(I != FI.InlineSites.end() &&
415            "child site not in function inline site map");
416     emitInlinedCallSite(FI, ChildSite, I->second);
417   }
418 
419   // Close the scope.
420   OS.AddComment("Record length");
421   OS.EmitIntValue(2, 2);                                  // RecordLength
422   OS.AddComment("Record kind: S_INLINESITE_END");
423   OS.EmitIntValue(SymbolKind::S_INLINESITE_END, 2); // RecordKind
424 }
425 
426 void CodeViewDebug::switchToDebugSectionForSymbol(const MCSymbol *GVSym) {
427   // If we have a symbol, it may be in a section that is COMDAT. If so, find the
428   // comdat key. A section may be comdat because of -ffunction-sections or
429   // because it is comdat in the IR.
430   MCSectionCOFF *GVSec =
431       GVSym ? dyn_cast<MCSectionCOFF>(&GVSym->getSection()) : nullptr;
432   const MCSymbol *KeySym = GVSec ? GVSec->getCOMDATSymbol() : nullptr;
433 
434   MCSectionCOFF *DebugSec = cast<MCSectionCOFF>(
435       Asm->getObjFileLowering().getCOFFDebugSymbolsSection());
436   DebugSec = OS.getContext().getAssociativeCOFFSection(DebugSec, KeySym);
437 
438   OS.SwitchSection(DebugSec);
439 
440   // Emit the magic version number if this is the first time we've switched to
441   // this section.
442   if (ComdatDebugSections.insert(DebugSec).second)
443     emitCodeViewMagicVersion();
444 }
445 
446 void CodeViewDebug::emitDebugInfoForFunction(const Function *GV,
447                                              FunctionInfo &FI) {
448   // For each function there is a separate subsection
449   // which holds the PC to file:line table.
450   const MCSymbol *Fn = Asm->getSymbol(GV);
451   assert(Fn);
452 
453   // Switch to the to a comdat section, if appropriate.
454   switchToDebugSectionForSymbol(Fn);
455 
456   StringRef FuncName;
457   if (auto *SP = GV->getSubprogram())
458     FuncName = SP->getDisplayName();
459 
460   // If our DISubprogram name is empty, use the mangled name.
461   if (FuncName.empty())
462     FuncName = GlobalValue::getRealLinkageName(GV->getName());
463 
464   // Emit a symbol subsection, required by VS2012+ to find function boundaries.
465   MCSymbol *SymbolsBegin = MMI->getContext().createTempSymbol(),
466            *SymbolsEnd = MMI->getContext().createTempSymbol();
467   OS.AddComment("Symbol subsection for " + Twine(FuncName));
468   OS.EmitIntValue(unsigned(ModuleSubstreamKind::Symbols), 4);
469   OS.AddComment("Subsection size");
470   OS.emitAbsoluteSymbolDiff(SymbolsEnd, SymbolsBegin, 4);
471   OS.EmitLabel(SymbolsBegin);
472   {
473     MCSymbol *ProcRecordBegin = MMI->getContext().createTempSymbol(),
474              *ProcRecordEnd = MMI->getContext().createTempSymbol();
475     OS.AddComment("Record length");
476     OS.emitAbsoluteSymbolDiff(ProcRecordEnd, ProcRecordBegin, 2);
477     OS.EmitLabel(ProcRecordBegin);
478 
479     OS.AddComment("Record kind: S_GPROC32_ID");
480     OS.EmitIntValue(unsigned(SymbolKind::S_GPROC32_ID), 2);
481 
482     // These fields are filled in by tools like CVPACK which run after the fact.
483     OS.AddComment("PtrParent");
484     OS.EmitIntValue(0, 4);
485     OS.AddComment("PtrEnd");
486     OS.EmitIntValue(0, 4);
487     OS.AddComment("PtrNext");
488     OS.EmitIntValue(0, 4);
489     // This is the important bit that tells the debugger where the function
490     // code is located and what's its size:
491     OS.AddComment("Code size");
492     OS.emitAbsoluteSymbolDiff(FI.End, Fn, 4);
493     OS.AddComment("Offset after prologue");
494     OS.EmitIntValue(0, 4);
495     OS.AddComment("Offset before epilogue");
496     OS.EmitIntValue(0, 4);
497     OS.AddComment("Function type index");
498     OS.EmitIntValue(0, 4);
499     OS.AddComment("Function section relative address");
500     OS.EmitCOFFSecRel32(Fn);
501     OS.AddComment("Function section index");
502     OS.EmitCOFFSectionIndex(Fn);
503     OS.AddComment("Flags");
504     OS.EmitIntValue(0, 1);
505     // Emit the function display name as a null-terminated string.
506     OS.AddComment("Function name");
507     // Truncate the name so we won't overflow the record length field.
508     emitNullTerminatedSymbolName(OS, FuncName);
509     OS.EmitLabel(ProcRecordEnd);
510 
511     for (const LocalVariable &Var : FI.Locals)
512       emitLocalVariable(Var);
513 
514     // Emit inlined call site information. Only emit functions inlined directly
515     // into the parent function. We'll emit the other sites recursively as part
516     // of their parent inline site.
517     for (const DILocation *InlinedAt : FI.ChildSites) {
518       auto I = FI.InlineSites.find(InlinedAt);
519       assert(I != FI.InlineSites.end() &&
520              "child site not in function inline site map");
521       emitInlinedCallSite(FI, InlinedAt, I->second);
522     }
523 
524     // We're done with this function.
525     OS.AddComment("Record length");
526     OS.EmitIntValue(0x0002, 2);
527     OS.AddComment("Record kind: S_PROC_ID_END");
528     OS.EmitIntValue(unsigned(SymbolKind::S_PROC_ID_END), 2);
529   }
530   OS.EmitLabel(SymbolsEnd);
531   // Every subsection must be aligned to a 4-byte boundary.
532   OS.EmitValueToAlignment(4);
533 
534   // We have an assembler directive that takes care of the whole line table.
535   OS.EmitCVLinetableDirective(FI.FuncId, Fn, FI.End);
536 }
537 
538 CodeViewDebug::LocalVarDefRange
539 CodeViewDebug::createDefRangeMem(uint16_t CVRegister, int Offset) {
540   LocalVarDefRange DR;
541   DR.InMemory = -1;
542   DR.DataOffset = Offset;
543   assert(DR.DataOffset == Offset && "truncation");
544   DR.StructOffset = 0;
545   DR.CVRegister = CVRegister;
546   return DR;
547 }
548 
549 CodeViewDebug::LocalVarDefRange
550 CodeViewDebug::createDefRangeReg(uint16_t CVRegister) {
551   LocalVarDefRange DR;
552   DR.InMemory = 0;
553   DR.DataOffset = 0;
554   DR.StructOffset = 0;
555   DR.CVRegister = CVRegister;
556   return DR;
557 }
558 
559 void CodeViewDebug::collectVariableInfoFromMMITable(
560     DenseSet<InlinedVariable> &Processed) {
561   const TargetSubtargetInfo &TSI = Asm->MF->getSubtarget();
562   const TargetFrameLowering *TFI = TSI.getFrameLowering();
563   const TargetRegisterInfo *TRI = TSI.getRegisterInfo();
564 
565   for (const MachineModuleInfo::VariableDbgInfo &VI :
566        MMI->getVariableDbgInfo()) {
567     if (!VI.Var)
568       continue;
569     assert(VI.Var->isValidLocationForIntrinsic(VI.Loc) &&
570            "Expected inlined-at fields to agree");
571 
572     Processed.insert(InlinedVariable(VI.Var, VI.Loc->getInlinedAt()));
573     LexicalScope *Scope = LScopes.findLexicalScope(VI.Loc);
574 
575     // If variable scope is not found then skip this variable.
576     if (!Scope)
577       continue;
578 
579     // Get the frame register used and the offset.
580     unsigned FrameReg = 0;
581     int FrameOffset = TFI->getFrameIndexReference(*Asm->MF, VI.Slot, FrameReg);
582     uint16_t CVReg = TRI->getCodeViewRegNum(FrameReg);
583 
584     // Calculate the label ranges.
585     LocalVarDefRange DefRange = createDefRangeMem(CVReg, FrameOffset);
586     for (const InsnRange &Range : Scope->getRanges()) {
587       const MCSymbol *Begin = getLabelBeforeInsn(Range.first);
588       const MCSymbol *End = getLabelAfterInsn(Range.second);
589       End = End ? End : Asm->getFunctionEnd();
590       DefRange.Ranges.emplace_back(Begin, End);
591     }
592 
593     LocalVariable Var;
594     Var.DIVar = VI.Var;
595     Var.DefRanges.emplace_back(std::move(DefRange));
596     recordLocalVariable(std::move(Var), VI.Loc->getInlinedAt());
597   }
598 }
599 
600 void CodeViewDebug::collectVariableInfo(const DISubprogram *SP) {
601   DenseSet<InlinedVariable> Processed;
602   // Grab the variable info that was squirreled away in the MMI side-table.
603   collectVariableInfoFromMMITable(Processed);
604 
605   const TargetRegisterInfo *TRI = Asm->MF->getSubtarget().getRegisterInfo();
606 
607   for (const auto &I : DbgValues) {
608     InlinedVariable IV = I.first;
609     if (Processed.count(IV))
610       continue;
611     const DILocalVariable *DIVar = IV.first;
612     const DILocation *InlinedAt = IV.second;
613 
614     // Instruction ranges, specifying where IV is accessible.
615     const auto &Ranges = I.second;
616 
617     LexicalScope *Scope = nullptr;
618     if (InlinedAt)
619       Scope = LScopes.findInlinedScope(DIVar->getScope(), InlinedAt);
620     else
621       Scope = LScopes.findLexicalScope(DIVar->getScope());
622     // If variable scope is not found then skip this variable.
623     if (!Scope)
624       continue;
625 
626     LocalVariable Var;
627     Var.DIVar = DIVar;
628 
629     // Calculate the definition ranges.
630     for (auto I = Ranges.begin(), E = Ranges.end(); I != E; ++I) {
631       const InsnRange &Range = *I;
632       const MachineInstr *DVInst = Range.first;
633       assert(DVInst->isDebugValue() && "Invalid History entry");
634       const DIExpression *DIExpr = DVInst->getDebugExpression();
635 
636       // Bail if there is a complex DWARF expression for now.
637       if (DIExpr && DIExpr->getNumElements() > 0)
638         continue;
639 
640       // Bail if operand 0 is not a valid register. This means the variable is a
641       // simple constant, or is described by a complex expression.
642       // FIXME: Find a way to represent constant variables, since they are
643       // relatively common.
644       unsigned Reg =
645           DVInst->getOperand(0).isReg() ? DVInst->getOperand(0).getReg() : 0;
646       if (Reg == 0)
647         continue;
648 
649       // Handle the two cases we can handle: indirect in memory and in register.
650       bool IsIndirect = DVInst->getOperand(1).isImm();
651       unsigned CVReg = TRI->getCodeViewRegNum(DVInst->getOperand(0).getReg());
652       {
653         LocalVarDefRange DefRange;
654         if (IsIndirect) {
655           int64_t Offset = DVInst->getOperand(1).getImm();
656           DefRange = createDefRangeMem(CVReg, Offset);
657         } else {
658           DefRange = createDefRangeReg(CVReg);
659         }
660         if (Var.DefRanges.empty() ||
661             Var.DefRanges.back().isDifferentLocation(DefRange)) {
662           Var.DefRanges.emplace_back(std::move(DefRange));
663         }
664       }
665 
666       // Compute the label range.
667       const MCSymbol *Begin = getLabelBeforeInsn(Range.first);
668       const MCSymbol *End = getLabelAfterInsn(Range.second);
669       if (!End) {
670         if (std::next(I) != E)
671           End = getLabelBeforeInsn(std::next(I)->first);
672         else
673           End = Asm->getFunctionEnd();
674       }
675 
676       // If the last range end is our begin, just extend the last range.
677       // Otherwise make a new range.
678       SmallVectorImpl<std::pair<const MCSymbol *, const MCSymbol *>> &Ranges =
679           Var.DefRanges.back().Ranges;
680       if (!Ranges.empty() && Ranges.back().second == Begin)
681         Ranges.back().second = End;
682       else
683         Ranges.emplace_back(Begin, End);
684 
685       // FIXME: Do more range combining.
686     }
687 
688     recordLocalVariable(std::move(Var), InlinedAt);
689   }
690 }
691 
692 void CodeViewDebug::beginFunction(const MachineFunction *MF) {
693   assert(!CurFn && "Can't process two functions at once!");
694 
695   if (!Asm || !MMI->hasDebugInfo())
696     return;
697 
698   DebugHandlerBase::beginFunction(MF);
699 
700   const Function *GV = MF->getFunction();
701   assert(FnDebugInfo.count(GV) == false);
702   CurFn = &FnDebugInfo[GV];
703   CurFn->FuncId = NextFuncId++;
704   CurFn->Begin = Asm->getFunctionBegin();
705 
706   // Find the end of the function prolog.  First known non-DBG_VALUE and
707   // non-frame setup location marks the beginning of the function body.
708   // FIXME: is there a simpler a way to do this? Can we just search
709   // for the first instruction of the function, not the last of the prolog?
710   DebugLoc PrologEndLoc;
711   bool EmptyPrologue = true;
712   for (const auto &MBB : *MF) {
713     for (const auto &MI : MBB) {
714       if (!MI.isDebugValue() && !MI.getFlag(MachineInstr::FrameSetup) &&
715           MI.getDebugLoc()) {
716         PrologEndLoc = MI.getDebugLoc();
717         break;
718       } else if (!MI.isDebugValue()) {
719         EmptyPrologue = false;
720       }
721     }
722   }
723 
724   // Record beginning of function if we have a non-empty prologue.
725   if (PrologEndLoc && !EmptyPrologue) {
726     DebugLoc FnStartDL = PrologEndLoc.getFnDebugLoc();
727     maybeRecordLocation(FnStartDL, MF);
728   }
729 }
730 
731 TypeIndex CodeViewDebug::lowerType(const DIType *Ty) {
732   // Generic dispatch for lowering an unknown type.
733   switch (Ty->getTag()) {
734   case dwarf::DW_TAG_base_type:
735     return lowerTypeBasic(cast<DIBasicType>(Ty));
736   case dwarf::DW_TAG_pointer_type:
737   case dwarf::DW_TAG_reference_type:
738   case dwarf::DW_TAG_rvalue_reference_type:
739     return lowerTypePointer(cast<DIDerivedType>(Ty));
740   case dwarf::DW_TAG_ptr_to_member_type:
741     return lowerTypeMemberPointer(cast<DIDerivedType>(Ty));
742   case dwarf::DW_TAG_const_type:
743   case dwarf::DW_TAG_volatile_type:
744     return lowerTypeModifier(cast<DIDerivedType>(Ty));
745   default:
746     // Use the null type index.
747     return TypeIndex();
748   }
749 }
750 
751 TypeIndex CodeViewDebug::lowerTypeBasic(const DIBasicType *Ty) {
752   TypeIndex Index;
753   dwarf::TypeKind Kind;
754   uint32_t ByteSize;
755 
756   Kind = static_cast<dwarf::TypeKind>(Ty->getEncoding());
757   ByteSize = Ty->getSizeInBits() >> 3;
758 
759   SimpleTypeKind STK = SimpleTypeKind::None;
760   switch (Kind) {
761   case dwarf::DW_ATE_address:
762     // FIXME: Translate
763     break;
764   case dwarf::DW_ATE_boolean:
765     switch (ByteSize) {
766     case 1: STK = SimpleTypeKind::Boolean8;  break;
767     case 2: STK = SimpleTypeKind::Boolean16; break;
768     case 4: STK = SimpleTypeKind::Boolean32; break;
769     case 8: STK = SimpleTypeKind::Boolean64; break;
770     }
771     break;
772   case dwarf::DW_ATE_complex_float:
773     switch (ByteSize) {
774     case 4:  STK = SimpleTypeKind::Complex32;  break;
775     case 8:  STK = SimpleTypeKind::Complex64;  break;
776     case 10: STK = SimpleTypeKind::Complex80;  break;
777     case 16: STK = SimpleTypeKind::Complex128; break;
778     }
779     break;
780   case dwarf::DW_ATE_float:
781     switch (ByteSize) {
782     case 4:  STK = SimpleTypeKind::Float32;  break;
783     case 6:  STK = SimpleTypeKind::Float48;  break;
784     case 8:  STK = SimpleTypeKind::Float64;  break;
785     case 10: STK = SimpleTypeKind::Float80;  break;
786     case 16: STK = SimpleTypeKind::Float128; break;
787     }
788     break;
789   case dwarf::DW_ATE_signed:
790     switch (ByteSize) {
791     case 1: STK = SimpleTypeKind::SByte;      break;
792     case 2: STK = SimpleTypeKind::Int16Short; break;
793     case 4: STK = SimpleTypeKind::Int32;      break;
794     case 8: STK = SimpleTypeKind::Int64;      break;
795     }
796     break;
797   case dwarf::DW_ATE_unsigned:
798     switch (ByteSize) {
799     case 1: STK = SimpleTypeKind::Byte;        break;
800     case 2: STK = SimpleTypeKind::UInt16Short; break;
801     case 4: STK = SimpleTypeKind::UInt32;      break;
802     case 8: STK = SimpleTypeKind::UInt64;      break;
803     }
804     break;
805   case dwarf::DW_ATE_UTF:
806     switch (ByteSize) {
807     case 2: STK = SimpleTypeKind::Character16; break;
808     case 4: STK = SimpleTypeKind::Character32; break;
809     }
810     break;
811   case dwarf::DW_ATE_signed_char:
812     if (ByteSize == 1)
813       STK = SimpleTypeKind::SignedCharacter;
814     break;
815   case dwarf::DW_ATE_unsigned_char:
816     if (ByteSize == 1)
817       STK = SimpleTypeKind::UnsignedCharacter;
818     break;
819   default:
820     break;
821   }
822 
823   // Apply some fixups based on the source-level type name.
824   if (STK == SimpleTypeKind::Int32 && Ty->getName() == "long int")
825     STK = SimpleTypeKind::Int32Long;
826   if (STK == SimpleTypeKind::UInt32 && Ty->getName() == "long unsigned int")
827     STK = SimpleTypeKind::UInt32Long;
828   if ((STK == SimpleTypeKind::Int16Short ||
829        STK == SimpleTypeKind::UInt16Short) &&
830       Ty->getName() == "wchar_t")
831     STK = SimpleTypeKind::WideCharacter;
832   if ((STK == SimpleTypeKind::SignedCharacter ||
833        STK == SimpleTypeKind::UnsignedCharacter) &&
834       Ty->getName() == "char")
835     STK = SimpleTypeKind::NarrowCharacter;
836 
837   return TypeIndex(STK);
838 }
839 
840 TypeIndex CodeViewDebug::lowerTypePointer(const DIDerivedType *Ty) {
841   TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType());
842 
843   // Pointers to simple types can use SimpleTypeMode, rather than having a
844   // dedicated pointer type record.
845   if (PointeeTI.isSimple() &&
846       PointeeTI.getSimpleMode() == SimpleTypeMode::Direct &&
847       Ty->getTag() == dwarf::DW_TAG_pointer_type) {
848     SimpleTypeMode Mode = Ty->getSizeInBits() == 64
849                               ? SimpleTypeMode::NearPointer64
850                               : SimpleTypeMode::NearPointer32;
851     return TypeIndex(PointeeTI.getSimpleKind(), Mode);
852   }
853 
854   PointerKind PK =
855       Ty->getSizeInBits() == 64 ? PointerKind::Near64 : PointerKind::Near32;
856   PointerMode PM = PointerMode::Pointer;
857   switch (Ty->getTag()) {
858   default: llvm_unreachable("not a pointer tag type");
859   case dwarf::DW_TAG_pointer_type:
860     PM = PointerMode::Pointer;
861     break;
862   case dwarf::DW_TAG_reference_type:
863     PM = PointerMode::LValueReference;
864     break;
865   case dwarf::DW_TAG_rvalue_reference_type:
866     PM = PointerMode::RValueReference;
867     break;
868   }
869   // FIXME: MSVC folds qualifiers into PointerOptions in the context of a method
870   // 'this' pointer, but not normal contexts. Figure out what we're supposed to
871   // do.
872   PointerOptions PO = PointerOptions::None;
873   PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8);
874   return TypeTable.writePointer(PR);
875 }
876 
877 TypeIndex CodeViewDebug::lowerTypeMemberPointer(const DIDerivedType *Ty) {
878   assert(Ty->getTag() == dwarf::DW_TAG_ptr_to_member_type);
879   TypeIndex ClassTI = getTypeIndex(Ty->getClassType());
880   TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType());
881   PointerKind PK = Asm->MAI->getPointerSize() == 8 ? PointerKind::Near64
882                                                    : PointerKind::Near32;
883   PointerMode PM = isa<DISubroutineType>(Ty->getBaseType())
884                        ? PointerMode::PointerToMemberFunction
885                        : PointerMode::PointerToDataMember;
886   PointerOptions PO = PointerOptions::None; // FIXME
887   // FIXME: Thread this ABI info through metadata.
888   PointerToMemberRepresentation PMR = PointerToMemberRepresentation::Unknown;
889   MemberPointerInfo MPI(ClassTI, PMR);
890   PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8, MPI);
891   return TypeTable.writePointer(PR);
892 }
893 
894 TypeIndex CodeViewDebug::lowerTypeModifier(const DIDerivedType *Ty) {
895   ModifierOptions Mods = ModifierOptions::None;
896   bool IsModifier = true;
897   const DIType *BaseTy = Ty;
898   while (IsModifier) {
899     assert(BaseTy);
900     // FIXME: Need to add DWARF tag for __unaligned.
901     switch (BaseTy->getTag()) {
902     case dwarf::DW_TAG_const_type:
903       Mods |= ModifierOptions::Const;
904       break;
905     case dwarf::DW_TAG_volatile_type:
906       Mods |= ModifierOptions::Volatile;
907       break;
908     default:
909       IsModifier = false;
910       break;
911     }
912     if (IsModifier)
913       BaseTy = cast<DIDerivedType>(BaseTy)->getBaseType().resolve();
914   }
915   TypeIndex ModifiedTI = getTypeIndex(BaseTy);
916   ModifierRecord MR(ModifiedTI, Mods);
917   return TypeTable.writeModifier(MR);
918 }
919 
920 TypeIndex CodeViewDebug::getTypeIndex(DITypeRef TypeRef) {
921   const DIType *Ty = TypeRef.resolve();
922 
923   // The null DIType is the void type. Don't try to hash it.
924   if (!Ty)
925     return TypeIndex::Void();
926 
927   // Check if we've already translated this type.
928   auto I = TypeIndices.find(Ty);
929   if (I != TypeIndices.end())
930     return I->second;
931 
932   TypeIndex TI = lowerType(Ty);
933 
934   auto InsertResult = TypeIndices.insert({Ty, TI});
935   (void)InsertResult;
936   assert(InsertResult.second && "DIType lowered twice");
937   return TI;
938 }
939 
940 void CodeViewDebug::emitLocalVariable(const LocalVariable &Var) {
941   // LocalSym record, see SymbolRecord.h for more info.
942   MCSymbol *LocalBegin = MMI->getContext().createTempSymbol(),
943            *LocalEnd = MMI->getContext().createTempSymbol();
944   OS.AddComment("Record length");
945   OS.emitAbsoluteSymbolDiff(LocalEnd, LocalBegin, 2);
946   OS.EmitLabel(LocalBegin);
947 
948   OS.AddComment("Record kind: S_LOCAL");
949   OS.EmitIntValue(unsigned(SymbolKind::S_LOCAL), 2);
950 
951   LocalSymFlags Flags = LocalSymFlags::None;
952   if (Var.DIVar->isParameter())
953     Flags |= LocalSymFlags::IsParameter;
954   if (Var.DefRanges.empty())
955     Flags |= LocalSymFlags::IsOptimizedOut;
956 
957   OS.AddComment("TypeIndex");
958   TypeIndex TI = getTypeIndex(Var.DIVar->getType());
959   OS.EmitIntValue(TI.getIndex(), 4);
960   OS.AddComment("Flags");
961   OS.EmitIntValue(static_cast<uint16_t>(Flags), 2);
962   // Truncate the name so we won't overflow the record length field.
963   emitNullTerminatedSymbolName(OS, Var.DIVar->getName());
964   OS.EmitLabel(LocalEnd);
965 
966   // Calculate the on disk prefix of the appropriate def range record. The
967   // records and on disk formats are described in SymbolRecords.h. BytePrefix
968   // should be big enough to hold all forms without memory allocation.
969   SmallString<20> BytePrefix;
970   for (const LocalVarDefRange &DefRange : Var.DefRanges) {
971     BytePrefix.clear();
972     // FIXME: Handle bitpieces.
973     if (DefRange.StructOffset != 0)
974       continue;
975 
976     if (DefRange.InMemory) {
977       DefRangeRegisterRelSym Sym(DefRange.CVRegister, 0, DefRange.DataOffset, 0,
978                                  0, 0, ArrayRef<LocalVariableAddrGap>());
979       ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER_REL);
980       BytePrefix +=
981           StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind));
982       BytePrefix +=
983           StringRef(reinterpret_cast<const char *>(&Sym.Header),
984                     sizeof(Sym.Header) - sizeof(LocalVariableAddrRange));
985     } else {
986       assert(DefRange.DataOffset == 0 && "unexpected offset into register");
987       // Unclear what matters here.
988       DefRangeRegisterSym Sym(DefRange.CVRegister, 0, 0, 0, 0,
989                               ArrayRef<LocalVariableAddrGap>());
990       ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER);
991       BytePrefix +=
992           StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind));
993       BytePrefix +=
994           StringRef(reinterpret_cast<const char *>(&Sym.Header),
995                     sizeof(Sym.Header) - sizeof(LocalVariableAddrRange));
996     }
997     OS.EmitCVDefRangeDirective(DefRange.Ranges, BytePrefix);
998   }
999 }
1000 
1001 void CodeViewDebug::endFunction(const MachineFunction *MF) {
1002   if (!Asm || !CurFn)  // We haven't created any debug info for this function.
1003     return;
1004 
1005   const Function *GV = MF->getFunction();
1006   assert(FnDebugInfo.count(GV));
1007   assert(CurFn == &FnDebugInfo[GV]);
1008 
1009   collectVariableInfo(GV->getSubprogram());
1010 
1011   DebugHandlerBase::endFunction(MF);
1012 
1013   // Don't emit anything if we don't have any line tables.
1014   if (!CurFn->HaveLineInfo) {
1015     FnDebugInfo.erase(GV);
1016     CurFn = nullptr;
1017     return;
1018   }
1019 
1020   CurFn->End = Asm->getFunctionEnd();
1021 
1022   CurFn = nullptr;
1023 }
1024 
1025 void CodeViewDebug::beginInstruction(const MachineInstr *MI) {
1026   DebugHandlerBase::beginInstruction(MI);
1027 
1028   // Ignore DBG_VALUE locations and function prologue.
1029   if (!Asm || MI->isDebugValue() || MI->getFlag(MachineInstr::FrameSetup))
1030     return;
1031   DebugLoc DL = MI->getDebugLoc();
1032   if (DL == PrevInstLoc || !DL)
1033     return;
1034   maybeRecordLocation(DL, Asm->MF);
1035 }
1036