1 //===-- llvm/lib/CodeGen/AsmPrinter/CodeViewDebug.cpp --*- C++ -*--===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for writing Microsoft CodeView debug info.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "CodeViewDebug.h"
15 #include "llvm/DebugInfo/CodeView/CodeView.h"
16 #include "llvm/DebugInfo/CodeView/FieldListRecordBuilder.h"
17 #include "llvm/DebugInfo/CodeView/Line.h"
18 #include "llvm/DebugInfo/CodeView/SymbolRecord.h"
19 #include "llvm/DebugInfo/CodeView/TypeDumper.h"
20 #include "llvm/DebugInfo/CodeView/TypeIndex.h"
21 #include "llvm/DebugInfo/CodeView/TypeRecord.h"
22 #include "llvm/MC/MCExpr.h"
23 #include "llvm/MC/MCSectionCOFF.h"
24 #include "llvm/MC/MCSymbol.h"
25 #include "llvm/Support/COFF.h"
26 #include "llvm/Support/ScopedPrinter.h"
27 #include "llvm/Target/TargetSubtargetInfo.h"
28 #include "llvm/Target/TargetRegisterInfo.h"
29 #include "llvm/Target/TargetFrameLowering.h"
30 
31 using namespace llvm;
32 using namespace llvm::codeview;
33 
34 CodeViewDebug::CodeViewDebug(AsmPrinter *AP)
35     : DebugHandlerBase(AP), OS(*Asm->OutStreamer), CurFn(nullptr) {
36   // If module doesn't have named metadata anchors or COFF debug section
37   // is not available, skip any debug info related stuff.
38   if (!MMI->getModule()->getNamedMetadata("llvm.dbg.cu") ||
39       !AP->getObjFileLowering().getCOFFDebugSymbolsSection()) {
40     Asm = nullptr;
41     return;
42   }
43 
44   // Tell MMI that we have debug info.
45   MMI->setDebugInfoAvailability(true);
46 }
47 
48 StringRef CodeViewDebug::getFullFilepath(const DIFile *File) {
49   std::string &Filepath = FileToFilepathMap[File];
50   if (!Filepath.empty())
51     return Filepath;
52 
53   StringRef Dir = File->getDirectory(), Filename = File->getFilename();
54 
55   // Clang emits directory and relative filename info into the IR, but CodeView
56   // operates on full paths.  We could change Clang to emit full paths too, but
57   // that would increase the IR size and probably not needed for other users.
58   // For now, just concatenate and canonicalize the path here.
59   if (Filename.find(':') == 1)
60     Filepath = Filename;
61   else
62     Filepath = (Dir + "\\" + Filename).str();
63 
64   // Canonicalize the path.  We have to do it textually because we may no longer
65   // have access the file in the filesystem.
66   // First, replace all slashes with backslashes.
67   std::replace(Filepath.begin(), Filepath.end(), '/', '\\');
68 
69   // Remove all "\.\" with "\".
70   size_t Cursor = 0;
71   while ((Cursor = Filepath.find("\\.\\", Cursor)) != std::string::npos)
72     Filepath.erase(Cursor, 2);
73 
74   // Replace all "\XXX\..\" with "\".  Don't try too hard though as the original
75   // path should be well-formatted, e.g. start with a drive letter, etc.
76   Cursor = 0;
77   while ((Cursor = Filepath.find("\\..\\", Cursor)) != std::string::npos) {
78     // Something's wrong if the path starts with "\..\", abort.
79     if (Cursor == 0)
80       break;
81 
82     size_t PrevSlash = Filepath.rfind('\\', Cursor - 1);
83     if (PrevSlash == std::string::npos)
84       // Something's wrong, abort.
85       break;
86 
87     Filepath.erase(PrevSlash, Cursor + 3 - PrevSlash);
88     // The next ".." might be following the one we've just erased.
89     Cursor = PrevSlash;
90   }
91 
92   // Remove all duplicate backslashes.
93   Cursor = 0;
94   while ((Cursor = Filepath.find("\\\\", Cursor)) != std::string::npos)
95     Filepath.erase(Cursor, 1);
96 
97   return Filepath;
98 }
99 
100 unsigned CodeViewDebug::maybeRecordFile(const DIFile *F) {
101   unsigned NextId = FileIdMap.size() + 1;
102   auto Insertion = FileIdMap.insert(std::make_pair(F, NextId));
103   if (Insertion.second) {
104     // We have to compute the full filepath and emit a .cv_file directive.
105     StringRef FullPath = getFullFilepath(F);
106     NextId = OS.EmitCVFileDirective(NextId, FullPath);
107     assert(NextId == FileIdMap.size() && ".cv_file directive failed");
108   }
109   return Insertion.first->second;
110 }
111 
112 CodeViewDebug::InlineSite &
113 CodeViewDebug::getInlineSite(const DILocation *InlinedAt,
114                              const DISubprogram *Inlinee) {
115   auto SiteInsertion = CurFn->InlineSites.insert({InlinedAt, InlineSite()});
116   InlineSite *Site = &SiteInsertion.first->second;
117   if (SiteInsertion.second) {
118     Site->SiteFuncId = NextFuncId++;
119     Site->Inlinee = Inlinee;
120     InlinedSubprograms.insert(Inlinee);
121     getFuncIdForSubprogram(Inlinee);
122   }
123   return *Site;
124 }
125 
126 TypeIndex CodeViewDebug::getFuncIdForSubprogram(const DISubprogram *SP) {
127   // It's possible to ask for the FuncId of a function which doesn't have a
128   // subprogram: inlining a function with debug info into a function with none.
129   if (!SP)
130     return TypeIndex::None();
131 
132   // Check if we've already translated this subprogram.
133   auto I = TypeIndices.find(SP);
134   if (I != TypeIndices.end())
135     return I->second;
136 
137   TypeIndex ParentScope = TypeIndex(0);
138   StringRef DisplayName = SP->getDisplayName();
139   FuncIdRecord FuncId(ParentScope, getTypeIndex(SP->getType()), DisplayName);
140   TypeIndex TI = TypeTable.writeFuncId(FuncId);
141 
142   recordTypeIndexForDINode(SP, TI);
143   return TI;
144 }
145 
146 void CodeViewDebug::recordTypeIndexForDINode(const DINode *Node, TypeIndex TI) {
147   auto InsertResult = TypeIndices.insert({Node, TI});
148   (void)InsertResult;
149   assert(InsertResult.second && "DINode was already assigned a type index");
150 }
151 
152 void CodeViewDebug::recordLocalVariable(LocalVariable &&Var,
153                                         const DILocation *InlinedAt) {
154   if (InlinedAt) {
155     // This variable was inlined. Associate it with the InlineSite.
156     const DISubprogram *Inlinee = Var.DIVar->getScope()->getSubprogram();
157     InlineSite &Site = getInlineSite(InlinedAt, Inlinee);
158     Site.InlinedLocals.emplace_back(Var);
159   } else {
160     // This variable goes in the main ProcSym.
161     CurFn->Locals.emplace_back(Var);
162   }
163 }
164 
165 static void addLocIfNotPresent(SmallVectorImpl<const DILocation *> &Locs,
166                                const DILocation *Loc) {
167   auto B = Locs.begin(), E = Locs.end();
168   if (std::find(B, E, Loc) == E)
169     Locs.push_back(Loc);
170 }
171 
172 void CodeViewDebug::maybeRecordLocation(const DebugLoc &DL,
173                                         const MachineFunction *MF) {
174   // Skip this instruction if it has the same location as the previous one.
175   if (DL == CurFn->LastLoc)
176     return;
177 
178   const DIScope *Scope = DL.get()->getScope();
179   if (!Scope)
180     return;
181 
182   // Skip this line if it is longer than the maximum we can record.
183   LineInfo LI(DL.getLine(), DL.getLine(), /*IsStatement=*/true);
184   if (LI.getStartLine() != DL.getLine() || LI.isAlwaysStepInto() ||
185       LI.isNeverStepInto())
186     return;
187 
188   ColumnInfo CI(DL.getCol(), /*EndColumn=*/0);
189   if (CI.getStartColumn() != DL.getCol())
190     return;
191 
192   if (!CurFn->HaveLineInfo)
193     CurFn->HaveLineInfo = true;
194   unsigned FileId = 0;
195   if (CurFn->LastLoc.get() && CurFn->LastLoc->getFile() == DL->getFile())
196     FileId = CurFn->LastFileId;
197   else
198     FileId = CurFn->LastFileId = maybeRecordFile(DL->getFile());
199   CurFn->LastLoc = DL;
200 
201   unsigned FuncId = CurFn->FuncId;
202   if (const DILocation *SiteLoc = DL->getInlinedAt()) {
203     const DILocation *Loc = DL.get();
204 
205     // If this location was actually inlined from somewhere else, give it the ID
206     // of the inline call site.
207     FuncId =
208         getInlineSite(SiteLoc, Loc->getScope()->getSubprogram()).SiteFuncId;
209 
210     // Ensure we have links in the tree of inline call sites.
211     bool FirstLoc = true;
212     while ((SiteLoc = Loc->getInlinedAt())) {
213       InlineSite &Site =
214           getInlineSite(SiteLoc, Loc->getScope()->getSubprogram());
215       if (!FirstLoc)
216         addLocIfNotPresent(Site.ChildSites, Loc);
217       FirstLoc = false;
218       Loc = SiteLoc;
219     }
220     addLocIfNotPresent(CurFn->ChildSites, Loc);
221   }
222 
223   OS.EmitCVLocDirective(FuncId, FileId, DL.getLine(), DL.getCol(),
224                         /*PrologueEnd=*/false,
225                         /*IsStmt=*/false, DL->getFilename());
226 }
227 
228 void CodeViewDebug::emitCodeViewMagicVersion() {
229   OS.EmitValueToAlignment(4);
230   OS.AddComment("Debug section magic");
231   OS.EmitIntValue(COFF::DEBUG_SECTION_MAGIC, 4);
232 }
233 
234 void CodeViewDebug::endModule() {
235   if (!Asm || !MMI->hasDebugInfo())
236     return;
237 
238   assert(Asm != nullptr);
239 
240   // The COFF .debug$S section consists of several subsections, each starting
241   // with a 4-byte control code (e.g. 0xF1, 0xF2, etc) and then a 4-byte length
242   // of the payload followed by the payload itself.  The subsections are 4-byte
243   // aligned.
244 
245   // Use the generic .debug$S section, and make a subsection for all the inlined
246   // subprograms.
247   switchToDebugSectionForSymbol(nullptr);
248   emitInlineeLinesSubsection();
249 
250   // Emit per-function debug information.
251   for (auto &P : FnDebugInfo)
252     if (!P.first->isDeclarationForLinker())
253       emitDebugInfoForFunction(P.first, P.second);
254 
255   // Emit global variable debug information.
256   setCurrentSubprogram(nullptr);
257   emitDebugInfoForGlobals();
258 
259   // Switch back to the generic .debug$S section after potentially processing
260   // comdat symbol sections.
261   switchToDebugSectionForSymbol(nullptr);
262 
263   // Emit UDT records for any types used by global variables.
264   if (!GlobalUDTs.empty()) {
265     MCSymbol *SymbolsEnd = beginCVSubsection(ModuleSubstreamKind::Symbols);
266     emitDebugInfoForUDTs(GlobalUDTs);
267     endCVSubsection(SymbolsEnd);
268   }
269 
270   // This subsection holds a file index to offset in string table table.
271   OS.AddComment("File index to string table offset subsection");
272   OS.EmitCVFileChecksumsDirective();
273 
274   // This subsection holds the string table.
275   OS.AddComment("String table");
276   OS.EmitCVStringTableDirective();
277 
278   // Emit type information last, so that any types we translate while emitting
279   // function info are included.
280   emitTypeInformation();
281 
282   clear();
283 }
284 
285 static void emitNullTerminatedSymbolName(MCStreamer &OS, StringRef S) {
286   // Microsoft's linker seems to have trouble with symbol names longer than
287   // 0xffd8 bytes.
288   S = S.substr(0, 0xffd8);
289   SmallString<32> NullTerminatedString(S);
290   NullTerminatedString.push_back('\0');
291   OS.EmitBytes(NullTerminatedString);
292 }
293 
294 void CodeViewDebug::emitTypeInformation() {
295   // Do nothing if we have no debug info or if no non-trivial types were emitted
296   // to TypeTable during codegen.
297   NamedMDNode *CU_Nodes =
298       MMI->getModule()->getNamedMetadata("llvm.dbg.cu");
299   if (!CU_Nodes)
300     return;
301   if (TypeTable.empty())
302     return;
303 
304   // Start the .debug$T section with 0x4.
305   OS.SwitchSection(Asm->getObjFileLowering().getCOFFDebugTypesSection());
306   emitCodeViewMagicVersion();
307 
308   SmallString<8> CommentPrefix;
309   if (OS.isVerboseAsm()) {
310     CommentPrefix += '\t';
311     CommentPrefix += Asm->MAI->getCommentString();
312     CommentPrefix += ' ';
313   }
314 
315   CVTypeDumper CVTD(nullptr, /*PrintRecordBytes=*/false);
316   TypeTable.ForEachRecord(
317       [&](TypeIndex Index, StringRef Record) {
318         if (OS.isVerboseAsm()) {
319           // Emit a block comment describing the type record for readability.
320           SmallString<512> CommentBlock;
321           raw_svector_ostream CommentOS(CommentBlock);
322           ScopedPrinter SP(CommentOS);
323           SP.setPrefix(CommentPrefix);
324           CVTD.setPrinter(&SP);
325           Error EC = CVTD.dump({Record.bytes_begin(), Record.bytes_end()});
326           assert(!EC && "produced malformed type record");
327           consumeError(std::move(EC));
328           // emitRawComment will insert its own tab and comment string before
329           // the first line, so strip off our first one. It also prints its own
330           // newline.
331           OS.emitRawComment(
332               CommentOS.str().drop_front(CommentPrefix.size() - 1).rtrim());
333         }
334         OS.EmitBinaryData(Record);
335       });
336 }
337 
338 void CodeViewDebug::emitInlineeLinesSubsection() {
339   if (InlinedSubprograms.empty())
340     return;
341 
342 
343   OS.AddComment("Inlinee lines subsection");
344   MCSymbol *InlineEnd = beginCVSubsection(ModuleSubstreamKind::InlineeLines);
345 
346   // We don't provide any extra file info.
347   // FIXME: Find out if debuggers use this info.
348   OS.AddComment("Inlinee lines signature");
349   OS.EmitIntValue(unsigned(InlineeLinesSignature::Normal), 4);
350 
351   for (const DISubprogram *SP : InlinedSubprograms) {
352     assert(TypeIndices.count(SP));
353     TypeIndex InlineeIdx = TypeIndices[SP];
354 
355     OS.AddBlankLine();
356     unsigned FileId = maybeRecordFile(SP->getFile());
357     OS.AddComment("Inlined function " + SP->getDisplayName() + " starts at " +
358                   SP->getFilename() + Twine(':') + Twine(SP->getLine()));
359     OS.AddBlankLine();
360     // The filechecksum table uses 8 byte entries for now, and file ids start at
361     // 1.
362     unsigned FileOffset = (FileId - 1) * 8;
363     OS.AddComment("Type index of inlined function");
364     OS.EmitIntValue(InlineeIdx.getIndex(), 4);
365     OS.AddComment("Offset into filechecksum table");
366     OS.EmitIntValue(FileOffset, 4);
367     OS.AddComment("Starting line number");
368     OS.EmitIntValue(SP->getLine(), 4);
369   }
370 
371   endCVSubsection(InlineEnd);
372 }
373 
374 void CodeViewDebug::collectInlineSiteChildren(
375     SmallVectorImpl<unsigned> &Children, const FunctionInfo &FI,
376     const InlineSite &Site) {
377   for (const DILocation *ChildSiteLoc : Site.ChildSites) {
378     auto I = FI.InlineSites.find(ChildSiteLoc);
379     const InlineSite &ChildSite = I->second;
380     Children.push_back(ChildSite.SiteFuncId);
381     collectInlineSiteChildren(Children, FI, ChildSite);
382   }
383 }
384 
385 void CodeViewDebug::emitInlinedCallSite(const FunctionInfo &FI,
386                                         const DILocation *InlinedAt,
387                                         const InlineSite &Site) {
388   MCSymbol *InlineBegin = MMI->getContext().createTempSymbol(),
389            *InlineEnd = MMI->getContext().createTempSymbol();
390 
391   assert(TypeIndices.count(Site.Inlinee));
392   TypeIndex InlineeIdx = TypeIndices[Site.Inlinee];
393 
394   // SymbolRecord
395   OS.AddComment("Record length");
396   OS.emitAbsoluteSymbolDiff(InlineEnd, InlineBegin, 2);   // RecordLength
397   OS.EmitLabel(InlineBegin);
398   OS.AddComment("Record kind: S_INLINESITE");
399   OS.EmitIntValue(SymbolKind::S_INLINESITE, 2); // RecordKind
400 
401   OS.AddComment("PtrParent");
402   OS.EmitIntValue(0, 4);
403   OS.AddComment("PtrEnd");
404   OS.EmitIntValue(0, 4);
405   OS.AddComment("Inlinee type index");
406   OS.EmitIntValue(InlineeIdx.getIndex(), 4);
407 
408   unsigned FileId = maybeRecordFile(Site.Inlinee->getFile());
409   unsigned StartLineNum = Site.Inlinee->getLine();
410   SmallVector<unsigned, 3> SecondaryFuncIds;
411   collectInlineSiteChildren(SecondaryFuncIds, FI, Site);
412 
413   OS.EmitCVInlineLinetableDirective(Site.SiteFuncId, FileId, StartLineNum,
414                                     FI.Begin, FI.End, SecondaryFuncIds);
415 
416   OS.EmitLabel(InlineEnd);
417 
418   for (const LocalVariable &Var : Site.InlinedLocals)
419     emitLocalVariable(Var);
420 
421   // Recurse on child inlined call sites before closing the scope.
422   for (const DILocation *ChildSite : Site.ChildSites) {
423     auto I = FI.InlineSites.find(ChildSite);
424     assert(I != FI.InlineSites.end() &&
425            "child site not in function inline site map");
426     emitInlinedCallSite(FI, ChildSite, I->second);
427   }
428 
429   // Close the scope.
430   OS.AddComment("Record length");
431   OS.EmitIntValue(2, 2);                                  // RecordLength
432   OS.AddComment("Record kind: S_INLINESITE_END");
433   OS.EmitIntValue(SymbolKind::S_INLINESITE_END, 2); // RecordKind
434 }
435 
436 void CodeViewDebug::switchToDebugSectionForSymbol(const MCSymbol *GVSym) {
437   // If we have a symbol, it may be in a section that is COMDAT. If so, find the
438   // comdat key. A section may be comdat because of -ffunction-sections or
439   // because it is comdat in the IR.
440   MCSectionCOFF *GVSec =
441       GVSym ? dyn_cast<MCSectionCOFF>(&GVSym->getSection()) : nullptr;
442   const MCSymbol *KeySym = GVSec ? GVSec->getCOMDATSymbol() : nullptr;
443 
444   MCSectionCOFF *DebugSec = cast<MCSectionCOFF>(
445       Asm->getObjFileLowering().getCOFFDebugSymbolsSection());
446   DebugSec = OS.getContext().getAssociativeCOFFSection(DebugSec, KeySym);
447 
448   OS.SwitchSection(DebugSec);
449 
450   // Emit the magic version number if this is the first time we've switched to
451   // this section.
452   if (ComdatDebugSections.insert(DebugSec).second)
453     emitCodeViewMagicVersion();
454 }
455 
456 void CodeViewDebug::emitDebugInfoForFunction(const Function *GV,
457                                              FunctionInfo &FI) {
458   // For each function there is a separate subsection
459   // which holds the PC to file:line table.
460   const MCSymbol *Fn = Asm->getSymbol(GV);
461   assert(Fn);
462 
463   // Switch to the to a comdat section, if appropriate.
464   switchToDebugSectionForSymbol(Fn);
465 
466   StringRef FuncName;
467   auto *SP = GV->getSubprogram();
468   setCurrentSubprogram(SP);
469   if (SP != nullptr)
470     FuncName = SP->getDisplayName();
471 
472   // If our DISubprogram name is empty, use the mangled name.
473   if (FuncName.empty())
474     FuncName = GlobalValue::getRealLinkageName(GV->getName());
475 
476   // Emit a symbol subsection, required by VS2012+ to find function boundaries.
477   OS.AddComment("Symbol subsection for " + Twine(FuncName));
478   MCSymbol *SymbolsEnd = beginCVSubsection(ModuleSubstreamKind::Symbols);
479   {
480     MCSymbol *ProcRecordBegin = MMI->getContext().createTempSymbol(),
481              *ProcRecordEnd = MMI->getContext().createTempSymbol();
482     OS.AddComment("Record length");
483     OS.emitAbsoluteSymbolDiff(ProcRecordEnd, ProcRecordBegin, 2);
484     OS.EmitLabel(ProcRecordBegin);
485 
486     OS.AddComment("Record kind: S_GPROC32_ID");
487     OS.EmitIntValue(unsigned(SymbolKind::S_GPROC32_ID), 2);
488 
489     // These fields are filled in by tools like CVPACK which run after the fact.
490     OS.AddComment("PtrParent");
491     OS.EmitIntValue(0, 4);
492     OS.AddComment("PtrEnd");
493     OS.EmitIntValue(0, 4);
494     OS.AddComment("PtrNext");
495     OS.EmitIntValue(0, 4);
496     // This is the important bit that tells the debugger where the function
497     // code is located and what's its size:
498     OS.AddComment("Code size");
499     OS.emitAbsoluteSymbolDiff(FI.End, Fn, 4);
500     OS.AddComment("Offset after prologue");
501     OS.EmitIntValue(0, 4);
502     OS.AddComment("Offset before epilogue");
503     OS.EmitIntValue(0, 4);
504     OS.AddComment("Function type index");
505     OS.EmitIntValue(getFuncIdForSubprogram(GV->getSubprogram()).getIndex(), 4);
506     OS.AddComment("Function section relative address");
507     OS.EmitCOFFSecRel32(Fn);
508     OS.AddComment("Function section index");
509     OS.EmitCOFFSectionIndex(Fn);
510     OS.AddComment("Flags");
511     OS.EmitIntValue(0, 1);
512     // Emit the function display name as a null-terminated string.
513     OS.AddComment("Function name");
514     // Truncate the name so we won't overflow the record length field.
515     emitNullTerminatedSymbolName(OS, FuncName);
516     OS.EmitLabel(ProcRecordEnd);
517 
518     for (const LocalVariable &Var : FI.Locals)
519       emitLocalVariable(Var);
520 
521     // Emit inlined call site information. Only emit functions inlined directly
522     // into the parent function. We'll emit the other sites recursively as part
523     // of their parent inline site.
524     for (const DILocation *InlinedAt : FI.ChildSites) {
525       auto I = FI.InlineSites.find(InlinedAt);
526       assert(I != FI.InlineSites.end() &&
527              "child site not in function inline site map");
528       emitInlinedCallSite(FI, InlinedAt, I->second);
529     }
530 
531     if (SP != nullptr)
532       emitDebugInfoForUDTs(LocalUDTs);
533 
534     // We're done with this function.
535     OS.AddComment("Record length");
536     OS.EmitIntValue(0x0002, 2);
537     OS.AddComment("Record kind: S_PROC_ID_END");
538     OS.EmitIntValue(unsigned(SymbolKind::S_PROC_ID_END), 2);
539   }
540   endCVSubsection(SymbolsEnd);
541 
542   // We have an assembler directive that takes care of the whole line table.
543   OS.EmitCVLinetableDirective(FI.FuncId, Fn, FI.End);
544 }
545 
546 CodeViewDebug::LocalVarDefRange
547 CodeViewDebug::createDefRangeMem(uint16_t CVRegister, int Offset) {
548   LocalVarDefRange DR;
549   DR.InMemory = -1;
550   DR.DataOffset = Offset;
551   assert(DR.DataOffset == Offset && "truncation");
552   DR.StructOffset = 0;
553   DR.CVRegister = CVRegister;
554   return DR;
555 }
556 
557 CodeViewDebug::LocalVarDefRange
558 CodeViewDebug::createDefRangeReg(uint16_t CVRegister) {
559   LocalVarDefRange DR;
560   DR.InMemory = 0;
561   DR.DataOffset = 0;
562   DR.StructOffset = 0;
563   DR.CVRegister = CVRegister;
564   return DR;
565 }
566 
567 void CodeViewDebug::collectVariableInfoFromMMITable(
568     DenseSet<InlinedVariable> &Processed) {
569   const TargetSubtargetInfo &TSI = Asm->MF->getSubtarget();
570   const TargetFrameLowering *TFI = TSI.getFrameLowering();
571   const TargetRegisterInfo *TRI = TSI.getRegisterInfo();
572 
573   for (const MachineModuleInfo::VariableDbgInfo &VI :
574        MMI->getVariableDbgInfo()) {
575     if (!VI.Var)
576       continue;
577     assert(VI.Var->isValidLocationForIntrinsic(VI.Loc) &&
578            "Expected inlined-at fields to agree");
579 
580     Processed.insert(InlinedVariable(VI.Var, VI.Loc->getInlinedAt()));
581     LexicalScope *Scope = LScopes.findLexicalScope(VI.Loc);
582 
583     // If variable scope is not found then skip this variable.
584     if (!Scope)
585       continue;
586 
587     // Get the frame register used and the offset.
588     unsigned FrameReg = 0;
589     int FrameOffset = TFI->getFrameIndexReference(*Asm->MF, VI.Slot, FrameReg);
590     uint16_t CVReg = TRI->getCodeViewRegNum(FrameReg);
591 
592     // Calculate the label ranges.
593     LocalVarDefRange DefRange = createDefRangeMem(CVReg, FrameOffset);
594     for (const InsnRange &Range : Scope->getRanges()) {
595       const MCSymbol *Begin = getLabelBeforeInsn(Range.first);
596       const MCSymbol *End = getLabelAfterInsn(Range.second);
597       End = End ? End : Asm->getFunctionEnd();
598       DefRange.Ranges.emplace_back(Begin, End);
599     }
600 
601     LocalVariable Var;
602     Var.DIVar = VI.Var;
603     Var.DefRanges.emplace_back(std::move(DefRange));
604     recordLocalVariable(std::move(Var), VI.Loc->getInlinedAt());
605   }
606 }
607 
608 void CodeViewDebug::collectVariableInfo(const DISubprogram *SP) {
609   DenseSet<InlinedVariable> Processed;
610   // Grab the variable info that was squirreled away in the MMI side-table.
611   collectVariableInfoFromMMITable(Processed);
612 
613   const TargetRegisterInfo *TRI = Asm->MF->getSubtarget().getRegisterInfo();
614 
615   for (const auto &I : DbgValues) {
616     InlinedVariable IV = I.first;
617     if (Processed.count(IV))
618       continue;
619     const DILocalVariable *DIVar = IV.first;
620     const DILocation *InlinedAt = IV.second;
621 
622     // Instruction ranges, specifying where IV is accessible.
623     const auto &Ranges = I.second;
624 
625     LexicalScope *Scope = nullptr;
626     if (InlinedAt)
627       Scope = LScopes.findInlinedScope(DIVar->getScope(), InlinedAt);
628     else
629       Scope = LScopes.findLexicalScope(DIVar->getScope());
630     // If variable scope is not found then skip this variable.
631     if (!Scope)
632       continue;
633 
634     LocalVariable Var;
635     Var.DIVar = DIVar;
636 
637     // Calculate the definition ranges.
638     for (auto I = Ranges.begin(), E = Ranges.end(); I != E; ++I) {
639       const InsnRange &Range = *I;
640       const MachineInstr *DVInst = Range.first;
641       assert(DVInst->isDebugValue() && "Invalid History entry");
642       const DIExpression *DIExpr = DVInst->getDebugExpression();
643 
644       // Bail if there is a complex DWARF expression for now.
645       if (DIExpr && DIExpr->getNumElements() > 0)
646         continue;
647 
648       // Bail if operand 0 is not a valid register. This means the variable is a
649       // simple constant, or is described by a complex expression.
650       // FIXME: Find a way to represent constant variables, since they are
651       // relatively common.
652       unsigned Reg =
653           DVInst->getOperand(0).isReg() ? DVInst->getOperand(0).getReg() : 0;
654       if (Reg == 0)
655         continue;
656 
657       // Handle the two cases we can handle: indirect in memory and in register.
658       bool IsIndirect = DVInst->getOperand(1).isImm();
659       unsigned CVReg = TRI->getCodeViewRegNum(DVInst->getOperand(0).getReg());
660       {
661         LocalVarDefRange DefRange;
662         if (IsIndirect) {
663           int64_t Offset = DVInst->getOperand(1).getImm();
664           DefRange = createDefRangeMem(CVReg, Offset);
665         } else {
666           DefRange = createDefRangeReg(CVReg);
667         }
668         if (Var.DefRanges.empty() ||
669             Var.DefRanges.back().isDifferentLocation(DefRange)) {
670           Var.DefRanges.emplace_back(std::move(DefRange));
671         }
672       }
673 
674       // Compute the label range.
675       const MCSymbol *Begin = getLabelBeforeInsn(Range.first);
676       const MCSymbol *End = getLabelAfterInsn(Range.second);
677       if (!End) {
678         if (std::next(I) != E)
679           End = getLabelBeforeInsn(std::next(I)->first);
680         else
681           End = Asm->getFunctionEnd();
682       }
683 
684       // If the last range end is our begin, just extend the last range.
685       // Otherwise make a new range.
686       SmallVectorImpl<std::pair<const MCSymbol *, const MCSymbol *>> &Ranges =
687           Var.DefRanges.back().Ranges;
688       if (!Ranges.empty() && Ranges.back().second == Begin)
689         Ranges.back().second = End;
690       else
691         Ranges.emplace_back(Begin, End);
692 
693       // FIXME: Do more range combining.
694     }
695 
696     recordLocalVariable(std::move(Var), InlinedAt);
697   }
698 }
699 
700 void CodeViewDebug::beginFunction(const MachineFunction *MF) {
701   assert(!CurFn && "Can't process two functions at once!");
702 
703   if (!Asm || !MMI->hasDebugInfo())
704     return;
705 
706   DebugHandlerBase::beginFunction(MF);
707 
708   const Function *GV = MF->getFunction();
709   assert(FnDebugInfo.count(GV) == false);
710   CurFn = &FnDebugInfo[GV];
711   CurFn->FuncId = NextFuncId++;
712   CurFn->Begin = Asm->getFunctionBegin();
713 
714   // Find the end of the function prolog.  First known non-DBG_VALUE and
715   // non-frame setup location marks the beginning of the function body.
716   // FIXME: is there a simpler a way to do this? Can we just search
717   // for the first instruction of the function, not the last of the prolog?
718   DebugLoc PrologEndLoc;
719   bool EmptyPrologue = true;
720   for (const auto &MBB : *MF) {
721     for (const auto &MI : MBB) {
722       if (!MI.isDebugValue() && !MI.getFlag(MachineInstr::FrameSetup) &&
723           MI.getDebugLoc()) {
724         PrologEndLoc = MI.getDebugLoc();
725         break;
726       } else if (!MI.isDebugValue()) {
727         EmptyPrologue = false;
728       }
729     }
730   }
731 
732   // Record beginning of function if we have a non-empty prologue.
733   if (PrologEndLoc && !EmptyPrologue) {
734     DebugLoc FnStartDL = PrologEndLoc.getFnDebugLoc();
735     maybeRecordLocation(FnStartDL, MF);
736   }
737 }
738 
739 TypeIndex CodeViewDebug::lowerType(const DIType *Ty) {
740   // Generic dispatch for lowering an unknown type.
741   switch (Ty->getTag()) {
742   case dwarf::DW_TAG_array_type:
743     return lowerTypeArray(cast<DICompositeType>(Ty));
744   case dwarf::DW_TAG_typedef:
745     return lowerTypeAlias(cast<DIDerivedType>(Ty));
746   case dwarf::DW_TAG_base_type:
747     return lowerTypeBasic(cast<DIBasicType>(Ty));
748   case dwarf::DW_TAG_pointer_type:
749   case dwarf::DW_TAG_reference_type:
750   case dwarf::DW_TAG_rvalue_reference_type:
751     return lowerTypePointer(cast<DIDerivedType>(Ty));
752   case dwarf::DW_TAG_ptr_to_member_type:
753     return lowerTypeMemberPointer(cast<DIDerivedType>(Ty));
754   case dwarf::DW_TAG_const_type:
755   case dwarf::DW_TAG_volatile_type:
756     return lowerTypeModifier(cast<DIDerivedType>(Ty));
757   case dwarf::DW_TAG_subroutine_type:
758     return lowerTypeFunction(cast<DISubroutineType>(Ty));
759   case dwarf::DW_TAG_class_type:
760   case dwarf::DW_TAG_structure_type:
761     return lowerTypeClass(cast<DICompositeType>(Ty));
762   case dwarf::DW_TAG_union_type:
763     return lowerTypeUnion(cast<DICompositeType>(Ty));
764   default:
765     // Use the null type index.
766     return TypeIndex();
767   }
768 }
769 
770 static const DISubprogram *getQualifiedNameComponents(
771     const DIScope *Scope, SmallVectorImpl<StringRef> &QualifiedNameComponents) {
772   const DISubprogram *ClosestSubprogram = nullptr;
773   while (Scope != nullptr) {
774     if (ClosestSubprogram == nullptr)
775       ClosestSubprogram = dyn_cast<DISubprogram>(Scope);
776     StringRef ScopeName = Scope->getName();
777     if (!ScopeName.empty())
778       QualifiedNameComponents.push_back(ScopeName);
779     Scope = Scope->getScope().resolve();
780   }
781   return ClosestSubprogram;
782 }
783 
784 static std::string getQualifiedName(ArrayRef<StringRef> QualifiedNameComponents,
785                                     StringRef TypeName) {
786   std::string FullyQualifiedName;
787   for (StringRef QualifiedNameComponent : reverse(QualifiedNameComponents)) {
788     FullyQualifiedName.append(QualifiedNameComponent);
789     FullyQualifiedName.append("::");
790   }
791   FullyQualifiedName.append(TypeName);
792   return FullyQualifiedName;
793 }
794 
795 TypeIndex CodeViewDebug::lowerTypeAlias(const DIDerivedType *Ty) {
796   DITypeRef UnderlyingTypeRef = Ty->getBaseType();
797   TypeIndex UnderlyingTypeIndex = getTypeIndex(UnderlyingTypeRef);
798   StringRef TypeName = Ty->getName();
799 
800   SmallVector<StringRef, 5> QualifiedNameComponents;
801   const DISubprogram *ClosestSubprogram = getQualifiedNameComponents(
802       Ty->getScope().resolve(), QualifiedNameComponents);
803 
804   if (ClosestSubprogram == nullptr) {
805     std::string FullyQualifiedName =
806         getQualifiedName(QualifiedNameComponents, TypeName);
807     GlobalUDTs.emplace_back(std::move(FullyQualifiedName), UnderlyingTypeIndex);
808   } else if (ClosestSubprogram == CurrentSubprogram) {
809     std::string FullyQualifiedName =
810         getQualifiedName(QualifiedNameComponents, TypeName);
811     LocalUDTs.emplace_back(std::move(FullyQualifiedName), UnderlyingTypeIndex);
812   }
813   // TODO: What if the ClosestSubprogram is neither null or the current
814   // subprogram?  Currently, the UDT just gets dropped on the floor.
815   //
816   // The current behavior is not desirable.  To get maximal fidelity, we would
817   // need to perform all type translation before beginning emission of .debug$S
818   // and then make LocalUDTs a member of FunctionInfo
819 
820   if (UnderlyingTypeIndex == TypeIndex(SimpleTypeKind::Int32Long) &&
821       TypeName == "HRESULT")
822     return TypeIndex(SimpleTypeKind::HResult);
823   if (UnderlyingTypeIndex == TypeIndex(SimpleTypeKind::UInt16Short) &&
824       TypeName == "wchar_t")
825     return TypeIndex(SimpleTypeKind::WideCharacter);
826   return UnderlyingTypeIndex;
827 }
828 
829 TypeIndex CodeViewDebug::lowerTypeArray(const DICompositeType *Ty) {
830   DITypeRef ElementTypeRef = Ty->getBaseType();
831   TypeIndex ElementTypeIndex = getTypeIndex(ElementTypeRef);
832   // IndexType is size_t, which depends on the bitness of the target.
833   TypeIndex IndexType = Asm->MAI->getPointerSize() == 8
834                             ? TypeIndex(SimpleTypeKind::UInt64Quad)
835                             : TypeIndex(SimpleTypeKind::UInt32Long);
836   uint64_t Size = Ty->getSizeInBits() / 8;
837   ArrayRecord Record(ElementTypeIndex, IndexType, Size, Ty->getName());
838   return TypeTable.writeArray(Record);
839 }
840 
841 TypeIndex CodeViewDebug::lowerTypeBasic(const DIBasicType *Ty) {
842   TypeIndex Index;
843   dwarf::TypeKind Kind;
844   uint32_t ByteSize;
845 
846   Kind = static_cast<dwarf::TypeKind>(Ty->getEncoding());
847   ByteSize = Ty->getSizeInBits() / 8;
848 
849   SimpleTypeKind STK = SimpleTypeKind::None;
850   switch (Kind) {
851   case dwarf::DW_ATE_address:
852     // FIXME: Translate
853     break;
854   case dwarf::DW_ATE_boolean:
855     switch (ByteSize) {
856     case 1:  STK = SimpleTypeKind::Boolean8;   break;
857     case 2:  STK = SimpleTypeKind::Boolean16;  break;
858     case 4:  STK = SimpleTypeKind::Boolean32;  break;
859     case 8:  STK = SimpleTypeKind::Boolean64;  break;
860     case 16: STK = SimpleTypeKind::Boolean128; break;
861     }
862     break;
863   case dwarf::DW_ATE_complex_float:
864     switch (ByteSize) {
865     case 2:  STK = SimpleTypeKind::Complex16;  break;
866     case 4:  STK = SimpleTypeKind::Complex32;  break;
867     case 8:  STK = SimpleTypeKind::Complex64;  break;
868     case 10: STK = SimpleTypeKind::Complex80;  break;
869     case 16: STK = SimpleTypeKind::Complex128; break;
870     }
871     break;
872   case dwarf::DW_ATE_float:
873     switch (ByteSize) {
874     case 2:  STK = SimpleTypeKind::Float16;  break;
875     case 4:  STK = SimpleTypeKind::Float32;  break;
876     case 6:  STK = SimpleTypeKind::Float48;  break;
877     case 8:  STK = SimpleTypeKind::Float64;  break;
878     case 10: STK = SimpleTypeKind::Float80;  break;
879     case 16: STK = SimpleTypeKind::Float128; break;
880     }
881     break;
882   case dwarf::DW_ATE_signed:
883     switch (ByteSize) {
884     case 1:  STK = SimpleTypeKind::SByte;      break;
885     case 2:  STK = SimpleTypeKind::Int16Short; break;
886     case 4:  STK = SimpleTypeKind::Int32;      break;
887     case 8:  STK = SimpleTypeKind::Int64Quad;  break;
888     case 16: STK = SimpleTypeKind::Int128Oct;  break;
889     }
890     break;
891   case dwarf::DW_ATE_unsigned:
892     switch (ByteSize) {
893     case 1:  STK = SimpleTypeKind::Byte;        break;
894     case 2:  STK = SimpleTypeKind::UInt16Short; break;
895     case 4:  STK = SimpleTypeKind::UInt32;      break;
896     case 8:  STK = SimpleTypeKind::UInt64Quad;  break;
897     case 16: STK = SimpleTypeKind::UInt128Oct;  break;
898     }
899     break;
900   case dwarf::DW_ATE_UTF:
901     switch (ByteSize) {
902     case 2: STK = SimpleTypeKind::Character16; break;
903     case 4: STK = SimpleTypeKind::Character32; break;
904     }
905     break;
906   case dwarf::DW_ATE_signed_char:
907     if (ByteSize == 1)
908       STK = SimpleTypeKind::SignedCharacter;
909     break;
910   case dwarf::DW_ATE_unsigned_char:
911     if (ByteSize == 1)
912       STK = SimpleTypeKind::UnsignedCharacter;
913     break;
914   default:
915     break;
916   }
917 
918   // Apply some fixups based on the source-level type name.
919   if (STK == SimpleTypeKind::Int32 && Ty->getName() == "long int")
920     STK = SimpleTypeKind::Int32Long;
921   if (STK == SimpleTypeKind::UInt32 && Ty->getName() == "long unsigned int")
922     STK = SimpleTypeKind::UInt32Long;
923   if (STK == SimpleTypeKind::UInt16Short &&
924       (Ty->getName() == "wchar_t" || Ty->getName() == "__wchar_t"))
925     STK = SimpleTypeKind::WideCharacter;
926   if ((STK == SimpleTypeKind::SignedCharacter ||
927        STK == SimpleTypeKind::UnsignedCharacter) &&
928       Ty->getName() == "char")
929     STK = SimpleTypeKind::NarrowCharacter;
930 
931   return TypeIndex(STK);
932 }
933 
934 TypeIndex CodeViewDebug::lowerTypePointer(const DIDerivedType *Ty) {
935   TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType());
936 
937   // Pointers to simple types can use SimpleTypeMode, rather than having a
938   // dedicated pointer type record.
939   if (PointeeTI.isSimple() &&
940       PointeeTI.getSimpleMode() == SimpleTypeMode::Direct &&
941       Ty->getTag() == dwarf::DW_TAG_pointer_type) {
942     SimpleTypeMode Mode = Ty->getSizeInBits() == 64
943                               ? SimpleTypeMode::NearPointer64
944                               : SimpleTypeMode::NearPointer32;
945     return TypeIndex(PointeeTI.getSimpleKind(), Mode);
946   }
947 
948   PointerKind PK =
949       Ty->getSizeInBits() == 64 ? PointerKind::Near64 : PointerKind::Near32;
950   PointerMode PM = PointerMode::Pointer;
951   switch (Ty->getTag()) {
952   default: llvm_unreachable("not a pointer tag type");
953   case dwarf::DW_TAG_pointer_type:
954     PM = PointerMode::Pointer;
955     break;
956   case dwarf::DW_TAG_reference_type:
957     PM = PointerMode::LValueReference;
958     break;
959   case dwarf::DW_TAG_rvalue_reference_type:
960     PM = PointerMode::RValueReference;
961     break;
962   }
963   // FIXME: MSVC folds qualifiers into PointerOptions in the context of a method
964   // 'this' pointer, but not normal contexts. Figure out what we're supposed to
965   // do.
966   PointerOptions PO = PointerOptions::None;
967   PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8);
968   return TypeTable.writePointer(PR);
969 }
970 
971 TypeIndex CodeViewDebug::lowerTypeMemberPointer(const DIDerivedType *Ty) {
972   assert(Ty->getTag() == dwarf::DW_TAG_ptr_to_member_type);
973   TypeIndex ClassTI = getTypeIndex(Ty->getClassType());
974   TypeIndex PointeeTI = getTypeIndex(Ty->getBaseType());
975   PointerKind PK = Asm->MAI->getPointerSize() == 8 ? PointerKind::Near64
976                                                    : PointerKind::Near32;
977   PointerMode PM = isa<DISubroutineType>(Ty->getBaseType())
978                        ? PointerMode::PointerToMemberFunction
979                        : PointerMode::PointerToDataMember;
980   PointerOptions PO = PointerOptions::None; // FIXME
981   // FIXME: Thread this ABI info through metadata.
982   PointerToMemberRepresentation PMR = PointerToMemberRepresentation::Unknown;
983   MemberPointerInfo MPI(ClassTI, PMR);
984   PointerRecord PR(PointeeTI, PK, PM, PO, Ty->getSizeInBits() / 8, MPI);
985   return TypeTable.writePointer(PR);
986 }
987 
988 /// Given a DWARF calling convention, get the CodeView equivalent. If we don't
989 /// have a translation, use the NearC convention.
990 static CallingConvention dwarfCCToCodeView(unsigned DwarfCC) {
991   switch (DwarfCC) {
992   case dwarf::DW_CC_normal:             return CallingConvention::NearC;
993   case dwarf::DW_CC_BORLAND_msfastcall: return CallingConvention::NearFast;
994   case dwarf::DW_CC_BORLAND_thiscall:   return CallingConvention::ThisCall;
995   case dwarf::DW_CC_BORLAND_stdcall:    return CallingConvention::NearStdCall;
996   case dwarf::DW_CC_BORLAND_pascal:     return CallingConvention::NearPascal;
997   case dwarf::DW_CC_LLVM_vectorcall:    return CallingConvention::NearVector;
998   }
999   return CallingConvention::NearC;
1000 }
1001 
1002 TypeIndex CodeViewDebug::lowerTypeModifier(const DIDerivedType *Ty) {
1003   ModifierOptions Mods = ModifierOptions::None;
1004   bool IsModifier = true;
1005   const DIType *BaseTy = Ty;
1006   while (IsModifier && BaseTy) {
1007     // FIXME: Need to add DWARF tag for __unaligned.
1008     switch (BaseTy->getTag()) {
1009     case dwarf::DW_TAG_const_type:
1010       Mods |= ModifierOptions::Const;
1011       break;
1012     case dwarf::DW_TAG_volatile_type:
1013       Mods |= ModifierOptions::Volatile;
1014       break;
1015     default:
1016       IsModifier = false;
1017       break;
1018     }
1019     if (IsModifier)
1020       BaseTy = cast<DIDerivedType>(BaseTy)->getBaseType().resolve();
1021   }
1022   TypeIndex ModifiedTI = getTypeIndex(BaseTy);
1023   ModifierRecord MR(ModifiedTI, Mods);
1024   return TypeTable.writeModifier(MR);
1025 }
1026 
1027 TypeIndex CodeViewDebug::lowerTypeFunction(const DISubroutineType *Ty) {
1028   SmallVector<TypeIndex, 8> ReturnAndArgTypeIndices;
1029   for (DITypeRef ArgTypeRef : Ty->getTypeArray())
1030     ReturnAndArgTypeIndices.push_back(getTypeIndex(ArgTypeRef));
1031 
1032   TypeIndex ReturnTypeIndex = TypeIndex::Void();
1033   ArrayRef<TypeIndex> ArgTypeIndices = None;
1034   if (!ReturnAndArgTypeIndices.empty()) {
1035     auto ReturnAndArgTypesRef = makeArrayRef(ReturnAndArgTypeIndices);
1036     ReturnTypeIndex = ReturnAndArgTypesRef.front();
1037     ArgTypeIndices = ReturnAndArgTypesRef.drop_front();
1038   }
1039 
1040   ArgListRecord ArgListRec(TypeRecordKind::ArgList, ArgTypeIndices);
1041   TypeIndex ArgListIndex = TypeTable.writeArgList(ArgListRec);
1042 
1043   CallingConvention CC = dwarfCCToCodeView(Ty->getCC());
1044 
1045   // TODO: Some functions are member functions, we should use a more appropriate
1046   // record for those.
1047   ProcedureRecord Procedure(ReturnTypeIndex, CC, FunctionOptions::None,
1048                             ArgTypeIndices.size(), ArgListIndex);
1049   return TypeTable.writeProcedure(Procedure);
1050 }
1051 
1052 static MemberAccess translateAccessFlags(unsigned RecordTag,
1053                                          const DIType *Member) {
1054   switch (Member->getFlags() & DINode::FlagAccessibility) {
1055   case DINode::FlagPrivate:   return MemberAccess::Private;
1056   case DINode::FlagPublic:    return MemberAccess::Public;
1057   case DINode::FlagProtected: return MemberAccess::Protected;
1058   case 0:
1059     // If there was no explicit access control, provide the default for the tag.
1060     return RecordTag == dwarf::DW_TAG_class_type ? MemberAccess::Private
1061                                                  : MemberAccess::Public;
1062   }
1063   llvm_unreachable("access flags are exclusive");
1064 }
1065 
1066 static TypeRecordKind getRecordKind(const DICompositeType *Ty) {
1067   switch (Ty->getTag()) {
1068   case dwarf::DW_TAG_class_type:     return TypeRecordKind::Class;
1069   case dwarf::DW_TAG_structure_type: return TypeRecordKind::Struct;
1070   }
1071   llvm_unreachable("unexpected tag");
1072 }
1073 
1074 /// Return the HasUniqueName option if it should be present in ClassOptions, or
1075 /// None otherwise.
1076 static ClassOptions getRecordUniqueNameOption(const DICompositeType *Ty) {
1077   // MSVC always sets this flag now, even for local types. Clang doesn't always
1078   // appear to give every type a linkage name, which may be problematic for us.
1079   // FIXME: Investigate the consequences of not following them here.
1080   return !Ty->getIdentifier().empty() ? ClassOptions::HasUniqueName
1081                                       : ClassOptions::None;
1082 }
1083 
1084 TypeIndex CodeViewDebug::lowerTypeClass(const DICompositeType *Ty) {
1085   // First, construct the forward decl.  Don't look into Ty to compute the
1086   // forward decl options, since it might not be available in all TUs.
1087   TypeRecordKind Kind = getRecordKind(Ty);
1088   ClassOptions CO =
1089       ClassOptions::ForwardReference | getRecordUniqueNameOption(Ty);
1090   TypeIndex FwdDeclTI = TypeTable.writeClass(ClassRecord(
1091       Kind, 0, CO, HfaKind::None, WindowsRTClassKind::None, TypeIndex(),
1092       TypeIndex(), TypeIndex(), 0, Ty->getName(), Ty->getIdentifier()));
1093   return FwdDeclTI;
1094 }
1095 
1096 TypeIndex CodeViewDebug::lowerCompleteTypeClass(const DICompositeType *Ty) {
1097   // Construct the field list and complete type record.
1098   TypeRecordKind Kind = getRecordKind(Ty);
1099   // FIXME: Other ClassOptions, like ContainsNestedClass and NestedClass.
1100   ClassOptions CO = ClassOptions::None | getRecordUniqueNameOption(Ty);
1101   TypeIndex FTI;
1102   unsigned FieldCount;
1103   std::tie(FTI, FieldCount) = lowerRecordFieldList(Ty);
1104 
1105   uint64_t SizeInBytes = Ty->getSizeInBits() / 8;
1106   return TypeTable.writeClass(ClassRecord(Kind, FieldCount, CO, HfaKind::None,
1107                                           WindowsRTClassKind::None, FTI,
1108                                           TypeIndex(), TypeIndex(), SizeInBytes,
1109                                           Ty->getName(), Ty->getIdentifier()));
1110   // FIXME: Make an LF_UDT_SRC_LINE record.
1111 }
1112 
1113 TypeIndex CodeViewDebug::lowerTypeUnion(const DICompositeType *Ty) {
1114   ClassOptions CO =
1115       ClassOptions::ForwardReference | getRecordUniqueNameOption(Ty);
1116   TypeIndex FwdDeclTI =
1117       TypeTable.writeUnion(UnionRecord(0, CO, HfaKind::None, TypeIndex(), 0,
1118                                        Ty->getName(), Ty->getIdentifier()));
1119   return FwdDeclTI;
1120 }
1121 
1122 TypeIndex CodeViewDebug::lowerCompleteTypeUnion(const DICompositeType *Ty) {
1123   ClassOptions CO = ClassOptions::None | getRecordUniqueNameOption(Ty);
1124   TypeIndex FTI;
1125   unsigned FieldCount;
1126   std::tie(FTI, FieldCount) = lowerRecordFieldList(Ty);
1127   uint64_t SizeInBytes = Ty->getSizeInBits() / 8;
1128   return TypeTable.writeUnion(UnionRecord(FieldCount, CO, HfaKind::None, FTI,
1129                                           SizeInBytes, Ty->getName(),
1130                                           Ty->getIdentifier()));
1131   // FIXME: Make an LF_UDT_SRC_LINE record.
1132 }
1133 
1134 std::pair<TypeIndex, unsigned>
1135 CodeViewDebug::lowerRecordFieldList(const DICompositeType *Ty) {
1136   // Manually count members. MSVC appears to count everything that generates a
1137   // field list record. Each individual overload in a method overload group
1138   // contributes to this count, even though the overload group is a single field
1139   // list record.
1140   unsigned MemberCount = 0;
1141   FieldListRecordBuilder Fields;
1142   for (const DINode *Element : Ty->getElements()) {
1143     // We assume that the frontend provides all members in source declaration
1144     // order, which is what MSVC does.
1145     if (!Element)
1146       continue;
1147     if (auto *SP = dyn_cast<DISubprogram>(Element)) {
1148       // C++ method.
1149       // FIXME: Overloaded methods are grouped together, so we'll need two
1150       // passes to group them.
1151       (void)SP;
1152     } else if (auto *Member = dyn_cast<DIDerivedType>(Element)) {
1153       if (Member->getTag() == dwarf::DW_TAG_member) {
1154         if (Member->isStaticMember()) {
1155           // Static data member.
1156           Fields.writeStaticDataMember(StaticDataMemberRecord(
1157               translateAccessFlags(Ty->getTag(), Member),
1158               getTypeIndex(Member->getBaseType()), Member->getName()));
1159           MemberCount++;
1160         } else {
1161           // Data member.
1162           // FIXME: Make a BitFieldRecord for bitfields.
1163           Fields.writeDataMember(DataMemberRecord(
1164               translateAccessFlags(Ty->getTag(), Member),
1165               getTypeIndex(Member->getBaseType()),
1166               Member->getOffsetInBits() / 8, Member->getName()));
1167           MemberCount++;
1168         }
1169       } else if (Member->getTag() == dwarf::DW_TAG_friend) {
1170         // Ignore friend members. It appears that MSVC emitted info about
1171         // friends in the past, but modern versions do not.
1172       }
1173       // FIXME: Get clang to emit nested types here and do something with
1174       // them.
1175     }
1176     // Skip other unrecognized kinds of elements.
1177   }
1178   return {TypeTable.writeFieldList(Fields), MemberCount};
1179 }
1180 
1181 TypeIndex CodeViewDebug::getTypeIndex(DITypeRef TypeRef) {
1182   const DIType *Ty = TypeRef.resolve();
1183 
1184   // The null DIType is the void type. Don't try to hash it.
1185   if (!Ty)
1186     return TypeIndex::Void();
1187 
1188   // Check if we've already translated this type. Don't try to do a
1189   // get-or-create style insertion that caches the hash lookup across the
1190   // lowerType call. It will update the TypeIndices map.
1191   auto I = TypeIndices.find(Ty);
1192   if (I != TypeIndices.end())
1193     return I->second;
1194 
1195   TypeIndex TI = lowerType(Ty);
1196 
1197   recordTypeIndexForDINode(Ty, TI);
1198   return TI;
1199 }
1200 
1201 TypeIndex CodeViewDebug::getCompleteTypeIndex(DITypeRef TypeRef) {
1202   const DIType *Ty = TypeRef.resolve();
1203 
1204   // The null DIType is the void type. Don't try to hash it.
1205   if (!Ty)
1206     return TypeIndex::Void();
1207 
1208   // If this is a non-record type, the complete type index is the same as the
1209   // normal type index. Just call getTypeIndex.
1210   switch (Ty->getTag()) {
1211   case dwarf::DW_TAG_class_type:
1212   case dwarf::DW_TAG_structure_type:
1213   case dwarf::DW_TAG_union_type:
1214     break;
1215   default:
1216     return getTypeIndex(Ty);
1217   }
1218 
1219   // Check if we've already translated the complete record type.  Lowering a
1220   // complete type should never trigger lowering another complete type, so we
1221   // can reuse the hash table lookup result.
1222   const auto *CTy = cast<DICompositeType>(Ty);
1223   auto InsertResult = CompleteTypeIndices.insert({CTy, TypeIndex()});
1224   if (!InsertResult.second)
1225     return InsertResult.first->second;
1226 
1227   // Make sure the forward declaration is emitted first. It's unclear if this
1228   // is necessary, but MSVC does it, and we should follow suit until we can show
1229   // otherwise.
1230   TypeIndex FwdDeclTI = getTypeIndex(CTy);
1231 
1232   // Just use the forward decl if we don't have complete type info. This might
1233   // happen if the frontend is using modules and expects the complete definition
1234   // to be emitted elsewhere.
1235   if (CTy->isForwardDecl())
1236     return FwdDeclTI;
1237 
1238   TypeIndex TI;
1239   switch (CTy->getTag()) {
1240   case dwarf::DW_TAG_class_type:
1241   case dwarf::DW_TAG_structure_type:
1242     TI = lowerCompleteTypeClass(CTy);
1243     break;
1244   case dwarf::DW_TAG_union_type:
1245     TI = lowerCompleteTypeUnion(CTy);
1246     break;
1247   default:
1248     llvm_unreachable("not a record");
1249   }
1250 
1251   InsertResult.first->second = TI;
1252   return TI;
1253 }
1254 
1255 void CodeViewDebug::emitLocalVariable(const LocalVariable &Var) {
1256   // LocalSym record, see SymbolRecord.h for more info.
1257   MCSymbol *LocalBegin = MMI->getContext().createTempSymbol(),
1258            *LocalEnd = MMI->getContext().createTempSymbol();
1259   OS.AddComment("Record length");
1260   OS.emitAbsoluteSymbolDiff(LocalEnd, LocalBegin, 2);
1261   OS.EmitLabel(LocalBegin);
1262 
1263   OS.AddComment("Record kind: S_LOCAL");
1264   OS.EmitIntValue(unsigned(SymbolKind::S_LOCAL), 2);
1265 
1266   LocalSymFlags Flags = LocalSymFlags::None;
1267   if (Var.DIVar->isParameter())
1268     Flags |= LocalSymFlags::IsParameter;
1269   if (Var.DefRanges.empty())
1270     Flags |= LocalSymFlags::IsOptimizedOut;
1271 
1272   OS.AddComment("TypeIndex");
1273   TypeIndex TI = getCompleteTypeIndex(Var.DIVar->getType());
1274   OS.EmitIntValue(TI.getIndex(), 4);
1275   OS.AddComment("Flags");
1276   OS.EmitIntValue(static_cast<uint16_t>(Flags), 2);
1277   // Truncate the name so we won't overflow the record length field.
1278   emitNullTerminatedSymbolName(OS, Var.DIVar->getName());
1279   OS.EmitLabel(LocalEnd);
1280 
1281   // Calculate the on disk prefix of the appropriate def range record. The
1282   // records and on disk formats are described in SymbolRecords.h. BytePrefix
1283   // should be big enough to hold all forms without memory allocation.
1284   SmallString<20> BytePrefix;
1285   for (const LocalVarDefRange &DefRange : Var.DefRanges) {
1286     BytePrefix.clear();
1287     // FIXME: Handle bitpieces.
1288     if (DefRange.StructOffset != 0)
1289       continue;
1290 
1291     if (DefRange.InMemory) {
1292       DefRangeRegisterRelSym Sym(DefRange.CVRegister, 0, DefRange.DataOffset, 0,
1293                                  0, 0, ArrayRef<LocalVariableAddrGap>());
1294       ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER_REL);
1295       BytePrefix +=
1296           StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind));
1297       BytePrefix +=
1298           StringRef(reinterpret_cast<const char *>(&Sym.Header),
1299                     sizeof(Sym.Header) - sizeof(LocalVariableAddrRange));
1300     } else {
1301       assert(DefRange.DataOffset == 0 && "unexpected offset into register");
1302       // Unclear what matters here.
1303       DefRangeRegisterSym Sym(DefRange.CVRegister, 0, 0, 0, 0,
1304                               ArrayRef<LocalVariableAddrGap>());
1305       ulittle16_t SymKind = ulittle16_t(S_DEFRANGE_REGISTER);
1306       BytePrefix +=
1307           StringRef(reinterpret_cast<const char *>(&SymKind), sizeof(SymKind));
1308       BytePrefix +=
1309           StringRef(reinterpret_cast<const char *>(&Sym.Header),
1310                     sizeof(Sym.Header) - sizeof(LocalVariableAddrRange));
1311     }
1312     OS.EmitCVDefRangeDirective(DefRange.Ranges, BytePrefix);
1313   }
1314 }
1315 
1316 void CodeViewDebug::endFunction(const MachineFunction *MF) {
1317   if (!Asm || !CurFn)  // We haven't created any debug info for this function.
1318     return;
1319 
1320   const Function *GV = MF->getFunction();
1321   assert(FnDebugInfo.count(GV));
1322   assert(CurFn == &FnDebugInfo[GV]);
1323 
1324   collectVariableInfo(GV->getSubprogram());
1325 
1326   DebugHandlerBase::endFunction(MF);
1327 
1328   // Don't emit anything if we don't have any line tables.
1329   if (!CurFn->HaveLineInfo) {
1330     FnDebugInfo.erase(GV);
1331     CurFn = nullptr;
1332     return;
1333   }
1334 
1335   CurFn->End = Asm->getFunctionEnd();
1336 
1337   CurFn = nullptr;
1338 }
1339 
1340 void CodeViewDebug::beginInstruction(const MachineInstr *MI) {
1341   DebugHandlerBase::beginInstruction(MI);
1342 
1343   // Ignore DBG_VALUE locations and function prologue.
1344   if (!Asm || MI->isDebugValue() || MI->getFlag(MachineInstr::FrameSetup))
1345     return;
1346   DebugLoc DL = MI->getDebugLoc();
1347   if (DL == PrevInstLoc || !DL)
1348     return;
1349   maybeRecordLocation(DL, Asm->MF);
1350 }
1351 
1352 MCSymbol *CodeViewDebug::beginCVSubsection(ModuleSubstreamKind Kind) {
1353   MCSymbol *BeginLabel = MMI->getContext().createTempSymbol(),
1354            *EndLabel = MMI->getContext().createTempSymbol();
1355   OS.EmitIntValue(unsigned(Kind), 4);
1356   OS.AddComment("Subsection size");
1357   OS.emitAbsoluteSymbolDiff(EndLabel, BeginLabel, 4);
1358   OS.EmitLabel(BeginLabel);
1359   return EndLabel;
1360 }
1361 
1362 void CodeViewDebug::endCVSubsection(MCSymbol *EndLabel) {
1363   OS.EmitLabel(EndLabel);
1364   // Every subsection must be aligned to a 4-byte boundary.
1365   OS.EmitValueToAlignment(4);
1366 }
1367 
1368 void CodeViewDebug::emitDebugInfoForUDTs(
1369     ArrayRef<std::pair<std::string, TypeIndex>> UDTs) {
1370   for (const std::pair<std::string, codeview::TypeIndex> &UDT : UDTs) {
1371     MCSymbol *UDTRecordBegin = MMI->getContext().createTempSymbol(),
1372              *UDTRecordEnd = MMI->getContext().createTempSymbol();
1373     OS.AddComment("Record length");
1374     OS.emitAbsoluteSymbolDiff(UDTRecordEnd, UDTRecordBegin, 2);
1375     OS.EmitLabel(UDTRecordBegin);
1376 
1377     OS.AddComment("Record kind: S_UDT");
1378     OS.EmitIntValue(unsigned(SymbolKind::S_UDT), 2);
1379 
1380     OS.AddComment("Type");
1381     OS.EmitIntValue(UDT.second.getIndex(), 4);
1382 
1383     emitNullTerminatedSymbolName(OS, UDT.first);
1384     OS.EmitLabel(UDTRecordEnd);
1385   }
1386 }
1387 
1388 void CodeViewDebug::emitDebugInfoForGlobals() {
1389   NamedMDNode *CUs = MMI->getModule()->getNamedMetadata("llvm.dbg.cu");
1390   for (const MDNode *Node : CUs->operands()) {
1391     const auto *CU = cast<DICompileUnit>(Node);
1392 
1393     // First, emit all globals that are not in a comdat in a single symbol
1394     // substream. MSVC doesn't like it if the substream is empty, so only open
1395     // it if we have at least one global to emit.
1396     switchToDebugSectionForSymbol(nullptr);
1397     MCSymbol *EndLabel = nullptr;
1398     for (const DIGlobalVariable *G : CU->getGlobalVariables()) {
1399       if (const auto *GV = dyn_cast_or_null<GlobalVariable>(G->getVariable())) {
1400         if (!GV->hasComdat() && !GV->isDeclarationForLinker()) {
1401           if (!EndLabel) {
1402             OS.AddComment("Symbol subsection for globals");
1403             EndLabel = beginCVSubsection(ModuleSubstreamKind::Symbols);
1404           }
1405           emitDebugInfoForGlobal(G, Asm->getSymbol(GV));
1406         }
1407       }
1408     }
1409     if (EndLabel)
1410       endCVSubsection(EndLabel);
1411 
1412     // Second, emit each global that is in a comdat into its own .debug$S
1413     // section along with its own symbol substream.
1414     for (const DIGlobalVariable *G : CU->getGlobalVariables()) {
1415       if (const auto *GV = dyn_cast_or_null<GlobalVariable>(G->getVariable())) {
1416         if (GV->hasComdat()) {
1417           MCSymbol *GVSym = Asm->getSymbol(GV);
1418           OS.AddComment("Symbol subsection for " +
1419                         Twine(GlobalValue::getRealLinkageName(GV->getName())));
1420           switchToDebugSectionForSymbol(GVSym);
1421           EndLabel = beginCVSubsection(ModuleSubstreamKind::Symbols);
1422           emitDebugInfoForGlobal(G, GVSym);
1423           endCVSubsection(EndLabel);
1424         }
1425       }
1426     }
1427   }
1428 }
1429 
1430 void CodeViewDebug::emitDebugInfoForGlobal(const DIGlobalVariable *DIGV,
1431                                            MCSymbol *GVSym) {
1432   // DataSym record, see SymbolRecord.h for more info.
1433   // FIXME: Thread local data, etc
1434   MCSymbol *DataBegin = MMI->getContext().createTempSymbol(),
1435            *DataEnd = MMI->getContext().createTempSymbol();
1436   OS.AddComment("Record length");
1437   OS.emitAbsoluteSymbolDiff(DataEnd, DataBegin, 2);
1438   OS.EmitLabel(DataBegin);
1439   OS.AddComment("Record kind: S_GDATA32");
1440   OS.EmitIntValue(unsigned(SymbolKind::S_GDATA32), 2);
1441   OS.AddComment("Type");
1442   OS.EmitIntValue(getCompleteTypeIndex(DIGV->getType()).getIndex(), 4);
1443   OS.AddComment("DataOffset");
1444   OS.EmitCOFFSecRel32(GVSym);
1445   OS.AddComment("Segment");
1446   OS.EmitCOFFSectionIndex(GVSym);
1447   OS.AddComment("Name");
1448   emitNullTerminatedSymbolName(OS, DIGV->getName());
1449   OS.EmitLabel(DataEnd);
1450 }
1451