1 //===-- llvm/CodeGen/DwarfDebug.h - Dwarf Debug Framework ------*- C++ -*--===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains support for writing dwarf debug info into asm files.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #ifndef LLVM_LIB_CODEGEN_ASMPRINTER_DWARFDEBUG_H
15 #define LLVM_LIB_CODEGEN_ASMPRINTER_DWARFDEBUG_H
16 
17 #include "DbgValueHistoryCalculator.h"
18 #include "DebugHandlerBase.h"
19 #include "DebugLocStream.h"
20 #include "DwarfAccelTable.h"
21 #include "DwarfFile.h"
22 #include "llvm/ADT/DenseMap.h"
23 #include "llvm/ADT/DenseSet.h"
24 #include "llvm/ADT/MapVector.h"
25 #include "llvm/ADT/SetVector.h"
26 #include "llvm/ADT/SmallPtrSet.h"
27 #include "llvm/ADT/StringMap.h"
28 #include "llvm/CodeGen/DIE.h"
29 #include "llvm/CodeGen/LexicalScopes.h"
30 #include "llvm/CodeGen/MachineInstr.h"
31 #include "llvm/IR/DebugInfo.h"
32 #include "llvm/IR/DebugLoc.h"
33 #include "llvm/MC/MCDwarf.h"
34 #include "llvm/MC/MachineLocation.h"
35 #include "llvm/Support/Allocator.h"
36 #include "llvm/Target/TargetOptions.h"
37 #include <memory>
38 
39 namespace llvm {
40 
41 class AsmPrinter;
42 class ByteStreamer;
43 class ConstantInt;
44 class ConstantFP;
45 class DebugLocEntry;
46 class DwarfCompileUnit;
47 class DwarfDebug;
48 class DwarfTypeUnit;
49 class DwarfUnit;
50 class MachineModuleInfo;
51 
52 //===----------------------------------------------------------------------===//
53 /// This class is used to track local variable information.
54 ///
55 /// Variables can be created from allocas, in which case they're generated from
56 /// the MMI table.  Such variables can have multiple expressions and frame
57 /// indices.  The \a Expr and \a FrameIndices array must match.
58 ///
59 /// Variables can be created from \c DBG_VALUE instructions.  Those whose
60 /// location changes over time use \a DebugLocListIndex, while those with a
61 /// single instruction use \a MInsn and (optionally) a single entry of \a Expr.
62 ///
63 /// Variables that have been optimized out use none of these fields.
64 class DbgVariable {
65   const DILocalVariable *Var;                /// Variable Descriptor.
66   const DILocation *IA;                      /// Inlined at location.
67   SmallVector<const DIExpression *, 1> Expr; /// Complex address.
68   DIE *TheDIE = nullptr;                     /// Variable DIE.
69   unsigned DebugLocListIndex = ~0u;          /// Offset in DebugLocs.
70   const MachineInstr *MInsn = nullptr;       /// DBG_VALUE instruction.
71   SmallVector<int, 1> FrameIndex;            /// Frame index.
72 
73 public:
74   /// Construct a DbgVariable.
75   ///
76   /// Creates a variable without any DW_AT_location.  Call \a initializeMMI()
77   /// for MMI entries, or \a initializeDbgValue() for DBG_VALUE instructions.
78   DbgVariable(const DILocalVariable *V, const DILocation *IA)
79       : Var(V), IA(IA) {}
80 
81   /// Initialize from the MMI table.
82   void initializeMMI(const DIExpression *E, int FI) {
83     assert(Expr.empty() && "Already initialized?");
84     assert(FrameIndex.empty() && "Already initialized?");
85     assert(!MInsn && "Already initialized?");
86 
87     assert((!E || E->isValid()) && "Expected valid expression");
88     assert(~FI && "Expected valid index");
89 
90     Expr.push_back(E);
91     FrameIndex.push_back(FI);
92   }
93 
94   /// Initialize from a DBG_VALUE instruction.
95   void initializeDbgValue(const MachineInstr *DbgValue) {
96     assert(Expr.empty() && "Already initialized?");
97     assert(FrameIndex.empty() && "Already initialized?");
98     assert(!MInsn && "Already initialized?");
99 
100     assert(Var == DbgValue->getDebugVariable() && "Wrong variable");
101     assert(IA == DbgValue->getDebugLoc()->getInlinedAt() && "Wrong inlined-at");
102 
103     MInsn = DbgValue;
104     if (auto *E = DbgValue->getDebugExpression())
105       if (E->getNumElements())
106         Expr.push_back(E);
107   }
108 
109   // Accessors.
110   const DILocalVariable *getVariable() const { return Var; }
111   const DILocation *getInlinedAt() const { return IA; }
112   ArrayRef<const DIExpression *> getExpression() const { return Expr; }
113   const DIExpression *getSingleExpression() const {
114     assert(MInsn && Expr.size() <= 1);
115     return Expr.size() ? Expr[0] : nullptr;
116   }
117   void setDIE(DIE &D) { TheDIE = &D; }
118   DIE *getDIE() const { return TheDIE; }
119   void setDebugLocListIndex(unsigned O) { DebugLocListIndex = O; }
120   unsigned getDebugLocListIndex() const { return DebugLocListIndex; }
121   StringRef getName() const { return Var->getName(); }
122   const MachineInstr *getMInsn() const { return MInsn; }
123   ArrayRef<int> getFrameIndex() const { return FrameIndex; }
124 
125   void addMMIEntry(const DbgVariable &V) {
126     assert(DebugLocListIndex == ~0U && !MInsn && "not an MMI entry");
127     assert(V.DebugLocListIndex == ~0U && !V.MInsn && "not an MMI entry");
128     assert(V.Var == Var && "conflicting variable");
129     assert(V.IA == IA && "conflicting inlined-at location");
130 
131     assert(!FrameIndex.empty() && "Expected an MMI entry");
132     assert(!V.FrameIndex.empty() && "Expected an MMI entry");
133     assert(Expr.size() == FrameIndex.size() && "Mismatched expressions");
134     assert(V.Expr.size() == V.FrameIndex.size() && "Mismatched expressions");
135 
136     Expr.append(V.Expr.begin(), V.Expr.end());
137     FrameIndex.append(V.FrameIndex.begin(), V.FrameIndex.end());
138     assert(all_of(Expr, [](const DIExpression *E) {
139              return E && E->isFragment();
140            }) && "conflicting locations for variable");
141   }
142 
143   // Translate tag to proper Dwarf tag.
144   dwarf::Tag getTag() const {
145     // FIXME: Why don't we just infer this tag and store it all along?
146     if (Var->isParameter())
147       return dwarf::DW_TAG_formal_parameter;
148 
149     return dwarf::DW_TAG_variable;
150   }
151   /// Return true if DbgVariable is artificial.
152   bool isArtificial() const {
153     if (Var->isArtificial())
154       return true;
155     if (getType()->isArtificial())
156       return true;
157     return false;
158   }
159 
160   bool isObjectPointer() const {
161     if (Var->isObjectPointer())
162       return true;
163     if (getType()->isObjectPointer())
164       return true;
165     return false;
166   }
167 
168   bool hasComplexAddress() const {
169     assert(MInsn && "Expected DBG_VALUE, not MMI variable");
170     assert(FrameIndex.empty() && "Expected DBG_VALUE, not MMI variable");
171     assert(
172         (Expr.empty() || (Expr.size() == 1 && Expr.back()->getNumElements())) &&
173         "Invalid Expr for DBG_VALUE");
174     return !Expr.empty();
175   }
176   bool isBlockByrefVariable() const;
177   const DIType *getType() const;
178 
179 private:
180   template <typename T> T *resolve(TypedDINodeRef<T> Ref) const {
181     return Ref.resolve();
182   }
183 };
184 
185 
186 /// Helper used to pair up a symbol and its DWARF compile unit.
187 struct SymbolCU {
188   SymbolCU(DwarfCompileUnit *CU, const MCSymbol *Sym) : Sym(Sym), CU(CU) {}
189   const MCSymbol *Sym;
190   DwarfCompileUnit *CU;
191 };
192 
193 /// Collects and handles dwarf debug information.
194 class DwarfDebug : public DebugHandlerBase {
195   /// All DIEValues are allocated through this allocator.
196   BumpPtrAllocator DIEValueAllocator;
197 
198   /// Maps MDNode with its corresponding DwarfCompileUnit.
199   MapVector<const MDNode *, DwarfCompileUnit *> CUMap;
200 
201   /// Maps a CU DIE with its corresponding DwarfCompileUnit.
202   DenseMap<const DIE *, DwarfCompileUnit *> CUDieMap;
203 
204   /// List of all labels used in aranges generation.
205   std::vector<SymbolCU> ArangeLabels;
206 
207   /// Size of each symbol emitted (for those symbols that have a specific size).
208   DenseMap<const MCSymbol *, uint64_t> SymSize;
209 
210   /// Collection of abstract variables.
211   DenseMap<const MDNode *, std::unique_ptr<DbgVariable>> AbstractVariables;
212   SmallVector<std::unique_ptr<DbgVariable>, 64> ConcreteVariables;
213 
214   /// Collection of DebugLocEntry. Stored in a linked list so that DIELocLists
215   /// can refer to them in spite of insertions into this list.
216   DebugLocStream DebugLocs;
217 
218   /// This is a collection of subprogram MDNodes that are processed to
219   /// create DIEs.
220   SetVector<const DISubprogram *, SmallVector<const DISubprogram *, 16>,
221             SmallPtrSet<const DISubprogram *, 16>>
222       ProcessedSPNodes;
223 
224   /// If nonnull, stores the current machine function we're processing.
225   const MachineFunction *CurFn;
226 
227   /// If nonnull, stores the CU in which the previous subprogram was contained.
228   const DwarfCompileUnit *PrevCU;
229 
230   /// As an optimization, there is no need to emit an entry in the directory
231   /// table for the same directory as DW_AT_comp_dir.
232   StringRef CompilationDir;
233 
234   /// Holder for the file specific debug information.
235   DwarfFile InfoHolder;
236 
237   /// Holders for the various debug information flags that we might need to
238   /// have exposed. See accessor functions below for description.
239 
240   /// Map from MDNodes for user-defined types to their type signatures. Also
241   /// used to keep track of which types we have emitted type units for.
242   DenseMap<const MDNode *, uint64_t> TypeSignatures;
243 
244   SmallVector<
245       std::pair<std::unique_ptr<DwarfTypeUnit>, const DICompositeType *>, 1>
246       TypeUnitsUnderConstruction;
247 
248   /// Whether to emit the pubnames/pubtypes sections.
249   bool HasDwarfPubSections;
250 
251   /// Whether to use the GNU TLS opcode (instead of the standard opcode).
252   bool UseGNUTLSOpcode;
253 
254   /// Whether to use DWARF 2 bitfields (instead of the DWARF 4 format).
255   bool UseDWARF2Bitfields;
256 
257   /// Whether to emit all linkage names, or just abstract subprograms.
258   bool UseAllLinkageNames;
259 
260   /// DWARF5 Experimental Options
261   /// @{
262   bool HasDwarfAccelTables;
263   bool HasAppleExtensionAttributes;
264   bool HasSplitDwarf;
265 
266   /// Separated Dwarf Variables
267   /// In general these will all be for bits that are left in the
268   /// original object file, rather than things that are meant
269   /// to be in the .dwo sections.
270 
271   /// Holder for the skeleton information.
272   DwarfFile SkeletonHolder;
273 
274   /// Store file names for type units under fission in a line table
275   /// header that will be emitted into debug_line.dwo.
276   // FIXME: replace this with a map from comp_dir to table so that we
277   // can emit multiple tables during LTO each of which uses directory
278   // 0, referencing the comp_dir of all the type units that use it.
279   MCDwarfDwoLineTable SplitTypeUnitFileTable;
280   /// @}
281 
282   /// True iff there are multiple CUs in this module.
283   bool SingleCU;
284   bool IsDarwin;
285 
286   AddressPool AddrPool;
287 
288   DwarfAccelTable AccelNames;
289   DwarfAccelTable AccelObjC;
290   DwarfAccelTable AccelNamespace;
291   DwarfAccelTable AccelTypes;
292 
293   // Identify a debugger for "tuning" the debug info.
294   DebuggerKind DebuggerTuning;
295 
296   /// \defgroup DebuggerTuning Predicates to tune DWARF for a given debugger.
297   ///
298   /// Returns whether we are "tuning" for a given debugger.
299   /// Should be used only within the constructor, to set feature flags.
300   /// @{
301   bool tuneForGDB() const { return DebuggerTuning == DebuggerKind::GDB; }
302   bool tuneForLLDB() const { return DebuggerTuning == DebuggerKind::LLDB; }
303   bool tuneForSCE() const { return DebuggerTuning == DebuggerKind::SCE; }
304   /// @}
305 
306   MCDwarfDwoLineTable *getDwoLineTable(const DwarfCompileUnit &);
307 
308   const SmallVectorImpl<std::unique_ptr<DwarfCompileUnit>> &getUnits() {
309     return InfoHolder.getUnits();
310   }
311 
312   typedef DbgValueHistoryMap::InlinedVariable InlinedVariable;
313 
314   /// Find abstract variable associated with Var.
315   DbgVariable *getExistingAbstractVariable(InlinedVariable IV,
316                                            const DILocalVariable *&Cleansed);
317   DbgVariable *getExistingAbstractVariable(InlinedVariable IV);
318   void createAbstractVariable(const DILocalVariable *DV, LexicalScope *Scope);
319   void ensureAbstractVariableIsCreated(InlinedVariable Var,
320                                        const MDNode *Scope);
321   void ensureAbstractVariableIsCreatedIfScoped(InlinedVariable Var,
322                                                const MDNode *Scope);
323 
324   DbgVariable *createConcreteVariable(LexicalScope &Scope, InlinedVariable IV);
325 
326   /// Construct a DIE for this abstract scope.
327   void constructAbstractSubprogramScopeDIE(LexicalScope *Scope);
328 
329   void finishVariableDefinitions();
330 
331   void finishSubprogramDefinitions();
332 
333   /// Finish off debug information after all functions have been
334   /// processed.
335   void finalizeModuleInfo();
336 
337   /// Emit the debug info section.
338   void emitDebugInfo();
339 
340   /// Emit the abbreviation section.
341   void emitAbbreviations();
342 
343   /// Emit a specified accelerator table.
344   void emitAccel(DwarfAccelTable &Accel, MCSection *Section,
345                  StringRef TableName);
346 
347   /// Emit visible names into a hashed accelerator table section.
348   void emitAccelNames();
349 
350   /// Emit objective C classes and categories into a hashed
351   /// accelerator table section.
352   void emitAccelObjC();
353 
354   /// Emit namespace dies into a hashed accelerator table.
355   void emitAccelNamespaces();
356 
357   /// Emit type dies into a hashed accelerator table.
358   void emitAccelTypes();
359 
360   /// Emit visible names into a debug pubnames section.
361   /// \param GnuStyle determines whether or not we want to emit
362   /// additional information into the table ala newer gcc for gdb
363   /// index.
364   void emitDebugPubNames(bool GnuStyle = false);
365 
366   /// Emit visible types into a debug pubtypes section.
367   /// \param GnuStyle determines whether or not we want to emit
368   /// additional information into the table ala newer gcc for gdb
369   /// index.
370   void emitDebugPubTypes(bool GnuStyle = false);
371 
372   void emitDebugPubSection(
373       bool GnuStyle, MCSection *PSec, StringRef Name,
374       const StringMap<const DIE *> &(DwarfCompileUnit::*Accessor)() const);
375 
376   /// Emit null-terminated strings into a debug str section.
377   void emitDebugStr();
378 
379   /// Emit variable locations into a debug loc section.
380   void emitDebugLoc();
381 
382   /// Emit variable locations into a debug loc dwo section.
383   void emitDebugLocDWO();
384 
385   /// Emit address ranges into a debug aranges section.
386   void emitDebugARanges();
387 
388   /// Emit address ranges into a debug ranges section.
389   void emitDebugRanges();
390 
391   /// Emit macros into a debug macinfo section.
392   void emitDebugMacinfo();
393   void emitMacro(DIMacro &M);
394   void emitMacroFile(DIMacroFile &F, DwarfCompileUnit &U);
395   void handleMacroNodes(DIMacroNodeArray Nodes, DwarfCompileUnit &U);
396 
397   /// DWARF 5 Experimental Split Dwarf Emitters
398 
399   /// Initialize common features of skeleton units.
400   void initSkeletonUnit(const DwarfUnit &U, DIE &Die,
401                         std::unique_ptr<DwarfCompileUnit> NewU);
402 
403   /// Construct the split debug info compile unit for the debug info
404   /// section.
405   DwarfCompileUnit &constructSkeletonCU(const DwarfCompileUnit &CU);
406 
407   /// Emit the debug info dwo section.
408   void emitDebugInfoDWO();
409 
410   /// Emit the debug abbrev dwo section.
411   void emitDebugAbbrevDWO();
412 
413   /// Emit the debug line dwo section.
414   void emitDebugLineDWO();
415 
416   /// Emit the debug str dwo section.
417   void emitDebugStrDWO();
418 
419   /// Flags to let the linker know we have emitted new style pubnames. Only
420   /// emit it here if we don't have a skeleton CU for split dwarf.
421   void addGnuPubAttributes(DwarfUnit &U, DIE &D) const;
422 
423   /// Create new DwarfCompileUnit for the given metadata node with tag
424   /// DW_TAG_compile_unit.
425   DwarfCompileUnit &constructDwarfCompileUnit(const DICompileUnit *DIUnit);
426 
427   /// Construct imported_module or imported_declaration DIE.
428   void constructAndAddImportedEntityDIE(DwarfCompileUnit &TheCU,
429                                         const DIImportedEntity *N);
430 
431   /// Register a source line with debug info. Returns the unique
432   /// label that was emitted and which provides correspondence to the
433   /// source line list.
434   void recordSourceLine(unsigned Line, unsigned Col, const MDNode *Scope,
435                         unsigned Flags);
436 
437   /// Populate LexicalScope entries with variables' info.
438   void collectVariableInfo(DwarfCompileUnit &TheCU, const DISubprogram *SP,
439                            DenseSet<InlinedVariable> &ProcessedVars);
440 
441   /// Build the location list for all DBG_VALUEs in the
442   /// function that describe the same variable.
443   void buildLocationList(SmallVectorImpl<DebugLocEntry> &DebugLoc,
444                          const DbgValueHistoryMap::InstrRanges &Ranges);
445 
446   /// Collect variable information from the side table maintained by MF.
447   void collectVariableInfoFromMFTable(DenseSet<InlinedVariable> &P);
448 
449 public:
450   //===--------------------------------------------------------------------===//
451   // Main entry points.
452   //
453   DwarfDebug(AsmPrinter *A, Module *M);
454 
455   ~DwarfDebug() override;
456 
457   /// Emit all Dwarf sections that should come prior to the
458   /// content.
459   void beginModule();
460 
461   /// Emit all Dwarf sections that should come after the content.
462   void endModule() override;
463 
464   /// Gather pre-function debug information.
465   void beginFunction(const MachineFunction *MF) override;
466 
467   /// Gather and emit post-function debug information.
468   void endFunction(const MachineFunction *MF) override;
469 
470   /// Process beginning of an instruction.
471   void beginInstruction(const MachineInstr *MI) override;
472 
473   /// Perform an MD5 checksum of \p Identifier and return the lower 64 bits.
474   static uint64_t makeTypeSignature(StringRef Identifier);
475 
476   /// Add a DIE to the set of types that we're going to pull into
477   /// type units.
478   void addDwarfTypeUnitType(DwarfCompileUnit &CU, StringRef Identifier,
479                             DIE &Die, const DICompositeType *CTy);
480 
481   /// Add a label so that arange data can be generated for it.
482   void addArangeLabel(SymbolCU SCU) { ArangeLabels.push_back(SCU); }
483 
484   /// For symbols that have a size designated (e.g. common symbols),
485   /// this tracks that size.
486   void setSymbolSize(const MCSymbol *Sym, uint64_t Size) override {
487     SymSize[Sym] = Size;
488   }
489 
490   /// Returns whether we should emit all DW_AT_[MIPS_]linkage_name.
491   /// If not, we still might emit certain cases.
492   bool useAllLinkageNames() const { return UseAllLinkageNames; }
493 
494   /// Returns whether to use DW_OP_GNU_push_tls_address, instead of the
495   /// standard DW_OP_form_tls_address opcode
496   bool useGNUTLSOpcode() const { return UseGNUTLSOpcode; }
497 
498   /// Returns whether to use the DWARF2 format for bitfields instyead of the
499   /// DWARF4 format.
500   bool useDWARF2Bitfields() const { return UseDWARF2Bitfields; }
501 
502   // Experimental DWARF5 features.
503 
504   /// Returns whether or not to emit tables that dwarf consumers can
505   /// use to accelerate lookup.
506   bool useDwarfAccelTables() const { return HasDwarfAccelTables; }
507 
508   bool useAppleExtensionAttributes() const {
509     return HasAppleExtensionAttributes;
510   }
511 
512   /// Returns whether or not to change the current debug info for the
513   /// split dwarf proposal support.
514   bool useSplitDwarf() const { return HasSplitDwarf; }
515 
516   /// Returns the Dwarf Version.
517   uint16_t getDwarfVersion() const;
518 
519   /// Returns the previous CU that was being updated
520   const DwarfCompileUnit *getPrevCU() const { return PrevCU; }
521   void setPrevCU(const DwarfCompileUnit *PrevCU) { this->PrevCU = PrevCU; }
522 
523   /// Returns the entries for the .debug_loc section.
524   const DebugLocStream &getDebugLocs() const { return DebugLocs; }
525 
526   /// Emit an entry for the debug loc section. This can be used to
527   /// handle an entry that's going to be emitted into the debug loc section.
528   void emitDebugLocEntry(ByteStreamer &Streamer,
529                          const DebugLocStream::Entry &Entry);
530 
531   /// Emit the location for a debug loc entry, including the size header.
532   void emitDebugLocEntryLocation(const DebugLocStream::Entry &Entry);
533 
534   /// Find the MDNode for the given reference.
535   template <typename T> T *resolve(TypedDINodeRef<T> Ref) const {
536     return Ref.resolve();
537   }
538 
539   void addSubprogramNames(const DISubprogram *SP, DIE &Die);
540 
541   AddressPool &getAddressPool() { return AddrPool; }
542 
543   void addAccelName(StringRef Name, const DIE &Die);
544 
545   void addAccelObjC(StringRef Name, const DIE &Die);
546 
547   void addAccelNamespace(StringRef Name, const DIE &Die);
548 
549   void addAccelType(StringRef Name, const DIE &Die, char Flags);
550 
551   const MachineFunction *getCurrentFunction() const { return CurFn; }
552 
553   /// A helper function to check whether the DIE for a given Scope is
554   /// going to be null.
555   bool isLexicalScopeDIENull(LexicalScope *Scope);
556 };
557 } // End of namespace llvm
558 
559 #endif
560