1 //===- llvm/CodeGen/DwarfExpression.cpp - Dwarf Debug Framework -----------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file contains support for writing dwarf debug info into asm files.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "DwarfExpression.h"
14 #include "DwarfCompileUnit.h"
15 #include "llvm/ADT/APInt.h"
16 #include "llvm/ADT/SmallBitVector.h"
17 #include "llvm/BinaryFormat/Dwarf.h"
18 #include "llvm/CodeGen/Register.h"
19 #include "llvm/CodeGen/TargetRegisterInfo.h"
20 #include "llvm/IR/DebugInfoMetadata.h"
21 #include "llvm/Support/ErrorHandling.h"
22 #include <algorithm>
23 #include <cassert>
24 #include <cstdint>
25 
26 using namespace llvm;
27 
28 void DwarfExpression::emitConstu(uint64_t Value) {
29   if (Value < 32)
30     emitOp(dwarf::DW_OP_lit0 + Value);
31   else if (Value == std::numeric_limits<uint64_t>::max()) {
32     // Only do this for 64-bit values as the DWARF expression stack uses
33     // target-address-size values.
34     emitOp(dwarf::DW_OP_lit0);
35     emitOp(dwarf::DW_OP_not);
36   } else {
37     emitOp(dwarf::DW_OP_constu);
38     emitUnsigned(Value);
39   }
40 }
41 
42 void DwarfExpression::addReg(int DwarfReg, const char *Comment) {
43  assert(DwarfReg >= 0 && "invalid negative dwarf register number");
44  assert((isUnknownLocation() || isRegisterLocation()) &&
45         "location description already locked down");
46  LocationKind = Register;
47  if (DwarfReg < 32) {
48    emitOp(dwarf::DW_OP_reg0 + DwarfReg, Comment);
49   } else {
50     emitOp(dwarf::DW_OP_regx, Comment);
51     emitUnsigned(DwarfReg);
52   }
53 }
54 
55 void DwarfExpression::addBReg(int DwarfReg, int Offset) {
56   assert(DwarfReg >= 0 && "invalid negative dwarf register number");
57   assert(!isRegisterLocation() && "location description already locked down");
58   if (DwarfReg < 32) {
59     emitOp(dwarf::DW_OP_breg0 + DwarfReg);
60   } else {
61     emitOp(dwarf::DW_OP_bregx);
62     emitUnsigned(DwarfReg);
63   }
64   emitSigned(Offset);
65 }
66 
67 void DwarfExpression::addFBReg(int Offset) {
68   emitOp(dwarf::DW_OP_fbreg);
69   emitSigned(Offset);
70 }
71 
72 void DwarfExpression::addOpPiece(unsigned SizeInBits, unsigned OffsetInBits) {
73   if (!SizeInBits)
74     return;
75 
76   const unsigned SizeOfByte = 8;
77   if (OffsetInBits > 0 || SizeInBits % SizeOfByte) {
78     emitOp(dwarf::DW_OP_bit_piece);
79     emitUnsigned(SizeInBits);
80     emitUnsigned(OffsetInBits);
81   } else {
82     emitOp(dwarf::DW_OP_piece);
83     unsigned ByteSize = SizeInBits / SizeOfByte;
84     emitUnsigned(ByteSize);
85   }
86   this->OffsetInBits += SizeInBits;
87 }
88 
89 void DwarfExpression::addShr(unsigned ShiftBy) {
90   emitConstu(ShiftBy);
91   emitOp(dwarf::DW_OP_shr);
92 }
93 
94 void DwarfExpression::addAnd(unsigned Mask) {
95   emitConstu(Mask);
96   emitOp(dwarf::DW_OP_and);
97 }
98 
99 bool DwarfExpression::addMachineReg(const TargetRegisterInfo &TRI,
100                                     unsigned MachineReg, unsigned MaxSize) {
101   if (!llvm::Register::isPhysicalRegister(MachineReg)) {
102     if (isFrameRegister(TRI, MachineReg)) {
103       DwarfRegs.push_back({-1, 0, nullptr});
104       return true;
105     }
106     return false;
107   }
108 
109   int Reg = TRI.getDwarfRegNum(MachineReg, false);
110 
111   // If this is a valid register number, emit it.
112   if (Reg >= 0) {
113     DwarfRegs.push_back({Reg, 0, nullptr});
114     return true;
115   }
116 
117   // Walk up the super-register chain until we find a valid number.
118   // For example, EAX on x86_64 is a 32-bit fragment of RAX with offset 0.
119   for (MCSuperRegIterator SR(MachineReg, &TRI); SR.isValid(); ++SR) {
120     Reg = TRI.getDwarfRegNum(*SR, false);
121     if (Reg >= 0) {
122       unsigned Idx = TRI.getSubRegIndex(*SR, MachineReg);
123       unsigned Size = TRI.getSubRegIdxSize(Idx);
124       unsigned RegOffset = TRI.getSubRegIdxOffset(Idx);
125       DwarfRegs.push_back({Reg, 0, "super-register"});
126       // Use a DW_OP_bit_piece to describe the sub-register.
127       setSubRegisterPiece(Size, RegOffset);
128       return true;
129     }
130   }
131 
132   // Otherwise, attempt to find a covering set of sub-register numbers.
133   // For example, Q0 on ARM is a composition of D0+D1.
134   unsigned CurPos = 0;
135   // The size of the register in bits.
136   const TargetRegisterClass *RC = TRI.getMinimalPhysRegClass(MachineReg);
137   unsigned RegSize = TRI.getRegSizeInBits(*RC);
138   // Keep track of the bits in the register we already emitted, so we
139   // can avoid emitting redundant aliasing subregs. Because this is
140   // just doing a greedy scan of all subregisters, it is possible that
141   // this doesn't find a combination of subregisters that fully cover
142   // the register (even though one may exist).
143   SmallBitVector Coverage(RegSize, false);
144   for (MCSubRegIterator SR(MachineReg, &TRI); SR.isValid(); ++SR) {
145     unsigned Idx = TRI.getSubRegIndex(MachineReg, *SR);
146     unsigned Size = TRI.getSubRegIdxSize(Idx);
147     unsigned Offset = TRI.getSubRegIdxOffset(Idx);
148     Reg = TRI.getDwarfRegNum(*SR, false);
149     if (Reg < 0)
150       continue;
151 
152     // Intersection between the bits we already emitted and the bits
153     // covered by this subregister.
154     SmallBitVector CurSubReg(RegSize, false);
155     CurSubReg.set(Offset, Offset + Size);
156 
157     // If this sub-register has a DWARF number and we haven't covered
158     // its range, emit a DWARF piece for it.
159     if (CurSubReg.test(Coverage)) {
160       // Emit a piece for any gap in the coverage.
161       if (Offset > CurPos)
162         DwarfRegs.push_back({-1, Offset - CurPos, "no DWARF register encoding"});
163       DwarfRegs.push_back(
164           {Reg, std::min<unsigned>(Size, MaxSize - Offset), "sub-register"});
165       if (Offset >= MaxSize)
166         break;
167 
168       // Mark it as emitted.
169       Coverage.set(Offset, Offset + Size);
170       CurPos = Offset + Size;
171     }
172   }
173   // Failed to find any DWARF encoding.
174   if (CurPos == 0)
175     return false;
176   // Found a partial or complete DWARF encoding.
177   if (CurPos < RegSize)
178     DwarfRegs.push_back({-1, RegSize - CurPos, "no DWARF register encoding"});
179   return true;
180 }
181 
182 void DwarfExpression::addStackValue() {
183   if (DwarfVersion >= 4)
184     emitOp(dwarf::DW_OP_stack_value);
185 }
186 
187 void DwarfExpression::addSignedConstant(int64_t Value) {
188   assert(isImplicitLocation() || isUnknownLocation());
189   LocationKind = Implicit;
190   emitOp(dwarf::DW_OP_consts);
191   emitSigned(Value);
192 }
193 
194 void DwarfExpression::addUnsignedConstant(uint64_t Value) {
195   assert(isImplicitLocation() || isUnknownLocation());
196   LocationKind = Implicit;
197   emitConstu(Value);
198 }
199 
200 void DwarfExpression::addUnsignedConstant(const APInt &Value) {
201   assert(isImplicitLocation() || isUnknownLocation());
202   LocationKind = Implicit;
203 
204   unsigned Size = Value.getBitWidth();
205   const uint64_t *Data = Value.getRawData();
206 
207   // Chop it up into 64-bit pieces, because that's the maximum that
208   // addUnsignedConstant takes.
209   unsigned Offset = 0;
210   while (Offset < Size) {
211     addUnsignedConstant(*Data++);
212     if (Offset == 0 && Size <= 64)
213       break;
214     addStackValue();
215     addOpPiece(std::min(Size - Offset, 64u), Offset);
216     Offset += 64;
217   }
218 }
219 
220 bool DwarfExpression::addMachineRegExpression(const TargetRegisterInfo &TRI,
221                                               DIExpressionCursor &ExprCursor,
222                                               unsigned MachineReg,
223                                               unsigned FragmentOffsetInBits) {
224   auto Fragment = ExprCursor.getFragmentInfo();
225   if (!addMachineReg(TRI, MachineReg, Fragment ? Fragment->SizeInBits : ~1U)) {
226     LocationKind = Unknown;
227     return false;
228   }
229 
230   bool HasComplexExpression = false;
231   auto Op = ExprCursor.peek();
232   if (Op && Op->getOp() != dwarf::DW_OP_LLVM_fragment)
233     HasComplexExpression = true;
234 
235   // If the register can only be described by a complex expression (i.e.,
236   // multiple subregisters) it doesn't safely compose with another complex
237   // expression. For example, it is not possible to apply a DW_OP_deref
238   // operation to multiple DW_OP_pieces.
239   if (HasComplexExpression && DwarfRegs.size() > 1) {
240     DwarfRegs.clear();
241     LocationKind = Unknown;
242     return false;
243   }
244 
245   // Handle simple register locations. If we are supposed to emit
246   // a call site parameter expression and if that expression is just a register
247   // location, emit it with addBReg and offset 0, because we should emit a DWARF
248   // expression representing a value, rather than a location.
249   if (!isMemoryLocation() && !HasComplexExpression && (!isParameterValue() ||
250                                                        isEntryValue())) {
251     for (auto &Reg : DwarfRegs) {
252       if (Reg.DwarfRegNo >= 0)
253         addReg(Reg.DwarfRegNo, Reg.Comment);
254       addOpPiece(Reg.Size);
255     }
256 
257     if (isEntryValue() && !isParameterValue() && DwarfVersion >= 4)
258       emitOp(dwarf::DW_OP_stack_value);
259 
260     DwarfRegs.clear();
261     return true;
262   }
263 
264   // Don't emit locations that cannot be expressed without DW_OP_stack_value.
265   if (DwarfVersion < 4)
266     if (any_of(ExprCursor, [](DIExpression::ExprOperand Op) -> bool {
267           return Op.getOp() == dwarf::DW_OP_stack_value;
268         })) {
269       DwarfRegs.clear();
270       LocationKind = Unknown;
271       return false;
272     }
273 
274   assert(DwarfRegs.size() == 1);
275   auto Reg = DwarfRegs[0];
276   bool FBReg = isFrameRegister(TRI, MachineReg);
277   int SignedOffset = 0;
278   assert(Reg.Size == 0 && "subregister has same size as superregister");
279 
280   // Pattern-match combinations for which more efficient representations exist.
281   // [Reg, DW_OP_plus_uconst, Offset] --> [DW_OP_breg, Offset].
282   if (Op && (Op->getOp() == dwarf::DW_OP_plus_uconst)) {
283     uint64_t Offset = Op->getArg(0);
284     uint64_t IntMax = static_cast<uint64_t>(std::numeric_limits<int>::max());
285     if (Offset <= IntMax) {
286       SignedOffset = Offset;
287       ExprCursor.take();
288     }
289   }
290 
291   // [Reg, DW_OP_constu, Offset, DW_OP_plus]  --> [DW_OP_breg, Offset]
292   // [Reg, DW_OP_constu, Offset, DW_OP_minus] --> [DW_OP_breg,-Offset]
293   // If Reg is a subregister we need to mask it out before subtracting.
294   if (Op && Op->getOp() == dwarf::DW_OP_constu) {
295     uint64_t Offset = Op->getArg(0);
296     uint64_t IntMax = static_cast<uint64_t>(std::numeric_limits<int>::max());
297     auto N = ExprCursor.peekNext();
298     if (N && N->getOp() == dwarf::DW_OP_plus && Offset <= IntMax) {
299       SignedOffset = Offset;
300       ExprCursor.consume(2);
301     } else if (N && N->getOp() == dwarf::DW_OP_minus &&
302                !SubRegisterSizeInBits && Offset <= IntMax + 1) {
303       SignedOffset = -static_cast<int64_t>(Offset);
304       ExprCursor.consume(2);
305     }
306   }
307 
308   if (FBReg)
309     addFBReg(SignedOffset);
310   else
311     addBReg(Reg.DwarfRegNo, SignedOffset);
312   DwarfRegs.clear();
313   return true;
314 }
315 
316 void DwarfExpression::addEntryValueExpression(DIExpressionCursor &ExprCursor) {
317   auto Op = ExprCursor.take();
318   assert(Op && Op->getOp() == dwarf::DW_OP_entry_value);
319   assert(!isMemoryLocation() &&
320          "We don't support entry values of memory locations yet");
321 
322   emitOp(CU.getDwarf5OrGNULocationAtom(dwarf::DW_OP_entry_value));
323   emitUnsigned(Op->getArg(0));
324 }
325 
326 /// Assuming a well-formed expression, match "DW_OP_deref* DW_OP_LLVM_fragment?".
327 static bool isMemoryLocation(DIExpressionCursor ExprCursor) {
328   while (ExprCursor) {
329     auto Op = ExprCursor.take();
330     switch (Op->getOp()) {
331     case dwarf::DW_OP_deref:
332     case dwarf::DW_OP_LLVM_fragment:
333       break;
334     default:
335       return false;
336     }
337   }
338   return true;
339 }
340 
341 void DwarfExpression::addExpression(DIExpressionCursor &&ExprCursor,
342                                     unsigned FragmentOffsetInBits) {
343   // If we need to mask out a subregister, do it now, unless the next
344   // operation would emit an OpPiece anyway.
345   auto N = ExprCursor.peek();
346   if (SubRegisterSizeInBits && N && (N->getOp() != dwarf::DW_OP_LLVM_fragment))
347     maskSubRegister();
348 
349   Optional<DIExpression::ExprOperand> PrevConvertOp = None;
350 
351   while (ExprCursor) {
352     auto Op = ExprCursor.take();
353     uint64_t OpNum = Op->getOp();
354 
355     if (OpNum >= dwarf::DW_OP_reg0 && OpNum <= dwarf::DW_OP_reg31) {
356       emitOp(OpNum);
357       continue;
358     } else if (OpNum >= dwarf::DW_OP_breg0 && OpNum <= dwarf::DW_OP_breg31) {
359       addBReg(OpNum - dwarf::DW_OP_breg0, Op->getArg(0));
360       continue;
361     }
362 
363     switch (OpNum) {
364     case dwarf::DW_OP_LLVM_fragment: {
365       unsigned SizeInBits = Op->getArg(1);
366       unsigned FragmentOffset = Op->getArg(0);
367       // The fragment offset must have already been adjusted by emitting an
368       // empty DW_OP_piece / DW_OP_bit_piece before we emitted the base
369       // location.
370       assert(OffsetInBits >= FragmentOffset && "fragment offset not added?");
371 
372       // If addMachineReg already emitted DW_OP_piece operations to represent
373       // a super-register by splicing together sub-registers, subtract the size
374       // of the pieces that was already emitted.
375       SizeInBits -= OffsetInBits - FragmentOffset;
376 
377       // If addMachineReg requested a DW_OP_bit_piece to stencil out a
378       // sub-register that is smaller than the current fragment's size, use it.
379       if (SubRegisterSizeInBits)
380         SizeInBits = std::min<unsigned>(SizeInBits, SubRegisterSizeInBits);
381 
382       // Emit a DW_OP_stack_value for implicit location descriptions.
383       if (isImplicitLocation())
384         addStackValue();
385 
386       // Emit the DW_OP_piece.
387       addOpPiece(SizeInBits, SubRegisterOffsetInBits);
388       setSubRegisterPiece(0, 0);
389       // Reset the location description kind.
390       LocationKind = Unknown;
391       return;
392     }
393     case dwarf::DW_OP_plus_uconst:
394       assert(!isRegisterLocation());
395       emitOp(dwarf::DW_OP_plus_uconst);
396       emitUnsigned(Op->getArg(0));
397       break;
398     case dwarf::DW_OP_plus:
399     case dwarf::DW_OP_minus:
400     case dwarf::DW_OP_mul:
401     case dwarf::DW_OP_div:
402     case dwarf::DW_OP_mod:
403     case dwarf::DW_OP_or:
404     case dwarf::DW_OP_and:
405     case dwarf::DW_OP_xor:
406     case dwarf::DW_OP_shl:
407     case dwarf::DW_OP_shr:
408     case dwarf::DW_OP_shra:
409     case dwarf::DW_OP_lit0:
410     case dwarf::DW_OP_not:
411     case dwarf::DW_OP_dup:
412       emitOp(OpNum);
413       break;
414     case dwarf::DW_OP_deref:
415       assert(!isRegisterLocation());
416       if (!isMemoryLocation() && ::isMemoryLocation(ExprCursor))
417         // Turning this into a memory location description makes the deref
418         // implicit.
419         LocationKind = Memory;
420       else
421         emitOp(dwarf::DW_OP_deref);
422       break;
423     case dwarf::DW_OP_constu:
424       assert(!isRegisterLocation());
425       emitConstu(Op->getArg(0));
426       break;
427     case dwarf::DW_OP_LLVM_convert: {
428       unsigned BitSize = Op->getArg(0);
429       dwarf::TypeKind Encoding = static_cast<dwarf::TypeKind>(Op->getArg(1));
430       if (DwarfVersion >= 5) {
431         emitOp(dwarf::DW_OP_convert);
432         // Reuse the base_type if we already have one in this CU otherwise we
433         // create a new one.
434         unsigned I = 0, E = CU.ExprRefedBaseTypes.size();
435         for (; I != E; ++I)
436           if (CU.ExprRefedBaseTypes[I].BitSize == BitSize &&
437               CU.ExprRefedBaseTypes[I].Encoding == Encoding)
438             break;
439 
440         if (I == E)
441           CU.ExprRefedBaseTypes.emplace_back(BitSize, Encoding);
442 
443         // If targeting a location-list; simply emit the index into the raw
444         // byte stream as ULEB128, DwarfDebug::emitDebugLocEntry has been
445         // fitted with means to extract it later.
446         // If targeting a inlined DW_AT_location; insert a DIEBaseTypeRef
447         // (containing the index and a resolve mechanism during emit) into the
448         // DIE value list.
449         emitBaseTypeRef(I);
450       } else {
451         if (PrevConvertOp && PrevConvertOp->getArg(0) < BitSize) {
452           if (Encoding == dwarf::DW_ATE_signed)
453             emitLegacySExt(PrevConvertOp->getArg(0));
454           else if (Encoding == dwarf::DW_ATE_unsigned)
455             emitLegacyZExt(PrevConvertOp->getArg(0));
456           PrevConvertOp = None;
457         } else {
458           PrevConvertOp = Op;
459         }
460       }
461       break;
462     }
463     case dwarf::DW_OP_stack_value:
464       LocationKind = Implicit;
465       break;
466     case dwarf::DW_OP_swap:
467       assert(!isRegisterLocation());
468       emitOp(dwarf::DW_OP_swap);
469       break;
470     case dwarf::DW_OP_xderef:
471       assert(!isRegisterLocation());
472       emitOp(dwarf::DW_OP_xderef);
473       break;
474     case dwarf::DW_OP_deref_size:
475       emitOp(dwarf::DW_OP_deref_size);
476       emitData1(Op->getArg(0));
477       break;
478     case dwarf::DW_OP_LLVM_tag_offset:
479       TagOffset = Op->getArg(0);
480       break;
481     case dwarf::DW_OP_regx:
482       emitOp(dwarf::DW_OP_regx);
483       emitUnsigned(Op->getArg(0));
484       break;
485     case dwarf::DW_OP_bregx:
486       emitOp(dwarf::DW_OP_bregx);
487       emitUnsigned(Op->getArg(0));
488       emitSigned(Op->getArg(1));
489       break;
490     default:
491       llvm_unreachable("unhandled opcode found in expression");
492     }
493   }
494 
495   if (isImplicitLocation() && !isParameterValue())
496     // Turn this into an implicit location description.
497     addStackValue();
498 }
499 
500 /// add masking operations to stencil out a subregister.
501 void DwarfExpression::maskSubRegister() {
502   assert(SubRegisterSizeInBits && "no subregister was registered");
503   if (SubRegisterOffsetInBits > 0)
504     addShr(SubRegisterOffsetInBits);
505   uint64_t Mask = (1ULL << (uint64_t)SubRegisterSizeInBits) - 1ULL;
506   addAnd(Mask);
507 }
508 
509 void DwarfExpression::finalize() {
510   assert(DwarfRegs.size() == 0 && "dwarf registers not emitted");
511   // Emit any outstanding DW_OP_piece operations to mask out subregisters.
512   if (SubRegisterSizeInBits == 0)
513     return;
514   // Don't emit a DW_OP_piece for a subregister at offset 0.
515   if (SubRegisterOffsetInBits == 0)
516     return;
517   addOpPiece(SubRegisterSizeInBits, SubRegisterOffsetInBits);
518 }
519 
520 void DwarfExpression::addFragmentOffset(const DIExpression *Expr) {
521   if (!Expr || !Expr->isFragment())
522     return;
523 
524   uint64_t FragmentOffset = Expr->getFragmentInfo()->OffsetInBits;
525   assert(FragmentOffset >= OffsetInBits &&
526          "overlapping or duplicate fragments");
527   if (FragmentOffset > OffsetInBits)
528     addOpPiece(FragmentOffset - OffsetInBits);
529   OffsetInBits = FragmentOffset;
530 }
531 
532 void DwarfExpression::emitLegacySExt(unsigned FromBits) {
533   // (((X >> (FromBits - 1)) * (~0)) << FromBits) | X
534   emitOp(dwarf::DW_OP_dup);
535   emitOp(dwarf::DW_OP_constu);
536   emitUnsigned(FromBits - 1);
537   emitOp(dwarf::DW_OP_shr);
538   emitOp(dwarf::DW_OP_lit0);
539   emitOp(dwarf::DW_OP_not);
540   emitOp(dwarf::DW_OP_mul);
541   emitOp(dwarf::DW_OP_constu);
542   emitUnsigned(FromBits);
543   emitOp(dwarf::DW_OP_shl);
544   emitOp(dwarf::DW_OP_or);
545 }
546 
547 void DwarfExpression::emitLegacyZExt(unsigned FromBits) {
548   // (X & (1 << FromBits - 1))
549   emitOp(dwarf::DW_OP_constu);
550   emitUnsigned((1ULL << FromBits) - 1);
551   emitOp(dwarf::DW_OP_and);
552 }
553