1 //===-- RuntimeDyld.cpp - Run-time dynamic linker for MC-JIT ----*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // Implementation of the MC-JIT runtime dynamic linker.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/ExecutionEngine/RuntimeDyld.h"
15 #include "RuntimeDyldCheckerImpl.h"
16 #include "RuntimeDyldCOFF.h"
17 #include "RuntimeDyldELF.h"
18 #include "RuntimeDyldImpl.h"
19 #include "RuntimeDyldMachO.h"
20 #include "llvm/Object/ELFObjectFile.h"
21 #include "llvm/Object/COFF.h"
22 #include "llvm/Support/ManagedStatic.h"
23 #include "llvm/Support/MathExtras.h"
24 #include "llvm/Support/MutexGuard.h"
25 
26 using namespace llvm;
27 using namespace llvm::object;
28 
29 #define DEBUG_TYPE "dyld"
30 
31 namespace {
32 
33 enum RuntimeDyldErrorCode {
34   GenericRTDyldError = 1
35 };
36 
37 // FIXME: This class is only here to support the transition to llvm::Error. It
38 // will be removed once this transition is complete. Clients should prefer to
39 // deal with the Error value directly, rather than converting to error_code.
40 class RuntimeDyldErrorCategory : public std::error_category {
41 public:
42   const char *name() const noexcept override { return "runtimedyld"; }
43 
44   std::string message(int Condition) const override {
45     switch (static_cast<RuntimeDyldErrorCode>(Condition)) {
46       case GenericRTDyldError: return "Generic RuntimeDyld error";
47     }
48     llvm_unreachable("Unrecognized RuntimeDyldErrorCode");
49   }
50 };
51 
52 static ManagedStatic<RuntimeDyldErrorCategory> RTDyldErrorCategory;
53 
54 }
55 
56 char RuntimeDyldError::ID = 0;
57 
58 void RuntimeDyldError::log(raw_ostream &OS) const {
59   OS << ErrMsg << "\n";
60 }
61 
62 std::error_code RuntimeDyldError::convertToErrorCode() const {
63   return std::error_code(GenericRTDyldError, *RTDyldErrorCategory);
64 }
65 
66 // Empty out-of-line virtual destructor as the key function.
67 RuntimeDyldImpl::~RuntimeDyldImpl() {}
68 
69 // Pin LoadedObjectInfo's vtables to this file.
70 void RuntimeDyld::LoadedObjectInfo::anchor() {}
71 
72 namespace llvm {
73 
74 void RuntimeDyldImpl::registerEHFrames() {}
75 
76 void RuntimeDyldImpl::deregisterEHFrames() {}
77 
78 #ifndef NDEBUG
79 static void dumpSectionMemory(const SectionEntry &S, StringRef State) {
80   dbgs() << "----- Contents of section " << S.getName() << " " << State
81          << " -----";
82 
83   if (S.getAddress() == nullptr) {
84     dbgs() << "\n          <section not emitted>\n";
85     return;
86   }
87 
88   const unsigned ColsPerRow = 16;
89 
90   uint8_t *DataAddr = S.getAddress();
91   uint64_t LoadAddr = S.getLoadAddress();
92 
93   unsigned StartPadding = LoadAddr & (ColsPerRow - 1);
94   unsigned BytesRemaining = S.getSize();
95 
96   if (StartPadding) {
97     dbgs() << "\n" << format("0x%016" PRIx64,
98                              LoadAddr & ~(uint64_t)(ColsPerRow - 1)) << ":";
99     while (StartPadding--)
100       dbgs() << "   ";
101   }
102 
103   while (BytesRemaining > 0) {
104     if ((LoadAddr & (ColsPerRow - 1)) == 0)
105       dbgs() << "\n" << format("0x%016" PRIx64, LoadAddr) << ":";
106 
107     dbgs() << " " << format("%02x", *DataAddr);
108 
109     ++DataAddr;
110     ++LoadAddr;
111     --BytesRemaining;
112   }
113 
114   dbgs() << "\n";
115 }
116 #endif
117 
118 // Resolve the relocations for all symbols we currently know about.
119 void RuntimeDyldImpl::resolveRelocations() {
120   MutexGuard locked(lock);
121 
122   // Print out the sections prior to relocation.
123   DEBUG(
124     for (int i = 0, e = Sections.size(); i != e; ++i)
125       dumpSectionMemory(Sections[i], "before relocations");
126   );
127 
128   // First, resolve relocations associated with external symbols.
129   resolveExternalSymbols();
130 
131   // Iterate over all outstanding relocations
132   for (auto it = Relocations.begin(), e = Relocations.end(); it != e; ++it) {
133     // The Section here (Sections[i]) refers to the section in which the
134     // symbol for the relocation is located.  The SectionID in the relocation
135     // entry provides the section to which the relocation will be applied.
136     int Idx = it->first;
137     uint64_t Addr = Sections[Idx].getLoadAddress();
138     DEBUG(dbgs() << "Resolving relocations Section #" << Idx << "\t"
139                  << format("%p", (uintptr_t)Addr) << "\n");
140     resolveRelocationList(it->second, Addr);
141   }
142   Relocations.clear();
143 
144   // Print out sections after relocation.
145   DEBUG(
146     for (int i = 0, e = Sections.size(); i != e; ++i)
147       dumpSectionMemory(Sections[i], "after relocations");
148   );
149 
150 }
151 
152 void RuntimeDyldImpl::mapSectionAddress(const void *LocalAddress,
153                                         uint64_t TargetAddress) {
154   MutexGuard locked(lock);
155   for (unsigned i = 0, e = Sections.size(); i != e; ++i) {
156     if (Sections[i].getAddress() == LocalAddress) {
157       reassignSectionAddress(i, TargetAddress);
158       return;
159     }
160   }
161   llvm_unreachable("Attempting to remap address of unknown section!");
162 }
163 
164 static Error getOffset(const SymbolRef &Sym, SectionRef Sec,
165                        uint64_t &Result) {
166   Expected<uint64_t> AddressOrErr = Sym.getAddress();
167   if (!AddressOrErr)
168     return AddressOrErr.takeError();
169   Result = *AddressOrErr - Sec.getAddress();
170   return Error::success();
171 }
172 
173 Expected<RuntimeDyldImpl::ObjSectionToIDMap>
174 RuntimeDyldImpl::loadObjectImpl(const object::ObjectFile &Obj) {
175   MutexGuard locked(lock);
176 
177   // Save information about our target
178   Arch = (Triple::ArchType)Obj.getArch();
179   IsTargetLittleEndian = Obj.isLittleEndian();
180   setMipsABI(Obj);
181 
182   // Compute the memory size required to load all sections to be loaded
183   // and pass this information to the memory manager
184   if (MemMgr.needsToReserveAllocationSpace()) {
185     uint64_t CodeSize = 0, RODataSize = 0, RWDataSize = 0;
186     uint32_t CodeAlign = 1, RODataAlign = 1, RWDataAlign = 1;
187     if (auto Err = computeTotalAllocSize(Obj,
188                                          CodeSize, CodeAlign,
189                                          RODataSize, RODataAlign,
190                                          RWDataSize, RWDataAlign))
191       return std::move(Err);
192     MemMgr.reserveAllocationSpace(CodeSize, CodeAlign, RODataSize, RODataAlign,
193                                   RWDataSize, RWDataAlign);
194   }
195 
196   // Used sections from the object file
197   ObjSectionToIDMap LocalSections;
198 
199   // Common symbols requiring allocation, with their sizes and alignments
200   CommonSymbolList CommonSymbols;
201 
202   // Parse symbols
203   DEBUG(dbgs() << "Parse symbols:\n");
204   for (symbol_iterator I = Obj.symbol_begin(), E = Obj.symbol_end(); I != E;
205        ++I) {
206     uint32_t Flags = I->getFlags();
207 
208     // Skip undefined symbols.
209     if (Flags & SymbolRef::SF_Undefined)
210       continue;
211 
212     if (Flags & SymbolRef::SF_Common)
213       CommonSymbols.push_back(*I);
214     else {
215 
216       // Get the symbol type.
217       object::SymbolRef::Type SymType;
218       if (auto SymTypeOrErr = I->getType())
219         SymType =  *SymTypeOrErr;
220       else
221         return SymTypeOrErr.takeError();
222 
223       // Get symbol name.
224       StringRef Name;
225       if (auto NameOrErr = I->getName())
226         Name = *NameOrErr;
227       else
228         return NameOrErr.takeError();
229 
230       // Compute JIT symbol flags.
231       JITSymbolFlags JITSymFlags = JITSymbolFlags::fromObjectSymbol(*I);
232 
233       // If this is a weak definition, check to see if there's a strong one.
234       // If there is, skip this symbol (we won't be providing it: the strong
235       // definition will). If there's no strong definition, make this definition
236       // strong.
237       if (JITSymFlags.isWeak()) {
238         // First check whether there's already a definition in this instance.
239         // FIXME: Override existing weak definitions with strong ones.
240         if (GlobalSymbolTable.count(Name))
241           continue;
242         // Then check the symbol resolver to see if there's a definition
243         // elsewhere in this logical dylib.
244         if (auto Sym = Resolver.findSymbolInLogicalDylib(Name))
245           if (Sym.getFlags().isStrongDefinition())
246             continue;
247         // else
248         JITSymFlags &= ~JITSymbolFlags::Weak;
249       }
250 
251       if (Flags & SymbolRef::SF_Absolute &&
252           SymType != object::SymbolRef::ST_File) {
253         uint64_t Addr = 0;
254         if (auto AddrOrErr = I->getAddress())
255           Addr = *AddrOrErr;
256         else
257           return AddrOrErr.takeError();
258 
259         unsigned SectionID = AbsoluteSymbolSection;
260 
261         DEBUG(dbgs() << "\tType: " << SymType << " (absolute) Name: " << Name
262                      << " SID: " << SectionID << " Offset: "
263                      << format("%p", (uintptr_t)Addr)
264                      << " flags: " << Flags << "\n");
265         GlobalSymbolTable[Name] =
266           SymbolTableEntry(SectionID, Addr, JITSymFlags);
267       } else if (SymType == object::SymbolRef::ST_Function ||
268                  SymType == object::SymbolRef::ST_Data ||
269                  SymType == object::SymbolRef::ST_Unknown ||
270                  SymType == object::SymbolRef::ST_Other) {
271 
272         section_iterator SI = Obj.section_end();
273         if (auto SIOrErr = I->getSection())
274           SI = *SIOrErr;
275         else
276           return SIOrErr.takeError();
277 
278         if (SI == Obj.section_end())
279           continue;
280 
281         // Get symbol offset.
282         uint64_t SectOffset;
283         if (auto Err = getOffset(*I, *SI, SectOffset))
284           return std::move(Err);
285 
286         bool IsCode = SI->isText();
287         unsigned SectionID;
288         if (auto SectionIDOrErr = findOrEmitSection(Obj, *SI, IsCode,
289                                                     LocalSections))
290           SectionID = *SectionIDOrErr;
291         else
292           return SectionIDOrErr.takeError();
293 
294         DEBUG(dbgs() << "\tType: " << SymType << " Name: " << Name
295                      << " SID: " << SectionID << " Offset: "
296                      << format("%p", (uintptr_t)SectOffset)
297                      << " flags: " << Flags << "\n");
298         GlobalSymbolTable[Name] =
299           SymbolTableEntry(SectionID, SectOffset, JITSymFlags);
300       }
301     }
302   }
303 
304   // Allocate common symbols
305   if (auto Err = emitCommonSymbols(Obj, CommonSymbols))
306     return std::move(Err);
307 
308   // Parse and process relocations
309   DEBUG(dbgs() << "Parse relocations:\n");
310   for (section_iterator SI = Obj.section_begin(), SE = Obj.section_end();
311        SI != SE; ++SI) {
312     StubMap Stubs;
313     section_iterator RelocatedSection = SI->getRelocatedSection();
314 
315     if (RelocatedSection == SE)
316       continue;
317 
318     relocation_iterator I = SI->relocation_begin();
319     relocation_iterator E = SI->relocation_end();
320 
321     if (I == E && !ProcessAllSections)
322       continue;
323 
324     bool IsCode = RelocatedSection->isText();
325     unsigned SectionID = 0;
326     if (auto SectionIDOrErr = findOrEmitSection(Obj, *RelocatedSection, IsCode,
327                                                 LocalSections))
328       SectionID = *SectionIDOrErr;
329     else
330       return SectionIDOrErr.takeError();
331 
332     DEBUG(dbgs() << "\tSectionID: " << SectionID << "\n");
333 
334     for (; I != E;)
335       if (auto IOrErr = processRelocationRef(SectionID, I, Obj, LocalSections, Stubs))
336         I = *IOrErr;
337       else
338         return IOrErr.takeError();
339 
340     // If there is an attached checker, notify it about the stubs for this
341     // section so that they can be verified.
342     if (Checker)
343       Checker->registerStubMap(Obj.getFileName(), SectionID, Stubs);
344   }
345 
346   // Give the subclasses a chance to tie-up any loose ends.
347   if (auto Err = finalizeLoad(Obj, LocalSections))
348     return std::move(Err);
349 
350 //   for (auto E : LocalSections)
351 //     llvm::dbgs() << "Added: " << E.first.getRawDataRefImpl() << " -> " << E.second << "\n";
352 
353   return LocalSections;
354 }
355 
356 // A helper method for computeTotalAllocSize.
357 // Computes the memory size required to allocate sections with the given sizes,
358 // assuming that all sections are allocated with the given alignment
359 static uint64_t
360 computeAllocationSizeForSections(std::vector<uint64_t> &SectionSizes,
361                                  uint64_t Alignment) {
362   uint64_t TotalSize = 0;
363   for (size_t Idx = 0, Cnt = SectionSizes.size(); Idx < Cnt; Idx++) {
364     uint64_t AlignedSize =
365         (SectionSizes[Idx] + Alignment - 1) / Alignment * Alignment;
366     TotalSize += AlignedSize;
367   }
368   return TotalSize;
369 }
370 
371 static bool isRequiredForExecution(const SectionRef Section) {
372   const ObjectFile *Obj = Section.getObject();
373   if (isa<object::ELFObjectFileBase>(Obj))
374     return ELFSectionRef(Section).getFlags() & ELF::SHF_ALLOC;
375   if (auto *COFFObj = dyn_cast<object::COFFObjectFile>(Obj)) {
376     const coff_section *CoffSection = COFFObj->getCOFFSection(Section);
377     // Avoid loading zero-sized COFF sections.
378     // In PE files, VirtualSize gives the section size, and SizeOfRawData
379     // may be zero for sections with content. In Obj files, SizeOfRawData
380     // gives the section size, and VirtualSize is always zero. Hence
381     // the need to check for both cases below.
382     bool HasContent =
383         (CoffSection->VirtualSize > 0) || (CoffSection->SizeOfRawData > 0);
384     bool IsDiscardable =
385         CoffSection->Characteristics &
386         (COFF::IMAGE_SCN_MEM_DISCARDABLE | COFF::IMAGE_SCN_LNK_INFO);
387     return HasContent && !IsDiscardable;
388   }
389 
390   assert(isa<MachOObjectFile>(Obj));
391   return true;
392 }
393 
394 static bool isReadOnlyData(const SectionRef Section) {
395   const ObjectFile *Obj = Section.getObject();
396   if (isa<object::ELFObjectFileBase>(Obj))
397     return !(ELFSectionRef(Section).getFlags() &
398              (ELF::SHF_WRITE | ELF::SHF_EXECINSTR));
399   if (auto *COFFObj = dyn_cast<object::COFFObjectFile>(Obj))
400     return ((COFFObj->getCOFFSection(Section)->Characteristics &
401              (COFF::IMAGE_SCN_CNT_INITIALIZED_DATA
402              | COFF::IMAGE_SCN_MEM_READ
403              | COFF::IMAGE_SCN_MEM_WRITE))
404              ==
405              (COFF::IMAGE_SCN_CNT_INITIALIZED_DATA
406              | COFF::IMAGE_SCN_MEM_READ));
407 
408   assert(isa<MachOObjectFile>(Obj));
409   return false;
410 }
411 
412 static bool isZeroInit(const SectionRef Section) {
413   const ObjectFile *Obj = Section.getObject();
414   if (isa<object::ELFObjectFileBase>(Obj))
415     return ELFSectionRef(Section).getType() == ELF::SHT_NOBITS;
416   if (auto *COFFObj = dyn_cast<object::COFFObjectFile>(Obj))
417     return COFFObj->getCOFFSection(Section)->Characteristics &
418             COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA;
419 
420   auto *MachO = cast<MachOObjectFile>(Obj);
421   unsigned SectionType = MachO->getSectionType(Section);
422   return SectionType == MachO::S_ZEROFILL ||
423          SectionType == MachO::S_GB_ZEROFILL;
424 }
425 
426 // Compute an upper bound of the memory size that is required to load all
427 // sections
428 Error RuntimeDyldImpl::computeTotalAllocSize(const ObjectFile &Obj,
429                                              uint64_t &CodeSize,
430                                              uint32_t &CodeAlign,
431                                              uint64_t &RODataSize,
432                                              uint32_t &RODataAlign,
433                                              uint64_t &RWDataSize,
434                                              uint32_t &RWDataAlign) {
435   // Compute the size of all sections required for execution
436   std::vector<uint64_t> CodeSectionSizes;
437   std::vector<uint64_t> ROSectionSizes;
438   std::vector<uint64_t> RWSectionSizes;
439 
440   // Collect sizes of all sections to be loaded;
441   // also determine the max alignment of all sections
442   for (section_iterator SI = Obj.section_begin(), SE = Obj.section_end();
443        SI != SE; ++SI) {
444     const SectionRef &Section = *SI;
445 
446     bool IsRequired = isRequiredForExecution(Section) || ProcessAllSections;
447 
448     // Consider only the sections that are required to be loaded for execution
449     if (IsRequired) {
450       uint64_t DataSize = Section.getSize();
451       uint64_t Alignment64 = Section.getAlignment();
452       unsigned Alignment = (unsigned)Alignment64 & 0xffffffffL;
453       bool IsCode = Section.isText();
454       bool IsReadOnly = isReadOnlyData(Section);
455 
456       StringRef Name;
457       if (auto EC = Section.getName(Name))
458         return errorCodeToError(EC);
459 
460       uint64_t StubBufSize = computeSectionStubBufSize(Obj, Section);
461       uint64_t SectionSize = DataSize + StubBufSize;
462 
463       // The .eh_frame section (at least on Linux) needs an extra four bytes
464       // padded
465       // with zeroes added at the end.  For MachO objects, this section has a
466       // slightly different name, so this won't have any effect for MachO
467       // objects.
468       if (Name == ".eh_frame")
469         SectionSize += 4;
470 
471       if (!SectionSize)
472         SectionSize = 1;
473 
474       if (IsCode) {
475         CodeAlign = std::max(CodeAlign, Alignment);
476         CodeSectionSizes.push_back(SectionSize);
477       } else if (IsReadOnly) {
478         RODataAlign = std::max(RODataAlign, Alignment);
479         ROSectionSizes.push_back(SectionSize);
480       } else {
481         RWDataAlign = std::max(RWDataAlign, Alignment);
482         RWSectionSizes.push_back(SectionSize);
483       }
484     }
485   }
486 
487   // Compute Global Offset Table size. If it is not zero we
488   // also update alignment, which is equal to a size of a
489   // single GOT entry.
490   if (unsigned GotSize = computeGOTSize(Obj)) {
491     RWSectionSizes.push_back(GotSize);
492     RWDataAlign = std::max<uint32_t>(RWDataAlign, getGOTEntrySize());
493   }
494 
495   // Compute the size of all common symbols
496   uint64_t CommonSize = 0;
497   uint32_t CommonAlign = 1;
498   for (symbol_iterator I = Obj.symbol_begin(), E = Obj.symbol_end(); I != E;
499        ++I) {
500     uint32_t Flags = I->getFlags();
501     if (Flags & SymbolRef::SF_Common) {
502       // Add the common symbols to a list.  We'll allocate them all below.
503       uint64_t Size = I->getCommonSize();
504       uint32_t Align = I->getAlignment();
505       // If this is the first common symbol, use its alignment as the alignment
506       // for the common symbols section.
507       if (CommonSize == 0)
508         CommonAlign = Align;
509       CommonSize = alignTo(CommonSize, Align) + Size;
510     }
511   }
512   if (CommonSize != 0) {
513     RWSectionSizes.push_back(CommonSize);
514     RWDataAlign = std::max(RWDataAlign, CommonAlign);
515   }
516 
517   // Compute the required allocation space for each different type of sections
518   // (code, read-only data, read-write data) assuming that all sections are
519   // allocated with the max alignment. Note that we cannot compute with the
520   // individual alignments of the sections, because then the required size
521   // depends on the order, in which the sections are allocated.
522   CodeSize = computeAllocationSizeForSections(CodeSectionSizes, CodeAlign);
523   RODataSize = computeAllocationSizeForSections(ROSectionSizes, RODataAlign);
524   RWDataSize = computeAllocationSizeForSections(RWSectionSizes, RWDataAlign);
525 
526   return Error::success();
527 }
528 
529 // compute GOT size
530 unsigned RuntimeDyldImpl::computeGOTSize(const ObjectFile &Obj) {
531   size_t GotEntrySize = getGOTEntrySize();
532   if (!GotEntrySize)
533     return 0;
534 
535   size_t GotSize = 0;
536   for (section_iterator SI = Obj.section_begin(), SE = Obj.section_end();
537        SI != SE; ++SI) {
538 
539     for (const RelocationRef &Reloc : SI->relocations())
540       if (relocationNeedsGot(Reloc))
541         GotSize += GotEntrySize;
542   }
543 
544   return GotSize;
545 }
546 
547 // compute stub buffer size for the given section
548 unsigned RuntimeDyldImpl::computeSectionStubBufSize(const ObjectFile &Obj,
549                                                     const SectionRef &Section) {
550   unsigned StubSize = getMaxStubSize();
551   if (StubSize == 0) {
552     return 0;
553   }
554   // FIXME: this is an inefficient way to handle this. We should computed the
555   // necessary section allocation size in loadObject by walking all the sections
556   // once.
557   unsigned StubBufSize = 0;
558   for (section_iterator SI = Obj.section_begin(), SE = Obj.section_end();
559        SI != SE; ++SI) {
560     section_iterator RelSecI = SI->getRelocatedSection();
561     if (!(RelSecI == Section))
562       continue;
563 
564     for (const RelocationRef &Reloc : SI->relocations())
565       if (relocationNeedsStub(Reloc))
566         StubBufSize += StubSize;
567   }
568 
569   // Get section data size and alignment
570   uint64_t DataSize = Section.getSize();
571   uint64_t Alignment64 = Section.getAlignment();
572 
573   // Add stubbuf size alignment
574   unsigned Alignment = (unsigned)Alignment64 & 0xffffffffL;
575   unsigned StubAlignment = getStubAlignment();
576   unsigned EndAlignment = (DataSize | Alignment) & -(DataSize | Alignment);
577   if (StubAlignment > EndAlignment)
578     StubBufSize += StubAlignment - EndAlignment;
579   return StubBufSize;
580 }
581 
582 uint64_t RuntimeDyldImpl::readBytesUnaligned(uint8_t *Src,
583                                              unsigned Size) const {
584   uint64_t Result = 0;
585   if (IsTargetLittleEndian) {
586     Src += Size - 1;
587     while (Size--)
588       Result = (Result << 8) | *Src--;
589   } else
590     while (Size--)
591       Result = (Result << 8) | *Src++;
592 
593   return Result;
594 }
595 
596 void RuntimeDyldImpl::writeBytesUnaligned(uint64_t Value, uint8_t *Dst,
597                                           unsigned Size) const {
598   if (IsTargetLittleEndian) {
599     while (Size--) {
600       *Dst++ = Value & 0xFF;
601       Value >>= 8;
602     }
603   } else {
604     Dst += Size - 1;
605     while (Size--) {
606       *Dst-- = Value & 0xFF;
607       Value >>= 8;
608     }
609   }
610 }
611 
612 Error RuntimeDyldImpl::emitCommonSymbols(const ObjectFile &Obj,
613                                          CommonSymbolList &CommonSymbols) {
614   if (CommonSymbols.empty())
615     return Error::success();
616 
617   uint64_t CommonSize = 0;
618   uint32_t CommonAlign = CommonSymbols.begin()->getAlignment();
619   CommonSymbolList SymbolsToAllocate;
620 
621   DEBUG(dbgs() << "Processing common symbols...\n");
622 
623   for (const auto &Sym : CommonSymbols) {
624     StringRef Name;
625     if (auto NameOrErr = Sym.getName())
626       Name = *NameOrErr;
627     else
628       return NameOrErr.takeError();
629 
630     // Skip common symbols already elsewhere.
631     if (GlobalSymbolTable.count(Name)) {
632       DEBUG(dbgs() << "\tSkipping already emitted common symbol '" << Name
633                    << "'\n");
634       continue;
635     }
636 
637     if (auto Sym = Resolver.findSymbolInLogicalDylib(Name)) {
638       if (!Sym.getFlags().isCommon()) {
639         DEBUG(dbgs() << "\tSkipping common symbol '" << Name
640                      << "' in favor of stronger definition.\n");
641         continue;
642       }
643     }
644     uint32_t Align = Sym.getAlignment();
645     uint64_t Size = Sym.getCommonSize();
646 
647     CommonSize = alignTo(CommonSize, Align) + Size;
648 
649     SymbolsToAllocate.push_back(Sym);
650   }
651 
652   // Allocate memory for the section
653   unsigned SectionID = Sections.size();
654   uint8_t *Addr = MemMgr.allocateDataSection(CommonSize, CommonAlign, SectionID,
655                                              "<common symbols>", false);
656   if (!Addr)
657     report_fatal_error("Unable to allocate memory for common symbols!");
658   uint64_t Offset = 0;
659   Sections.push_back(
660       SectionEntry("<common symbols>", Addr, CommonSize, CommonSize, 0));
661   memset(Addr, 0, CommonSize);
662 
663   DEBUG(dbgs() << "emitCommonSection SectionID: " << SectionID << " new addr: "
664                << format("%p", Addr) << " DataSize: " << CommonSize << "\n");
665 
666   // Assign the address of each symbol
667   for (auto &Sym : SymbolsToAllocate) {
668     uint32_t Align = Sym.getAlignment();
669     uint64_t Size = Sym.getCommonSize();
670     StringRef Name;
671     if (auto NameOrErr = Sym.getName())
672       Name = *NameOrErr;
673     else
674       return NameOrErr.takeError();
675     if (Align) {
676       // This symbol has an alignment requirement.
677       uint64_t AlignOffset = OffsetToAlignment((uint64_t)Addr, Align);
678       Addr += AlignOffset;
679       Offset += AlignOffset;
680     }
681     JITSymbolFlags JITSymFlags = JITSymbolFlags::fromObjectSymbol(Sym);
682     DEBUG(dbgs() << "Allocating common symbol " << Name << " address "
683                  << format("%p", Addr) << "\n");
684     GlobalSymbolTable[Name] =
685       SymbolTableEntry(SectionID, Offset, JITSymFlags);
686     Offset += Size;
687     Addr += Size;
688   }
689 
690   if (Checker)
691     Checker->registerSection(Obj.getFileName(), SectionID);
692 
693   return Error::success();
694 }
695 
696 Expected<unsigned>
697 RuntimeDyldImpl::emitSection(const ObjectFile &Obj,
698                              const SectionRef &Section,
699                              bool IsCode) {
700   StringRef data;
701   uint64_t Alignment64 = Section.getAlignment();
702 
703   unsigned Alignment = (unsigned)Alignment64 & 0xffffffffL;
704   unsigned PaddingSize = 0;
705   unsigned StubBufSize = 0;
706   bool IsRequired = isRequiredForExecution(Section) || ProcessAllSections;
707   bool IsVirtual = Section.isVirtual();
708   bool IsZeroInit = isZeroInit(Section);
709   bool IsReadOnly = isReadOnlyData(Section);
710   uint64_t DataSize = Section.getSize();
711 
712   StringRef Name;
713   if (auto EC = Section.getName(Name))
714     return errorCodeToError(EC);
715 
716   StubBufSize = computeSectionStubBufSize(Obj, Section);
717 
718   // The .eh_frame section (at least on Linux) needs an extra four bytes padded
719   // with zeroes added at the end.  For MachO objects, this section has a
720   // slightly different name, so this won't have any effect for MachO objects.
721   if (Name == ".eh_frame")
722     PaddingSize = 4;
723 
724   uintptr_t Allocate;
725   unsigned SectionID = Sections.size();
726   uint8_t *Addr;
727   const char *pData = nullptr;
728 
729   // If this section contains any bits (i.e. isn't a virtual or bss section),
730   // grab a reference to them.
731   if (!IsVirtual && !IsZeroInit) {
732     // In either case, set the location of the unrelocated section in memory,
733     // since we still process relocations for it even if we're not applying them.
734     if (auto EC = Section.getContents(data))
735       return errorCodeToError(EC);
736     pData = data.data();
737   }
738 
739   // Code section alignment needs to be at least as high as stub alignment or
740   // padding calculations may by incorrect when the section is remapped to a
741   // higher alignment.
742   if (IsCode)
743     Alignment = std::max(Alignment, getStubAlignment());
744 
745   // Some sections, such as debug info, don't need to be loaded for execution.
746   // Leave those where they are.
747   if (IsRequired) {
748     Allocate = DataSize + PaddingSize + StubBufSize;
749     if (!Allocate)
750       Allocate = 1;
751     Addr = IsCode ? MemMgr.allocateCodeSection(Allocate, Alignment, SectionID,
752                                                Name)
753                   : MemMgr.allocateDataSection(Allocate, Alignment, SectionID,
754                                                Name, IsReadOnly);
755     if (!Addr)
756       report_fatal_error("Unable to allocate section memory!");
757 
758     // Zero-initialize or copy the data from the image
759     if (IsZeroInit || IsVirtual)
760       memset(Addr, 0, DataSize);
761     else
762       memcpy(Addr, pData, DataSize);
763 
764     // Fill in any extra bytes we allocated for padding
765     if (PaddingSize != 0) {
766       memset(Addr + DataSize, 0, PaddingSize);
767       // Update the DataSize variable so that the stub offset is set correctly.
768       DataSize += PaddingSize;
769     }
770 
771     DEBUG(dbgs() << "emitSection SectionID: " << SectionID << " Name: " << Name
772                  << " obj addr: " << format("%p", pData)
773                  << " new addr: " << format("%p", Addr)
774                  << " DataSize: " << DataSize << " StubBufSize: " << StubBufSize
775                  << " Allocate: " << Allocate << "\n");
776   } else {
777     // Even if we didn't load the section, we need to record an entry for it
778     // to handle later processing (and by 'handle' I mean don't do anything
779     // with these sections).
780     Allocate = 0;
781     Addr = nullptr;
782     DEBUG(dbgs() << "emitSection SectionID: " << SectionID << " Name: " << Name
783                  << " obj addr: " << format("%p", data.data()) << " new addr: 0"
784                  << " DataSize: " << DataSize << " StubBufSize: " << StubBufSize
785                  << " Allocate: " << Allocate << "\n");
786   }
787 
788   Sections.push_back(
789       SectionEntry(Name, Addr, DataSize, Allocate, (uintptr_t)pData));
790 
791   if (Checker)
792     Checker->registerSection(Obj.getFileName(), SectionID);
793 
794   return SectionID;
795 }
796 
797 Expected<unsigned>
798 RuntimeDyldImpl::findOrEmitSection(const ObjectFile &Obj,
799                                    const SectionRef &Section,
800                                    bool IsCode,
801                                    ObjSectionToIDMap &LocalSections) {
802 
803   unsigned SectionID = 0;
804   ObjSectionToIDMap::iterator i = LocalSections.find(Section);
805   if (i != LocalSections.end())
806     SectionID = i->second;
807   else {
808     if (auto SectionIDOrErr = emitSection(Obj, Section, IsCode))
809       SectionID = *SectionIDOrErr;
810     else
811       return SectionIDOrErr.takeError();
812     LocalSections[Section] = SectionID;
813   }
814   return SectionID;
815 }
816 
817 void RuntimeDyldImpl::addRelocationForSection(const RelocationEntry &RE,
818                                               unsigned SectionID) {
819   Relocations[SectionID].push_back(RE);
820 }
821 
822 void RuntimeDyldImpl::addRelocationForSymbol(const RelocationEntry &RE,
823                                              StringRef SymbolName) {
824   // Relocation by symbol.  If the symbol is found in the global symbol table,
825   // create an appropriate section relocation.  Otherwise, add it to
826   // ExternalSymbolRelocations.
827   RTDyldSymbolTable::const_iterator Loc = GlobalSymbolTable.find(SymbolName);
828   if (Loc == GlobalSymbolTable.end()) {
829     ExternalSymbolRelocations[SymbolName].push_back(RE);
830   } else {
831     // Copy the RE since we want to modify its addend.
832     RelocationEntry RECopy = RE;
833     const auto &SymInfo = Loc->second;
834     RECopy.Addend += SymInfo.getOffset();
835     Relocations[SymInfo.getSectionID()].push_back(RECopy);
836   }
837 }
838 
839 uint8_t *RuntimeDyldImpl::createStubFunction(uint8_t *Addr,
840                                              unsigned AbiVariant) {
841   if (Arch == Triple::aarch64 || Arch == Triple::aarch64_be) {
842     // This stub has to be able to access the full address space,
843     // since symbol lookup won't necessarily find a handy, in-range,
844     // PLT stub for functions which could be anywhere.
845     // Stub can use ip0 (== x16) to calculate address
846     writeBytesUnaligned(0xd2e00010, Addr,    4); // movz ip0, #:abs_g3:<addr>
847     writeBytesUnaligned(0xf2c00010, Addr+4,  4); // movk ip0, #:abs_g2_nc:<addr>
848     writeBytesUnaligned(0xf2a00010, Addr+8,  4); // movk ip0, #:abs_g1_nc:<addr>
849     writeBytesUnaligned(0xf2800010, Addr+12, 4); // movk ip0, #:abs_g0_nc:<addr>
850     writeBytesUnaligned(0xd61f0200, Addr+16, 4); // br ip0
851 
852     return Addr;
853   } else if (Arch == Triple::arm || Arch == Triple::armeb) {
854     // TODO: There is only ARM far stub now. We should add the Thumb stub,
855     // and stubs for branches Thumb - ARM and ARM - Thumb.
856     writeBytesUnaligned(0xe51ff004, Addr, 4); // ldr pc,<label>
857     return Addr + 4;
858   } else if (IsMipsO32ABI) {
859     // 0:   3c190000        lui     t9,%hi(addr).
860     // 4:   27390000        addiu   t9,t9,%lo(addr).
861     // 8:   03200008        jr      t9.
862     // c:   00000000        nop.
863     const unsigned LuiT9Instr = 0x3c190000, AdduiT9Instr = 0x27390000;
864     const unsigned NopInstr = 0x0;
865     unsigned JrT9Instr = 0x03200008;
866     if ((AbiVariant & ELF::EF_MIPS_ARCH) == ELF::EF_MIPS_ARCH_32R6)
867         JrT9Instr = 0x03200009;
868 
869     writeBytesUnaligned(LuiT9Instr, Addr, 4);
870     writeBytesUnaligned(AdduiT9Instr, Addr+4, 4);
871     writeBytesUnaligned(JrT9Instr, Addr+8, 4);
872     writeBytesUnaligned(NopInstr, Addr+12, 4);
873     return Addr;
874   } else if (Arch == Triple::ppc64 || Arch == Triple::ppc64le) {
875     // Depending on which version of the ELF ABI is in use, we need to
876     // generate one of two variants of the stub.  They both start with
877     // the same sequence to load the target address into r12.
878     writeInt32BE(Addr,    0x3D800000); // lis   r12, highest(addr)
879     writeInt32BE(Addr+4,  0x618C0000); // ori   r12, higher(addr)
880     writeInt32BE(Addr+8,  0x798C07C6); // sldi  r12, r12, 32
881     writeInt32BE(Addr+12, 0x658C0000); // oris  r12, r12, h(addr)
882     writeInt32BE(Addr+16, 0x618C0000); // ori   r12, r12, l(addr)
883     if (AbiVariant == 2) {
884       // PowerPC64 stub ELFv2 ABI: The address points to the function itself.
885       // The address is already in r12 as required by the ABI.  Branch to it.
886       writeInt32BE(Addr+20, 0xF8410018); // std   r2,  24(r1)
887       writeInt32BE(Addr+24, 0x7D8903A6); // mtctr r12
888       writeInt32BE(Addr+28, 0x4E800420); // bctr
889     } else {
890       // PowerPC64 stub ELFv1 ABI: The address points to a function descriptor.
891       // Load the function address on r11 and sets it to control register. Also
892       // loads the function TOC in r2 and environment pointer to r11.
893       writeInt32BE(Addr+20, 0xF8410028); // std   r2,  40(r1)
894       writeInt32BE(Addr+24, 0xE96C0000); // ld    r11, 0(r12)
895       writeInt32BE(Addr+28, 0xE84C0008); // ld    r2,  0(r12)
896       writeInt32BE(Addr+32, 0x7D6903A6); // mtctr r11
897       writeInt32BE(Addr+36, 0xE96C0010); // ld    r11, 16(r2)
898       writeInt32BE(Addr+40, 0x4E800420); // bctr
899     }
900     return Addr;
901   } else if (Arch == Triple::systemz) {
902     writeInt16BE(Addr,    0xC418);     // lgrl %r1,.+8
903     writeInt16BE(Addr+2,  0x0000);
904     writeInt16BE(Addr+4,  0x0004);
905     writeInt16BE(Addr+6,  0x07F1);     // brc 15,%r1
906     // 8-byte address stored at Addr + 8
907     return Addr;
908   } else if (Arch == Triple::x86_64) {
909     *Addr      = 0xFF; // jmp
910     *(Addr+1)  = 0x25; // rip
911     // 32-bit PC-relative address of the GOT entry will be stored at Addr+2
912   } else if (Arch == Triple::x86) {
913     *Addr      = 0xE9; // 32-bit pc-relative jump.
914   }
915   return Addr;
916 }
917 
918 // Assign an address to a symbol name and resolve all the relocations
919 // associated with it.
920 void RuntimeDyldImpl::reassignSectionAddress(unsigned SectionID,
921                                              uint64_t Addr) {
922   // The address to use for relocation resolution is not
923   // the address of the local section buffer. We must be doing
924   // a remote execution environment of some sort. Relocations can't
925   // be applied until all the sections have been moved.  The client must
926   // trigger this with a call to MCJIT::finalize() or
927   // RuntimeDyld::resolveRelocations().
928   //
929   // Addr is a uint64_t because we can't assume the pointer width
930   // of the target is the same as that of the host. Just use a generic
931   // "big enough" type.
932   DEBUG(dbgs() << "Reassigning address for section " << SectionID << " ("
933                << Sections[SectionID].getName() << "): "
934                << format("0x%016" PRIx64, Sections[SectionID].getLoadAddress())
935                << " -> " << format("0x%016" PRIx64, Addr) << "\n");
936   Sections[SectionID].setLoadAddress(Addr);
937 }
938 
939 void RuntimeDyldImpl::resolveRelocationList(const RelocationList &Relocs,
940                                             uint64_t Value) {
941   for (unsigned i = 0, e = Relocs.size(); i != e; ++i) {
942     const RelocationEntry &RE = Relocs[i];
943     // Ignore relocations for sections that were not loaded
944     if (Sections[RE.SectionID].getAddress() == nullptr)
945       continue;
946     resolveRelocation(RE, Value);
947   }
948 }
949 
950 void RuntimeDyldImpl::resolveExternalSymbols() {
951   while (!ExternalSymbolRelocations.empty()) {
952     StringMap<RelocationList>::iterator i = ExternalSymbolRelocations.begin();
953 
954     StringRef Name = i->first();
955     if (Name.size() == 0) {
956       // This is an absolute symbol, use an address of zero.
957       DEBUG(dbgs() << "Resolving absolute relocations."
958                    << "\n");
959       RelocationList &Relocs = i->second;
960       resolveRelocationList(Relocs, 0);
961     } else {
962       uint64_t Addr = 0;
963       RTDyldSymbolTable::const_iterator Loc = GlobalSymbolTable.find(Name);
964       if (Loc == GlobalSymbolTable.end()) {
965         // This is an external symbol, try to get its address from the symbol
966         // resolver.
967         // First search for the symbol in this logical dylib.
968         Addr = Resolver.findSymbolInLogicalDylib(Name.data()).getAddress();
969         // If that fails, try searching for an external symbol.
970         if (!Addr)
971           Addr = Resolver.findSymbol(Name.data()).getAddress();
972         // The call to getSymbolAddress may have caused additional modules to
973         // be loaded, which may have added new entries to the
974         // ExternalSymbolRelocations map.  Consquently, we need to update our
975         // iterator.  This is also why retrieval of the relocation list
976         // associated with this symbol is deferred until below this point.
977         // New entries may have been added to the relocation list.
978         i = ExternalSymbolRelocations.find(Name);
979       } else {
980         // We found the symbol in our global table.  It was probably in a
981         // Module that we loaded previously.
982         const auto &SymInfo = Loc->second;
983         Addr = getSectionLoadAddress(SymInfo.getSectionID()) +
984                SymInfo.getOffset();
985       }
986 
987       // FIXME: Implement error handling that doesn't kill the host program!
988       if (!Addr)
989         report_fatal_error("Program used external function '" + Name +
990                            "' which could not be resolved!");
991 
992       // If Resolver returned UINT64_MAX, the client wants to handle this symbol
993       // manually and we shouldn't resolve its relocations.
994       if (Addr != UINT64_MAX) {
995         DEBUG(dbgs() << "Resolving relocations Name: " << Name << "\t"
996                      << format("0x%lx", Addr) << "\n");
997         // This list may have been updated when we called getSymbolAddress, so
998         // don't change this code to get the list earlier.
999         RelocationList &Relocs = i->second;
1000         resolveRelocationList(Relocs, Addr);
1001       }
1002     }
1003 
1004     ExternalSymbolRelocations.erase(i);
1005   }
1006 }
1007 
1008 //===----------------------------------------------------------------------===//
1009 // RuntimeDyld class implementation
1010 
1011 uint64_t RuntimeDyld::LoadedObjectInfo::getSectionLoadAddress(
1012                                           const object::SectionRef &Sec) const {
1013 
1014   auto I = ObjSecToIDMap.find(Sec);
1015   if (I != ObjSecToIDMap.end())
1016     return RTDyld.Sections[I->second].getLoadAddress();
1017 
1018   return 0;
1019 }
1020 
1021 void RuntimeDyld::MemoryManager::anchor() {}
1022 void JITSymbolResolver::anchor() {}
1023 
1024 RuntimeDyld::RuntimeDyld(RuntimeDyld::MemoryManager &MemMgr,
1025                          JITSymbolResolver &Resolver)
1026     : MemMgr(MemMgr), Resolver(Resolver) {
1027   // FIXME: There's a potential issue lurking here if a single instance of
1028   // RuntimeDyld is used to load multiple objects.  The current implementation
1029   // associates a single memory manager with a RuntimeDyld instance.  Even
1030   // though the public class spawns a new 'impl' instance for each load,
1031   // they share a single memory manager.  This can become a problem when page
1032   // permissions are applied.
1033   Dyld = nullptr;
1034   ProcessAllSections = false;
1035   Checker = nullptr;
1036 }
1037 
1038 RuntimeDyld::~RuntimeDyld() {}
1039 
1040 static std::unique_ptr<RuntimeDyldCOFF>
1041 createRuntimeDyldCOFF(Triple::ArchType Arch, RuntimeDyld::MemoryManager &MM,
1042                       JITSymbolResolver &Resolver, bool ProcessAllSections,
1043                       RuntimeDyldCheckerImpl *Checker) {
1044   std::unique_ptr<RuntimeDyldCOFF> Dyld =
1045     RuntimeDyldCOFF::create(Arch, MM, Resolver);
1046   Dyld->setProcessAllSections(ProcessAllSections);
1047   Dyld->setRuntimeDyldChecker(Checker);
1048   return Dyld;
1049 }
1050 
1051 static std::unique_ptr<RuntimeDyldELF>
1052 createRuntimeDyldELF(Triple::ArchType Arch, RuntimeDyld::MemoryManager &MM,
1053                      JITSymbolResolver &Resolver, bool ProcessAllSections,
1054                      RuntimeDyldCheckerImpl *Checker) {
1055   std::unique_ptr<RuntimeDyldELF> Dyld =
1056       RuntimeDyldELF::create(Arch, MM, Resolver);
1057   Dyld->setProcessAllSections(ProcessAllSections);
1058   Dyld->setRuntimeDyldChecker(Checker);
1059   return Dyld;
1060 }
1061 
1062 static std::unique_ptr<RuntimeDyldMachO>
1063 createRuntimeDyldMachO(Triple::ArchType Arch, RuntimeDyld::MemoryManager &MM,
1064                        JITSymbolResolver &Resolver,
1065                        bool ProcessAllSections,
1066                        RuntimeDyldCheckerImpl *Checker) {
1067   std::unique_ptr<RuntimeDyldMachO> Dyld =
1068     RuntimeDyldMachO::create(Arch, MM, Resolver);
1069   Dyld->setProcessAllSections(ProcessAllSections);
1070   Dyld->setRuntimeDyldChecker(Checker);
1071   return Dyld;
1072 }
1073 
1074 std::unique_ptr<RuntimeDyld::LoadedObjectInfo>
1075 RuntimeDyld::loadObject(const ObjectFile &Obj) {
1076   if (!Dyld) {
1077     if (Obj.isELF())
1078       Dyld =
1079           createRuntimeDyldELF(static_cast<Triple::ArchType>(Obj.getArch()),
1080                                MemMgr, Resolver, ProcessAllSections, Checker);
1081     else if (Obj.isMachO())
1082       Dyld = createRuntimeDyldMachO(
1083                static_cast<Triple::ArchType>(Obj.getArch()), MemMgr, Resolver,
1084                ProcessAllSections, Checker);
1085     else if (Obj.isCOFF())
1086       Dyld = createRuntimeDyldCOFF(
1087                static_cast<Triple::ArchType>(Obj.getArch()), MemMgr, Resolver,
1088                ProcessAllSections, Checker);
1089     else
1090       report_fatal_error("Incompatible object format!");
1091   }
1092 
1093   if (!Dyld->isCompatibleFile(Obj))
1094     report_fatal_error("Incompatible object format!");
1095 
1096   auto LoadedObjInfo = Dyld->loadObject(Obj);
1097   MemMgr.notifyObjectLoaded(*this, Obj);
1098   return LoadedObjInfo;
1099 }
1100 
1101 void *RuntimeDyld::getSymbolLocalAddress(StringRef Name) const {
1102   if (!Dyld)
1103     return nullptr;
1104   return Dyld->getSymbolLocalAddress(Name);
1105 }
1106 
1107 JITEvaluatedSymbol RuntimeDyld::getSymbol(StringRef Name) const {
1108   if (!Dyld)
1109     return nullptr;
1110   return Dyld->getSymbol(Name);
1111 }
1112 
1113 void RuntimeDyld::resolveRelocations() { Dyld->resolveRelocations(); }
1114 
1115 void RuntimeDyld::reassignSectionAddress(unsigned SectionID, uint64_t Addr) {
1116   Dyld->reassignSectionAddress(SectionID, Addr);
1117 }
1118 
1119 void RuntimeDyld::mapSectionAddress(const void *LocalAddress,
1120                                     uint64_t TargetAddress) {
1121   Dyld->mapSectionAddress(LocalAddress, TargetAddress);
1122 }
1123 
1124 bool RuntimeDyld::hasError() { return Dyld->hasError(); }
1125 
1126 StringRef RuntimeDyld::getErrorString() { return Dyld->getErrorString(); }
1127 
1128 void RuntimeDyld::finalizeWithMemoryManagerLocking() {
1129   bool MemoryFinalizationLocked = MemMgr.FinalizationLocked;
1130   MemMgr.FinalizationLocked = true;
1131   resolveRelocations();
1132   registerEHFrames();
1133   if (!MemoryFinalizationLocked) {
1134     MemMgr.finalizeMemory();
1135     MemMgr.FinalizationLocked = false;
1136   }
1137 }
1138 
1139 void RuntimeDyld::registerEHFrames() {
1140   if (Dyld)
1141     Dyld->registerEHFrames();
1142 }
1143 
1144 void RuntimeDyld::deregisterEHFrames() {
1145   if (Dyld)
1146     Dyld->deregisterEHFrames();
1147 }
1148 
1149 } // end namespace llvm
1150