1 //===- InputSection.cpp ---------------------------------------------------===//
2 //
3 //                             The LLVM Linker
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "InputSection.h"
11 #include "Config.h"
12 #include "Error.h"
13 #include "InputFiles.h"
14 #include "OutputSections.h"
15 #include "Target.h"
16 
17 #include "llvm/Support/Endian.h"
18 
19 using namespace llvm;
20 using namespace llvm::ELF;
21 using namespace llvm::object;
22 using namespace llvm::support::endian;
23 
24 using namespace lld;
25 using namespace lld::elf;
26 
27 template <class ELFT>
28 InputSectionBase<ELFT>::InputSectionBase(elf::ObjectFile<ELFT> *File,
29                                          const Elf_Shdr *Header,
30                                          Kind SectionKind)
31     : Header(Header), File(File), SectionKind(SectionKind), Repl(this) {
32   // The garbage collector sets sections' Live bits.
33   // If GC is disabled, all sections are considered live by default.
34   Live = !Config->GcSections;
35 
36   // The ELF spec states that a value of 0 means the section has
37   // no alignment constraits.
38   Align = std::max<uintX_t>(Header->sh_addralign, 1);
39 }
40 
41 template <class ELFT> size_t InputSectionBase<ELFT>::getSize() const {
42   if (auto *D = dyn_cast<InputSection<ELFT>>(this))
43     if (D->getThunksSize() > 0)
44       return D->getThunkOff() + D->getThunksSize();
45   return Header->sh_size;
46 }
47 
48 template <class ELFT> StringRef InputSectionBase<ELFT>::getSectionName() const {
49   return check(File->getObj().getSectionName(this->Header));
50 }
51 
52 template <class ELFT>
53 ArrayRef<uint8_t> InputSectionBase<ELFT>::getSectionData() const {
54   return check(this->File->getObj().getSectionContents(this->Header));
55 }
56 
57 template <class ELFT>
58 typename ELFT::uint InputSectionBase<ELFT>::getOffset(uintX_t Offset) {
59   switch (SectionKind) {
60   case Regular:
61     return cast<InputSection<ELFT>>(this)->OutSecOff + Offset;
62   case EHFrame:
63     return cast<EHInputSection<ELFT>>(this)->getOffset(Offset);
64   case Merge:
65     return cast<MergeInputSection<ELFT>>(this)->getOffset(Offset);
66   case MipsReginfo:
67     // MIPS .reginfo sections are consumed by the linker,
68     // so it should never be copied to output.
69     llvm_unreachable("MIPS .reginfo reached writeTo().");
70   }
71   llvm_unreachable("invalid section kind");
72 }
73 
74 template <class ELFT>
75 typename ELFT::uint
76 InputSectionBase<ELFT>::getOffset(const DefinedRegular<ELFT> &Sym) {
77   return getOffset(Sym.Value);
78 }
79 
80 // Returns a section that Rel relocation is pointing to.
81 template <class ELFT>
82 InputSectionBase<ELFT> *
83 InputSectionBase<ELFT>::getRelocTarget(const Elf_Rel &Rel) const {
84   // Global symbol
85   uint32_t SymIndex = Rel.getSymbol(Config->Mips64EL);
86   SymbolBody &B = File->getSymbolBody(SymIndex).repl();
87   if (auto *D = dyn_cast<DefinedRegular<ELFT>>(&B))
88     if (D->Section)
89       return D->Section->Repl;
90   return nullptr;
91 }
92 
93 template <class ELFT>
94 InputSectionBase<ELFT> *
95 InputSectionBase<ELFT>::getRelocTarget(const Elf_Rela &Rel) const {
96   return getRelocTarget(reinterpret_cast<const Elf_Rel &>(Rel));
97 }
98 
99 template <class ELFT>
100 InputSection<ELFT>::InputSection(elf::ObjectFile<ELFT> *F,
101                                  const Elf_Shdr *Header)
102     : InputSectionBase<ELFT>(F, Header, Base::Regular) {}
103 
104 template <class ELFT>
105 bool InputSection<ELFT>::classof(const InputSectionBase<ELFT> *S) {
106   return S->SectionKind == Base::Regular;
107 }
108 
109 template <class ELFT>
110 InputSectionBase<ELFT> *InputSection<ELFT>::getRelocatedSection() {
111   assert(this->Header->sh_type == SHT_RELA || this->Header->sh_type == SHT_REL);
112   ArrayRef<InputSectionBase<ELFT> *> Sections = this->File->getSections();
113   return Sections[this->Header->sh_info];
114 }
115 
116 template <class ELFT> void InputSection<ELFT>::addThunk(SymbolBody &Body) {
117   Body.ThunkIndex = Thunks.size();
118   Thunks.push_back(&Body);
119 }
120 
121 template <class ELFT> uint64_t InputSection<ELFT>::getThunkOff() const {
122   return this->Header->sh_size;
123 }
124 
125 template <class ELFT> uint64_t InputSection<ELFT>::getThunksSize() const {
126   return Thunks.size() * Target->ThunkSize;
127 }
128 
129 // This is used for -r. We can't use memcpy to copy relocations because we need
130 // to update symbol table offset and section index for each relocation. So we
131 // copy relocations one by one.
132 template <class ELFT>
133 template <class RelTy>
134 void InputSection<ELFT>::copyRelocations(uint8_t *Buf, ArrayRef<RelTy> Rels) {
135   InputSectionBase<ELFT> *RelocatedSection = getRelocatedSection();
136 
137   for (const RelTy &Rel : Rels) {
138     uint32_t SymIndex = Rel.getSymbol(Config->Mips64EL);
139     uint32_t Type = Rel.getType(Config->Mips64EL);
140     SymbolBody &Body = this->File->getSymbolBody(SymIndex).repl();
141 
142     RelTy *P = reinterpret_cast<RelTy *>(Buf);
143     Buf += sizeof(RelTy);
144 
145     P->r_offset = RelocatedSection->getOffset(Rel.r_offset);
146     P->setSymbolAndType(Body.DynsymIndex, Type, Config->Mips64EL);
147   }
148 }
149 
150 // Page(Expr) is the page address of the expression Expr, defined
151 // as (Expr & ~0xFFF). (This applies even if the machine page size
152 // supported by the platform has a different value.)
153 static uint64_t getAArch64Page(uint64_t Expr) {
154   return Expr & (~static_cast<uint64_t>(0xFFF));
155 }
156 
157 template <class ELFT>
158 static typename ELFT::uint
159 getSymVA(uint32_t Type, typename ELFT::uint A, typename ELFT::uint P,
160          const SymbolBody &Body, uint8_t *BufLoc,
161          const elf::ObjectFile<ELFT> &File, RelExpr Expr) {
162   switch (Expr) {
163   case R_TLSLD:
164     return Out<ELFT>::Got->getTlsIndexVA() + A;
165   case R_TLSLD_PC:
166     return Out<ELFT>::Got->getTlsIndexVA() + A - P;
167   case R_THUNK:
168     return Body.getThunkVA<ELFT>();
169   case R_PPC_TOC:
170     return getPPC64TocBase() + A;
171   case R_TLSGD:
172     return Out<ELFT>::Got->getGlobalDynAddr(Body) + A;
173   case R_TLSGD_PC:
174     return Out<ELFT>::Got->getGlobalDynAddr(Body) + A - P;
175   case R_PLT:
176     return Body.getPltVA<ELFT>() + A;
177   case R_PLT_PC:
178   case R_PPC_PLT_OPD:
179     return Body.getPltVA<ELFT>() + A - P;
180   case R_SIZE:
181     return Body.getSize<ELFT>() + A;
182   case R_GOT:
183   case R_RELAX_TLS_GD_TO_IE:
184     return Body.getGotVA<ELFT>() + A;
185   case R_GOT_PAGE_PC:
186     return getAArch64Page(Body.getGotVA<ELFT>() + A) - getAArch64Page(P);
187   case R_GOT_PC:
188   case R_RELAX_TLS_GD_TO_IE_PC:
189     return Body.getGotVA<ELFT>() + A - P;
190   case R_ABS:
191   case R_RELAX_TLS_GD_TO_LE:
192   case R_RELAX_TLS_IE_TO_LE:
193   case R_RELAX_TLS_LD_TO_LE:
194     return Body.getVA<ELFT>(A);
195   case R_MIPS_GP0:
196     // We need to adjust SymVA value in case of R_MIPS_GPREL16/32
197     // relocations because they use the following expression to calculate
198     // the relocation's result for local symbol: S + A + GP0 - G.
199     return Body.getVA<ELFT>(A) + File.getMipsGp0();
200   case R_MIPS_GOT_LOCAL:
201     // If relocation against MIPS local symbol requires GOT entry, this entry
202     // should be initialized by 'page address'. This address is high 16-bits
203     // of sum the symbol's value and the addend.
204     return Out<ELFT>::Got->getMipsLocalPageAddr(Body.getVA<ELFT>(A));
205   case R_MIPS_GOT:
206     // For non-local symbols GOT entries should contain their full
207     // addresses. But if such symbol cannot be preempted, we do not
208     // have to put them into the "global" part of GOT and use dynamic
209     // linker to determine their actual addresses. That is why we
210     // create GOT entries for them in the "local" part of GOT.
211     return Out<ELFT>::Got->getMipsLocalEntryAddr(Body.getVA<ELFT>(A));
212   case R_PPC_OPD: {
213     uint64_t SymVA = Body.getVA<ELFT>(A);
214     // If we have an undefined weak symbol, we might get here with a symbol
215     // address of zero. That could overflow, but the code must be unreachable,
216     // so don't bother doing anything at all.
217     if (!SymVA)
218       return 0;
219     if (Out<ELF64BE>::Opd) {
220       // If this is a local call, and we currently have the address of a
221       // function-descriptor, get the underlying code address instead.
222       uint64_t OpdStart = Out<ELF64BE>::Opd->getVA();
223       uint64_t OpdEnd = OpdStart + Out<ELF64BE>::Opd->getSize();
224       bool InOpd = OpdStart <= SymVA && SymVA < OpdEnd;
225       if (InOpd)
226         SymVA = read64be(&Out<ELF64BE>::OpdBuf[SymVA - OpdStart]);
227     }
228     return SymVA - P;
229   }
230   case R_PC:
231     return Body.getVA<ELFT>(A) - P;
232   case R_PAGE_PC:
233     return getAArch64Page(Body.getVA<ELFT>(A)) - getAArch64Page(P);
234   }
235   llvm_unreachable("Invalid expression");
236 }
237 
238 template <class ELFT>
239 void InputSectionBase<ELFT>::relocate(uint8_t *Buf, uint8_t *BufEnd) {
240   const unsigned Bits = sizeof(uintX_t) * 8;
241   for (const Relocation &Rel : Relocations) {
242     uintX_t Offset = Rel.Offset;
243     uint8_t *BufLoc = Buf + Offset;
244     uint32_t Type = Rel.Type;
245     uintX_t A = Rel.Addend;
246 
247     uintX_t AddrLoc = OutSec->getVA() + Offset;
248     RelExpr Expr = Rel.Expr;
249     uint64_t SymVA = SignExtend64<Bits>(
250         getSymVA<ELFT>(Type, A, AddrLoc, *Rel.Sym, BufLoc, *File, Expr));
251 
252     if (Expr == R_RELAX_TLS_IE_TO_LE) {
253       Target->relaxTlsIeToLe(BufLoc, Type, SymVA);
254       continue;
255     }
256     if (Expr == R_RELAX_TLS_LD_TO_LE) {
257       Target->relaxTlsLdToLe(BufLoc, Type, SymVA);
258       continue;
259     }
260     if (Expr == R_RELAX_TLS_GD_TO_LE) {
261       Target->relaxTlsGdToLe(BufLoc, Type, SymVA);
262       continue;
263     }
264     if (Expr == R_RELAX_TLS_GD_TO_IE_PC || Expr == R_RELAX_TLS_GD_TO_IE) {
265       Target->relaxTlsGdToIe(BufLoc, Type, SymVA);
266       continue;
267     }
268 
269     if (Expr == R_PPC_PLT_OPD) {
270       uint32_t Nop = 0x60000000;
271       if (BufLoc + 8 <= BufEnd && read32be(BufLoc + 4) == Nop)
272         write32be(BufLoc + 4, 0xe8410028); // ld %r2, 40(%r1)
273     }
274 
275     Target->relocateOne(BufLoc, Type, SymVA);
276   }
277 }
278 
279 template <class ELFT> void InputSection<ELFT>::writeTo(uint8_t *Buf) {
280   if (this->Header->sh_type == SHT_NOBITS)
281     return;
282   ELFFile<ELFT> &EObj = this->File->getObj();
283 
284   // If -r is given, then an InputSection may be a relocation section.
285   if (this->Header->sh_type == SHT_RELA) {
286     copyRelocations(Buf + OutSecOff, EObj.relas(this->Header));
287     return;
288   }
289   if (this->Header->sh_type == SHT_REL) {
290     copyRelocations(Buf + OutSecOff, EObj.rels(this->Header));
291     return;
292   }
293 
294   // Copy section contents from source object file to output file.
295   ArrayRef<uint8_t> Data = this->getSectionData();
296   memcpy(Buf + OutSecOff, Data.data(), Data.size());
297 
298   // Iterate over all relocation sections that apply to this section.
299   uint8_t *BufEnd = Buf + OutSecOff + Data.size();
300   this->relocate(Buf, BufEnd);
301 
302   // The section might have a data/code generated by the linker and need
303   // to be written after the section. Usually these are thunks - small piece
304   // of code used to jump between "incompatible" functions like PIC and non-PIC
305   // or if the jump target too far and its address does not fit to the short
306   // jump istruction.
307   if (!Thunks.empty()) {
308     Buf += OutSecOff + getThunkOff();
309     for (const SymbolBody *S : Thunks) {
310       Target->writeThunk(Buf, S->getVA<ELFT>());
311       Buf += Target->ThunkSize;
312     }
313   }
314 }
315 
316 template <class ELFT>
317 void InputSection<ELFT>::replace(InputSection<ELFT> *Other) {
318   this->Align = std::max(this->Align, Other->Align);
319   Other->Repl = this->Repl;
320   Other->Live = false;
321 }
322 
323 template <class ELFT>
324 SplitInputSection<ELFT>::SplitInputSection(
325     elf::ObjectFile<ELFT> *File, const Elf_Shdr *Header,
326     typename InputSectionBase<ELFT>::Kind SectionKind)
327     : InputSectionBase<ELFT>(File, Header, SectionKind) {}
328 
329 template <class ELFT>
330 EHInputSection<ELFT>::EHInputSection(elf::ObjectFile<ELFT> *F,
331                                      const Elf_Shdr *Header)
332     : SplitInputSection<ELFT>(F, Header, InputSectionBase<ELFT>::EHFrame) {
333   // Mark .eh_frame sections as live by default because there are
334   // usually no relocations that point to .eh_frames. Otherwise,
335   // the garbage collector would drop all .eh_frame sections.
336   this->Live = true;
337 }
338 
339 template <class ELFT>
340 bool EHInputSection<ELFT>::classof(const InputSectionBase<ELFT> *S) {
341   return S->SectionKind == InputSectionBase<ELFT>::EHFrame;
342 }
343 
344 template <class ELFT>
345 typename ELFT::uint EHInputSection<ELFT>::getOffset(uintX_t Offset) {
346   // The file crtbeginT.o has relocations pointing to the start of an empty
347   // .eh_frame that is known to be the first in the link. It does that to
348   // identify the start of the output .eh_frame. Handle this special case.
349   if (this->getSectionHdr()->sh_size == 0)
350     return Offset;
351   std::pair<uintX_t, uintX_t> *I = this->getRangeAndSize(Offset).first;
352   uintX_t Base = I->second;
353   if (Base == uintX_t(-1))
354     return -1; // Not in the output
355 
356   uintX_t Addend = Offset - I->first;
357   return Base + Addend;
358 }
359 
360 template <class ELFT>
361 MergeInputSection<ELFT>::MergeInputSection(elf::ObjectFile<ELFT> *F,
362                                            const Elf_Shdr *Header)
363     : SplitInputSection<ELFT>(F, Header, InputSectionBase<ELFT>::Merge) {}
364 
365 template <class ELFT>
366 bool MergeInputSection<ELFT>::classof(const InputSectionBase<ELFT> *S) {
367   return S->SectionKind == InputSectionBase<ELFT>::Merge;
368 }
369 
370 template <class ELFT>
371 std::pair<std::pair<typename ELFT::uint, typename ELFT::uint> *,
372           typename ELFT::uint>
373 SplitInputSection<ELFT>::getRangeAndSize(uintX_t Offset) {
374   ArrayRef<uint8_t> D = this->getSectionData();
375   StringRef Data((const char *)D.data(), D.size());
376   uintX_t Size = Data.size();
377   if (Offset >= Size)
378     fatal("entry is past the end of the section");
379 
380   // Find the element this offset points to.
381   auto I = std::upper_bound(
382       Offsets.begin(), Offsets.end(), Offset,
383       [](const uintX_t &A, const std::pair<uintX_t, uintX_t> &B) {
384         return A < B.first;
385       });
386   uintX_t End = I == Offsets.end() ? Data.size() : I->first;
387   --I;
388   return std::make_pair(&*I, End);
389 }
390 
391 template <class ELFT>
392 typename ELFT::uint MergeInputSection<ELFT>::getOffset(uintX_t Offset) {
393   std::pair<std::pair<uintX_t, uintX_t> *, uintX_t> T =
394       this->getRangeAndSize(Offset);
395   std::pair<uintX_t, uintX_t> *I = T.first;
396   uintX_t End = T.second;
397   uintX_t Start = I->first;
398 
399   // Compute the Addend and if the Base is cached, return.
400   uintX_t Addend = Offset - Start;
401   uintX_t &Base = I->second;
402   if (Base != uintX_t(-1))
403     return Base + Addend;
404 
405   // Map the base to the offset in the output section and cache it.
406   ArrayRef<uint8_t> D = this->getSectionData();
407   StringRef Data((const char *)D.data(), D.size());
408   StringRef Entry = Data.substr(Start, End - Start);
409   Base =
410       static_cast<MergeOutputSection<ELFT> *>(this->OutSec)->getOffset(Entry);
411   return Base + Addend;
412 }
413 
414 template <class ELFT>
415 MipsReginfoInputSection<ELFT>::MipsReginfoInputSection(elf::ObjectFile<ELFT> *F,
416                                                        const Elf_Shdr *Hdr)
417     : InputSectionBase<ELFT>(F, Hdr, InputSectionBase<ELFT>::MipsReginfo) {
418   // Initialize this->Reginfo.
419   ArrayRef<uint8_t> D = this->getSectionData();
420   if (D.size() != sizeof(Elf_Mips_RegInfo<ELFT>))
421     fatal("invalid size of .reginfo section");
422   Reginfo = reinterpret_cast<const Elf_Mips_RegInfo<ELFT> *>(D.data());
423 }
424 
425 template <class ELFT>
426 bool MipsReginfoInputSection<ELFT>::classof(const InputSectionBase<ELFT> *S) {
427   return S->SectionKind == InputSectionBase<ELFT>::MipsReginfo;
428 }
429 
430 template class elf::InputSectionBase<ELF32LE>;
431 template class elf::InputSectionBase<ELF32BE>;
432 template class elf::InputSectionBase<ELF64LE>;
433 template class elf::InputSectionBase<ELF64BE>;
434 
435 template class elf::InputSection<ELF32LE>;
436 template class elf::InputSection<ELF32BE>;
437 template class elf::InputSection<ELF64LE>;
438 template class elf::InputSection<ELF64BE>;
439 
440 template class elf::EHInputSection<ELF32LE>;
441 template class elf::EHInputSection<ELF32BE>;
442 template class elf::EHInputSection<ELF64LE>;
443 template class elf::EHInputSection<ELF64BE>;
444 
445 template class elf::MergeInputSection<ELF32LE>;
446 template class elf::MergeInputSection<ELF32BE>;
447 template class elf::MergeInputSection<ELF64LE>;
448 template class elf::MergeInputSection<ELF64BE>;
449 
450 template class elf::MipsReginfoInputSection<ELF32LE>;
451 template class elf::MipsReginfoInputSection<ELF32BE>;
452 template class elf::MipsReginfoInputSection<ELF64LE>;
453 template class elf::MipsReginfoInputSection<ELF64BE>;
454