1 //===- Writer.cpp ---------------------------------------------------------===// 2 // 3 // The LLVM Linker 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 10 #include "Writer.h" 11 #include "Config.h" 12 #include "LinkerScript.h" 13 #include "OutputSections.h" 14 #include "Relocations.h" 15 #include "SymbolTable.h" 16 #include "Target.h" 17 18 #include "llvm/ADT/StringMap.h" 19 #include "llvm/ADT/StringSwitch.h" 20 #include "llvm/Support/FileOutputBuffer.h" 21 #include "llvm/Support/StringSaver.h" 22 #include "llvm/Support/raw_ostream.h" 23 24 using namespace llvm; 25 using namespace llvm::ELF; 26 using namespace llvm::object; 27 28 using namespace lld; 29 using namespace lld::elf; 30 31 namespace { 32 // The writer writes a SymbolTable result to a file. 33 template <class ELFT> class Writer { 34 public: 35 typedef typename ELFT::uint uintX_t; 36 typedef typename ELFT::Shdr Elf_Shdr; 37 typedef typename ELFT::Ehdr Elf_Ehdr; 38 typedef typename ELFT::Phdr Elf_Phdr; 39 typedef typename ELFT::Sym Elf_Sym; 40 typedef typename ELFT::SymRange Elf_Sym_Range; 41 typedef typename ELFT::Rela Elf_Rela; 42 Writer(SymbolTable<ELFT> &S) : Symtab(S) {} 43 void run(); 44 45 private: 46 // This describes a program header entry. 47 // Each contains type, access flags and range of output sections that will be 48 // placed in it. 49 struct Phdr { 50 Phdr(unsigned Type, unsigned Flags) { 51 H.p_type = Type; 52 H.p_flags = Flags; 53 } 54 Elf_Phdr H = {}; 55 OutputSectionBase<ELFT> *First = nullptr; 56 OutputSectionBase<ELFT> *Last = nullptr; 57 }; 58 59 void copyLocalSymbols(); 60 void addReservedSymbols(); 61 void createSections(); 62 void addPredefinedSections(); 63 bool needsGot(); 64 65 void createPhdrs(); 66 void assignAddresses(); 67 void assignFileOffsets(); 68 void setPhdrs(); 69 void fixHeaders(); 70 void fixSectionAlignments(); 71 void fixAbsoluteSymbols(); 72 void openFile(); 73 void writeHeader(); 74 void writeSections(); 75 void writeBuildId(); 76 bool isDiscarded(InputSectionBase<ELFT> *IS) const; 77 StringRef getOutputSectionName(InputSectionBase<ELFT> *S) const; 78 bool needsInterpSection() const { 79 return !Symtab.getSharedFiles().empty() && !Config->DynamicLinker.empty(); 80 } 81 bool isOutputDynamic() const { 82 return !Symtab.getSharedFiles().empty() || Config->Pic; 83 } 84 85 void addCommonSymbols(std::vector<DefinedCommon *> &Syms); 86 87 std::unique_ptr<llvm::FileOutputBuffer> Buffer; 88 89 BumpPtrAllocator Alloc; 90 std::vector<OutputSectionBase<ELFT> *> OutputSections; 91 std::vector<std::unique_ptr<OutputSectionBase<ELFT>>> OwningSections; 92 93 void addRelIpltSymbols(); 94 void addStartEndSymbols(); 95 void addStartStopSymbols(OutputSectionBase<ELFT> *Sec); 96 97 SymbolTable<ELFT> &Symtab; 98 std::vector<Phdr> Phdrs; 99 100 uintX_t FileSize; 101 uintX_t SectionHeaderOff; 102 }; 103 } // anonymous namespace 104 105 template <class ELFT> void elf::writeResult(SymbolTable<ELFT> *Symtab) { 106 typedef typename ELFT::uint uintX_t; 107 typedef typename ELFT::Ehdr Elf_Ehdr; 108 109 // Create singleton output sections. 110 OutputSection<ELFT> Bss(".bss", SHT_NOBITS, SHF_ALLOC | SHF_WRITE); 111 DynamicSection<ELFT> Dynamic; 112 EhOutputSection<ELFT> EhFrame; 113 GotSection<ELFT> Got; 114 InterpSection<ELFT> Interp; 115 PltSection<ELFT> Plt; 116 RelocationSection<ELFT> RelaDyn(Config->Rela ? ".rela.dyn" : ".rel.dyn", 117 Config->ZCombreloc); 118 StringTableSection<ELFT> DynStrTab(".dynstr", true); 119 StringTableSection<ELFT> ShStrTab(".shstrtab", false); 120 SymbolTableSection<ELFT> DynSymTab(DynStrTab); 121 VersionTableSection<ELFT> VerSym; 122 VersionNeedSection<ELFT> VerNeed; 123 124 OutputSectionBase<ELFT> ElfHeader("", 0, SHF_ALLOC); 125 ElfHeader.setSize(sizeof(Elf_Ehdr)); 126 OutputSectionBase<ELFT> ProgramHeaders("", 0, SHF_ALLOC); 127 ProgramHeaders.updateAlign(sizeof(uintX_t)); 128 129 // Instantiate optional output sections if they are needed. 130 std::unique_ptr<BuildIdSection<ELFT>> BuildId; 131 std::unique_ptr<EhFrameHeader<ELFT>> EhFrameHdr; 132 std::unique_ptr<GnuHashTableSection<ELFT>> GnuHashTab; 133 std::unique_ptr<GotPltSection<ELFT>> GotPlt; 134 std::unique_ptr<HashTableSection<ELFT>> HashTab; 135 std::unique_ptr<RelocationSection<ELFT>> RelaPlt; 136 std::unique_ptr<StringTableSection<ELFT>> StrTab; 137 std::unique_ptr<SymbolTableSection<ELFT>> SymTabSec; 138 std::unique_ptr<OutputSection<ELFT>> MipsRldMap; 139 140 if (Config->BuildId == BuildIdKind::Fnv1) 141 BuildId.reset(new BuildIdFnv1<ELFT>); 142 else if (Config->BuildId == BuildIdKind::Md5) 143 BuildId.reset(new BuildIdMd5<ELFT>); 144 else if (Config->BuildId == BuildIdKind::Sha1) 145 BuildId.reset(new BuildIdSha1<ELFT>); 146 else if (Config->BuildId == BuildIdKind::Hexstring) 147 BuildId.reset(new BuildIdHexstring<ELFT>); 148 149 if (Config->EhFrameHdr) 150 EhFrameHdr.reset(new EhFrameHeader<ELFT>); 151 152 if (Config->GnuHash) 153 GnuHashTab.reset(new GnuHashTableSection<ELFT>); 154 if (Config->SysvHash) 155 HashTab.reset(new HashTableSection<ELFT>); 156 StringRef S = Config->Rela ? ".rela.plt" : ".rel.plt"; 157 GotPlt.reset(new GotPltSection<ELFT>); 158 RelaPlt.reset(new RelocationSection<ELFT>(S, false /*Sort*/)); 159 if (!Config->StripAll) { 160 StrTab.reset(new StringTableSection<ELFT>(".strtab", false)); 161 SymTabSec.reset(new SymbolTableSection<ELFT>(*StrTab)); 162 } 163 if (Config->EMachine == EM_MIPS && !Config->Shared) { 164 // This is a MIPS specific section to hold a space within the data segment 165 // of executable file which is pointed to by the DT_MIPS_RLD_MAP entry. 166 // See "Dynamic section" in Chapter 5 in the following document: 167 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf 168 MipsRldMap.reset(new OutputSection<ELFT>(".rld_map", SHT_PROGBITS, 169 SHF_ALLOC | SHF_WRITE)); 170 MipsRldMap->setSize(sizeof(uintX_t)); 171 MipsRldMap->updateAlign(sizeof(uintX_t)); 172 } 173 174 Out<ELFT>::Bss = &Bss; 175 Out<ELFT>::BuildId = BuildId.get(); 176 Out<ELFT>::DynStrTab = &DynStrTab; 177 Out<ELFT>::DynSymTab = &DynSymTab; 178 Out<ELFT>::Dynamic = &Dynamic; 179 Out<ELFT>::EhFrame = &EhFrame; 180 Out<ELFT>::EhFrameHdr = EhFrameHdr.get(); 181 Out<ELFT>::GnuHashTab = GnuHashTab.get(); 182 Out<ELFT>::Got = &Got; 183 Out<ELFT>::GotPlt = GotPlt.get(); 184 Out<ELFT>::HashTab = HashTab.get(); 185 Out<ELFT>::Interp = &Interp; 186 Out<ELFT>::Plt = &Plt; 187 Out<ELFT>::RelaDyn = &RelaDyn; 188 Out<ELFT>::RelaPlt = RelaPlt.get(); 189 Out<ELFT>::ShStrTab = &ShStrTab; 190 Out<ELFT>::StrTab = StrTab.get(); 191 Out<ELFT>::SymTab = SymTabSec.get(); 192 Out<ELFT>::VerSym = &VerSym; 193 Out<ELFT>::VerNeed = &VerNeed; 194 Out<ELFT>::MipsRldMap = MipsRldMap.get(); 195 Out<ELFT>::Opd = nullptr; 196 Out<ELFT>::OpdBuf = nullptr; 197 Out<ELFT>::TlsPhdr = nullptr; 198 Out<ELFT>::ElfHeader = &ElfHeader; 199 Out<ELFT>::ProgramHeaders = &ProgramHeaders; 200 201 Writer<ELFT>(*Symtab).run(); 202 } 203 204 // The main function of the writer. 205 template <class ELFT> void Writer<ELFT>::run() { 206 if (!Config->DiscardAll) 207 copyLocalSymbols(); 208 addReservedSymbols(); 209 createSections(); 210 if (HasError) 211 return; 212 213 if (Config->Relocatable) { 214 assignFileOffsets(); 215 } else { 216 createPhdrs(); 217 fixHeaders(); 218 if (ScriptConfig->DoLayout) { 219 Script<ELFT>::X->assignAddresses(OutputSections); 220 } else { 221 fixSectionAlignments(); 222 assignAddresses(); 223 } 224 assignFileOffsets(); 225 setPhdrs(); 226 fixAbsoluteSymbols(); 227 } 228 229 openFile(); 230 if (HasError) 231 return; 232 writeHeader(); 233 writeSections(); 234 writeBuildId(); 235 if (HasError) 236 return; 237 check(Buffer->commit()); 238 } 239 240 namespace { 241 template <bool Is64Bits> struct SectionKey { 242 typedef typename std::conditional<Is64Bits, uint64_t, uint32_t>::type uintX_t; 243 StringRef Name; 244 uint32_t Type; 245 uintX_t Flags; 246 uintX_t Alignment; 247 }; 248 } 249 namespace llvm { 250 template <bool Is64Bits> struct DenseMapInfo<SectionKey<Is64Bits>> { 251 static SectionKey<Is64Bits> getEmptyKey() { 252 return SectionKey<Is64Bits>{DenseMapInfo<StringRef>::getEmptyKey(), 0, 0, 253 0}; 254 } 255 static SectionKey<Is64Bits> getTombstoneKey() { 256 return SectionKey<Is64Bits>{DenseMapInfo<StringRef>::getTombstoneKey(), 0, 257 0, 0}; 258 } 259 static unsigned getHashValue(const SectionKey<Is64Bits> &Val) { 260 return hash_combine(Val.Name, Val.Type, Val.Flags, Val.Alignment); 261 } 262 static bool isEqual(const SectionKey<Is64Bits> &LHS, 263 const SectionKey<Is64Bits> &RHS) { 264 return DenseMapInfo<StringRef>::isEqual(LHS.Name, RHS.Name) && 265 LHS.Type == RHS.Type && LHS.Flags == RHS.Flags && 266 LHS.Alignment == RHS.Alignment; 267 } 268 }; 269 } 270 271 template <class ELFT> 272 static void reportUndefined(SymbolTable<ELFT> &Symtab, SymbolBody *Sym) { 273 if (!Config->NoUndefined) { 274 if (Config->Relocatable) 275 return; 276 if (Config->Shared && !Config->ZDefs) 277 if (Sym->symbol()->Visibility == STV_DEFAULT) 278 return; 279 } 280 281 std::string Msg = "undefined symbol: " + Sym->getName().str(); 282 if (InputFile *File = Sym->getSourceFile<ELFT>()) 283 Msg += " in " + getFilename(File); 284 if (Config->NoinhibitExec) 285 warning(Msg); 286 else 287 error(Msg); 288 } 289 290 template <class ELFT> 291 static bool shouldKeepInSymtab(InputSectionBase<ELFT> *Sec, StringRef SymName, 292 const SymbolBody &B) { 293 if (B.isFile()) 294 return false; 295 296 // We keep sections in symtab for relocatable output. 297 if (B.isSection()) 298 return Config->Relocatable; 299 300 // If sym references a section in a discarded group, don't keep it. 301 if (Sec == &InputSection<ELFT>::Discarded) 302 return false; 303 304 if (Config->DiscardNone) 305 return true; 306 307 // In ELF assembly .L symbols are normally discarded by the assembler. 308 // If the assembler fails to do so, the linker discards them if 309 // * --discard-locals is used. 310 // * The symbol is in a SHF_MERGE section, which is normally the reason for 311 // the assembler keeping the .L symbol. 312 if (!SymName.startswith(".L") && !SymName.empty()) 313 return true; 314 315 if (Config->DiscardLocals) 316 return false; 317 318 return !(Sec->getSectionHdr()->sh_flags & SHF_MERGE); 319 } 320 321 template <class ELFT> static bool includeInSymtab(const SymbolBody &B) { 322 if (!B.isLocal() && !B.symbol()->IsUsedInRegularObj) 323 return false; 324 325 if (auto *D = dyn_cast<DefinedRegular<ELFT>>(&B)) { 326 // Always include absolute symbols. 327 if (!D->Section) 328 return true; 329 // Exclude symbols pointing to garbage-collected sections. 330 if (!D->Section->Live) 331 return false; 332 if (auto *S = dyn_cast<MergeInputSection<ELFT>>(D->Section)) 333 if (!S->getSectionPiece(D->Value)->Live) 334 return false; 335 } 336 return true; 337 } 338 339 // Local symbols are not in the linker's symbol table. This function scans 340 // each object file's symbol table to copy local symbols to the output. 341 template <class ELFT> void Writer<ELFT>::copyLocalSymbols() { 342 if (!Out<ELFT>::SymTab) 343 return; 344 for (const std::unique_ptr<elf::ObjectFile<ELFT>> &F : 345 Symtab.getObjectFiles()) { 346 const char *StrTab = F->getStringTable().data(); 347 for (SymbolBody *B : F->getLocalSymbols()) { 348 auto *DR = dyn_cast<DefinedRegular<ELFT>>(B); 349 // No reason to keep local undefined symbol in symtab. 350 if (!DR) 351 continue; 352 if (!includeInSymtab<ELFT>(*B)) 353 continue; 354 StringRef SymName(StrTab + B->getNameOffset()); 355 InputSectionBase<ELFT> *Sec = DR->Section; 356 if (!shouldKeepInSymtab<ELFT>(Sec, SymName, *B)) 357 continue; 358 ++Out<ELFT>::SymTab->NumLocals; 359 if (Config->Relocatable) 360 B->DynsymIndex = Out<ELFT>::SymTab->NumLocals; 361 F->KeptLocalSyms.push_back( 362 std::make_pair(DR, Out<ELFT>::SymTab->StrTabSec.addString(SymName))); 363 } 364 } 365 } 366 367 // PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections that 368 // we would like to make sure appear is a specific order to maximize their 369 // coverage by a single signed 16-bit offset from the TOC base pointer. 370 // Conversely, the special .tocbss section should be first among all SHT_NOBITS 371 // sections. This will put it next to the loaded special PPC64 sections (and, 372 // thus, within reach of the TOC base pointer). 373 static int getPPC64SectionRank(StringRef SectionName) { 374 return StringSwitch<int>(SectionName) 375 .Case(".tocbss", 0) 376 .Case(".branch_lt", 2) 377 .Case(".toc", 3) 378 .Case(".toc1", 4) 379 .Case(".opd", 5) 380 .Default(1); 381 } 382 383 template <class ELFT> static bool isRelroSection(OutputSectionBase<ELFT> *Sec) { 384 if (!Config->ZRelro) 385 return false; 386 typename ELFT::uint Flags = Sec->getFlags(); 387 if (!(Flags & SHF_ALLOC) || !(Flags & SHF_WRITE)) 388 return false; 389 if (Flags & SHF_TLS) 390 return true; 391 uint32_t Type = Sec->getType(); 392 if (Type == SHT_INIT_ARRAY || Type == SHT_FINI_ARRAY || 393 Type == SHT_PREINIT_ARRAY) 394 return true; 395 if (Sec == Out<ELFT>::GotPlt) 396 return Config->ZNow; 397 if (Sec == Out<ELFT>::Dynamic || Sec == Out<ELFT>::Got) 398 return true; 399 StringRef S = Sec->getName(); 400 return S == ".data.rel.ro" || S == ".ctors" || S == ".dtors" || S == ".jcr" || 401 S == ".eh_frame"; 402 } 403 404 // Output section ordering is determined by this function. 405 template <class ELFT> 406 static bool compareSections(OutputSectionBase<ELFT> *A, 407 OutputSectionBase<ELFT> *B) { 408 typedef typename ELFT::uint uintX_t; 409 410 int Comp = Script<ELFT>::X->compareSections(A->getName(), B->getName()); 411 if (Comp != 0) 412 return Comp < 0; 413 414 uintX_t AFlags = A->getFlags(); 415 uintX_t BFlags = B->getFlags(); 416 417 // Allocatable sections go first to reduce the total PT_LOAD size and 418 // so debug info doesn't change addresses in actual code. 419 bool AIsAlloc = AFlags & SHF_ALLOC; 420 bool BIsAlloc = BFlags & SHF_ALLOC; 421 if (AIsAlloc != BIsAlloc) 422 return AIsAlloc; 423 424 // We don't have any special requirements for the relative order of 425 // two non allocatable sections. 426 if (!AIsAlloc) 427 return false; 428 429 // We want the read only sections first so that they go in the PT_LOAD 430 // covering the program headers at the start of the file. 431 bool AIsWritable = AFlags & SHF_WRITE; 432 bool BIsWritable = BFlags & SHF_WRITE; 433 if (AIsWritable != BIsWritable) 434 return BIsWritable; 435 436 // For a corresponding reason, put non exec sections first (the program 437 // header PT_LOAD is not executable). 438 bool AIsExec = AFlags & SHF_EXECINSTR; 439 bool BIsExec = BFlags & SHF_EXECINSTR; 440 if (AIsExec != BIsExec) 441 return BIsExec; 442 443 // If we got here we know that both A and B are in the same PT_LOAD. 444 445 // The TLS initialization block needs to be a single contiguous block in a R/W 446 // PT_LOAD, so stick TLS sections directly before R/W sections. The TLS NOBITS 447 // sections are placed here as they don't take up virtual address space in the 448 // PT_LOAD. 449 bool AIsTls = AFlags & SHF_TLS; 450 bool BIsTls = BFlags & SHF_TLS; 451 if (AIsTls != BIsTls) 452 return AIsTls; 453 454 // The next requirement we have is to put nobits sections last. The 455 // reason is that the only thing the dynamic linker will see about 456 // them is a p_memsz that is larger than p_filesz. Seeing that it 457 // zeros the end of the PT_LOAD, so that has to correspond to the 458 // nobits sections. 459 bool AIsNoBits = A->getType() == SHT_NOBITS; 460 bool BIsNoBits = B->getType() == SHT_NOBITS; 461 if (AIsNoBits != BIsNoBits) 462 return BIsNoBits; 463 464 // We place RelRo section before plain r/w ones. 465 bool AIsRelRo = isRelroSection(A); 466 bool BIsRelRo = isRelroSection(B); 467 if (AIsRelRo != BIsRelRo) 468 return AIsRelRo; 469 470 // Some architectures have additional ordering restrictions for sections 471 // within the same PT_LOAD. 472 if (Config->EMachine == EM_PPC64) 473 return getPPC64SectionRank(A->getName()) < 474 getPPC64SectionRank(B->getName()); 475 476 return false; 477 } 478 479 // Until this function is called, common symbols do not belong to any section. 480 // This function adds them to end of BSS section. 481 template <class ELFT> 482 void Writer<ELFT>::addCommonSymbols(std::vector<DefinedCommon *> &Syms) { 483 if (Syms.empty()) 484 return; 485 486 // Sort the common symbols by alignment as an heuristic to pack them better. 487 std::stable_sort(Syms.begin(), Syms.end(), 488 [](const DefinedCommon *A, const DefinedCommon *B) { 489 return A->Alignment > B->Alignment; 490 }); 491 492 uintX_t Off = Out<ELFT>::Bss->getSize(); 493 for (DefinedCommon *C : Syms) { 494 Off = alignTo(Off, C->Alignment); 495 Out<ELFT>::Bss->updateAlign(C->Alignment); 496 C->OffsetInBss = Off; 497 Off += C->Size; 498 } 499 500 Out<ELFT>::Bss->setSize(Off); 501 } 502 503 template <class ELFT> 504 StringRef Writer<ELFT>::getOutputSectionName(InputSectionBase<ELFT> *S) const { 505 StringRef Dest = Script<ELFT>::X->getOutputSection(S); 506 if (!Dest.empty()) 507 return Dest; 508 509 StringRef Name = S->getSectionName(); 510 for (StringRef V : {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.", 511 ".init_array.", ".fini_array.", ".ctors.", ".dtors.", 512 ".tbss.", ".gcc_except_table.", ".tdata."}) 513 if (Name.startswith(V)) 514 return V.drop_back(); 515 return Name; 516 } 517 518 template <class ELFT> 519 void reportDiscarded(InputSectionBase<ELFT> *IS, 520 const std::unique_ptr<elf::ObjectFile<ELFT>> &File) { 521 if (!Config->PrintGcSections || !IS || IS->Live) 522 return; 523 llvm::errs() << "removing unused section from '" << IS->getSectionName() 524 << "' in file '" << File->getName() << "'\n"; 525 } 526 527 template <class ELFT> 528 bool Writer<ELFT>::isDiscarded(InputSectionBase<ELFT> *S) const { 529 return !S || S == &InputSection<ELFT>::Discarded || !S->Live || 530 Script<ELFT>::X->isDiscarded(S); 531 } 532 533 template <class ELFT> 534 static Symbol *addOptionalSynthetic(SymbolTable<ELFT> &Table, StringRef Name, 535 OutputSectionBase<ELFT> *Sec, 536 typename ELFT::uint Val) { 537 SymbolBody *S = Table.find(Name); 538 if (!S) 539 return nullptr; 540 if (!S->isUndefined() && !S->isShared()) 541 return S->symbol(); 542 return Table.addSynthetic(Name, Sec, Val); 543 } 544 545 // The beginning and the ending of .rel[a].plt section are marked 546 // with __rel[a]_iplt_{start,end} symbols if it is a statically linked 547 // executable. The runtime needs these symbols in order to resolve 548 // all IRELATIVE relocs on startup. For dynamic executables, we don't 549 // need these symbols, since IRELATIVE relocs are resolved through GOT 550 // and PLT. For details, see http://www.airs.com/blog/archives/403. 551 template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() { 552 if (isOutputDynamic() || !Out<ELFT>::RelaPlt) 553 return; 554 StringRef S = Config->Rela ? "__rela_iplt_start" : "__rel_iplt_start"; 555 addOptionalSynthetic(Symtab, S, Out<ELFT>::RelaPlt, 0); 556 557 S = Config->Rela ? "__rela_iplt_end" : "__rel_iplt_end"; 558 addOptionalSynthetic(Symtab, S, Out<ELFT>::RelaPlt, 559 DefinedSynthetic<ELFT>::SectionEnd); 560 } 561 562 // This class knows how to create an output section for a given 563 // input section. Output section type is determined by various 564 // factors, including input section's sh_flags, sh_type and 565 // linker scripts. 566 namespace { 567 template <class ELFT> class OutputSectionFactory { 568 typedef typename ELFT::Shdr Elf_Shdr; 569 typedef typename ELFT::uint uintX_t; 570 571 public: 572 std::pair<OutputSectionBase<ELFT> *, bool> create(InputSectionBase<ELFT> *C, 573 StringRef OutsecName); 574 575 OutputSectionBase<ELFT> *lookup(StringRef Name, uint32_t Type, 576 uintX_t Flags) { 577 return Map.lookup({Name, Type, Flags, 0}); 578 } 579 580 private: 581 SectionKey<ELFT::Is64Bits> createKey(InputSectionBase<ELFT> *C, 582 StringRef OutsecName); 583 584 SmallDenseMap<SectionKey<ELFT::Is64Bits>, OutputSectionBase<ELFT> *> Map; 585 }; 586 } 587 588 template <class ELFT> 589 std::pair<OutputSectionBase<ELFT> *, bool> 590 OutputSectionFactory<ELFT>::create(InputSectionBase<ELFT> *C, 591 StringRef OutsecName) { 592 SectionKey<ELFT::Is64Bits> Key = createKey(C, OutsecName); 593 OutputSectionBase<ELFT> *&Sec = Map[Key]; 594 if (Sec) 595 return {Sec, false}; 596 597 switch (C->SectionKind) { 598 case InputSectionBase<ELFT>::Regular: 599 Sec = new OutputSection<ELFT>(Key.Name, Key.Type, Key.Flags); 600 break; 601 case InputSectionBase<ELFT>::EHFrame: 602 return {Out<ELFT>::EhFrame, false}; 603 case InputSectionBase<ELFT>::Merge: 604 Sec = new MergeOutputSection<ELFT>(Key.Name, Key.Type, Key.Flags, 605 Key.Alignment); 606 break; 607 case InputSectionBase<ELFT>::MipsReginfo: 608 Sec = new MipsReginfoOutputSection<ELFT>(); 609 break; 610 case InputSectionBase<ELFT>::MipsOptions: 611 Sec = new MipsOptionsOutputSection<ELFT>(); 612 break; 613 } 614 return {Sec, true}; 615 } 616 617 template <class ELFT> 618 SectionKey<ELFT::Is64Bits> 619 OutputSectionFactory<ELFT>::createKey(InputSectionBase<ELFT> *C, 620 StringRef OutsecName) { 621 const Elf_Shdr *H = C->getSectionHdr(); 622 uintX_t Flags = H->sh_flags & ~SHF_GROUP; 623 624 // For SHF_MERGE we create different output sections for each alignment. 625 // This makes each output section simple and keeps a single level mapping from 626 // input to output. 627 uintX_t Alignment = 0; 628 if (isa<MergeInputSection<ELFT>>(C)) 629 Alignment = std::max(H->sh_addralign, H->sh_entsize); 630 631 uint32_t Type = H->sh_type; 632 return SectionKey<ELFT::Is64Bits>{OutsecName, Type, Flags, Alignment}; 633 } 634 635 // The linker is expected to define some symbols depending on 636 // the linking result. This function defines such symbols. 637 template <class ELFT> void Writer<ELFT>::addReservedSymbols() { 638 if (Config->EMachine == EM_MIPS) { 639 // Define _gp for MIPS. st_value of _gp symbol will be updated by Writer 640 // so that it points to an absolute address which is relative to GOT. 641 // See "Global Data Symbols" in Chapter 6 in the following document: 642 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf 643 Symtab.addSynthetic("_gp", Out<ELFT>::Got, MipsGPOffset); 644 645 // On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between 646 // start of function and 'gp' pointer into GOT. 647 Symbol *Sym = 648 addOptionalSynthetic(Symtab, "_gp_disp", Out<ELFT>::Got, MipsGPOffset); 649 if (Sym) 650 ElfSym<ELFT>::MipsGpDisp = Sym->body(); 651 652 // The __gnu_local_gp is a magic symbol equal to the current value of 'gp' 653 // pointer. This symbol is used in the code generated by .cpload pseudo-op 654 // in case of using -mno-shared option. 655 // https://sourceware.org/ml/binutils/2004-12/msg00094.html 656 addOptionalSynthetic(Symtab, "__gnu_local_gp", Out<ELFT>::Got, 657 MipsGPOffset); 658 } 659 660 // In the assembly for 32 bit x86 the _GLOBAL_OFFSET_TABLE_ symbol 661 // is magical and is used to produce a R_386_GOTPC relocation. 662 // The R_386_GOTPC relocation value doesn't actually depend on the 663 // symbol value, so it could use an index of STN_UNDEF which, according 664 // to the spec, means the symbol value is 0. 665 // Unfortunately both gas and MC keep the _GLOBAL_OFFSET_TABLE_ symbol in 666 // the object file. 667 // The situation is even stranger on x86_64 where the assembly doesn't 668 // need the magical symbol, but gas still puts _GLOBAL_OFFSET_TABLE_ as 669 // an undefined symbol in the .o files. 670 // Given that the symbol is effectively unused, we just create a dummy 671 // hidden one to avoid the undefined symbol error. 672 if (!Config->Relocatable) 673 Symtab.addIgnored("_GLOBAL_OFFSET_TABLE_"); 674 675 // __tls_get_addr is defined by the dynamic linker for dynamic ELFs. For 676 // static linking the linker is required to optimize away any references to 677 // __tls_get_addr, so it's not defined anywhere. Create a hidden definition 678 // to avoid the undefined symbol error. 679 if (!isOutputDynamic()) 680 Symtab.addIgnored("__tls_get_addr"); 681 682 auto Define = [this](StringRef S, DefinedRegular<ELFT> *&Sym1, 683 DefinedRegular<ELFT> *&Sym2) { 684 Sym1 = Symtab.addIgnored(S, STV_DEFAULT); 685 686 // The name without the underscore is not a reserved name, 687 // so it is defined only when there is a reference against it. 688 assert(S.startswith("_")); 689 S = S.substr(1); 690 if (SymbolBody *B = Symtab.find(S)) 691 if (B->isUndefined()) 692 Sym2 = Symtab.addAbsolute(S, STV_DEFAULT); 693 }; 694 695 Define("_end", ElfSym<ELFT>::End, ElfSym<ELFT>::End2); 696 Define("_etext", ElfSym<ELFT>::Etext, ElfSym<ELFT>::Etext2); 697 Define("_edata", ElfSym<ELFT>::Edata, ElfSym<ELFT>::Edata2); 698 } 699 700 // Sort input sections by section name suffixes for 701 // __attribute__((init_priority(N))). 702 template <class ELFT> static void sortInitFini(OutputSectionBase<ELFT> *S) { 703 if (S) 704 reinterpret_cast<OutputSection<ELFT> *>(S)->sortInitFini(); 705 } 706 707 // Sort input sections by the special rule for .ctors and .dtors. 708 template <class ELFT> static void sortCtorsDtors(OutputSectionBase<ELFT> *S) { 709 if (S) 710 reinterpret_cast<OutputSection<ELFT> *>(S)->sortCtorsDtors(); 711 } 712 713 // Create output section objects and add them to OutputSections. 714 template <class ELFT> void Writer<ELFT>::createSections() { 715 // Add .interp first because some loaders want to see that section 716 // on the first page of the executable file when loaded into memory. 717 if (needsInterpSection()) 718 OutputSections.push_back(Out<ELFT>::Interp); 719 720 // A core file does not usually contain unmodified segments except 721 // the first page of the executable. Add the build ID section now 722 // so that the section is included in the first page. 723 if (Out<ELFT>::BuildId) 724 OutputSections.push_back(Out<ELFT>::BuildId); 725 726 // Create output sections for input object file sections. 727 std::vector<OutputSectionBase<ELFT> *> RegularSections; 728 OutputSectionFactory<ELFT> Factory; 729 for (const std::unique_ptr<elf::ObjectFile<ELFT>> &F : 730 Symtab.getObjectFiles()) { 731 for (InputSectionBase<ELFT> *C : F->getSections()) { 732 if (isDiscarded(C)) { 733 reportDiscarded(C, F); 734 continue; 735 } 736 OutputSectionBase<ELFT> *Sec; 737 bool IsNew; 738 std::tie(Sec, IsNew) = Factory.create(C, getOutputSectionName(C)); 739 if (IsNew) { 740 OwningSections.emplace_back(Sec); 741 OutputSections.push_back(Sec); 742 RegularSections.push_back(Sec); 743 } 744 Sec->addSection(C); 745 } 746 } 747 748 // If we have a .opd section (used under PPC64 for function descriptors), 749 // store a pointer to it here so that we can use it later when processing 750 // relocations. 751 Out<ELFT>::Opd = Factory.lookup(".opd", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC); 752 753 Out<ELFT>::Dynamic->PreInitArraySec = Factory.lookup( 754 ".preinit_array", SHT_PREINIT_ARRAY, SHF_WRITE | SHF_ALLOC); 755 Out<ELFT>::Dynamic->InitArraySec = 756 Factory.lookup(".init_array", SHT_INIT_ARRAY, SHF_WRITE | SHF_ALLOC); 757 Out<ELFT>::Dynamic->FiniArraySec = 758 Factory.lookup(".fini_array", SHT_FINI_ARRAY, SHF_WRITE | SHF_ALLOC); 759 760 // Sort section contents for __attribute__((init_priority(N)). 761 sortInitFini(Out<ELFT>::Dynamic->InitArraySec); 762 sortInitFini(Out<ELFT>::Dynamic->FiniArraySec); 763 sortCtorsDtors(Factory.lookup(".ctors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); 764 sortCtorsDtors(Factory.lookup(".dtors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); 765 766 // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop 767 // symbols for sections, so that the runtime can get the start and end 768 // addresses of each section by section name. Add such symbols. 769 if (!Config->Relocatable) { 770 addStartEndSymbols(); 771 for (OutputSectionBase<ELFT> *Sec : RegularSections) 772 addStartStopSymbols(Sec); 773 } 774 775 // Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type. 776 // It should be okay as no one seems to care about the type. 777 // Even the author of gold doesn't remember why gold behaves that way. 778 // https://sourceware.org/ml/binutils/2002-03/msg00360.html 779 if (isOutputDynamic()) 780 Symtab.addSynthetic("_DYNAMIC", Out<ELFT>::Dynamic, 0); 781 782 // Define __rel[a]_iplt_{start,end} symbols if needed. 783 addRelIpltSymbols(); 784 785 if (!Out<ELFT>::EhFrame->empty()) { 786 OutputSections.push_back(Out<ELFT>::EhFrame); 787 Out<ELFT>::EhFrame->finalize(); 788 } 789 790 // Scan relocations. This must be done after every symbol is declared so that 791 // we can correctly decide if a dynamic relocation is needed. 792 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 793 Sec->forEachInputSection([&](InputSectionBase<ELFT> *S) { 794 if (auto *IS = dyn_cast<InputSection<ELFT>>(S)) { 795 // Set OutSecOff so that scanRelocations can use it. 796 uintX_t Off = alignTo(Sec->getSize(), S->Align); 797 IS->OutSecOff = Off; 798 799 scanRelocations(*IS); 800 801 // Now that scan relocs possibly changed the size, update the offset. 802 Sec->setSize(Off + S->getSize()); 803 } else if (auto *EH = dyn_cast<EhInputSection<ELFT>>(S)) { 804 if (EH->RelocSection) 805 scanRelocations(*EH, *EH->RelocSection); 806 } 807 }); 808 } 809 810 // Now that we have defined all possible symbols including linker- 811 // synthesized ones. Visit all symbols to give the finishing touches. 812 std::vector<DefinedCommon *> CommonSymbols; 813 for (Symbol *S : Symtab.getSymbols()) { 814 SymbolBody *Body = S->body(); 815 816 // Set "used" bit for --as-needed. 817 if (S->IsUsedInRegularObj && !S->isWeak()) 818 if (auto *SS = dyn_cast<SharedSymbol<ELFT>>(Body)) 819 SS->File->IsUsed = true; 820 821 // We only report undefined symbols in regular objects. This means that we 822 // will accept an undefined reference in bitcode if it can be optimized out. 823 if (S->IsUsedInRegularObj && Body->isUndefined() && !S->isWeak()) 824 reportUndefined<ELFT>(Symtab, Body); 825 826 if (auto *C = dyn_cast<DefinedCommon>(Body)) 827 CommonSymbols.push_back(C); 828 829 if (!includeInSymtab<ELFT>(*Body)) 830 continue; 831 if (Out<ELFT>::SymTab) 832 Out<ELFT>::SymTab->addSymbol(Body); 833 834 if (isOutputDynamic() && S->includeInDynsym()) { 835 Out<ELFT>::DynSymTab->addSymbol(Body); 836 if (auto *SS = dyn_cast<SharedSymbol<ELFT>>(Body)) 837 Out<ELFT>::VerNeed->addSymbol(SS); 838 } 839 } 840 841 // Do not proceed if there was an undefined symbol. 842 if (HasError) 843 return; 844 845 addCommonSymbols(CommonSymbols); 846 847 // So far we have added sections from input object files. 848 // This function adds linker-created Out<ELFT>::* sections. 849 addPredefinedSections(); 850 851 std::stable_sort(OutputSections.begin(), OutputSections.end(), 852 compareSections<ELFT>); 853 854 unsigned I = 1; 855 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 856 Sec->SectionIndex = I++; 857 Sec->setSHName(Out<ELFT>::ShStrTab->addString(Sec->getName())); 858 } 859 860 // Finalizers fix each section's size. 861 // .dynsym is finalized early since that may fill up .gnu.hash. 862 if (isOutputDynamic()) 863 Out<ELFT>::DynSymTab->finalize(); 864 865 // Fill other section headers. The dynamic table is finalized 866 // at the end because some tags like RELSZ depend on result 867 // of finalizing other sections. The dynamic string table is 868 // finalized once the .dynamic finalizer has added a few last 869 // strings. See DynamicSection::finalize() 870 for (OutputSectionBase<ELFT> *Sec : OutputSections) 871 if (Sec != Out<ELFT>::DynStrTab && Sec != Out<ELFT>::Dynamic) 872 Sec->finalize(); 873 874 if (isOutputDynamic()) 875 Out<ELFT>::Dynamic->finalize(); 876 } 877 878 template <class ELFT> bool Writer<ELFT>::needsGot() { 879 if (!Out<ELFT>::Got->empty()) 880 return true; 881 882 // We add the .got section to the result for dynamic MIPS target because 883 // its address and properties are mentioned in the .dynamic section. 884 if (Config->EMachine == EM_MIPS) 885 return true; 886 887 // If we have a relocation that is relative to GOT (such as GOTOFFREL), 888 // we need to emit a GOT even if it's empty. 889 return Out<ELFT>::Got->HasGotOffRel; 890 } 891 892 // This function add Out<ELFT>::* sections to OutputSections. 893 template <class ELFT> void Writer<ELFT>::addPredefinedSections() { 894 auto Add = [&](OutputSectionBase<ELFT> *C) { 895 if (C) 896 OutputSections.push_back(C); 897 }; 898 899 // This order is not the same as the final output order 900 // because we sort the sections using their attributes below. 901 Add(Out<ELFT>::SymTab); 902 Add(Out<ELFT>::ShStrTab); 903 Add(Out<ELFT>::StrTab); 904 if (isOutputDynamic()) { 905 Add(Out<ELFT>::DynSymTab); 906 if (Out<ELFT>::VerNeed->getNeedNum() != 0) { 907 Add(Out<ELFT>::VerSym); 908 Add(Out<ELFT>::VerNeed); 909 } 910 Add(Out<ELFT>::GnuHashTab); 911 Add(Out<ELFT>::HashTab); 912 Add(Out<ELFT>::Dynamic); 913 Add(Out<ELFT>::DynStrTab); 914 if (Out<ELFT>::RelaDyn->hasRelocs()) 915 Add(Out<ELFT>::RelaDyn); 916 Add(Out<ELFT>::MipsRldMap); 917 } 918 919 // We always need to add rel[a].plt to output if it has entries. 920 // Even during static linking it can contain R_[*]_IRELATIVE relocations. 921 if (Out<ELFT>::RelaPlt && Out<ELFT>::RelaPlt->hasRelocs()) { 922 Add(Out<ELFT>::RelaPlt); 923 Out<ELFT>::RelaPlt->Static = !isOutputDynamic(); 924 } 925 926 if (needsGot()) 927 Add(Out<ELFT>::Got); 928 if (Out<ELFT>::GotPlt && !Out<ELFT>::GotPlt->empty()) 929 Add(Out<ELFT>::GotPlt); 930 if (!Out<ELFT>::Plt->empty()) 931 Add(Out<ELFT>::Plt); 932 if (!Out<ELFT>::EhFrame->empty()) 933 Add(Out<ELFT>::EhFrameHdr); 934 if (Out<ELFT>::Bss->getSize() > 0) 935 Add(Out<ELFT>::Bss); 936 } 937 938 // The linker is expected to define SECNAME_start and SECNAME_end 939 // symbols for a few sections. This function defines them. 940 template <class ELFT> void Writer<ELFT>::addStartEndSymbols() { 941 auto Define = [&](StringRef Start, StringRef End, 942 OutputSectionBase<ELFT> *OS) { 943 if (OS) { 944 this->Symtab.addSynthetic(Start, OS, 0); 945 this->Symtab.addSynthetic(End, OS, DefinedSynthetic<ELFT>::SectionEnd); 946 } else { 947 addOptionalSynthetic(this->Symtab, Start, 948 (OutputSectionBase<ELFT> *)nullptr, 0); 949 addOptionalSynthetic(this->Symtab, End, 950 (OutputSectionBase<ELFT> *)nullptr, 0); 951 } 952 }; 953 954 Define("__preinit_array_start", "__preinit_array_end", 955 Out<ELFT>::Dynamic->PreInitArraySec); 956 Define("__init_array_start", "__init_array_end", 957 Out<ELFT>::Dynamic->InitArraySec); 958 Define("__fini_array_start", "__fini_array_end", 959 Out<ELFT>::Dynamic->FiniArraySec); 960 } 961 962 // If a section name is valid as a C identifier (which is rare because of 963 // the leading '.'), linkers are expected to define __start_<secname> and 964 // __stop_<secname> symbols. They are at beginning and end of the section, 965 // respectively. This is not requested by the ELF standard, but GNU ld and 966 // gold provide the feature, and used by many programs. 967 template <class ELFT> 968 void Writer<ELFT>::addStartStopSymbols(OutputSectionBase<ELFT> *Sec) { 969 StringRef S = Sec->getName(); 970 if (!isValidCIdentifier(S)) 971 return; 972 StringSaver Saver(Alloc); 973 StringRef Start = Saver.save("__start_" + S); 974 StringRef Stop = Saver.save("__stop_" + S); 975 if (SymbolBody *B = Symtab.find(Start)) 976 if (B->isUndefined()) 977 Symtab.addSynthetic(Start, Sec, 0); 978 if (SymbolBody *B = Symtab.find(Stop)) 979 if (B->isUndefined()) 980 Symtab.addSynthetic(Stop, Sec, DefinedSynthetic<ELFT>::SectionEnd); 981 } 982 983 template <class ELFT> static bool needsPtLoad(OutputSectionBase<ELFT> *Sec) { 984 if (!(Sec->getFlags() & SHF_ALLOC)) 985 return false; 986 987 // Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is 988 // responsible for allocating space for them, not the PT_LOAD that 989 // contains the TLS initialization image. 990 if (Sec->getFlags() & SHF_TLS && Sec->getType() == SHT_NOBITS) 991 return false; 992 return true; 993 } 994 995 static uint32_t toPhdrFlags(uint64_t Flags) { 996 uint32_t Ret = PF_R; 997 if (Flags & SHF_WRITE) 998 Ret |= PF_W; 999 if (Flags & SHF_EXECINSTR) 1000 Ret |= PF_X; 1001 return Ret; 1002 } 1003 1004 // Decide which program headers to create and which sections to include in each 1005 // one. 1006 template <class ELFT> void Writer<ELFT>::createPhdrs() { 1007 auto AddHdr = [this](unsigned Type, unsigned Flags) { 1008 return &*Phdrs.emplace(Phdrs.end(), Type, Flags); 1009 }; 1010 1011 auto AddSec = [](Phdr &Hdr, OutputSectionBase<ELFT> *Sec) { 1012 Hdr.Last = Sec; 1013 if (!Hdr.First) 1014 Hdr.First = Sec; 1015 Hdr.H.p_align = std::max<uintX_t>(Hdr.H.p_align, Sec->getAlign()); 1016 }; 1017 1018 // The first phdr entry is PT_PHDR which describes the program header itself. 1019 Phdr &Hdr = *AddHdr(PT_PHDR, PF_R); 1020 AddSec(Hdr, Out<ELFT>::ProgramHeaders); 1021 1022 // PT_INTERP must be the second entry if exists. 1023 if (needsInterpSection()) { 1024 Phdr &Hdr = *AddHdr(PT_INTERP, toPhdrFlags(Out<ELFT>::Interp->getFlags())); 1025 AddSec(Hdr, Out<ELFT>::Interp); 1026 } 1027 1028 // Add the first PT_LOAD segment for regular output sections. 1029 uintX_t Flags = PF_R; 1030 Phdr *Load = AddHdr(PT_LOAD, Flags); 1031 AddSec(*Load, Out<ELFT>::ElfHeader); 1032 AddSec(*Load, Out<ELFT>::ProgramHeaders); 1033 1034 Phdr TlsHdr(PT_TLS, PF_R); 1035 Phdr RelRo(PT_GNU_RELRO, PF_R); 1036 Phdr Note(PT_NOTE, PF_R); 1037 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1038 if (!(Sec->getFlags() & SHF_ALLOC)) 1039 break; 1040 1041 // If we meet TLS section then we create TLS header 1042 // and put all TLS sections inside for futher use when 1043 // assign addresses. 1044 if (Sec->getFlags() & SHF_TLS) 1045 AddSec(TlsHdr, Sec); 1046 1047 if (!needsPtLoad<ELFT>(Sec)) 1048 continue; 1049 1050 // If flags changed then we want new load segment. 1051 uintX_t NewFlags = toPhdrFlags(Sec->getFlags()); 1052 if (Flags != NewFlags) { 1053 Load = AddHdr(PT_LOAD, NewFlags); 1054 Flags = NewFlags; 1055 } 1056 1057 AddSec(*Load, Sec); 1058 1059 if (isRelroSection(Sec)) 1060 AddSec(RelRo, Sec); 1061 if (Sec->getType() == SHT_NOTE) 1062 AddSec(Note, Sec); 1063 } 1064 1065 // Add the TLS segment unless it's empty. 1066 if (TlsHdr.First) 1067 Phdrs.push_back(std::move(TlsHdr)); 1068 1069 // Add an entry for .dynamic. 1070 if (isOutputDynamic()) { 1071 Phdr &H = *AddHdr(PT_DYNAMIC, toPhdrFlags(Out<ELFT>::Dynamic->getFlags())); 1072 AddSec(H, Out<ELFT>::Dynamic); 1073 } 1074 1075 // PT_GNU_RELRO includes all sections that should be marked as 1076 // read-only by dynamic linker after proccessing relocations. 1077 if (RelRo.First) 1078 Phdrs.push_back(std::move(RelRo)); 1079 1080 // PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr. 1081 if (!Out<ELFT>::EhFrame->empty() && Out<ELFT>::EhFrameHdr) { 1082 Phdr &Hdr = *AddHdr(PT_GNU_EH_FRAME, 1083 toPhdrFlags(Out<ELFT>::EhFrameHdr->getFlags())); 1084 AddSec(Hdr, Out<ELFT>::EhFrameHdr); 1085 } 1086 1087 // PT_GNU_STACK is a special section to tell the loader to make the 1088 // pages for the stack non-executable. 1089 if (!Config->ZExecStack) 1090 AddHdr(PT_GNU_STACK, PF_R | PF_W); 1091 1092 if (Note.First) 1093 Phdrs.push_back(std::move(Note)); 1094 1095 Out<ELFT>::ProgramHeaders->setSize(sizeof(Elf_Phdr) * Phdrs.size()); 1096 } 1097 1098 // The first section of each PT_LOAD and the first section after PT_GNU_RELRO 1099 // have to be page aligned so that the dynamic linker can set the permissions. 1100 template <class ELFT> void Writer<ELFT>::fixSectionAlignments() { 1101 for (const Phdr &P : Phdrs) 1102 if (P.H.p_type == PT_LOAD) 1103 P.First->PageAlign = true; 1104 1105 for (const Phdr &P : Phdrs) { 1106 if (P.H.p_type != PT_GNU_RELRO) 1107 continue; 1108 // Find the first section after PT_GNU_RELRO. If it is in a PT_LOAD we 1109 // have to align it to a page. 1110 auto End = OutputSections.end(); 1111 auto I = std::find(OutputSections.begin(), End, P.Last); 1112 if (I == End || (I + 1) == End) 1113 continue; 1114 OutputSectionBase<ELFT> *Sec = *(I + 1); 1115 if (needsPtLoad(Sec)) 1116 Sec->PageAlign = true; 1117 } 1118 } 1119 1120 // We should set file offsets and VAs for elf header and program headers 1121 // sections. These are special, we do not include them into output sections 1122 // list, but have them to simplify the code. 1123 template <class ELFT> void Writer<ELFT>::fixHeaders() { 1124 uintX_t BaseVA = ScriptConfig->DoLayout ? 0 : Target->getVAStart(); 1125 Out<ELFT>::ElfHeader->setVA(BaseVA); 1126 Out<ELFT>::ElfHeader->setFileOffset(0); 1127 uintX_t Off = Out<ELFT>::ElfHeader->getSize(); 1128 Out<ELFT>::ProgramHeaders->setVA(Off + BaseVA); 1129 Out<ELFT>::ProgramHeaders->setFileOffset(Off); 1130 } 1131 1132 // Assign VAs (addresses at run-time) to output sections. 1133 template <class ELFT> void Writer<ELFT>::assignAddresses() { 1134 uintX_t VA = Target->getVAStart() + Out<ELFT>::ElfHeader->getSize() + 1135 Out<ELFT>::ProgramHeaders->getSize(); 1136 1137 uintX_t ThreadBssOffset = 0; 1138 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1139 uintX_t Align = Sec->getAlign(); 1140 if (Sec->PageAlign) 1141 Align = std::max<uintX_t>(Align, Target->PageSize); 1142 1143 // We only assign VAs to allocated sections. 1144 if (needsPtLoad<ELFT>(Sec)) { 1145 VA = alignTo(VA, Align); 1146 Sec->setVA(VA); 1147 VA += Sec->getSize(); 1148 } else if (Sec->getFlags() & SHF_TLS && Sec->getType() == SHT_NOBITS) { 1149 uintX_t TVA = VA + ThreadBssOffset; 1150 TVA = alignTo(TVA, Align); 1151 Sec->setVA(TVA); 1152 ThreadBssOffset = TVA - VA + Sec->getSize(); 1153 } 1154 } 1155 } 1156 1157 // Adjusts the file alignment for a given output section and returns 1158 // its new file offset. The file offset must be the same with its 1159 // virtual address (modulo the page size) so that the loader can load 1160 // executables without any address adjustment. 1161 template <class ELFT, class uintX_t> 1162 static uintX_t getFileAlignment(uintX_t Off, OutputSectionBase<ELFT> *Sec) { 1163 uintX_t Align = Sec->getAlign(); 1164 if (Sec->PageAlign) 1165 Align = std::max<uintX_t>(Align, Target->PageSize); 1166 Off = alignTo(Off, Align); 1167 1168 // Relocatable output does not have program headers 1169 // and does not need any other offset adjusting. 1170 if (Config->Relocatable || !(Sec->getFlags() & SHF_ALLOC)) 1171 return Off; 1172 return alignTo(Off, Target->PageSize, Sec->getVA()); 1173 } 1174 1175 // Assign file offsets to output sections. 1176 template <class ELFT> void Writer<ELFT>::assignFileOffsets() { 1177 uintX_t Off = 1178 Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize(); 1179 1180 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1181 if (Sec->getType() == SHT_NOBITS) { 1182 Sec->setFileOffset(Off); 1183 continue; 1184 } 1185 1186 Off = getFileAlignment<ELFT>(Off, Sec); 1187 Sec->setFileOffset(Off); 1188 Off += Sec->getSize(); 1189 } 1190 SectionHeaderOff = alignTo(Off, sizeof(uintX_t)); 1191 FileSize = SectionHeaderOff + (OutputSections.size() + 1) * sizeof(Elf_Shdr); 1192 } 1193 1194 // Finalize the program headers. We call this function after we assign 1195 // file offsets and VAs to all sections. 1196 template <class ELFT> void Writer<ELFT>::setPhdrs() { 1197 for (Phdr &P : Phdrs) { 1198 Elf_Phdr &H = P.H; 1199 OutputSectionBase<ELFT> *First = P.First; 1200 OutputSectionBase<ELFT> *Last = P.Last; 1201 if (First) { 1202 H.p_filesz = Last->getFileOff() - First->getFileOff(); 1203 if (Last->getType() != SHT_NOBITS) 1204 H.p_filesz += Last->getSize(); 1205 H.p_memsz = Last->getVA() + Last->getSize() - First->getVA(); 1206 H.p_offset = First->getFileOff(); 1207 H.p_vaddr = First->getVA(); 1208 } 1209 if (H.p_type == PT_LOAD) 1210 H.p_align = Target->PageSize; 1211 else if (H.p_type == PT_GNU_RELRO) 1212 H.p_align = 1; 1213 H.p_paddr = H.p_vaddr; 1214 1215 // The TLS pointer goes after PT_TLS. At least glibc will align it, 1216 // so round up the size to make sure the offsets are correct. 1217 if (H.p_type == PT_TLS) { 1218 Out<ELFT>::TlsPhdr = &H; 1219 H.p_memsz = alignTo(H.p_memsz, H.p_align); 1220 } 1221 } 1222 } 1223 1224 static uint32_t getMipsEFlags(bool Is64Bits) { 1225 // FIXME: In fact ELF flags depends on ELF flags of input object files 1226 // and selected emulation. For now just use hard coded values. 1227 if (Is64Bits) 1228 return EF_MIPS_CPIC | EF_MIPS_PIC | EF_MIPS_ARCH_64R2; 1229 1230 uint32_t V = EF_MIPS_CPIC | EF_MIPS_ABI_O32 | EF_MIPS_ARCH_32R2; 1231 if (Config->Shared) 1232 V |= EF_MIPS_PIC; 1233 return V; 1234 } 1235 1236 template <class ELFT> static typename ELFT::uint getEntryAddr() { 1237 if (Symbol *S = Config->EntrySym) 1238 return S->body()->getVA<ELFT>(); 1239 if (Config->EntryAddr != uint64_t(-1)) 1240 return Config->EntryAddr; 1241 return 0; 1242 } 1243 1244 template <class ELFT> static uint8_t getELFEncoding() { 1245 if (ELFT::TargetEndianness == llvm::support::little) 1246 return ELFDATA2LSB; 1247 return ELFDATA2MSB; 1248 } 1249 1250 static uint16_t getELFType() { 1251 if (Config->Pic) 1252 return ET_DYN; 1253 if (Config->Relocatable) 1254 return ET_REL; 1255 return ET_EXEC; 1256 } 1257 1258 // This function is called after we have assigned address and size 1259 // to each section. This function fixes some predefined absolute 1260 // symbol values that depend on section address and size. 1261 template <class ELFT> void Writer<ELFT>::fixAbsoluteSymbols() { 1262 auto Set = [](DefinedRegular<ELFT> *&S1, DefinedRegular<ELFT> *&S2, 1263 uintX_t V) { 1264 if (S1) 1265 S1->Value = V; 1266 if (S2) 1267 S2->Value = V; 1268 }; 1269 1270 // _etext is the first location after the last read-only loadable segment. 1271 // _edata is the first location after the last read-write loadable segment. 1272 // _end is the first location after the uninitialized data region. 1273 for (Phdr &P : Phdrs) { 1274 Elf_Phdr &H = P.H; 1275 if (H.p_type != PT_LOAD) 1276 continue; 1277 Set(ElfSym<ELFT>::End, ElfSym<ELFT>::End2, H.p_vaddr + H.p_memsz); 1278 1279 uintX_t Val = H.p_vaddr + H.p_filesz; 1280 if (H.p_flags & PF_W) 1281 Set(ElfSym<ELFT>::Edata, ElfSym<ELFT>::Edata2, Val); 1282 else 1283 Set(ElfSym<ELFT>::Etext, ElfSym<ELFT>::Etext2, Val); 1284 } 1285 } 1286 1287 template <class ELFT> void Writer<ELFT>::writeHeader() { 1288 uint8_t *Buf = Buffer->getBufferStart(); 1289 memcpy(Buf, "\177ELF", 4); 1290 1291 auto &FirstObj = cast<ELFFileBase<ELFT>>(*Config->FirstElf); 1292 1293 // Write the ELF header. 1294 auto *EHdr = reinterpret_cast<Elf_Ehdr *>(Buf); 1295 EHdr->e_ident[EI_CLASS] = ELFT::Is64Bits ? ELFCLASS64 : ELFCLASS32; 1296 EHdr->e_ident[EI_DATA] = getELFEncoding<ELFT>(); 1297 EHdr->e_ident[EI_VERSION] = EV_CURRENT; 1298 EHdr->e_ident[EI_OSABI] = FirstObj.getOSABI(); 1299 EHdr->e_type = getELFType(); 1300 EHdr->e_machine = FirstObj.getEMachine(); 1301 EHdr->e_version = EV_CURRENT; 1302 EHdr->e_entry = getEntryAddr<ELFT>(); 1303 EHdr->e_shoff = SectionHeaderOff; 1304 EHdr->e_ehsize = sizeof(Elf_Ehdr); 1305 EHdr->e_phnum = Phdrs.size(); 1306 EHdr->e_shentsize = sizeof(Elf_Shdr); 1307 EHdr->e_shnum = OutputSections.size() + 1; 1308 EHdr->e_shstrndx = Out<ELFT>::ShStrTab->SectionIndex; 1309 1310 if (Config->EMachine == EM_MIPS) 1311 EHdr->e_flags = getMipsEFlags(ELFT::Is64Bits); 1312 1313 if (!Config->Relocatable) { 1314 EHdr->e_phoff = sizeof(Elf_Ehdr); 1315 EHdr->e_phentsize = sizeof(Elf_Phdr); 1316 } 1317 1318 // Write the program header table. 1319 auto *HBuf = reinterpret_cast<Elf_Phdr *>(Buf + EHdr->e_phoff); 1320 for (Phdr &P : Phdrs) 1321 *HBuf++ = P.H; 1322 1323 // Write the section header table. Note that the first table entry is null. 1324 auto *SHdrs = reinterpret_cast<Elf_Shdr *>(Buf + EHdr->e_shoff); 1325 for (OutputSectionBase<ELFT> *Sec : OutputSections) 1326 Sec->writeHeaderTo(++SHdrs); 1327 } 1328 1329 template <class ELFT> void Writer<ELFT>::openFile() { 1330 ErrorOr<std::unique_ptr<FileOutputBuffer>> BufferOrErr = 1331 FileOutputBuffer::create(Config->OutputFile, FileSize, 1332 FileOutputBuffer::F_executable); 1333 if (BufferOrErr) 1334 Buffer = std::move(*BufferOrErr); 1335 else 1336 error(BufferOrErr, "failed to open " + Config->OutputFile); 1337 } 1338 1339 // Write section contents to a mmap'ed file. 1340 template <class ELFT> void Writer<ELFT>::writeSections() { 1341 uint8_t *Buf = Buffer->getBufferStart(); 1342 1343 // PPC64 needs to process relocations in the .opd section before processing 1344 // relocations in code-containing sections. 1345 if (OutputSectionBase<ELFT> *Sec = Out<ELFT>::Opd) { 1346 Out<ELFT>::OpdBuf = Buf + Sec->getFileOff(); 1347 Sec->writeTo(Buf + Sec->getFileOff()); 1348 } 1349 1350 for (OutputSectionBase<ELFT> *Sec : OutputSections) 1351 if (Sec != Out<ELFT>::Opd) 1352 Sec->writeTo(Buf + Sec->getFileOff()); 1353 } 1354 1355 template <class ELFT> void Writer<ELFT>::writeBuildId() { 1356 BuildIdSection<ELFT> *S = Out<ELFT>::BuildId; 1357 if (!S) 1358 return; 1359 1360 // Compute a hash of all sections except .debug_* sections. 1361 // We skip debug sections because they tend to be very large 1362 // and their contents are very likely to be the same as long as 1363 // other sections are the same. 1364 uint8_t *Start = Buffer->getBufferStart(); 1365 uint8_t *Last = Start; 1366 std::vector<ArrayRef<uint8_t>> Regions; 1367 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1368 uint8_t *End = Start + Sec->getFileOff(); 1369 if (!Sec->getName().startswith(".debug_")) 1370 Regions.push_back({Last, End}); 1371 Last = End; 1372 } 1373 Regions.push_back({Last, Start + FileSize}); 1374 S->writeBuildId(Regions); 1375 } 1376 1377 template void elf::writeResult<ELF32LE>(SymbolTable<ELF32LE> *Symtab); 1378 template void elf::writeResult<ELF32BE>(SymbolTable<ELF32BE> *Symtab); 1379 template void elf::writeResult<ELF64LE>(SymbolTable<ELF64LE> *Symtab); 1380 template void elf::writeResult<ELF64BE>(SymbolTable<ELF64BE> *Symtab); 1381