1 //===- Writer.cpp ---------------------------------------------------------===// 2 // 3 // The LLVM Linker 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 10 #include "Writer.h" 11 #include "Config.h" 12 #include "LinkerScript.h" 13 #include "OutputSections.h" 14 #include "Relocations.h" 15 #include "SymbolTable.h" 16 #include "Target.h" 17 18 #include "llvm/ADT/StringMap.h" 19 #include "llvm/ADT/StringSwitch.h" 20 #include "llvm/Support/FileOutputBuffer.h" 21 #include "llvm/Support/StringSaver.h" 22 #include "llvm/Support/raw_ostream.h" 23 24 using namespace llvm; 25 using namespace llvm::ELF; 26 using namespace llvm::object; 27 28 using namespace lld; 29 using namespace lld::elf; 30 31 namespace { 32 // The writer writes a SymbolTable result to a file. 33 template <class ELFT> class Writer { 34 public: 35 typedef typename ELFT::uint uintX_t; 36 typedef typename ELFT::Shdr Elf_Shdr; 37 typedef typename ELFT::Ehdr Elf_Ehdr; 38 typedef typename ELFT::Phdr Elf_Phdr; 39 typedef typename ELFT::Sym Elf_Sym; 40 typedef typename ELFT::SymRange Elf_Sym_Range; 41 typedef typename ELFT::Rela Elf_Rela; 42 Writer(SymbolTable<ELFT> &S) : Symtab(S) {} 43 void run(); 44 45 private: 46 // This describes a program header entry. 47 // Each contains type, access flags and range of output sections that will be 48 // placed in it. 49 struct Phdr { 50 Phdr(unsigned Type, unsigned Flags) { 51 H.p_type = Type; 52 H.p_flags = Flags; 53 } 54 Elf_Phdr H = {}; 55 OutputSectionBase<ELFT> *First = nullptr; 56 OutputSectionBase<ELFT> *Last = nullptr; 57 }; 58 59 void copyLocalSymbols(); 60 void addReservedSymbols(); 61 void createSections(); 62 void addPredefinedSections(); 63 bool needsGot(); 64 65 void createPhdrs(); 66 void assignAddresses(); 67 void assignFileOffsets(); 68 void setPhdrs(); 69 void fixHeaders(); 70 void fixSectionAlignments(); 71 void fixAbsoluteSymbols(); 72 void openFile(); 73 void writeHeader(); 74 void writeSections(); 75 void writeBuildId(); 76 bool isDiscarded(InputSectionBase<ELFT> *IS) const; 77 StringRef getOutputSectionName(InputSectionBase<ELFT> *S) const; 78 bool needsInterpSection() const { 79 return !Symtab.getSharedFiles().empty() && !Config->DynamicLinker.empty(); 80 } 81 bool isOutputDynamic() const { 82 return !Symtab.getSharedFiles().empty() || Config->Pic; 83 } 84 85 void addCommonSymbols(std::vector<DefinedCommon *> &Syms); 86 87 std::unique_ptr<llvm::FileOutputBuffer> Buffer; 88 89 BumpPtrAllocator Alloc; 90 std::vector<OutputSectionBase<ELFT> *> OutputSections; 91 std::vector<std::unique_ptr<OutputSectionBase<ELFT>>> OwningSections; 92 93 void addRelIpltSymbols(); 94 void addStartEndSymbols(); 95 void addStartStopSymbols(OutputSectionBase<ELFT> *Sec); 96 97 SymbolTable<ELFT> &Symtab; 98 std::vector<Phdr> Phdrs; 99 100 uintX_t FileSize; 101 uintX_t SectionHeaderOff; 102 }; 103 } // anonymous namespace 104 105 template <class ELFT> void elf::writeResult(SymbolTable<ELFT> *Symtab) { 106 typedef typename ELFT::uint uintX_t; 107 typedef typename ELFT::Ehdr Elf_Ehdr; 108 109 // Create singleton output sections. 110 OutputSection<ELFT> Bss(".bss", SHT_NOBITS, SHF_ALLOC | SHF_WRITE); 111 DynamicSection<ELFT> Dynamic; 112 EhOutputSection<ELFT> EhFrame; 113 GotSection<ELFT> Got; 114 InterpSection<ELFT> Interp; 115 PltSection<ELFT> Plt; 116 RelocationSection<ELFT> RelaDyn(Config->Rela ? ".rela.dyn" : ".rel.dyn", 117 Config->ZCombreloc); 118 StringTableSection<ELFT> DynStrTab(".dynstr", true); 119 StringTableSection<ELFT> ShStrTab(".shstrtab", false); 120 SymbolTableSection<ELFT> DynSymTab(DynStrTab); 121 VersionTableSection<ELFT> VerSym; 122 VersionNeedSection<ELFT> VerNeed; 123 124 OutputSectionBase<ELFT> ElfHeader("", 0, SHF_ALLOC); 125 ElfHeader.setSize(sizeof(Elf_Ehdr)); 126 OutputSectionBase<ELFT> ProgramHeaders("", 0, SHF_ALLOC); 127 ProgramHeaders.updateAlign(sizeof(uintX_t)); 128 129 // Instantiate optional output sections if they are needed. 130 std::unique_ptr<BuildIdSection<ELFT>> BuildId; 131 std::unique_ptr<EhFrameHeader<ELFT>> EhFrameHdr; 132 std::unique_ptr<GnuHashTableSection<ELFT>> GnuHashTab; 133 std::unique_ptr<GotPltSection<ELFT>> GotPlt; 134 std::unique_ptr<HashTableSection<ELFT>> HashTab; 135 std::unique_ptr<RelocationSection<ELFT>> RelaPlt; 136 std::unique_ptr<StringTableSection<ELFT>> StrTab; 137 std::unique_ptr<SymbolTableSection<ELFT>> SymTabSec; 138 std::unique_ptr<OutputSection<ELFT>> MipsRldMap; 139 140 if (Config->BuildId == BuildIdKind::Fnv1) 141 BuildId.reset(new BuildIdFnv1<ELFT>); 142 else if (Config->BuildId == BuildIdKind::Md5) 143 BuildId.reset(new BuildIdMd5<ELFT>); 144 else if (Config->BuildId == BuildIdKind::Sha1) 145 BuildId.reset(new BuildIdSha1<ELFT>); 146 else if (Config->BuildId == BuildIdKind::Hexstring) 147 BuildId.reset(new BuildIdHexstring<ELFT>); 148 149 if (Config->EhFrameHdr) 150 EhFrameHdr.reset(new EhFrameHeader<ELFT>); 151 152 if (Config->GnuHash) 153 GnuHashTab.reset(new GnuHashTableSection<ELFT>); 154 if (Config->SysvHash) 155 HashTab.reset(new HashTableSection<ELFT>); 156 StringRef S = Config->Rela ? ".rela.plt" : ".rel.plt"; 157 GotPlt.reset(new GotPltSection<ELFT>); 158 RelaPlt.reset(new RelocationSection<ELFT>(S, false /*Sort*/)); 159 if (!Config->StripAll) { 160 StrTab.reset(new StringTableSection<ELFT>(".strtab", false)); 161 SymTabSec.reset(new SymbolTableSection<ELFT>(*StrTab)); 162 } 163 if (Config->EMachine == EM_MIPS && !Config->Shared) { 164 // This is a MIPS specific section to hold a space within the data segment 165 // of executable file which is pointed to by the DT_MIPS_RLD_MAP entry. 166 // See "Dynamic section" in Chapter 5 in the following document: 167 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf 168 MipsRldMap.reset(new OutputSection<ELFT>(".rld_map", SHT_PROGBITS, 169 SHF_ALLOC | SHF_WRITE)); 170 MipsRldMap->setSize(sizeof(uintX_t)); 171 MipsRldMap->updateAlign(sizeof(uintX_t)); 172 } 173 174 Out<ELFT>::Bss = &Bss; 175 Out<ELFT>::BuildId = BuildId.get(); 176 Out<ELFT>::DynStrTab = &DynStrTab; 177 Out<ELFT>::DynSymTab = &DynSymTab; 178 Out<ELFT>::Dynamic = &Dynamic; 179 Out<ELFT>::EhFrame = &EhFrame; 180 Out<ELFT>::EhFrameHdr = EhFrameHdr.get(); 181 Out<ELFT>::GnuHashTab = GnuHashTab.get(); 182 Out<ELFT>::Got = &Got; 183 Out<ELFT>::GotPlt = GotPlt.get(); 184 Out<ELFT>::HashTab = HashTab.get(); 185 Out<ELFT>::Interp = &Interp; 186 Out<ELFT>::Plt = &Plt; 187 Out<ELFT>::RelaDyn = &RelaDyn; 188 Out<ELFT>::RelaPlt = RelaPlt.get(); 189 Out<ELFT>::ShStrTab = &ShStrTab; 190 Out<ELFT>::StrTab = StrTab.get(); 191 Out<ELFT>::SymTab = SymTabSec.get(); 192 Out<ELFT>::VerSym = &VerSym; 193 Out<ELFT>::VerNeed = &VerNeed; 194 Out<ELFT>::MipsRldMap = MipsRldMap.get(); 195 Out<ELFT>::Opd = nullptr; 196 Out<ELFT>::OpdBuf = nullptr; 197 Out<ELFT>::TlsPhdr = nullptr; 198 Out<ELFT>::ElfHeader = &ElfHeader; 199 Out<ELFT>::ProgramHeaders = &ProgramHeaders; 200 201 Writer<ELFT>(*Symtab).run(); 202 } 203 204 // The main function of the writer. 205 template <class ELFT> void Writer<ELFT>::run() { 206 if (!Config->DiscardAll) 207 copyLocalSymbols(); 208 addReservedSymbols(); 209 createSections(); 210 if (HasError) 211 return; 212 213 if (Config->Relocatable) { 214 assignFileOffsets(); 215 } else { 216 createPhdrs(); 217 fixHeaders(); 218 if (ScriptConfig->DoLayout) { 219 Script<ELFT>::X->assignAddresses(OutputSections); 220 } else { 221 fixSectionAlignments(); 222 assignAddresses(); 223 } 224 assignFileOffsets(); 225 setPhdrs(); 226 fixAbsoluteSymbols(); 227 } 228 229 openFile(); 230 if (HasError) 231 return; 232 writeHeader(); 233 writeSections(); 234 writeBuildId(); 235 if (HasError) 236 return; 237 check(Buffer->commit()); 238 } 239 240 namespace { 241 template <bool Is64Bits> struct SectionKey { 242 typedef typename std::conditional<Is64Bits, uint64_t, uint32_t>::type uintX_t; 243 StringRef Name; 244 uint32_t Type; 245 uintX_t Flags; 246 uintX_t Alignment; 247 }; 248 } 249 namespace llvm { 250 template <bool Is64Bits> struct DenseMapInfo<SectionKey<Is64Bits>> { 251 static SectionKey<Is64Bits> getEmptyKey() { 252 return SectionKey<Is64Bits>{DenseMapInfo<StringRef>::getEmptyKey(), 0, 0, 253 0}; 254 } 255 static SectionKey<Is64Bits> getTombstoneKey() { 256 return SectionKey<Is64Bits>{DenseMapInfo<StringRef>::getTombstoneKey(), 0, 257 0, 0}; 258 } 259 static unsigned getHashValue(const SectionKey<Is64Bits> &Val) { 260 return hash_combine(Val.Name, Val.Type, Val.Flags, Val.Alignment); 261 } 262 static bool isEqual(const SectionKey<Is64Bits> &LHS, 263 const SectionKey<Is64Bits> &RHS) { 264 return DenseMapInfo<StringRef>::isEqual(LHS.Name, RHS.Name) && 265 LHS.Type == RHS.Type && LHS.Flags == RHS.Flags && 266 LHS.Alignment == RHS.Alignment; 267 } 268 }; 269 } 270 271 template <class ELFT> 272 static void reportUndefined(SymbolTable<ELFT> &Symtab, SymbolBody *Sym) { 273 if (!Config->NoUndefined) { 274 if (Config->Relocatable) 275 return; 276 if (Config->Shared && !Config->ZDefs) 277 if (Sym->symbol()->Visibility == STV_DEFAULT) 278 return; 279 } 280 281 std::string Msg = "undefined symbol: " + Sym->getName().str(); 282 if (InputFile *File = Sym->getSourceFile<ELFT>()) 283 Msg += " in " + getFilename(File); 284 if (Config->NoinhibitExec) 285 warning(Msg); 286 else 287 error(Msg); 288 } 289 290 template <class ELFT> 291 static bool shouldKeepInSymtab(InputSectionBase<ELFT> *Sec, StringRef SymName, 292 const SymbolBody &B) { 293 if (B.isFile()) 294 return false; 295 296 // We keep sections in symtab for relocatable output. 297 if (B.isSection()) 298 return Config->Relocatable; 299 300 // If sym references a section in a discarded group, don't keep it. 301 if (Sec == &InputSection<ELFT>::Discarded) 302 return false; 303 304 if (Config->DiscardNone) 305 return true; 306 307 // In ELF assembly .L symbols are normally discarded by the assembler. 308 // If the assembler fails to do so, the linker discards them if 309 // * --discard-locals is used. 310 // * The symbol is in a SHF_MERGE section, which is normally the reason for 311 // the assembler keeping the .L symbol. 312 if (!SymName.startswith(".L") && !SymName.empty()) 313 return true; 314 315 if (Config->DiscardLocals) 316 return false; 317 318 return !(Sec->getSectionHdr()->sh_flags & SHF_MERGE); 319 } 320 321 template <class ELFT> static bool includeInSymtab(const SymbolBody &B) { 322 if (!B.isLocal() && !B.symbol()->IsUsedInRegularObj) 323 return false; 324 325 if (auto *D = dyn_cast<DefinedRegular<ELFT>>(&B)) { 326 // Always include absolute symbols. 327 if (!D->Section) 328 return true; 329 // Exclude symbols pointing to garbage-collected sections. 330 if (!D->Section->Live) 331 return false; 332 if (auto *S = dyn_cast<MergeInputSection<ELFT>>(D->Section)) 333 if (!S->getSectionPiece(D->Value)->Live) 334 return false; 335 } 336 return true; 337 } 338 339 // Local symbols are not in the linker's symbol table. This function scans 340 // each object file's symbol table to copy local symbols to the output. 341 template <class ELFT> void Writer<ELFT>::copyLocalSymbols() { 342 if (!Out<ELFT>::SymTab) 343 return; 344 for (const std::unique_ptr<elf::ObjectFile<ELFT>> &F : 345 Symtab.getObjectFiles()) { 346 const char *StrTab = F->getStringTable().data(); 347 for (SymbolBody *B : F->getLocalSymbols()) { 348 auto *DR = dyn_cast<DefinedRegular<ELFT>>(B); 349 // No reason to keep local undefined symbol in symtab. 350 if (!DR) 351 continue; 352 if (!includeInSymtab<ELFT>(*B)) 353 continue; 354 StringRef SymName(StrTab + B->getNameOffset()); 355 InputSectionBase<ELFT> *Sec = DR->Section; 356 if (!shouldKeepInSymtab<ELFT>(Sec, SymName, *B)) 357 continue; 358 ++Out<ELFT>::SymTab->NumLocals; 359 if (Config->Relocatable) 360 B->DynsymIndex = Out<ELFT>::SymTab->NumLocals; 361 F->KeptLocalSyms.push_back( 362 std::make_pair(DR, Out<ELFT>::SymTab->StrTabSec.addString(SymName))); 363 } 364 } 365 } 366 367 // PPC64 has a number of special SHT_PROGBITS+SHF_ALLOC+SHF_WRITE sections that 368 // we would like to make sure appear is a specific order to maximize their 369 // coverage by a single signed 16-bit offset from the TOC base pointer. 370 // Conversely, the special .tocbss section should be first among all SHT_NOBITS 371 // sections. This will put it next to the loaded special PPC64 sections (and, 372 // thus, within reach of the TOC base pointer). 373 static int getPPC64SectionRank(StringRef SectionName) { 374 return StringSwitch<int>(SectionName) 375 .Case(".tocbss", 0) 376 .Case(".branch_lt", 2) 377 .Case(".toc", 3) 378 .Case(".toc1", 4) 379 .Case(".opd", 5) 380 .Default(1); 381 } 382 383 template <class ELFT> static bool isRelroSection(OutputSectionBase<ELFT> *Sec) { 384 if (!Config->ZRelro) 385 return false; 386 typename ELFT::uint Flags = Sec->getFlags(); 387 if (!(Flags & SHF_ALLOC) || !(Flags & SHF_WRITE)) 388 return false; 389 if (Flags & SHF_TLS) 390 return true; 391 uint32_t Type = Sec->getType(); 392 if (Type == SHT_INIT_ARRAY || Type == SHT_FINI_ARRAY || 393 Type == SHT_PREINIT_ARRAY) 394 return true; 395 if (Sec == Out<ELFT>::GotPlt) 396 return Config->ZNow; 397 if (Sec == Out<ELFT>::Dynamic || Sec == Out<ELFT>::Got) 398 return true; 399 StringRef S = Sec->getName(); 400 return S == ".data.rel.ro" || S == ".ctors" || S == ".dtors" || S == ".jcr" || 401 S == ".eh_frame"; 402 } 403 404 // Output section ordering is determined by this function. 405 template <class ELFT> 406 static bool compareSections(OutputSectionBase<ELFT> *A, 407 OutputSectionBase<ELFT> *B) { 408 typedef typename ELFT::uint uintX_t; 409 410 int Comp = Script<ELFT>::X->compareSections(A->getName(), B->getName()); 411 if (Comp != 0) 412 return Comp < 0; 413 414 uintX_t AFlags = A->getFlags(); 415 uintX_t BFlags = B->getFlags(); 416 417 // Allocatable sections go first to reduce the total PT_LOAD size and 418 // so debug info doesn't change addresses in actual code. 419 bool AIsAlloc = AFlags & SHF_ALLOC; 420 bool BIsAlloc = BFlags & SHF_ALLOC; 421 if (AIsAlloc != BIsAlloc) 422 return AIsAlloc; 423 424 // We don't have any special requirements for the relative order of 425 // two non allocatable sections. 426 if (!AIsAlloc) 427 return false; 428 429 // We want the read only sections first so that they go in the PT_LOAD 430 // covering the program headers at the start of the file. 431 bool AIsWritable = AFlags & SHF_WRITE; 432 bool BIsWritable = BFlags & SHF_WRITE; 433 if (AIsWritable != BIsWritable) 434 return BIsWritable; 435 436 // For a corresponding reason, put non exec sections first (the program 437 // header PT_LOAD is not executable). 438 bool AIsExec = AFlags & SHF_EXECINSTR; 439 bool BIsExec = BFlags & SHF_EXECINSTR; 440 if (AIsExec != BIsExec) 441 return BIsExec; 442 443 // If we got here we know that both A and B are in the same PT_LOAD. 444 445 // The TLS initialization block needs to be a single contiguous block in a R/W 446 // PT_LOAD, so stick TLS sections directly before R/W sections. The TLS NOBITS 447 // sections are placed here as they don't take up virtual address space in the 448 // PT_LOAD. 449 bool AIsTls = AFlags & SHF_TLS; 450 bool BIsTls = BFlags & SHF_TLS; 451 if (AIsTls != BIsTls) 452 return AIsTls; 453 454 // The next requirement we have is to put nobits sections last. The 455 // reason is that the only thing the dynamic linker will see about 456 // them is a p_memsz that is larger than p_filesz. Seeing that it 457 // zeros the end of the PT_LOAD, so that has to correspond to the 458 // nobits sections. 459 bool AIsNoBits = A->getType() == SHT_NOBITS; 460 bool BIsNoBits = B->getType() == SHT_NOBITS; 461 if (AIsNoBits != BIsNoBits) 462 return BIsNoBits; 463 464 // We place RelRo section before plain r/w ones. 465 bool AIsRelRo = isRelroSection(A); 466 bool BIsRelRo = isRelroSection(B); 467 if (AIsRelRo != BIsRelRo) 468 return AIsRelRo; 469 470 // Some architectures have additional ordering restrictions for sections 471 // within the same PT_LOAD. 472 if (Config->EMachine == EM_PPC64) 473 return getPPC64SectionRank(A->getName()) < 474 getPPC64SectionRank(B->getName()); 475 476 return false; 477 } 478 479 // Until this function is called, common symbols do not belong to any section. 480 // This function adds them to end of BSS section. 481 template <class ELFT> 482 void Writer<ELFT>::addCommonSymbols(std::vector<DefinedCommon *> &Syms) { 483 if (Syms.empty()) 484 return; 485 486 // Sort the common symbols by alignment as an heuristic to pack them better. 487 std::stable_sort(Syms.begin(), Syms.end(), 488 [](const DefinedCommon *A, const DefinedCommon *B) { 489 return A->Alignment > B->Alignment; 490 }); 491 492 uintX_t Off = Out<ELFT>::Bss->getSize(); 493 for (DefinedCommon *C : Syms) { 494 Off = alignTo(Off, C->Alignment); 495 Out<ELFT>::Bss->updateAlign(C->Alignment); 496 C->OffsetInBss = Off; 497 Off += C->Size; 498 } 499 500 Out<ELFT>::Bss->setSize(Off); 501 } 502 503 template <class ELFT> 504 StringRef Writer<ELFT>::getOutputSectionName(InputSectionBase<ELFT> *S) const { 505 StringRef Dest = Script<ELFT>::X->getOutputSection(S); 506 if (!Dest.empty()) 507 return Dest; 508 509 StringRef Name = S->getSectionName(); 510 for (StringRef V : {".text.", ".rodata.", ".data.rel.ro.", ".data.", ".bss.", 511 ".init_array.", ".fini_array.", ".ctors.", ".dtors.", 512 ".tbss.", ".gcc_except_table.", ".tdata."}) 513 if (Name.startswith(V)) 514 return V.drop_back(); 515 return Name; 516 } 517 518 template <class ELFT> 519 void reportDiscarded(InputSectionBase<ELFT> *IS, 520 const std::unique_ptr<elf::ObjectFile<ELFT>> &File) { 521 if (!Config->PrintGcSections || !IS || IS->Live) 522 return; 523 llvm::errs() << "removing unused section from '" << IS->getSectionName() 524 << "' in file '" << File->getName() << "'\n"; 525 } 526 527 template <class ELFT> 528 bool Writer<ELFT>::isDiscarded(InputSectionBase<ELFT> *S) const { 529 return !S || S == &InputSection<ELFT>::Discarded || !S->Live || 530 Script<ELFT>::X->isDiscarded(S); 531 } 532 533 template <class ELFT> 534 static Symbol *addOptionalSynthetic(SymbolTable<ELFT> &Table, StringRef Name, 535 OutputSectionBase<ELFT> *Sec, 536 typename ELFT::uint Val) { 537 SymbolBody *S = Table.find(Name); 538 if (!S) 539 return nullptr; 540 if (!S->isUndefined() && !S->isShared()) 541 return S->symbol(); 542 return Table.addSynthetic(Name, Sec, Val); 543 } 544 545 // The beginning and the ending of .rel[a].plt section are marked 546 // with __rel[a]_iplt_{start,end} symbols if it is a statically linked 547 // executable. The runtime needs these symbols in order to resolve 548 // all IRELATIVE relocs on startup. For dynamic executables, we don't 549 // need these symbols, since IRELATIVE relocs are resolved through GOT 550 // and PLT. For details, see http://www.airs.com/blog/archives/403. 551 template <class ELFT> void Writer<ELFT>::addRelIpltSymbols() { 552 if (isOutputDynamic() || !Out<ELFT>::RelaPlt) 553 return; 554 StringRef S = Config->Rela ? "__rela_iplt_start" : "__rel_iplt_start"; 555 addOptionalSynthetic(Symtab, S, Out<ELFT>::RelaPlt, 0); 556 557 S = Config->Rela ? "__rela_iplt_end" : "__rel_iplt_end"; 558 addOptionalSynthetic(Symtab, S, Out<ELFT>::RelaPlt, 559 DefinedSynthetic<ELFT>::SectionEnd); 560 } 561 562 // This class knows how to create an output section for a given 563 // input section. Output section type is determined by various 564 // factors, including input section's sh_flags, sh_type and 565 // linker scripts. 566 namespace { 567 template <class ELFT> class OutputSectionFactory { 568 typedef typename ELFT::Shdr Elf_Shdr; 569 typedef typename ELFT::uint uintX_t; 570 571 public: 572 std::pair<OutputSectionBase<ELFT> *, bool> create(InputSectionBase<ELFT> *C, 573 StringRef OutsecName); 574 575 OutputSectionBase<ELFT> *lookup(StringRef Name, uint32_t Type, 576 uintX_t Flags) { 577 return Map.lookup({Name, Type, Flags, 0}); 578 } 579 580 private: 581 SectionKey<ELFT::Is64Bits> createKey(InputSectionBase<ELFT> *C, 582 StringRef OutsecName); 583 584 SmallDenseMap<SectionKey<ELFT::Is64Bits>, OutputSectionBase<ELFT> *> Map; 585 }; 586 } 587 588 template <class ELFT> 589 std::pair<OutputSectionBase<ELFT> *, bool> 590 OutputSectionFactory<ELFT>::create(InputSectionBase<ELFT> *C, 591 StringRef OutsecName) { 592 SectionKey<ELFT::Is64Bits> Key = createKey(C, OutsecName); 593 OutputSectionBase<ELFT> *&Sec = Map[Key]; 594 if (Sec) 595 return {Sec, false}; 596 597 switch (C->SectionKind) { 598 case InputSectionBase<ELFT>::Regular: 599 Sec = new OutputSection<ELFT>(Key.Name, Key.Type, Key.Flags); 600 break; 601 case InputSectionBase<ELFT>::EHFrame: 602 return {Out<ELFT>::EhFrame, false}; 603 case InputSectionBase<ELFT>::Merge: 604 Sec = new MergeOutputSection<ELFT>(Key.Name, Key.Type, Key.Flags, 605 Key.Alignment); 606 break; 607 case InputSectionBase<ELFT>::MipsReginfo: 608 Sec = new MipsReginfoOutputSection<ELFT>(); 609 break; 610 case InputSectionBase<ELFT>::MipsOptions: 611 Sec = new MipsOptionsOutputSection<ELFT>(); 612 break; 613 } 614 return {Sec, true}; 615 } 616 617 template <class ELFT> 618 SectionKey<ELFT::Is64Bits> 619 OutputSectionFactory<ELFT>::createKey(InputSectionBase<ELFT> *C, 620 StringRef OutsecName) { 621 const Elf_Shdr *H = C->getSectionHdr(); 622 uintX_t Flags = H->sh_flags & ~SHF_GROUP; 623 624 // For SHF_MERGE we create different output sections for each alignment. 625 // This makes each output section simple and keeps a single level mapping from 626 // input to output. 627 uintX_t Alignment = 0; 628 if (isa<MergeInputSection<ELFT>>(C)) 629 Alignment = std::max(H->sh_addralign, H->sh_entsize); 630 631 uint32_t Type = H->sh_type; 632 return SectionKey<ELFT::Is64Bits>{OutsecName, Type, Flags, Alignment}; 633 } 634 635 // The linker is expected to define some symbols depending on 636 // the linking result. This function defines such symbols. 637 template <class ELFT> void Writer<ELFT>::addReservedSymbols() { 638 if (Config->EMachine == EM_MIPS) { 639 // Define _gp for MIPS. st_value of _gp symbol will be updated by Writer 640 // so that it points to an absolute address which is relative to GOT. 641 // See "Global Data Symbols" in Chapter 6 in the following document: 642 // ftp://www.linux-mips.org/pub/linux/mips/doc/ABI/mipsabi.pdf 643 Symtab.addSynthetic("_gp", Out<ELFT>::Got, MipsGPOffset); 644 645 // On MIPS O32 ABI, _gp_disp is a magic symbol designates offset between 646 // start of function and 'gp' pointer into GOT. 647 Symbol *Sym = 648 addOptionalSynthetic(Symtab, "_gp_disp", Out<ELFT>::Got, MipsGPOffset); 649 if (Sym) 650 ElfSym<ELFT>::MipsGpDisp = Sym->body(); 651 652 // The __gnu_local_gp is a magic symbol equal to the current value of 'gp' 653 // pointer. This symbol is used in the code generated by .cpload pseudo-op 654 // in case of using -mno-shared option. 655 // https://sourceware.org/ml/binutils/2004-12/msg00094.html 656 addOptionalSynthetic(Symtab, "__gnu_local_gp", Out<ELFT>::Got, 657 MipsGPOffset); 658 } 659 660 // In the assembly for 32 bit x86 the _GLOBAL_OFFSET_TABLE_ symbol 661 // is magical and is used to produce a R_386_GOTPC relocation. 662 // The R_386_GOTPC relocation value doesn't actually depend on the 663 // symbol value, so it could use an index of STN_UNDEF which, according 664 // to the spec, means the symbol value is 0. 665 // Unfortunately both gas and MC keep the _GLOBAL_OFFSET_TABLE_ symbol in 666 // the object file. 667 // The situation is even stranger on x86_64 where the assembly doesn't 668 // need the magical symbol, but gas still puts _GLOBAL_OFFSET_TABLE_ as 669 // an undefined symbol in the .o files. 670 // Given that the symbol is effectively unused, we just create a dummy 671 // hidden one to avoid the undefined symbol error. 672 if (!Config->Relocatable) 673 Symtab.addIgnored("_GLOBAL_OFFSET_TABLE_"); 674 675 // __tls_get_addr is defined by the dynamic linker for dynamic ELFs. For 676 // static linking the linker is required to optimize away any references to 677 // __tls_get_addr, so it's not defined anywhere. Create a hidden definition 678 // to avoid the undefined symbol error. 679 if (!isOutputDynamic()) 680 Symtab.addIgnored("__tls_get_addr"); 681 682 auto Define = [this](StringRef S, DefinedRegular<ELFT> *&Sym1, 683 DefinedRegular<ELFT> *&Sym2) { 684 Sym1 = Symtab.addIgnored(S, STV_DEFAULT); 685 686 // The name without the underscore is not a reserved name, 687 // so it is defined only when there is a reference against it. 688 assert(S.startswith("_")); 689 S = S.substr(1); 690 if (SymbolBody *B = Symtab.find(S)) 691 if (B->isUndefined()) 692 Sym2 = Symtab.addAbsolute(S, STV_DEFAULT); 693 }; 694 695 Define("_end", ElfSym<ELFT>::End, ElfSym<ELFT>::End2); 696 Define("_etext", ElfSym<ELFT>::Etext, ElfSym<ELFT>::Etext2); 697 Define("_edata", ElfSym<ELFT>::Edata, ElfSym<ELFT>::Edata2); 698 } 699 700 // Sort input sections by section name suffixes for 701 // __attribute__((init_priority(N))). 702 template <class ELFT> static void sortInitFini(OutputSectionBase<ELFT> *S) { 703 if (S) 704 reinterpret_cast<OutputSection<ELFT> *>(S)->sortInitFini(); 705 } 706 707 // Sort input sections by the special rule for .ctors and .dtors. 708 template <class ELFT> static void sortCtorsDtors(OutputSectionBase<ELFT> *S) { 709 if (S) 710 reinterpret_cast<OutputSection<ELFT> *>(S)->sortCtorsDtors(); 711 } 712 713 // Create output section objects and add them to OutputSections. 714 template <class ELFT> void Writer<ELFT>::createSections() { 715 // Add .interp first because some loaders want to see that section 716 // on the first page of the executable file when loaded into memory. 717 if (needsInterpSection()) 718 OutputSections.push_back(Out<ELFT>::Interp); 719 720 // A core file does not usually contain unmodified segments except 721 // the first page of the executable. Add the build ID section now 722 // so that the section is included in the first page. 723 if (Out<ELFT>::BuildId) 724 OutputSections.push_back(Out<ELFT>::BuildId); 725 726 // Create output sections for input object file sections. 727 std::vector<OutputSectionBase<ELFT> *> RegularSections; 728 OutputSectionFactory<ELFT> Factory; 729 for (const std::unique_ptr<elf::ObjectFile<ELFT>> &F : 730 Symtab.getObjectFiles()) { 731 for (InputSectionBase<ELFT> *C : F->getSections()) { 732 if (isDiscarded(C)) { 733 reportDiscarded(C, F); 734 continue; 735 } 736 OutputSectionBase<ELFT> *Sec; 737 bool IsNew; 738 std::tie(Sec, IsNew) = Factory.create(C, getOutputSectionName(C)); 739 if (IsNew) { 740 OwningSections.emplace_back(Sec); 741 OutputSections.push_back(Sec); 742 RegularSections.push_back(Sec); 743 } 744 Sec->addSection(C); 745 } 746 } 747 748 // If we have a .opd section (used under PPC64 for function descriptors), 749 // store a pointer to it here so that we can use it later when processing 750 // relocations. 751 Out<ELFT>::Opd = Factory.lookup(".opd", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC); 752 753 Out<ELFT>::Dynamic->PreInitArraySec = Factory.lookup( 754 ".preinit_array", SHT_PREINIT_ARRAY, SHF_WRITE | SHF_ALLOC); 755 Out<ELFT>::Dynamic->InitArraySec = 756 Factory.lookup(".init_array", SHT_INIT_ARRAY, SHF_WRITE | SHF_ALLOC); 757 Out<ELFT>::Dynamic->FiniArraySec = 758 Factory.lookup(".fini_array", SHT_FINI_ARRAY, SHF_WRITE | SHF_ALLOC); 759 760 // Sort section contents for __attribute__((init_priority(N)). 761 sortInitFini(Out<ELFT>::Dynamic->InitArraySec); 762 sortInitFini(Out<ELFT>::Dynamic->FiniArraySec); 763 sortCtorsDtors(Factory.lookup(".ctors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); 764 sortCtorsDtors(Factory.lookup(".dtors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); 765 766 // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop 767 // symbols for sections, so that the runtime can get the start and end 768 // addresses of each section by section name. Add such symbols. 769 if (!Config->Relocatable) { 770 addStartEndSymbols(); 771 for (OutputSectionBase<ELFT> *Sec : RegularSections) 772 addStartStopSymbols(Sec); 773 } 774 775 // Add _DYNAMIC symbol. Unlike GNU gold, our _DYNAMIC symbol has no type. 776 // It should be okay as no one seems to care about the type. 777 // Even the author of gold doesn't remember why gold behaves that way. 778 // https://sourceware.org/ml/binutils/2002-03/msg00360.html 779 if (isOutputDynamic()) 780 Symtab.addSynthetic("_DYNAMIC", Out<ELFT>::Dynamic, 0); 781 782 // Define __rel[a]_iplt_{start,end} symbols if needed. 783 addRelIpltSymbols(); 784 785 if (!Out<ELFT>::EhFrame->empty()) { 786 OutputSections.push_back(Out<ELFT>::EhFrame); 787 Out<ELFT>::EhFrame->finalize(); 788 } 789 790 // Scan relocations. This must be done after every symbol is declared so that 791 // we can correctly decide if a dynamic relocation is needed. 792 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 793 Sec->forEachInputSection([&](InputSectionBase<ELFT> *S) { 794 if (auto *IS = dyn_cast<InputSection<ELFT>>(S)) { 795 // Set OutSecOff so that scanRelocations can use it. 796 uintX_t Off = alignTo(Sec->getSize(), S->Align); 797 IS->OutSecOff = Off; 798 799 scanRelocations(*IS); 800 801 // Now that scan relocs possibly changed the size, update the offset. 802 Sec->setSize(Off + S->getSize()); 803 } else if (auto *EH = dyn_cast<EhInputSection<ELFT>>(S)) { 804 if (EH->RelocSection) 805 scanRelocations(*EH, *EH->RelocSection); 806 } 807 }); 808 } 809 810 // Now that we have defined all possible symbols including linker- 811 // synthesized ones. Visit all symbols to give the finishing touches. 812 std::vector<DefinedCommon *> CommonSymbols; 813 for (Symbol *S : Symtab.getSymbols()) { 814 SymbolBody *Body = S->body(); 815 816 // We only report undefined symbols in regular objects. This means that we 817 // will accept an undefined reference in bitcode if it can be optimized out. 818 if (S->IsUsedInRegularObj && Body->isUndefined() && !S->isWeak()) 819 reportUndefined<ELFT>(Symtab, Body); 820 821 if (auto *C = dyn_cast<DefinedCommon>(Body)) 822 CommonSymbols.push_back(C); 823 824 if (!includeInSymtab<ELFT>(*Body)) 825 continue; 826 if (Out<ELFT>::SymTab) 827 Out<ELFT>::SymTab->addSymbol(Body); 828 829 if (isOutputDynamic() && S->includeInDynsym()) { 830 Out<ELFT>::DynSymTab->addSymbol(Body); 831 if (auto *SS = dyn_cast<SharedSymbol<ELFT>>(Body)) 832 if (SS->File->isNeeded()) 833 Out<ELFT>::VerNeed->addSymbol(SS); 834 } 835 } 836 837 // Do not proceed if there was an undefined symbol. 838 if (HasError) 839 return; 840 841 addCommonSymbols(CommonSymbols); 842 843 // So far we have added sections from input object files. 844 // This function adds linker-created Out<ELFT>::* sections. 845 addPredefinedSections(); 846 847 std::stable_sort(OutputSections.begin(), OutputSections.end(), 848 compareSections<ELFT>); 849 850 unsigned I = 1; 851 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 852 Sec->SectionIndex = I++; 853 Sec->setSHName(Out<ELFT>::ShStrTab->addString(Sec->getName())); 854 } 855 856 // Finalizers fix each section's size. 857 // .dynsym is finalized early since that may fill up .gnu.hash. 858 if (isOutputDynamic()) 859 Out<ELFT>::DynSymTab->finalize(); 860 861 // Fill other section headers. The dynamic table is finalized 862 // at the end because some tags like RELSZ depend on result 863 // of finalizing other sections. The dynamic string table is 864 // finalized once the .dynamic finalizer has added a few last 865 // strings. See DynamicSection::finalize() 866 for (OutputSectionBase<ELFT> *Sec : OutputSections) 867 if (Sec != Out<ELFT>::DynStrTab && Sec != Out<ELFT>::Dynamic) 868 Sec->finalize(); 869 870 if (isOutputDynamic()) 871 Out<ELFT>::Dynamic->finalize(); 872 873 // Now that all output offsets are fixed. Finalize mergeable sections 874 // to fix their maps from input offsets to output offsets. 875 for (OutputSectionBase<ELFT> *Sec : OutputSections) 876 Sec->finalizePieces(); 877 } 878 879 template <class ELFT> bool Writer<ELFT>::needsGot() { 880 if (!Out<ELFT>::Got->empty()) 881 return true; 882 883 // We add the .got section to the result for dynamic MIPS target because 884 // its address and properties are mentioned in the .dynamic section. 885 if (Config->EMachine == EM_MIPS) 886 return true; 887 888 // If we have a relocation that is relative to GOT (such as GOTOFFREL), 889 // we need to emit a GOT even if it's empty. 890 return Out<ELFT>::Got->HasGotOffRel; 891 } 892 893 // This function add Out<ELFT>::* sections to OutputSections. 894 template <class ELFT> void Writer<ELFT>::addPredefinedSections() { 895 auto Add = [&](OutputSectionBase<ELFT> *C) { 896 if (C) 897 OutputSections.push_back(C); 898 }; 899 900 // This order is not the same as the final output order 901 // because we sort the sections using their attributes below. 902 Add(Out<ELFT>::SymTab); 903 Add(Out<ELFT>::ShStrTab); 904 Add(Out<ELFT>::StrTab); 905 if (isOutputDynamic()) { 906 Add(Out<ELFT>::DynSymTab); 907 if (Out<ELFT>::VerNeed->getNeedNum() != 0) { 908 Add(Out<ELFT>::VerSym); 909 Add(Out<ELFT>::VerNeed); 910 } 911 Add(Out<ELFT>::GnuHashTab); 912 Add(Out<ELFT>::HashTab); 913 Add(Out<ELFT>::Dynamic); 914 Add(Out<ELFT>::DynStrTab); 915 if (Out<ELFT>::RelaDyn->hasRelocs()) 916 Add(Out<ELFT>::RelaDyn); 917 Add(Out<ELFT>::MipsRldMap); 918 } 919 920 // We always need to add rel[a].plt to output if it has entries. 921 // Even during static linking it can contain R_[*]_IRELATIVE relocations. 922 if (Out<ELFT>::RelaPlt && Out<ELFT>::RelaPlt->hasRelocs()) { 923 Add(Out<ELFT>::RelaPlt); 924 Out<ELFT>::RelaPlt->Static = !isOutputDynamic(); 925 } 926 927 if (needsGot()) 928 Add(Out<ELFT>::Got); 929 if (Out<ELFT>::GotPlt && !Out<ELFT>::GotPlt->empty()) 930 Add(Out<ELFT>::GotPlt); 931 if (!Out<ELFT>::Plt->empty()) 932 Add(Out<ELFT>::Plt); 933 if (!Out<ELFT>::EhFrame->empty()) 934 Add(Out<ELFT>::EhFrameHdr); 935 if (Out<ELFT>::Bss->getSize() > 0) 936 Add(Out<ELFT>::Bss); 937 } 938 939 // The linker is expected to define SECNAME_start and SECNAME_end 940 // symbols for a few sections. This function defines them. 941 template <class ELFT> void Writer<ELFT>::addStartEndSymbols() { 942 auto Define = [&](StringRef Start, StringRef End, 943 OutputSectionBase<ELFT> *OS) { 944 if (OS) { 945 this->Symtab.addSynthetic(Start, OS, 0); 946 this->Symtab.addSynthetic(End, OS, DefinedSynthetic<ELFT>::SectionEnd); 947 } else { 948 addOptionalSynthetic(this->Symtab, Start, 949 (OutputSectionBase<ELFT> *)nullptr, 0); 950 addOptionalSynthetic(this->Symtab, End, 951 (OutputSectionBase<ELFT> *)nullptr, 0); 952 } 953 }; 954 955 Define("__preinit_array_start", "__preinit_array_end", 956 Out<ELFT>::Dynamic->PreInitArraySec); 957 Define("__init_array_start", "__init_array_end", 958 Out<ELFT>::Dynamic->InitArraySec); 959 Define("__fini_array_start", "__fini_array_end", 960 Out<ELFT>::Dynamic->FiniArraySec); 961 } 962 963 // If a section name is valid as a C identifier (which is rare because of 964 // the leading '.'), linkers are expected to define __start_<secname> and 965 // __stop_<secname> symbols. They are at beginning and end of the section, 966 // respectively. This is not requested by the ELF standard, but GNU ld and 967 // gold provide the feature, and used by many programs. 968 template <class ELFT> 969 void Writer<ELFT>::addStartStopSymbols(OutputSectionBase<ELFT> *Sec) { 970 StringRef S = Sec->getName(); 971 if (!isValidCIdentifier(S)) 972 return; 973 StringSaver Saver(Alloc); 974 StringRef Start = Saver.save("__start_" + S); 975 StringRef Stop = Saver.save("__stop_" + S); 976 if (SymbolBody *B = Symtab.find(Start)) 977 if (B->isUndefined()) 978 Symtab.addSynthetic(Start, Sec, 0); 979 if (SymbolBody *B = Symtab.find(Stop)) 980 if (B->isUndefined()) 981 Symtab.addSynthetic(Stop, Sec, DefinedSynthetic<ELFT>::SectionEnd); 982 } 983 984 template <class ELFT> static bool needsPtLoad(OutputSectionBase<ELFT> *Sec) { 985 if (!(Sec->getFlags() & SHF_ALLOC)) 986 return false; 987 988 // Don't allocate VA space for TLS NOBITS sections. The PT_TLS PHDR is 989 // responsible for allocating space for them, not the PT_LOAD that 990 // contains the TLS initialization image. 991 if (Sec->getFlags() & SHF_TLS && Sec->getType() == SHT_NOBITS) 992 return false; 993 return true; 994 } 995 996 static uint32_t toPhdrFlags(uint64_t Flags) { 997 uint32_t Ret = PF_R; 998 if (Flags & SHF_WRITE) 999 Ret |= PF_W; 1000 if (Flags & SHF_EXECINSTR) 1001 Ret |= PF_X; 1002 return Ret; 1003 } 1004 1005 // Decide which program headers to create and which sections to include in each 1006 // one. 1007 template <class ELFT> void Writer<ELFT>::createPhdrs() { 1008 auto AddHdr = [this](unsigned Type, unsigned Flags) { 1009 return &*Phdrs.emplace(Phdrs.end(), Type, Flags); 1010 }; 1011 1012 auto AddSec = [](Phdr &Hdr, OutputSectionBase<ELFT> *Sec) { 1013 Hdr.Last = Sec; 1014 if (!Hdr.First) 1015 Hdr.First = Sec; 1016 Hdr.H.p_align = std::max<uintX_t>(Hdr.H.p_align, Sec->getAlign()); 1017 }; 1018 1019 // The first phdr entry is PT_PHDR which describes the program header itself. 1020 Phdr &Hdr = *AddHdr(PT_PHDR, PF_R); 1021 AddSec(Hdr, Out<ELFT>::ProgramHeaders); 1022 1023 // PT_INTERP must be the second entry if exists. 1024 if (needsInterpSection()) { 1025 Phdr &Hdr = *AddHdr(PT_INTERP, toPhdrFlags(Out<ELFT>::Interp->getFlags())); 1026 AddSec(Hdr, Out<ELFT>::Interp); 1027 } 1028 1029 // Add the first PT_LOAD segment for regular output sections. 1030 uintX_t Flags = PF_R; 1031 Phdr *Load = AddHdr(PT_LOAD, Flags); 1032 AddSec(*Load, Out<ELFT>::ElfHeader); 1033 AddSec(*Load, Out<ELFT>::ProgramHeaders); 1034 1035 Phdr TlsHdr(PT_TLS, PF_R); 1036 Phdr RelRo(PT_GNU_RELRO, PF_R); 1037 Phdr Note(PT_NOTE, PF_R); 1038 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1039 if (!(Sec->getFlags() & SHF_ALLOC)) 1040 break; 1041 1042 // If we meet TLS section then we create TLS header 1043 // and put all TLS sections inside for futher use when 1044 // assign addresses. 1045 if (Sec->getFlags() & SHF_TLS) 1046 AddSec(TlsHdr, Sec); 1047 1048 if (!needsPtLoad<ELFT>(Sec)) 1049 continue; 1050 1051 // If flags changed then we want new load segment. 1052 uintX_t NewFlags = toPhdrFlags(Sec->getFlags()); 1053 if (Flags != NewFlags) { 1054 Load = AddHdr(PT_LOAD, NewFlags); 1055 Flags = NewFlags; 1056 } 1057 1058 AddSec(*Load, Sec); 1059 1060 if (isRelroSection(Sec)) 1061 AddSec(RelRo, Sec); 1062 if (Sec->getType() == SHT_NOTE) 1063 AddSec(Note, Sec); 1064 } 1065 1066 // Add the TLS segment unless it's empty. 1067 if (TlsHdr.First) 1068 Phdrs.push_back(std::move(TlsHdr)); 1069 1070 // Add an entry for .dynamic. 1071 if (isOutputDynamic()) { 1072 Phdr &H = *AddHdr(PT_DYNAMIC, toPhdrFlags(Out<ELFT>::Dynamic->getFlags())); 1073 AddSec(H, Out<ELFT>::Dynamic); 1074 } 1075 1076 // PT_GNU_RELRO includes all sections that should be marked as 1077 // read-only by dynamic linker after proccessing relocations. 1078 if (RelRo.First) 1079 Phdrs.push_back(std::move(RelRo)); 1080 1081 // PT_GNU_EH_FRAME is a special section pointing on .eh_frame_hdr. 1082 if (!Out<ELFT>::EhFrame->empty() && Out<ELFT>::EhFrameHdr) { 1083 Phdr &Hdr = *AddHdr(PT_GNU_EH_FRAME, 1084 toPhdrFlags(Out<ELFT>::EhFrameHdr->getFlags())); 1085 AddSec(Hdr, Out<ELFT>::EhFrameHdr); 1086 } 1087 1088 // PT_GNU_STACK is a special section to tell the loader to make the 1089 // pages for the stack non-executable. 1090 if (!Config->ZExecStack) 1091 AddHdr(PT_GNU_STACK, PF_R | PF_W); 1092 1093 if (Note.First) 1094 Phdrs.push_back(std::move(Note)); 1095 1096 Out<ELFT>::ProgramHeaders->setSize(sizeof(Elf_Phdr) * Phdrs.size()); 1097 } 1098 1099 // The first section of each PT_LOAD and the first section after PT_GNU_RELRO 1100 // have to be page aligned so that the dynamic linker can set the permissions. 1101 template <class ELFT> void Writer<ELFT>::fixSectionAlignments() { 1102 for (const Phdr &P : Phdrs) 1103 if (P.H.p_type == PT_LOAD) 1104 P.First->PageAlign = true; 1105 1106 for (const Phdr &P : Phdrs) { 1107 if (P.H.p_type != PT_GNU_RELRO) 1108 continue; 1109 // Find the first section after PT_GNU_RELRO. If it is in a PT_LOAD we 1110 // have to align it to a page. 1111 auto End = OutputSections.end(); 1112 auto I = std::find(OutputSections.begin(), End, P.Last); 1113 if (I == End || (I + 1) == End) 1114 continue; 1115 OutputSectionBase<ELFT> *Sec = *(I + 1); 1116 if (needsPtLoad(Sec)) 1117 Sec->PageAlign = true; 1118 } 1119 } 1120 1121 // We should set file offsets and VAs for elf header and program headers 1122 // sections. These are special, we do not include them into output sections 1123 // list, but have them to simplify the code. 1124 template <class ELFT> void Writer<ELFT>::fixHeaders() { 1125 uintX_t BaseVA = ScriptConfig->DoLayout ? 0 : Target->getVAStart(); 1126 Out<ELFT>::ElfHeader->setVA(BaseVA); 1127 Out<ELFT>::ElfHeader->setFileOffset(0); 1128 uintX_t Off = Out<ELFT>::ElfHeader->getSize(); 1129 Out<ELFT>::ProgramHeaders->setVA(Off + BaseVA); 1130 Out<ELFT>::ProgramHeaders->setFileOffset(Off); 1131 } 1132 1133 // Assign VAs (addresses at run-time) to output sections. 1134 template <class ELFT> void Writer<ELFT>::assignAddresses() { 1135 uintX_t VA = Target->getVAStart() + Out<ELFT>::ElfHeader->getSize() + 1136 Out<ELFT>::ProgramHeaders->getSize(); 1137 1138 uintX_t ThreadBssOffset = 0; 1139 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1140 uintX_t Align = Sec->getAlign(); 1141 if (Sec->PageAlign) 1142 Align = std::max<uintX_t>(Align, Target->PageSize); 1143 1144 // We only assign VAs to allocated sections. 1145 if (needsPtLoad<ELFT>(Sec)) { 1146 VA = alignTo(VA, Align); 1147 Sec->setVA(VA); 1148 VA += Sec->getSize(); 1149 } else if (Sec->getFlags() & SHF_TLS && Sec->getType() == SHT_NOBITS) { 1150 uintX_t TVA = VA + ThreadBssOffset; 1151 TVA = alignTo(TVA, Align); 1152 Sec->setVA(TVA); 1153 ThreadBssOffset = TVA - VA + Sec->getSize(); 1154 } 1155 } 1156 } 1157 1158 // Adjusts the file alignment for a given output section and returns 1159 // its new file offset. The file offset must be the same with its 1160 // virtual address (modulo the page size) so that the loader can load 1161 // executables without any address adjustment. 1162 template <class ELFT, class uintX_t> 1163 static uintX_t getFileAlignment(uintX_t Off, OutputSectionBase<ELFT> *Sec) { 1164 uintX_t Align = Sec->getAlign(); 1165 if (Sec->PageAlign) 1166 Align = std::max<uintX_t>(Align, Target->PageSize); 1167 Off = alignTo(Off, Align); 1168 1169 // Relocatable output does not have program headers 1170 // and does not need any other offset adjusting. 1171 if (Config->Relocatable || !(Sec->getFlags() & SHF_ALLOC)) 1172 return Off; 1173 return alignTo(Off, Target->PageSize, Sec->getVA()); 1174 } 1175 1176 // Assign file offsets to output sections. 1177 template <class ELFT> void Writer<ELFT>::assignFileOffsets() { 1178 uintX_t Off = 1179 Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize(); 1180 1181 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1182 if (Sec->getType() == SHT_NOBITS) { 1183 Sec->setFileOffset(Off); 1184 continue; 1185 } 1186 1187 Off = getFileAlignment<ELFT>(Off, Sec); 1188 Sec->setFileOffset(Off); 1189 Off += Sec->getSize(); 1190 } 1191 SectionHeaderOff = alignTo(Off, sizeof(uintX_t)); 1192 FileSize = SectionHeaderOff + (OutputSections.size() + 1) * sizeof(Elf_Shdr); 1193 } 1194 1195 // Finalize the program headers. We call this function after we assign 1196 // file offsets and VAs to all sections. 1197 template <class ELFT> void Writer<ELFT>::setPhdrs() { 1198 for (Phdr &P : Phdrs) { 1199 Elf_Phdr &H = P.H; 1200 OutputSectionBase<ELFT> *First = P.First; 1201 OutputSectionBase<ELFT> *Last = P.Last; 1202 if (First) { 1203 H.p_filesz = Last->getFileOff() - First->getFileOff(); 1204 if (Last->getType() != SHT_NOBITS) 1205 H.p_filesz += Last->getSize(); 1206 H.p_memsz = Last->getVA() + Last->getSize() - First->getVA(); 1207 H.p_offset = First->getFileOff(); 1208 H.p_vaddr = First->getVA(); 1209 } 1210 if (H.p_type == PT_LOAD) 1211 H.p_align = Target->PageSize; 1212 else if (H.p_type == PT_GNU_RELRO) 1213 H.p_align = 1; 1214 H.p_paddr = H.p_vaddr; 1215 1216 // The TLS pointer goes after PT_TLS. At least glibc will align it, 1217 // so round up the size to make sure the offsets are correct. 1218 if (H.p_type == PT_TLS) { 1219 Out<ELFT>::TlsPhdr = &H; 1220 H.p_memsz = alignTo(H.p_memsz, H.p_align); 1221 } 1222 } 1223 } 1224 1225 static uint32_t getMipsEFlags(bool Is64Bits) { 1226 // FIXME: In fact ELF flags depends on ELF flags of input object files 1227 // and selected emulation. For now just use hard coded values. 1228 if (Is64Bits) 1229 return EF_MIPS_CPIC | EF_MIPS_PIC | EF_MIPS_ARCH_64R2; 1230 1231 uint32_t V = EF_MIPS_CPIC | EF_MIPS_ABI_O32 | EF_MIPS_ARCH_32R2; 1232 if (Config->Shared) 1233 V |= EF_MIPS_PIC; 1234 return V; 1235 } 1236 1237 template <class ELFT> static typename ELFT::uint getEntryAddr() { 1238 if (Symbol *S = Config->EntrySym) 1239 return S->body()->getVA<ELFT>(); 1240 if (Config->EntryAddr != uint64_t(-1)) 1241 return Config->EntryAddr; 1242 return 0; 1243 } 1244 1245 template <class ELFT> static uint8_t getELFEncoding() { 1246 if (ELFT::TargetEndianness == llvm::support::little) 1247 return ELFDATA2LSB; 1248 return ELFDATA2MSB; 1249 } 1250 1251 static uint16_t getELFType() { 1252 if (Config->Pic) 1253 return ET_DYN; 1254 if (Config->Relocatable) 1255 return ET_REL; 1256 return ET_EXEC; 1257 } 1258 1259 // This function is called after we have assigned address and size 1260 // to each section. This function fixes some predefined absolute 1261 // symbol values that depend on section address and size. 1262 template <class ELFT> void Writer<ELFT>::fixAbsoluteSymbols() { 1263 auto Set = [](DefinedRegular<ELFT> *&S1, DefinedRegular<ELFT> *&S2, 1264 uintX_t V) { 1265 if (S1) 1266 S1->Value = V; 1267 if (S2) 1268 S2->Value = V; 1269 }; 1270 1271 // _etext is the first location after the last read-only loadable segment. 1272 // _edata is the first location after the last read-write loadable segment. 1273 // _end is the first location after the uninitialized data region. 1274 for (Phdr &P : Phdrs) { 1275 Elf_Phdr &H = P.H; 1276 if (H.p_type != PT_LOAD) 1277 continue; 1278 Set(ElfSym<ELFT>::End, ElfSym<ELFT>::End2, H.p_vaddr + H.p_memsz); 1279 1280 uintX_t Val = H.p_vaddr + H.p_filesz; 1281 if (H.p_flags & PF_W) 1282 Set(ElfSym<ELFT>::Edata, ElfSym<ELFT>::Edata2, Val); 1283 else 1284 Set(ElfSym<ELFT>::Etext, ElfSym<ELFT>::Etext2, Val); 1285 } 1286 } 1287 1288 template <class ELFT> void Writer<ELFT>::writeHeader() { 1289 uint8_t *Buf = Buffer->getBufferStart(); 1290 memcpy(Buf, "\177ELF", 4); 1291 1292 auto &FirstObj = cast<ELFFileBase<ELFT>>(*Config->FirstElf); 1293 1294 // Write the ELF header. 1295 auto *EHdr = reinterpret_cast<Elf_Ehdr *>(Buf); 1296 EHdr->e_ident[EI_CLASS] = ELFT::Is64Bits ? ELFCLASS64 : ELFCLASS32; 1297 EHdr->e_ident[EI_DATA] = getELFEncoding<ELFT>(); 1298 EHdr->e_ident[EI_VERSION] = EV_CURRENT; 1299 EHdr->e_ident[EI_OSABI] = FirstObj.getOSABI(); 1300 EHdr->e_type = getELFType(); 1301 EHdr->e_machine = FirstObj.getEMachine(); 1302 EHdr->e_version = EV_CURRENT; 1303 EHdr->e_entry = getEntryAddr<ELFT>(); 1304 EHdr->e_shoff = SectionHeaderOff; 1305 EHdr->e_ehsize = sizeof(Elf_Ehdr); 1306 EHdr->e_phnum = Phdrs.size(); 1307 EHdr->e_shentsize = sizeof(Elf_Shdr); 1308 EHdr->e_shnum = OutputSections.size() + 1; 1309 EHdr->e_shstrndx = Out<ELFT>::ShStrTab->SectionIndex; 1310 1311 if (Config->EMachine == EM_MIPS) 1312 EHdr->e_flags = getMipsEFlags(ELFT::Is64Bits); 1313 1314 if (!Config->Relocatable) { 1315 EHdr->e_phoff = sizeof(Elf_Ehdr); 1316 EHdr->e_phentsize = sizeof(Elf_Phdr); 1317 } 1318 1319 // Write the program header table. 1320 auto *HBuf = reinterpret_cast<Elf_Phdr *>(Buf + EHdr->e_phoff); 1321 for (Phdr &P : Phdrs) 1322 *HBuf++ = P.H; 1323 1324 // Write the section header table. Note that the first table entry is null. 1325 auto *SHdrs = reinterpret_cast<Elf_Shdr *>(Buf + EHdr->e_shoff); 1326 for (OutputSectionBase<ELFT> *Sec : OutputSections) 1327 Sec->writeHeaderTo(++SHdrs); 1328 } 1329 1330 template <class ELFT> void Writer<ELFT>::openFile() { 1331 ErrorOr<std::unique_ptr<FileOutputBuffer>> BufferOrErr = 1332 FileOutputBuffer::create(Config->OutputFile, FileSize, 1333 FileOutputBuffer::F_executable); 1334 if (BufferOrErr) 1335 Buffer = std::move(*BufferOrErr); 1336 else 1337 error(BufferOrErr, "failed to open " + Config->OutputFile); 1338 } 1339 1340 // Write section contents to a mmap'ed file. 1341 template <class ELFT> void Writer<ELFT>::writeSections() { 1342 uint8_t *Buf = Buffer->getBufferStart(); 1343 1344 // PPC64 needs to process relocations in the .opd section before processing 1345 // relocations in code-containing sections. 1346 if (OutputSectionBase<ELFT> *Sec = Out<ELFT>::Opd) { 1347 Out<ELFT>::OpdBuf = Buf + Sec->getFileOff(); 1348 Sec->writeTo(Buf + Sec->getFileOff()); 1349 } 1350 1351 for (OutputSectionBase<ELFT> *Sec : OutputSections) 1352 if (Sec != Out<ELFT>::Opd) 1353 Sec->writeTo(Buf + Sec->getFileOff()); 1354 } 1355 1356 template <class ELFT> void Writer<ELFT>::writeBuildId() { 1357 BuildIdSection<ELFT> *S = Out<ELFT>::BuildId; 1358 if (!S) 1359 return; 1360 1361 // Compute a hash of all sections except .debug_* sections. 1362 // We skip debug sections because they tend to be very large 1363 // and their contents are very likely to be the same as long as 1364 // other sections are the same. 1365 uint8_t *Start = Buffer->getBufferStart(); 1366 uint8_t *Last = Start; 1367 std::vector<ArrayRef<uint8_t>> Regions; 1368 for (OutputSectionBase<ELFT> *Sec : OutputSections) { 1369 uint8_t *End = Start + Sec->getFileOff(); 1370 if (!Sec->getName().startswith(".debug_")) 1371 Regions.push_back({Last, End}); 1372 Last = End; 1373 } 1374 Regions.push_back({Last, Start + FileSize}); 1375 S->writeBuildId(Regions); 1376 } 1377 1378 template void elf::writeResult<ELF32LE>(SymbolTable<ELF32LE> *Symtab); 1379 template void elf::writeResult<ELF32BE>(SymbolTable<ELF32BE> *Symtab); 1380 template void elf::writeResult<ELF64LE>(SymbolTable<ELF64LE> *Symtab); 1381 template void elf::writeResult<ELF64BE>(SymbolTable<ELF64BE> *Symtab); 1382