1f7c5fbb1SRui Ueyama //===- LinkerScript.cpp ---------------------------------------------------===// 2f7c5fbb1SRui Ueyama // 3f7c5fbb1SRui Ueyama // The LLVM Linker 4f7c5fbb1SRui Ueyama // 5f7c5fbb1SRui Ueyama // This file is distributed under the University of Illinois Open Source 6f7c5fbb1SRui Ueyama // License. See LICENSE.TXT for details. 7f7c5fbb1SRui Ueyama // 8f7c5fbb1SRui Ueyama //===----------------------------------------------------------------------===// 9f7c5fbb1SRui Ueyama // 10f7c5fbb1SRui Ueyama // This file contains the parser/evaluator of the linker script. 11629e0aa5SRui Ueyama // It parses a linker script and write the result to Config or ScriptConfig 12629e0aa5SRui Ueyama // objects. 13629e0aa5SRui Ueyama // 14629e0aa5SRui Ueyama // If SECTIONS command is used, a ScriptConfig contains an AST 15629e0aa5SRui Ueyama // of the command which will later be consumed by createSections() and 16629e0aa5SRui Ueyama // assignAddresses(). 17f7c5fbb1SRui Ueyama // 18f7c5fbb1SRui Ueyama //===----------------------------------------------------------------------===// 19f7c5fbb1SRui Ueyama 20717677afSRui Ueyama #include "LinkerScript.h" 21f7c5fbb1SRui Ueyama #include "Config.h" 22f7c5fbb1SRui Ueyama #include "Driver.h" 231ebc8ed7SRui Ueyama #include "InputSection.h" 24652852c5SGeorge Rimar #include "OutputSections.h" 25e77b5bf6SAdhemerval Zanella #include "ScriptParser.h" 2693c9af42SRui Ueyama #include "Strings.h" 27eda81a1bSEugene Leviant #include "Symbols.h" 28f7c5fbb1SRui Ueyama #include "SymbolTable.h" 29467c4d55SEugene Leviant #include "Target.h" 30bbe38602SEugene Leviant #include "Writer.h" 31960504b9SRui Ueyama #include "llvm/ADT/StringSwitch.h" 32652852c5SGeorge Rimar #include "llvm/Support/ELF.h" 33f7c5fbb1SRui Ueyama #include "llvm/Support/FileSystem.h" 34f7c5fbb1SRui Ueyama #include "llvm/Support/MemoryBuffer.h" 35f03f3cc1SRui Ueyama #include "llvm/Support/Path.h" 36a47ee68dSRui Ueyama #include "llvm/Support/StringSaver.h" 37f7c5fbb1SRui Ueyama 38f7c5fbb1SRui Ueyama using namespace llvm; 39652852c5SGeorge Rimar using namespace llvm::ELF; 401ebc8ed7SRui Ueyama using namespace llvm::object; 41f7c5fbb1SRui Ueyama using namespace lld; 42e0df00b9SRafael Espindola using namespace lld::elf; 43f7c5fbb1SRui Ueyama 44884e786dSGeorge Rimar LinkerScriptBase *elf::ScriptBase; 4507320e40SRui Ueyama ScriptConfiguration *elf::ScriptConfig; 46717677afSRui Ueyama 476c55f0e3SGeorge Rimar template <class ELFT> static void addRegular(SymbolAssignment *Cmd) { 481602421cSRui Ueyama Symbol *Sym = Symtab<ELFT>::X->addRegular(Cmd->Name, STB_GLOBAL, STV_DEFAULT); 491602421cSRui Ueyama Sym->Visibility = Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT; 501602421cSRui Ueyama Cmd->Sym = Sym->body(); 5120d03194SEugene Leviant 5220d03194SEugene Leviant // If we have no SECTIONS then we don't have '.' and don't call 5320d03194SEugene Leviant // assignAddresses(). We calculate symbol value immediately in this case. 5420d03194SEugene Leviant if (!ScriptConfig->HasSections) 5520d03194SEugene Leviant cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(0); 56ceabe80eSEugene Leviant } 57ceabe80eSEugene Leviant 580c70d3ccSRui Ueyama template <class ELFT> static void addSynthetic(SymbolAssignment *Cmd) { 59e1937bb5SGeorge Rimar Symbol *Sym = Symtab<ELFT>::X->addSynthetic( 60e1937bb5SGeorge Rimar Cmd->Name, nullptr, 0, Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT); 611602421cSRui Ueyama Cmd->Sym = Sym->body(); 62ceabe80eSEugene Leviant } 63ceabe80eSEugene Leviant 64db741e72SEugene Leviant template <class ELFT> static void addSymbol(SymbolAssignment *Cmd) { 65db741e72SEugene Leviant if (Cmd->IsAbsolute) 66db741e72SEugene Leviant addRegular<ELFT>(Cmd); 67db741e72SEugene Leviant else 68db741e72SEugene Leviant addSynthetic<ELFT>(Cmd); 69db741e72SEugene Leviant } 701602421cSRui Ueyama // If a symbol was in PROVIDE(), we need to define it only when 711602421cSRui Ueyama // it is an undefined symbol. 721602421cSRui Ueyama template <class ELFT> static bool shouldDefine(SymbolAssignment *Cmd) { 731602421cSRui Ueyama if (Cmd->Name == ".") 74ceabe80eSEugene Leviant return false; 751602421cSRui Ueyama if (!Cmd->Provide) 76ceabe80eSEugene Leviant return true; 771602421cSRui Ueyama SymbolBody *B = Symtab<ELFT>::X->find(Cmd->Name); 781602421cSRui Ueyama return B && B->isUndefined(); 79ceabe80eSEugene Leviant } 80ceabe80eSEugene Leviant 81076fe157SGeorge Rimar bool SymbolAssignment::classof(const BaseCommand *C) { 82076fe157SGeorge Rimar return C->Kind == AssignmentKind; 83076fe157SGeorge Rimar } 84076fe157SGeorge Rimar 85076fe157SGeorge Rimar bool OutputSectionCommand::classof(const BaseCommand *C) { 86076fe157SGeorge Rimar return C->Kind == OutputSectionKind; 87076fe157SGeorge Rimar } 88076fe157SGeorge Rimar 89eea3114fSGeorge Rimar bool InputSectionDescription::classof(const BaseCommand *C) { 90eea3114fSGeorge Rimar return C->Kind == InputSectionKind; 91eea3114fSGeorge Rimar } 92eea3114fSGeorge Rimar 93eefa758eSGeorge Rimar bool AssertCommand::classof(const BaseCommand *C) { 94eefa758eSGeorge Rimar return C->Kind == AssertKind; 95eefa758eSGeorge Rimar } 96eefa758eSGeorge Rimar 9736a153cdSRui Ueyama template <class ELFT> static bool isDiscarded(InputSectionBase<ELFT> *S) { 98eea3114fSGeorge Rimar return !S || !S->Live; 99717677afSRui Ueyama } 100717677afSRui Ueyama 101f34d0e08SRui Ueyama template <class ELFT> LinkerScript<ELFT>::LinkerScript() {} 102f34d0e08SRui Ueyama template <class ELFT> LinkerScript<ELFT>::~LinkerScript() {} 103f34d0e08SRui Ueyama 10407320e40SRui Ueyama template <class ELFT> 10507320e40SRui Ueyama bool LinkerScript<ELFT>::shouldKeep(InputSectionBase<ELFT> *S) { 106c91930a1SGeorge Rimar for (Regex *Re : Opt.KeptSections) 107042a3f20SRafael Espindola if (Re->match(S->Name)) 108eea3114fSGeorge Rimar return true; 109eea3114fSGeorge Rimar return false; 110eea3114fSGeorge Rimar } 111eea3114fSGeorge Rimar 112395281cfSGeorge Rimar static bool fileMatches(const llvm::Regex &FileRe, 113395281cfSGeorge Rimar const llvm::Regex &ExcludedFileRe, StringRef Filename) { 114395281cfSGeorge Rimar return const_cast<Regex &>(FileRe).match(Filename) && 115395281cfSGeorge Rimar !const_cast<Regex &>(ExcludedFileRe).match(Filename); 1160659800eSGeorge Rimar } 1170659800eSGeorge Rimar 118575208caSGeorge Rimar static bool comparePriority(InputSectionData *A, InputSectionData *B) { 119575208caSGeorge Rimar return getPriority(A->Name) < getPriority(B->Name); 120575208caSGeorge Rimar } 121575208caSGeorge Rimar 122c0028d3dSRafael Espindola static bool compareName(InputSectionData *A, InputSectionData *B) { 123042a3f20SRafael Espindola return A->Name < B->Name; 1240702c4e8SGeorge Rimar } 125742c3836SRui Ueyama 126c0028d3dSRafael Espindola static bool compareAlignment(InputSectionData *A, InputSectionData *B) { 127742c3836SRui Ueyama // ">" is not a mistake. Larger alignments are placed before smaller 128742c3836SRui Ueyama // alignments in order to reduce the amount of padding necessary. 129742c3836SRui Ueyama // This is compatible with GNU. 130742c3836SRui Ueyama return A->Alignment > B->Alignment; 131742c3836SRui Ueyama } 132742c3836SRui Ueyama 133c0028d3dSRafael Espindola static std::function<bool(InputSectionData *, InputSectionData *)> 134be394db3SGeorge Rimar getComparator(SortSectionPolicy K) { 135be394db3SGeorge Rimar switch (K) { 136be394db3SGeorge Rimar case SortSectionPolicy::Alignment: 137c0028d3dSRafael Espindola return compareAlignment; 138be394db3SGeorge Rimar case SortSectionPolicy::Name: 139be394db3SGeorge Rimar return compareName; 140be394db3SGeorge Rimar case SortSectionPolicy::Priority: 141be394db3SGeorge Rimar return comparePriority; 142be394db3SGeorge Rimar default: 143be394db3SGeorge Rimar llvm_unreachable("unknown sort policy"); 144be394db3SGeorge Rimar } 145742c3836SRui Ueyama } 1460702c4e8SGeorge Rimar 1478f66df92SGeorge Rimar static bool checkConstraint(uint64_t Flags, ConstraintKind Kind) { 1488f66df92SGeorge Rimar bool RO = (Kind == ConstraintKind::ReadOnly); 1498f66df92SGeorge Rimar bool RW = (Kind == ConstraintKind::ReadWrite); 1508f66df92SGeorge Rimar bool Writable = Flags & SHF_WRITE; 151adcdb664SRui Ueyama return !(RO && Writable) && !(RW && !Writable); 1528f66df92SGeorge Rimar } 1538f66df92SGeorge Rimar 15448c3f1ceSRui Ueyama template <class ELFT> 155e71a3f8aSRafael Espindola static bool matchConstraints(ArrayRef<InputSectionBase<ELFT> *> Sections, 15606ae6836SGeorge Rimar ConstraintKind Kind) { 1578f66df92SGeorge Rimar if (Kind == ConstraintKind::NoConstraint) 1588f66df92SGeorge Rimar return true; 159d3190795SRafael Espindola return llvm::all_of(Sections, [=](InputSectionData *Sec2) { 160d3190795SRafael Espindola auto *Sec = static_cast<InputSectionBase<ELFT> *>(Sec2); 1618f66df92SGeorge Rimar return checkConstraint(Sec->getSectionHdr()->sh_flags, Kind); 16206ae6836SGeorge Rimar }); 16306ae6836SGeorge Rimar } 16406ae6836SGeorge Rimar 165d3190795SRafael Espindola // Compute and remember which sections the InputSectionDescription matches. 166be94e1b6SRafael Espindola template <class ELFT> 167e71a3f8aSRafael Espindola void LinkerScript<ELFT>::computeInputSections(InputSectionDescription *I) { 168395281cfSGeorge Rimar for (const std::pair<llvm::Regex, llvm::Regex> &V : I->SectionsVec) { 169395281cfSGeorge Rimar for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles()) { 170395281cfSGeorge Rimar if (fileMatches(I->FileRe, V.first, sys::path::filename(F->getName()))) { 171395281cfSGeorge Rimar Regex &Re = const_cast<Regex &>(V.second); 172be94e1b6SRafael Espindola for (InputSectionBase<ELFT> *S : F->getSections()) 173395281cfSGeorge Rimar if (!isDiscarded(S) && !S->OutSec && Re.match(S->Name)) 174d3190795SRafael Espindola I->Sections.push_back(S); 175be94e1b6SRafael Espindola 176395281cfSGeorge Rimar if (Re.match("COMMON")) 177d3190795SRafael Espindola I->Sections.push_back(CommonInputSection<ELFT>::X); 178395281cfSGeorge Rimar } 179395281cfSGeorge Rimar } 180395281cfSGeorge Rimar } 181d3190795SRafael Espindola 182*b2a0abdfSRui Ueyama if (I->SortInner != SortSectionPolicy::Default) 183d3190795SRafael Espindola std::stable_sort(I->Sections.begin(), I->Sections.end(), 184d3190795SRafael Espindola getComparator(I->SortInner)); 185*b2a0abdfSRui Ueyama if (I->SortOuter != SortSectionPolicy::Default) 186d3190795SRafael Espindola std::stable_sort(I->Sections.begin(), I->Sections.end(), 187d3190795SRafael Espindola getComparator(I->SortOuter)); 188d3190795SRafael Espindola 189d3190795SRafael Espindola // We do not add duplicate input sections, so mark them with a dummy output 190d3190795SRafael Espindola // section for now. 191d3190795SRafael Espindola for (InputSectionData *S : I->Sections) { 192d3190795SRafael Espindola auto *S2 = static_cast<InputSectionBase<ELFT> *>(S); 193d3190795SRafael Espindola S2->OutSec = (OutputSectionBase<ELFT> *)-1; 194d3190795SRafael Espindola } 195be94e1b6SRafael Espindola } 196be94e1b6SRafael Espindola 197be94e1b6SRafael Espindola template <class ELFT> 198be94e1b6SRafael Espindola void LinkerScript<ELFT>::discard(ArrayRef<InputSectionBase<ELFT> *> V) { 199be94e1b6SRafael Espindola for (InputSectionBase<ELFT> *S : V) { 200be94e1b6SRafael Espindola S->Live = false; 201be94e1b6SRafael Espindola reportDiscarded(S); 202be94e1b6SRafael Espindola } 203be94e1b6SRafael Espindola } 204be94e1b6SRafael Espindola 20506ae6836SGeorge Rimar template <class ELFT> 2060b9ce6a4SRui Ueyama std::vector<InputSectionBase<ELFT> *> 20706ae6836SGeorge Rimar LinkerScript<ELFT>::createInputSectionList(OutputSectionCommand &OutCmd) { 2080b9ce6a4SRui Ueyama std::vector<InputSectionBase<ELFT> *> Ret; 209e7f912cdSRui Ueyama 21006ae6836SGeorge Rimar for (const std::unique_ptr<BaseCommand> &Base : OutCmd.Commands) { 2117c3ff2ebSRafael Espindola auto *Cmd = dyn_cast<InputSectionDescription>(Base.get()); 2127c3ff2ebSRafael Espindola if (!Cmd) 2130b9ce6a4SRui Ueyama continue; 214e71a3f8aSRafael Espindola computeInputSections(Cmd); 215d3190795SRafael Espindola for (InputSectionData *S : Cmd->Sections) 216d3190795SRafael Espindola Ret.push_back(static_cast<InputSectionBase<ELFT> *>(S)); 2170b9ce6a4SRui Ueyama } 218e71a3f8aSRafael Espindola 2190b9ce6a4SRui Ueyama return Ret; 2200b9ce6a4SRui Ueyama } 2210b9ce6a4SRui Ueyama 222e5d3ca50SPetr Hosek template <class ELFT> 22310897f18SRafael Espindola static SectionKey<ELFT::Is64Bits> createKey(InputSectionBase<ELFT> *C, 22410897f18SRafael Espindola StringRef OutsecName) { 22510897f18SRafael Espindola // When using linker script the merge rules are different. 22610897f18SRafael Espindola // Unfortunately, linker scripts are name based. This means that expressions 22710897f18SRafael Espindola // like *(.foo*) can refer to multiple input sections that would normally be 22810897f18SRafael Espindola // placed in different output sections. We cannot put them in different 22910897f18SRafael Espindola // output sections or we would produce wrong results for 23010897f18SRafael Espindola // start = .; *(.foo.*) end = .; *(.bar) 23110897f18SRafael Espindola // and a mapping of .foo1 and .bar1 to one section and .foo2 and .bar2 to 23210897f18SRafael Espindola // another. The problem is that there is no way to layout those output 23310897f18SRafael Espindola // sections such that the .foo sections are the only thing between the 23410897f18SRafael Espindola // start and end symbols. 23510897f18SRafael Espindola 23610897f18SRafael Espindola // An extra annoyance is that we cannot simply disable merging of the contents 23710897f18SRafael Espindola // of SHF_MERGE sections, but our implementation requires one output section 23810897f18SRafael Espindola // per "kind" (string or not, which size/aligment). 23910897f18SRafael Espindola // Fortunately, creating symbols in the middle of a merge section is not 24010897f18SRafael Espindola // supported by bfd or gold, so we can just create multiple section in that 24110897f18SRafael Espindola // case. 24210897f18SRafael Espindola const typename ELFT::Shdr *H = C->getSectionHdr(); 24310897f18SRafael Espindola typedef typename ELFT::uint uintX_t; 24410897f18SRafael Espindola uintX_t Flags = H->sh_flags & (SHF_MERGE | SHF_STRINGS); 24510897f18SRafael Espindola 24610897f18SRafael Espindola uintX_t Alignment = 0; 24710897f18SRafael Espindola if (isa<MergeInputSection<ELFT>>(C)) 24810897f18SRafael Espindola Alignment = std::max(H->sh_addralign, H->sh_entsize); 24910897f18SRafael Espindola 25010897f18SRafael Espindola return SectionKey<ELFT::Is64Bits>{OutsecName, /*Type*/ 0, Flags, Alignment}; 25110897f18SRafael Espindola } 25210897f18SRafael Espindola 25310897f18SRafael Espindola template <class ELFT> 25420d03194SEugene Leviant void LinkerScript<ELFT>::addSection(OutputSectionFactory<ELFT> &Factory, 25520d03194SEugene Leviant InputSectionBase<ELFT> *Sec, 25620d03194SEugene Leviant StringRef Name) { 25728c1597aSRafael Espindola OutputSectionBase<ELFT> *OutSec; 25828c1597aSRafael Espindola bool IsNew; 25910897f18SRafael Espindola std::tie(OutSec, IsNew) = Factory.create(createKey(Sec, Name), Sec); 26028c1597aSRafael Espindola if (IsNew) 26128c1597aSRafael Espindola OutputSections->push_back(OutSec); 26220d03194SEugene Leviant OutSec->addSection(Sec); 26320d03194SEugene Leviant } 26420d03194SEugene Leviant 26520d03194SEugene Leviant template <class ELFT> 26620d03194SEugene Leviant void LinkerScript<ELFT>::processCommands(OutputSectionFactory<ELFT> &Factory) { 26728c1597aSRafael Espindola 2687c3ff2ebSRafael Espindola for (unsigned I = 0; I < Opt.Commands.size(); ++I) { 2697c3ff2ebSRafael Espindola auto Iter = Opt.Commands.begin() + I; 2707c3ff2ebSRafael Espindola const std::unique_ptr<BaseCommand> &Base1 = *Iter; 2712ab5f73dSRui Ueyama if (auto *Cmd = dyn_cast<SymbolAssignment>(Base1.get())) { 2722ab5f73dSRui Ueyama if (shouldDefine<ELFT>(Cmd)) 2732ab5f73dSRui Ueyama addRegular<ELFT>(Cmd); 2742ab5f73dSRui Ueyama continue; 2752ab5f73dSRui Ueyama } 27620d03194SEugene Leviant if (auto *Cmd = dyn_cast<AssertCommand>(Base1.get())) { 27720d03194SEugene Leviant // If we don't have SECTIONS then output sections have already been 27820d03194SEugene Leviant // created by Writer<EFLT>. The LinkerScript<ELFT>::assignAddresses 27920d03194SEugene Leviant // will not be called, so ASSERT should be evaluated now. 28020d03194SEugene Leviant if (!Opt.HasSections) 28120d03194SEugene Leviant Cmd->Expression(0); 28220d03194SEugene Leviant continue; 28320d03194SEugene Leviant } 2842ab5f73dSRui Ueyama 285ceabe80eSEugene Leviant if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base1.get())) { 2867bd37870SRafael Espindola std::vector<InputSectionBase<ELFT> *> V = createInputSectionList(*Cmd); 2877bd37870SRafael Espindola 28848c3f1ceSRui Ueyama if (Cmd->Name == "/DISCARD/") { 2897bd37870SRafael Espindola discard(V); 29048c3f1ceSRui Ueyama continue; 29148c3f1ceSRui Ueyama } 2920b9ce6a4SRui Ueyama 2937c3ff2ebSRafael Espindola if (!matchConstraints<ELFT>(V, Cmd->Constraint)) { 2947c3ff2ebSRafael Espindola for (InputSectionBase<ELFT> *S : V) 2957c3ff2ebSRafael Espindola S->OutSec = nullptr; 2967c3ff2ebSRafael Espindola Opt.Commands.erase(Iter); 2977c3ff2ebSRafael Espindola continue; 2987c3ff2ebSRafael Espindola } 2997c3ff2ebSRafael Espindola 3007c3ff2ebSRafael Espindola for (const std::unique_ptr<BaseCommand> &Base : Cmd->Commands) 3017c3ff2ebSRafael Espindola if (auto *OutCmd = dyn_cast<SymbolAssignment>(Base.get())) 3027c3ff2ebSRafael Espindola if (shouldDefine<ELFT>(OutCmd)) 3037c3ff2ebSRafael Espindola addSymbol<ELFT>(OutCmd); 3047c3ff2ebSRafael Espindola 30597403d15SEugene Leviant if (V.empty()) 3060b9ce6a4SRui Ueyama continue; 3070b9ce6a4SRui Ueyama 308a14b13d8SGeorge Rimar for (InputSectionBase<ELFT> *Sec : V) { 30920d03194SEugene Leviant addSection(Factory, Sec, Cmd->Name); 31020d03194SEugene Leviant if (uint32_t Subalign = Cmd->SubalignExpr ? Cmd->SubalignExpr(0) : 0) 311db24d9c3SGeorge Rimar Sec->Alignment = Subalign; 31220d03194SEugene Leviant } 313eea3114fSGeorge Rimar } 31448c3f1ceSRui Ueyama } 315db24d9c3SGeorge Rimar } 316e63d81bdSEugene Leviant 31720d03194SEugene Leviant template <class ELFT> 31820d03194SEugene Leviant void LinkerScript<ELFT>::createSections(OutputSectionFactory<ELFT> &Factory) { 31920d03194SEugene Leviant processCommands(Factory); 3200b9ce6a4SRui Ueyama // Add orphan sections. 32120d03194SEugene Leviant for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles()) 32220d03194SEugene Leviant for (InputSectionBase<ELFT> *S : F->getSections()) 32320d03194SEugene Leviant if (!isDiscarded(S) && !S->OutSec) 32420d03194SEugene Leviant addSection(Factory, S, getOutputSectionName(S)); 325e63d81bdSEugene Leviant } 326e63d81bdSEugene Leviant 327db741e72SEugene Leviant // Sets value of a section-defined symbol. Two kinds of 328db741e72SEugene Leviant // symbols are processed: synthetic symbols, whose value 329db741e72SEugene Leviant // is an offset from beginning of section and regular 330db741e72SEugene Leviant // symbols whose value is absolute. 331db741e72SEugene Leviant template <class ELFT> 332db741e72SEugene Leviant static void assignSectionSymbol(SymbolAssignment *Cmd, 333db741e72SEugene Leviant OutputSectionBase<ELFT> *Sec, 334db741e72SEugene Leviant typename ELFT::uint Off) { 335db741e72SEugene Leviant if (!Cmd->Sym) 336db741e72SEugene Leviant return; 337db741e72SEugene Leviant 338db741e72SEugene Leviant if (auto *Body = dyn_cast<DefinedSynthetic<ELFT>>(Cmd->Sym)) { 339db741e72SEugene Leviant Body->Section = Sec; 340db741e72SEugene Leviant Body->Value = Cmd->Expression(Sec->getVA() + Off) - Sec->getVA(); 341db741e72SEugene Leviant return; 342db741e72SEugene Leviant } 343db741e72SEugene Leviant auto *Body = cast<DefinedRegular<ELFT>>(Cmd->Sym); 344db741e72SEugene Leviant Body->Value = Cmd->Expression(Sec->getVA() + Off); 345db741e72SEugene Leviant } 346db741e72SEugene Leviant 347d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::output(InputSection<ELFT> *S) { 348d3190795SRafael Espindola if (!AlreadyOutputIS.insert(S).second) 349ceabe80eSEugene Leviant return; 350d3190795SRafael Espindola bool IsTbss = 351d3190795SRafael Espindola (CurOutSec->getFlags() & SHF_TLS) && CurOutSec->getType() == SHT_NOBITS; 352d3190795SRafael Espindola 353d3190795SRafael Espindola uintX_t Pos = IsTbss ? Dot + ThreadBssOffset : Dot; 354d3190795SRafael Espindola Pos = alignTo(Pos, S->Alignment); 355d3190795SRafael Espindola S->OutSecOff = Pos - CurOutSec->getVA(); 356d3190795SRafael Espindola Pos += S->getSize(); 357d3190795SRafael Espindola 358d3190795SRafael Espindola // Update output section size after adding each section. This is so that 359d3190795SRafael Espindola // SIZEOF works correctly in the case below: 360d3190795SRafael Espindola // .foo { *(.aaa) a = SIZEOF(.foo); *(.bbb) } 361d3190795SRafael Espindola CurOutSec->setSize(Pos - CurOutSec->getVA()); 362d3190795SRafael Espindola 363d3190795SRafael Espindola if (!IsTbss) 364d3190795SRafael Espindola Dot = Pos; 3652de509c3SRui Ueyama } 366ceabe80eSEugene Leviant 367d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::flush() { 368d3190795SRafael Espindola if (auto *OutSec = dyn_cast_or_null<OutputSection<ELFT>>(CurOutSec)) { 369d3190795SRafael Espindola for (InputSection<ELFT> *I : OutSec->Sections) 370d3190795SRafael Espindola output(I); 371d3190795SRafael Espindola AlreadyOutputOS.insert(CurOutSec); 372d3190795SRafael Espindola } 373d3190795SRafael Espindola } 37497403d15SEugene Leviant 375d3190795SRafael Espindola template <class ELFT> 376d3190795SRafael Espindola void LinkerScript<ELFT>::switchTo(OutputSectionBase<ELFT> *Sec) { 377d3190795SRafael Espindola if (CurOutSec == Sec) 378d3190795SRafael Espindola return; 379d3190795SRafael Espindola if (AlreadyOutputOS.count(Sec)) 380d3190795SRafael Espindola return; 381d3190795SRafael Espindola 382d3190795SRafael Espindola flush(); 383d3190795SRafael Espindola CurOutSec = Sec; 384d3190795SRafael Espindola 385d3190795SRafael Espindola Dot = alignTo(Dot, CurOutSec->getAlignment()); 386d3190795SRafael Espindola CurOutSec->setVA(Dot); 387d3190795SRafael Espindola } 388d3190795SRafael Espindola 389d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::process(BaseCommand &Base) { 390d3190795SRafael Espindola if (auto *AssignCmd = dyn_cast<SymbolAssignment>(&Base)) { 39197403d15SEugene Leviant if (AssignCmd->Name == ".") { 39297403d15SEugene Leviant // Update to location counter means update to section size. 393d3190795SRafael Espindola Dot = AssignCmd->Expression(Dot); 394d3190795SRafael Espindola CurOutSec->setSize(Dot - CurOutSec->getVA()); 395d3190795SRafael Espindola return; 39697403d15SEugene Leviant } 397d3190795SRafael Espindola assignSectionSymbol<ELFT>(AssignCmd, CurOutSec, Dot - CurOutSec->getVA()); 398d3190795SRafael Espindola return; 39997403d15SEugene Leviant } 400d3190795SRafael Espindola auto &ICmd = cast<InputSectionDescription>(Base); 401d3190795SRafael Espindola for (InputSectionData *ID : ICmd.Sections) { 402d3190795SRafael Espindola auto *IB = static_cast<InputSectionBase<ELFT> *>(ID); 403d3190795SRafael Espindola switchTo(IB->OutSec); 404d3190795SRafael Espindola if (auto *I = dyn_cast<InputSection<ELFT>>(IB)) 405d3190795SRafael Espindola output(I); 406d3190795SRafael Espindola else if (AlreadyOutputOS.insert(CurOutSec).second) 407d3190795SRafael Espindola Dot += CurOutSec->getSize(); 408ceabe80eSEugene Leviant } 409ceabe80eSEugene Leviant } 410ceabe80eSEugene Leviant 4118f66df92SGeorge Rimar template <class ELFT> 412a14b13d8SGeorge Rimar static std::vector<OutputSectionBase<ELFT> *> 413a14b13d8SGeorge Rimar findSections(OutputSectionCommand &Cmd, 414d3190795SRafael Espindola const std::vector<OutputSectionBase<ELFT> *> &Sections) { 415a14b13d8SGeorge Rimar std::vector<OutputSectionBase<ELFT> *> Ret; 416a14b13d8SGeorge Rimar for (OutputSectionBase<ELFT> *Sec : Sections) 4177c3ff2ebSRafael Espindola if (Sec->getName() == Cmd.Name) 418a14b13d8SGeorge Rimar Ret.push_back(Sec); 419a14b13d8SGeorge Rimar return Ret; 4208f66df92SGeorge Rimar } 4218f66df92SGeorge Rimar 422d3190795SRafael Espindola template <class ELFT> 423d3190795SRafael Espindola void LinkerScript<ELFT>::assignOffsets(OutputSectionCommand *Cmd) { 424d3190795SRafael Espindola std::vector<OutputSectionBase<ELFT> *> Sections = 425d3190795SRafael Espindola findSections(*Cmd, *OutputSections); 426d3190795SRafael Espindola if (Sections.empty()) 427d3190795SRafael Espindola return; 428d3190795SRafael Espindola switchTo(Sections[0]); 429d3190795SRafael Espindola 430d3190795SRafael Espindola // Find the last section output location. We will output orphan sections 431d3190795SRafael Espindola // there so that end symbols point to the correct location. 432d3190795SRafael Espindola auto E = std::find_if(Cmd->Commands.rbegin(), Cmd->Commands.rend(), 433d3190795SRafael Espindola [](const std::unique_ptr<BaseCommand> &Cmd) { 434d3190795SRafael Espindola return !isa<SymbolAssignment>(*Cmd); 435d3190795SRafael Espindola }) 436d3190795SRafael Espindola .base(); 437d3190795SRafael Espindola for (auto I = Cmd->Commands.begin(); I != E; ++I) 438d3190795SRafael Espindola process(**I); 439d3190795SRafael Espindola flush(); 440d3190795SRafael Espindola for (OutputSectionBase<ELFT> *Base : Sections) { 441d3190795SRafael Espindola if (!AlreadyOutputOS.insert(Base).second) 442d3190795SRafael Espindola continue; 443d3190795SRafael Espindola switchTo(Base); 444d3190795SRafael Espindola Dot += CurOutSec->getSize(); 445d3190795SRafael Espindola } 446d3190795SRafael Espindola for (auto I = E, E = Cmd->Commands.end(); I != E; ++I) 447d3190795SRafael Espindola process(**I); 448d3190795SRafael Espindola } 449d3190795SRafael Espindola 450a4b41dcaSRafael Espindola template <class ELFT> void LinkerScript<ELFT>::assignAddresses() { 451652852c5SGeorge Rimar // Orphan sections are sections present in the input files which 4527c18c28cSRui Ueyama // are not explicitly placed into the output file by the linker script. 4537c18c28cSRui Ueyama // We place orphan sections at end of file. 4547c18c28cSRui Ueyama // Other linkers places them using some heuristics as described in 455652852c5SGeorge Rimar // https://sourceware.org/binutils/docs/ld/Orphan-Sections.html#Orphan-Sections. 456e5cc668eSRui Ueyama for (OutputSectionBase<ELFT> *Sec : *OutputSections) { 457652852c5SGeorge Rimar StringRef Name = Sec->getName(); 458c3e2a4b0SRui Ueyama if (getSectionIndex(Name) == INT_MAX) 459076fe157SGeorge Rimar Opt.Commands.push_back(llvm::make_unique<OutputSectionCommand>(Name)); 460652852c5SGeorge Rimar } 461652852c5SGeorge Rimar 4627c18c28cSRui Ueyama // Assign addresses as instructed by linker script SECTIONS sub-commands. 4634f7500bfSRui Ueyama Dot = getHeaderSize(); 464467c4d55SEugene Leviant uintX_t MinVA = std::numeric_limits<uintX_t>::max(); 465652852c5SGeorge Rimar 466076fe157SGeorge Rimar for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) { 467076fe157SGeorge Rimar if (auto *Cmd = dyn_cast<SymbolAssignment>(Base.get())) { 4688d083e6aSRui Ueyama if (Cmd->Name == ".") { 4698d083e6aSRui Ueyama Dot = Cmd->Expression(Dot); 4708d083e6aSRui Ueyama } else if (Cmd->Sym) { 4718d083e6aSRui Ueyama cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(Dot); 4728d083e6aSRui Ueyama } 47305ef4cffSRui Ueyama continue; 474652852c5SGeorge Rimar } 475652852c5SGeorge Rimar 476eefa758eSGeorge Rimar if (auto *Cmd = dyn_cast<AssertCommand>(Base.get())) { 477eefa758eSGeorge Rimar Cmd->Expression(Dot); 478eefa758eSGeorge Rimar continue; 479eefa758eSGeorge Rimar } 480eefa758eSGeorge Rimar 481076fe157SGeorge Rimar auto *Cmd = cast<OutputSectionCommand>(Base.get()); 482652852c5SGeorge Rimar 48358e5c4dcSGeorge Rimar if (Cmd->AddrExpr) 48458e5c4dcSGeorge Rimar Dot = Cmd->AddrExpr(Dot); 48558e5c4dcSGeorge Rimar 486467c4d55SEugene Leviant MinVA = std::min(MinVA, Dot); 487d3190795SRafael Espindola assignOffsets(Cmd); 488a14b13d8SGeorge Rimar } 489467c4d55SEugene Leviant 490d3190795SRafael Espindola for (OutputSectionBase<ELFT> *Sec : *OutputSections) 491d3190795SRafael Espindola if (!(Sec->getFlags() & SHF_ALLOC)) 492d3190795SRafael Espindola Sec->setVA(0); 4934ec013acSRafael Espindola uintX_t HeaderSize = 4944ec013acSRafael Espindola Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize(); 4954ec013acSRafael Espindola if (HeaderSize > MinVA) 4964ec013acSRafael Espindola fatal("Not enough space for ELF and program headers"); 4974ec013acSRafael Espindola 49864c32d6fSRafael Espindola // ELF and Program headers need to be right before the first section in 499b91e7118SGeorge Rimar // memory. Set their addresses accordingly. 5004ec013acSRafael Espindola MinVA = alignDown(MinVA - HeaderSize, Target->PageSize); 501467c4d55SEugene Leviant Out<ELFT>::ElfHeader->setVA(MinVA); 502467c4d55SEugene Leviant Out<ELFT>::ProgramHeaders->setVA(Out<ELFT>::ElfHeader->getSize() + MinVA); 503fb8978fcSDima Stepanov } 504652852c5SGeorge Rimar 505464daadcSRui Ueyama // Creates program headers as instructed by PHDRS linker script command. 50607320e40SRui Ueyama template <class ELFT> 507a4b41dcaSRafael Espindola std::vector<PhdrEntry<ELFT>> LinkerScript<ELFT>::createPhdrs() { 508edebbdf1SRui Ueyama std::vector<PhdrEntry<ELFT>> Ret; 509bbe38602SEugene Leviant 510464daadcSRui Ueyama // Process PHDRS and FILEHDR keywords because they are not 511464daadcSRui Ueyama // real output sections and cannot be added in the following loop. 512bbe38602SEugene Leviant for (const PhdrsCommand &Cmd : Opt.PhdrsCommands) { 513edebbdf1SRui Ueyama Ret.emplace_back(Cmd.Type, Cmd.Flags == UINT_MAX ? PF_R : Cmd.Flags); 514edebbdf1SRui Ueyama PhdrEntry<ELFT> &Phdr = Ret.back(); 515bbe38602SEugene Leviant 516bbe38602SEugene Leviant if (Cmd.HasFilehdr) 517adca245fSRui Ueyama Phdr.add(Out<ELFT>::ElfHeader); 518bbe38602SEugene Leviant if (Cmd.HasPhdrs) 519adca245fSRui Ueyama Phdr.add(Out<ELFT>::ProgramHeaders); 52056b21c86SEugene Leviant 52156b21c86SEugene Leviant if (Cmd.LMAExpr) { 52256b21c86SEugene Leviant Phdr.H.p_paddr = Cmd.LMAExpr(0); 52356b21c86SEugene Leviant Phdr.HasLMA = true; 52456b21c86SEugene Leviant } 525bbe38602SEugene Leviant } 526bbe38602SEugene Leviant 527464daadcSRui Ueyama // Add output sections to program headers. 528edebbdf1SRui Ueyama PhdrEntry<ELFT> *Load = nullptr; 529edebbdf1SRui Ueyama uintX_t Flags = PF_R; 530464daadcSRui Ueyama for (OutputSectionBase<ELFT> *Sec : *OutputSections) { 531bbe38602SEugene Leviant if (!(Sec->getFlags() & SHF_ALLOC)) 532bbe38602SEugene Leviant break; 533bbe38602SEugene Leviant 534edebbdf1SRui Ueyama std::vector<size_t> PhdrIds = getPhdrIndices(Sec->getName()); 535bbe38602SEugene Leviant if (!PhdrIds.empty()) { 536bbe38602SEugene Leviant // Assign headers specified by linker script 537bbe38602SEugene Leviant for (size_t Id : PhdrIds) { 538edebbdf1SRui Ueyama Ret[Id].add(Sec); 539865bf863SEugene Leviant if (Opt.PhdrsCommands[Id].Flags == UINT_MAX) 5400b113671SRafael Espindola Ret[Id].H.p_flags |= Sec->getPhdrFlags(); 541bbe38602SEugene Leviant } 542bbe38602SEugene Leviant } else { 543bbe38602SEugene Leviant // If we have no load segment or flags've changed then we want new load 544bbe38602SEugene Leviant // segment. 5450b113671SRafael Espindola uintX_t NewFlags = Sec->getPhdrFlags(); 546bbe38602SEugene Leviant if (Load == nullptr || Flags != NewFlags) { 547edebbdf1SRui Ueyama Load = &*Ret.emplace(Ret.end(), PT_LOAD, NewFlags); 548bbe38602SEugene Leviant Flags = NewFlags; 549bbe38602SEugene Leviant } 55018f084ffSRui Ueyama Load->add(Sec); 551bbe38602SEugene Leviant } 552bbe38602SEugene Leviant } 553edebbdf1SRui Ueyama return Ret; 554bbe38602SEugene Leviant } 555bbe38602SEugene Leviant 556f9bc3bd2SEugene Leviant template <class ELFT> bool LinkerScript<ELFT>::ignoreInterpSection() { 557f9bc3bd2SEugene Leviant // Ignore .interp section in case we have PHDRS specification 558f9bc3bd2SEugene Leviant // and PT_INTERP isn't listed. 559f9bc3bd2SEugene Leviant return !Opt.PhdrsCommands.empty() && 560f9bc3bd2SEugene Leviant llvm::find_if(Opt.PhdrsCommands, [](const PhdrsCommand &Cmd) { 561f9bc3bd2SEugene Leviant return Cmd.Type == PT_INTERP; 562f9bc3bd2SEugene Leviant }) == Opt.PhdrsCommands.end(); 563f9bc3bd2SEugene Leviant } 564f9bc3bd2SEugene Leviant 565bbe38602SEugene Leviant template <class ELFT> 56607320e40SRui Ueyama ArrayRef<uint8_t> LinkerScript<ELFT>::getFiller(StringRef Name) { 567f6c3ccefSGeorge Rimar for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) 568f6c3ccefSGeorge Rimar if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get())) 569f6c3ccefSGeorge Rimar if (Cmd->Name == Name) 570f6c3ccefSGeorge Rimar return Cmd->Filler; 571e2ee72b5SGeorge Rimar return {}; 572e2ee72b5SGeorge Rimar } 573e2ee72b5SGeorge Rimar 574206fffa1SGeorge Rimar template <class ELFT> Expr LinkerScript<ELFT>::getLma(StringRef Name) { 5758ceadb38SGeorge Rimar for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) 5768ceadb38SGeorge Rimar if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get())) 5778ceadb38SGeorge Rimar if (Cmd->LmaExpr && Cmd->Name == Name) 5788ceadb38SGeorge Rimar return Cmd->LmaExpr; 5798ceadb38SGeorge Rimar return {}; 5808ceadb38SGeorge Rimar } 5818ceadb38SGeorge Rimar 582c3e2a4b0SRui Ueyama // Returns the index of the given section name in linker script 583c3e2a4b0SRui Ueyama // SECTIONS commands. Sections are laid out as the same order as they 584c3e2a4b0SRui Ueyama // were in the script. If a given name did not appear in the script, 585c3e2a4b0SRui Ueyama // it returns INT_MAX, so that it will be laid out at end of file. 586076fe157SGeorge Rimar template <class ELFT> int LinkerScript<ELFT>::getSectionIndex(StringRef Name) { 587f510fa6bSRui Ueyama int I = 0; 588f510fa6bSRui Ueyama for (std::unique_ptr<BaseCommand> &Base : Opt.Commands) { 589076fe157SGeorge Rimar if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get())) 590076fe157SGeorge Rimar if (Cmd->Name == Name) 591f510fa6bSRui Ueyama return I; 592f510fa6bSRui Ueyama ++I; 593f510fa6bSRui Ueyama } 594f510fa6bSRui Ueyama return INT_MAX; 59571b26e94SGeorge Rimar } 59671b26e94SGeorge Rimar 59771b26e94SGeorge Rimar // A compartor to sort output sections. Returns -1 or 1 if 59871b26e94SGeorge Rimar // A or B are mentioned in linker script. Otherwise, returns 0. 59907320e40SRui Ueyama template <class ELFT> 60007320e40SRui Ueyama int LinkerScript<ELFT>::compareSections(StringRef A, StringRef B) { 601c3e2a4b0SRui Ueyama int I = getSectionIndex(A); 602c3e2a4b0SRui Ueyama int J = getSectionIndex(B); 603c3e2a4b0SRui Ueyama if (I == INT_MAX && J == INT_MAX) 604717677afSRui Ueyama return 0; 605717677afSRui Ueyama return I < J ? -1 : 1; 606717677afSRui Ueyama } 607717677afSRui Ueyama 608bbe38602SEugene Leviant template <class ELFT> bool LinkerScript<ELFT>::hasPhdrsCommands() { 609bbe38602SEugene Leviant return !Opt.PhdrsCommands.empty(); 610bbe38602SEugene Leviant } 611bbe38602SEugene Leviant 6129e69450eSGeorge Rimar template <class ELFT> 613884e786dSGeorge Rimar uint64_t LinkerScript<ELFT>::getOutputSectionAddress(StringRef Name) { 61496659df0SGeorge Rimar for (OutputSectionBase<ELFT> *Sec : *OutputSections) 61596659df0SGeorge Rimar if (Sec->getName() == Name) 61696659df0SGeorge Rimar return Sec->getVA(); 61796659df0SGeorge Rimar error("undefined section " + Name); 61896659df0SGeorge Rimar return 0; 61996659df0SGeorge Rimar } 62096659df0SGeorge Rimar 62196659df0SGeorge Rimar template <class ELFT> 622884e786dSGeorge Rimar uint64_t LinkerScript<ELFT>::getOutputSectionSize(StringRef Name) { 6239e69450eSGeorge Rimar for (OutputSectionBase<ELFT> *Sec : *OutputSections) 6249e69450eSGeorge Rimar if (Sec->getName() == Name) 6259e69450eSGeorge Rimar return Sec->getSize(); 6269e69450eSGeorge Rimar error("undefined section " + Name); 6279e69450eSGeorge Rimar return 0; 6289e69450eSGeorge Rimar } 6299e69450eSGeorge Rimar 63036fac7f0SEugene Leviant template <class ELFT> 63136fac7f0SEugene Leviant uint64_t LinkerScript<ELFT>::getOutputSectionAlign(StringRef Name) { 63236fac7f0SEugene Leviant for (OutputSectionBase<ELFT> *Sec : *OutputSections) 63336fac7f0SEugene Leviant if (Sec->getName() == Name) 63436fac7f0SEugene Leviant return Sec->getAlignment(); 63536fac7f0SEugene Leviant error("undefined section " + Name); 63636fac7f0SEugene Leviant return 0; 63736fac7f0SEugene Leviant } 63836fac7f0SEugene Leviant 639884e786dSGeorge Rimar template <class ELFT> uint64_t LinkerScript<ELFT>::getHeaderSize() { 640e32a3598SGeorge Rimar return Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize(); 641e32a3598SGeorge Rimar } 642e32a3598SGeorge Rimar 643884e786dSGeorge Rimar template <class ELFT> uint64_t LinkerScript<ELFT>::getSymbolValue(StringRef S) { 644884e786dSGeorge Rimar if (SymbolBody *B = Symtab<ELFT>::X->find(S)) 645884e786dSGeorge Rimar return B->getVA<ELFT>(); 646884e786dSGeorge Rimar error("symbol not found: " + S); 647884e786dSGeorge Rimar return 0; 648884e786dSGeorge Rimar } 649884e786dSGeorge Rimar 650bbe38602SEugene Leviant // Returns indices of ELF headers containing specific section, identified 651bbe38602SEugene Leviant // by Name. Each index is a zero based number of ELF header listed within 652bbe38602SEugene Leviant // PHDRS {} script block. 653bbe38602SEugene Leviant template <class ELFT> 654edebbdf1SRui Ueyama std::vector<size_t> LinkerScript<ELFT>::getPhdrIndices(StringRef SectionName) { 655076fe157SGeorge Rimar for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) { 656076fe157SGeorge Rimar auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()); 657edebbdf1SRui Ueyama if (!Cmd || Cmd->Name != SectionName) 65831d842f5SGeorge Rimar continue; 65931d842f5SGeorge Rimar 66029c5a2a9SRui Ueyama std::vector<size_t> Ret; 66129c5a2a9SRui Ueyama for (StringRef PhdrName : Cmd->Phdrs) 66229c5a2a9SRui Ueyama Ret.push_back(getPhdrIndex(PhdrName)); 66329c5a2a9SRui Ueyama return Ret; 664bbe38602SEugene Leviant } 66531d842f5SGeorge Rimar return {}; 66631d842f5SGeorge Rimar } 667bbe38602SEugene Leviant 66829c5a2a9SRui Ueyama template <class ELFT> 66929c5a2a9SRui Ueyama size_t LinkerScript<ELFT>::getPhdrIndex(StringRef PhdrName) { 67029c5a2a9SRui Ueyama size_t I = 0; 67129c5a2a9SRui Ueyama for (PhdrsCommand &Cmd : Opt.PhdrsCommands) { 67229c5a2a9SRui Ueyama if (Cmd.Name == PhdrName) 67329c5a2a9SRui Ueyama return I; 67429c5a2a9SRui Ueyama ++I; 67529c5a2a9SRui Ueyama } 67629c5a2a9SRui Ueyama error("section header '" + PhdrName + "' is not listed in PHDRS"); 67729c5a2a9SRui Ueyama return 0; 67829c5a2a9SRui Ueyama } 67929c5a2a9SRui Ueyama 68007320e40SRui Ueyama class elf::ScriptParser : public ScriptParserBase { 681c3794e58SGeorge Rimar typedef void (ScriptParser::*Handler)(); 682c3794e58SGeorge Rimar 683f7c5fbb1SRui Ueyama public: 68407320e40SRui Ueyama ScriptParser(StringRef S, bool B) : ScriptParserBase(S), IsUnderSysroot(B) {} 685f23b2320SGeorge Rimar 68620b6598cSGeorge Rimar void readLinkerScript(); 68720b6598cSGeorge Rimar void readVersionScript(); 688f7c5fbb1SRui Ueyama 689f7c5fbb1SRui Ueyama private: 69052a1509eSRui Ueyama void addFile(StringRef Path); 69152a1509eSRui Ueyama 692f7c5fbb1SRui Ueyama void readAsNeeded(); 69390c5099eSDenis Protivensky void readEntry(); 69483f406cfSGeorge Rimar void readExtern(); 695f7c5fbb1SRui Ueyama void readGroup(); 69631aa1f83SRui Ueyama void readInclude(); 697ee59282bSRui Ueyama void readOutput(); 6989159ce93SDavide Italiano void readOutputArch(); 699f7c5fbb1SRui Ueyama void readOutputFormat(); 700bbe38602SEugene Leviant void readPhdrs(); 70168a39a65SDavide Italiano void readSearchDir(); 7028e3b38abSDenis Protivensky void readSections(); 70395769b4aSRui Ueyama void readVersion(); 70495769b4aSRui Ueyama void readVersionScriptCommand(); 7058e3b38abSDenis Protivensky 706113cdec9SRui Ueyama SymbolAssignment *readAssignment(StringRef Name); 707ff1f29e0SGeorge Rimar std::vector<uint8_t> readFill(); 70810416564SRui Ueyama OutputSectionCommand *readOutputSectionDescription(StringRef OutSec); 709ff1f29e0SGeorge Rimar std::vector<uint8_t> readOutputSectionFiller(StringRef Tok); 710bbe38602SEugene Leviant std::vector<StringRef> readOutputSectionPhdrs(); 711a2496cbeSGeorge Rimar InputSectionDescription *readInputSectionDescription(StringRef Tok); 712c91930a1SGeorge Rimar Regex readFilePatterns(); 713395281cfSGeorge Rimar void readSectionExcludes(InputSectionDescription *Cmd); 714a2496cbeSGeorge Rimar InputSectionDescription *readInputSectionRules(StringRef FilePattern); 715bbe38602SEugene Leviant unsigned readPhdrType(); 716be394db3SGeorge Rimar SortSectionPolicy readSortKind(); 717a35e39caSPetr Hosek SymbolAssignment *readProvideHidden(bool Provide, bool Hidden); 718db741e72SEugene Leviant SymbolAssignment *readProvideOrAssignment(StringRef Tok, bool MakeAbsolute); 71903fc010eSGeorge Rimar void readSort(); 720eefa758eSGeorge Rimar Expr readAssert(); 721708019c4SRui Ueyama 722708019c4SRui Ueyama Expr readExpr(); 723708019c4SRui Ueyama Expr readExpr1(Expr Lhs, int MinPrec); 724708019c4SRui Ueyama Expr readPrimary(); 725708019c4SRui Ueyama Expr readTernary(Expr Cond); 7266ad7dfccSRui Ueyama Expr readParenExpr(); 727f7c5fbb1SRui Ueyama 72820b6598cSGeorge Rimar // For parsing version script. 72920b6598cSGeorge Rimar void readExtern(std::vector<SymbolVersion> *Globals); 73095769b4aSRui Ueyama void readVersionDeclaration(StringRef VerStr); 73120b6598cSGeorge Rimar void readGlobal(StringRef VerStr); 73220b6598cSGeorge Rimar void readLocal(); 73320b6598cSGeorge Rimar 73407320e40SRui Ueyama ScriptConfiguration &Opt = *ScriptConfig; 73507320e40SRui Ueyama StringSaver Saver = {ScriptConfig->Alloc}; 73616b0cc9eSSimon Atanasyan bool IsUnderSysroot; 737f7c5fbb1SRui Ueyama }; 738f7c5fbb1SRui Ueyama 73920b6598cSGeorge Rimar void ScriptParser::readVersionScript() { 74095769b4aSRui Ueyama readVersionScriptCommand(); 74120b6598cSGeorge Rimar if (!atEOF()) 74295769b4aSRui Ueyama setError("EOF expected, but got " + next()); 74395769b4aSRui Ueyama } 74495769b4aSRui Ueyama 74595769b4aSRui Ueyama void ScriptParser::readVersionScriptCommand() { 74695769b4aSRui Ueyama if (skip("{")) { 74795769b4aSRui Ueyama readVersionDeclaration(""); 74820b6598cSGeorge Rimar return; 74920b6598cSGeorge Rimar } 75020b6598cSGeorge Rimar 75195769b4aSRui Ueyama while (!atEOF() && !Error && peek() != "}") { 75220b6598cSGeorge Rimar StringRef VerStr = next(); 75320b6598cSGeorge Rimar if (VerStr == "{") { 75495769b4aSRui Ueyama setError("anonymous version definition is used in " 75595769b4aSRui Ueyama "combination with other version definitions"); 75620b6598cSGeorge Rimar return; 75720b6598cSGeorge Rimar } 75820b6598cSGeorge Rimar expect("{"); 75995769b4aSRui Ueyama readVersionDeclaration(VerStr); 76020b6598cSGeorge Rimar } 76120b6598cSGeorge Rimar } 76220b6598cSGeorge Rimar 76395769b4aSRui Ueyama void ScriptParser::readVersion() { 76495769b4aSRui Ueyama expect("{"); 76595769b4aSRui Ueyama readVersionScriptCommand(); 76695769b4aSRui Ueyama expect("}"); 76795769b4aSRui Ueyama } 76895769b4aSRui Ueyama 76920b6598cSGeorge Rimar void ScriptParser::readLinkerScript() { 770f7c5fbb1SRui Ueyama while (!atEOF()) { 771f7c5fbb1SRui Ueyama StringRef Tok = next(); 772a27eeccaSRui Ueyama if (Tok == ";") 773a27eeccaSRui Ueyama continue; 774a27eeccaSRui Ueyama 77520d03194SEugene Leviant if (Tok == "ASSERT") { 77620d03194SEugene Leviant Opt.Commands.emplace_back(new AssertCommand(readAssert())); 77720d03194SEugene Leviant } else if (Tok == "ENTRY") { 778a27eeccaSRui Ueyama readEntry(); 779a27eeccaSRui Ueyama } else if (Tok == "EXTERN") { 780a27eeccaSRui Ueyama readExtern(); 781a27eeccaSRui Ueyama } else if (Tok == "GROUP" || Tok == "INPUT") { 782a27eeccaSRui Ueyama readGroup(); 783a27eeccaSRui Ueyama } else if (Tok == "INCLUDE") { 784a27eeccaSRui Ueyama readInclude(); 785a27eeccaSRui Ueyama } else if (Tok == "OUTPUT") { 786a27eeccaSRui Ueyama readOutput(); 787a27eeccaSRui Ueyama } else if (Tok == "OUTPUT_ARCH") { 788a27eeccaSRui Ueyama readOutputArch(); 789a27eeccaSRui Ueyama } else if (Tok == "OUTPUT_FORMAT") { 790a27eeccaSRui Ueyama readOutputFormat(); 791a27eeccaSRui Ueyama } else if (Tok == "PHDRS") { 792a27eeccaSRui Ueyama readPhdrs(); 793a27eeccaSRui Ueyama } else if (Tok == "SEARCH_DIR") { 794a27eeccaSRui Ueyama readSearchDir(); 795a27eeccaSRui Ueyama } else if (Tok == "SECTIONS") { 796a27eeccaSRui Ueyama readSections(); 797a27eeccaSRui Ueyama } else if (Tok == "VERSION") { 798a27eeccaSRui Ueyama readVersion(); 799db741e72SEugene Leviant } else if (SymbolAssignment *Cmd = readProvideOrAssignment(Tok, true)) { 8000df80befSPetr Hosek Opt.Commands.emplace_back(Cmd); 801e5d3ca50SPetr Hosek } else { 8025761042dSGeorge Rimar setError("unknown directive: " + Tok); 803f7c5fbb1SRui Ueyama } 804f7c5fbb1SRui Ueyama } 805e5d3ca50SPetr Hosek } 806f7c5fbb1SRui Ueyama 807717677afSRui Ueyama void ScriptParser::addFile(StringRef S) { 80816b0cc9eSSimon Atanasyan if (IsUnderSysroot && S.startswith("/")) { 80916b0cc9eSSimon Atanasyan SmallString<128> Path; 81016b0cc9eSSimon Atanasyan (Config->Sysroot + S).toStringRef(Path); 81116b0cc9eSSimon Atanasyan if (sys::fs::exists(Path)) { 81216b0cc9eSSimon Atanasyan Driver->addFile(Saver.save(Path.str())); 81316b0cc9eSSimon Atanasyan return; 81416b0cc9eSSimon Atanasyan } 81516b0cc9eSSimon Atanasyan } 81616b0cc9eSSimon Atanasyan 817f03f3cc1SRui Ueyama if (sys::path::is_absolute(S)) { 81852a1509eSRui Ueyama Driver->addFile(S); 81952a1509eSRui Ueyama } else if (S.startswith("=")) { 82052a1509eSRui Ueyama if (Config->Sysroot.empty()) 82152a1509eSRui Ueyama Driver->addFile(S.substr(1)); 82252a1509eSRui Ueyama else 82352a1509eSRui Ueyama Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1))); 82452a1509eSRui Ueyama } else if (S.startswith("-l")) { 82521eecb4fSRui Ueyama Driver->addLibrary(S.substr(2)); 826a1b8fc3bSSimon Atanasyan } else if (sys::fs::exists(S)) { 827a1b8fc3bSSimon Atanasyan Driver->addFile(S); 82852a1509eSRui Ueyama } else { 82952a1509eSRui Ueyama std::string Path = findFromSearchPaths(S); 83052a1509eSRui Ueyama if (Path.empty()) 831777f9630SGeorge Rimar setError("unable to find " + S); 832025d59b1SRui Ueyama else 83352a1509eSRui Ueyama Driver->addFile(Saver.save(Path)); 83452a1509eSRui Ueyama } 83552a1509eSRui Ueyama } 83652a1509eSRui Ueyama 837717677afSRui Ueyama void ScriptParser::readAsNeeded() { 838f7c5fbb1SRui Ueyama expect("("); 83935da9b6eSRui Ueyama bool Orig = Config->AsNeeded; 84035da9b6eSRui Ueyama Config->AsNeeded = true; 841a2acc931SRui Ueyama while (!Error && !skip(")")) 842cd574a5eSGeorge Rimar addFile(unquote(next())); 84335da9b6eSRui Ueyama Config->AsNeeded = Orig; 844f7c5fbb1SRui Ueyama } 845f7c5fbb1SRui Ueyama 846717677afSRui Ueyama void ScriptParser::readEntry() { 84790c5099eSDenis Protivensky // -e <symbol> takes predecence over ENTRY(<symbol>). 84890c5099eSDenis Protivensky expect("("); 84990c5099eSDenis Protivensky StringRef Tok = next(); 85090c5099eSDenis Protivensky if (Config->Entry.empty()) 85190c5099eSDenis Protivensky Config->Entry = Tok; 85290c5099eSDenis Protivensky expect(")"); 85390c5099eSDenis Protivensky } 85490c5099eSDenis Protivensky 855717677afSRui Ueyama void ScriptParser::readExtern() { 85683f406cfSGeorge Rimar expect("("); 857a2acc931SRui Ueyama while (!Error && !skip(")")) 858a2acc931SRui Ueyama Config->Undefined.push_back(next()); 85983f406cfSGeorge Rimar } 86083f406cfSGeorge Rimar 861717677afSRui Ueyama void ScriptParser::readGroup() { 862f7c5fbb1SRui Ueyama expect("("); 863a2acc931SRui Ueyama while (!Error && !skip(")")) { 864f7c5fbb1SRui Ueyama StringRef Tok = next(); 865a2acc931SRui Ueyama if (Tok == "AS_NEEDED") 866f7c5fbb1SRui Ueyama readAsNeeded(); 867a2acc931SRui Ueyama else 868cd574a5eSGeorge Rimar addFile(unquote(Tok)); 869f7c5fbb1SRui Ueyama } 870f7c5fbb1SRui Ueyama } 871f7c5fbb1SRui Ueyama 872717677afSRui Ueyama void ScriptParser::readInclude() { 87331aa1f83SRui Ueyama StringRef Tok = next(); 874cd574a5eSGeorge Rimar auto MBOrErr = MemoryBuffer::getFile(unquote(Tok)); 875025d59b1SRui Ueyama if (!MBOrErr) { 8765761042dSGeorge Rimar setError("cannot open " + Tok); 877025d59b1SRui Ueyama return; 878025d59b1SRui Ueyama } 87931aa1f83SRui Ueyama std::unique_ptr<MemoryBuffer> &MB = *MBOrErr; 880a47ee68dSRui Ueyama StringRef S = Saver.save(MB->getMemBufferRef().getBuffer()); 881a47ee68dSRui Ueyama std::vector<StringRef> V = tokenize(S); 88231aa1f83SRui Ueyama Tokens.insert(Tokens.begin() + Pos, V.begin(), V.end()); 88331aa1f83SRui Ueyama } 88431aa1f83SRui Ueyama 885717677afSRui Ueyama void ScriptParser::readOutput() { 886ee59282bSRui Ueyama // -o <file> takes predecence over OUTPUT(<file>). 887ee59282bSRui Ueyama expect("("); 888ee59282bSRui Ueyama StringRef Tok = next(); 889ee59282bSRui Ueyama if (Config->OutputFile.empty()) 890cd574a5eSGeorge Rimar Config->OutputFile = unquote(Tok); 891ee59282bSRui Ueyama expect(")"); 892ee59282bSRui Ueyama } 893ee59282bSRui Ueyama 894717677afSRui Ueyama void ScriptParser::readOutputArch() { 8959159ce93SDavide Italiano // Error checking only for now. 8969159ce93SDavide Italiano expect("("); 8979159ce93SDavide Italiano next(); 8989159ce93SDavide Italiano expect(")"); 8999159ce93SDavide Italiano } 9009159ce93SDavide Italiano 901717677afSRui Ueyama void ScriptParser::readOutputFormat() { 902f7c5fbb1SRui Ueyama // Error checking only for now. 903f7c5fbb1SRui Ueyama expect("("); 904f7c5fbb1SRui Ueyama next(); 9056836c618SDavide Italiano StringRef Tok = next(); 9066836c618SDavide Italiano if (Tok == ")") 9076836c618SDavide Italiano return; 908025d59b1SRui Ueyama if (Tok != ",") { 9095761042dSGeorge Rimar setError("unexpected token: " + Tok); 910025d59b1SRui Ueyama return; 911025d59b1SRui Ueyama } 9126836c618SDavide Italiano next(); 9136836c618SDavide Italiano expect(","); 9146836c618SDavide Italiano next(); 915f7c5fbb1SRui Ueyama expect(")"); 916f7c5fbb1SRui Ueyama } 917f7c5fbb1SRui Ueyama 918bbe38602SEugene Leviant void ScriptParser::readPhdrs() { 919bbe38602SEugene Leviant expect("{"); 920bbe38602SEugene Leviant while (!Error && !skip("}")) { 921bbe38602SEugene Leviant StringRef Tok = next(); 92256b21c86SEugene Leviant Opt.PhdrsCommands.push_back( 92356b21c86SEugene Leviant {Tok, PT_NULL, false, false, UINT_MAX, nullptr}); 924bbe38602SEugene Leviant PhdrsCommand &PhdrCmd = Opt.PhdrsCommands.back(); 925bbe38602SEugene Leviant 926bbe38602SEugene Leviant PhdrCmd.Type = readPhdrType(); 927bbe38602SEugene Leviant do { 928bbe38602SEugene Leviant Tok = next(); 929bbe38602SEugene Leviant if (Tok == ";") 930bbe38602SEugene Leviant break; 931bbe38602SEugene Leviant if (Tok == "FILEHDR") 932bbe38602SEugene Leviant PhdrCmd.HasFilehdr = true; 933bbe38602SEugene Leviant else if (Tok == "PHDRS") 934bbe38602SEugene Leviant PhdrCmd.HasPhdrs = true; 93556b21c86SEugene Leviant else if (Tok == "AT") 93656b21c86SEugene Leviant PhdrCmd.LMAExpr = readParenExpr(); 937865bf863SEugene Leviant else if (Tok == "FLAGS") { 938865bf863SEugene Leviant expect("("); 939eb685cd7SRafael Espindola // Passing 0 for the value of dot is a bit of a hack. It means that 940eb685cd7SRafael Espindola // we accept expressions like ".|1". 941eb685cd7SRafael Espindola PhdrCmd.Flags = readExpr()(0); 942865bf863SEugene Leviant expect(")"); 943865bf863SEugene Leviant } else 944bbe38602SEugene Leviant setError("unexpected header attribute: " + Tok); 945bbe38602SEugene Leviant } while (!Error); 946bbe38602SEugene Leviant } 947bbe38602SEugene Leviant } 948bbe38602SEugene Leviant 949717677afSRui Ueyama void ScriptParser::readSearchDir() { 95068a39a65SDavide Italiano expect("("); 95186c5fb82SRui Ueyama StringRef Tok = next(); 9526c7ad13fSRui Ueyama if (!Config->Nostdlib) 953cd574a5eSGeorge Rimar Config->SearchPaths.push_back(unquote(Tok)); 95468a39a65SDavide Italiano expect(")"); 95568a39a65SDavide Italiano } 95668a39a65SDavide Italiano 957717677afSRui Ueyama void ScriptParser::readSections() { 958e05336ffSEugene Leviant Opt.HasSections = true; 9598e3b38abSDenis Protivensky expect("{"); 960652852c5SGeorge Rimar while (!Error && !skip("}")) { 961113cdec9SRui Ueyama StringRef Tok = next(); 962db741e72SEugene Leviant BaseCommand *Cmd = readProvideOrAssignment(Tok, true); 963ceabe80eSEugene Leviant if (!Cmd) { 964ceabe80eSEugene Leviant if (Tok == "ASSERT") 965eefa758eSGeorge Rimar Cmd = new AssertCommand(readAssert()); 966ceabe80eSEugene Leviant else 96710416564SRui Ueyama Cmd = readOutputSectionDescription(Tok); 9688e3b38abSDenis Protivensky } 96910416564SRui Ueyama Opt.Commands.emplace_back(Cmd); 970652852c5SGeorge Rimar } 971708019c4SRui Ueyama } 9728e3b38abSDenis Protivensky 973708019c4SRui Ueyama static int precedence(StringRef Op) { 974708019c4SRui Ueyama return StringSwitch<int>(Op) 975708019c4SRui Ueyama .Case("*", 4) 976708019c4SRui Ueyama .Case("/", 4) 977708019c4SRui Ueyama .Case("+", 3) 978708019c4SRui Ueyama .Case("-", 3) 979708019c4SRui Ueyama .Case("<", 2) 980708019c4SRui Ueyama .Case(">", 2) 981708019c4SRui Ueyama .Case(">=", 2) 982708019c4SRui Ueyama .Case("<=", 2) 983708019c4SRui Ueyama .Case("==", 2) 984708019c4SRui Ueyama .Case("!=", 2) 985708019c4SRui Ueyama .Case("&", 1) 986cc3dd629SRafael Espindola .Case("|", 1) 987708019c4SRui Ueyama .Default(-1); 988708019c4SRui Ueyama } 989708019c4SRui Ueyama 990c91930a1SGeorge Rimar Regex ScriptParser::readFilePatterns() { 99110416564SRui Ueyama std::vector<StringRef> V; 99210416564SRui Ueyama while (!Error && !skip(")")) 99310416564SRui Ueyama V.push_back(next()); 994c91930a1SGeorge Rimar return compileGlobPatterns(V); 9950702c4e8SGeorge Rimar } 9960702c4e8SGeorge Rimar 997be394db3SGeorge Rimar SortSectionPolicy ScriptParser::readSortKind() { 998742c3836SRui Ueyama if (skip("SORT") || skip("SORT_BY_NAME")) 999be394db3SGeorge Rimar return SortSectionPolicy::Name; 1000742c3836SRui Ueyama if (skip("SORT_BY_ALIGNMENT")) 1001be394db3SGeorge Rimar return SortSectionPolicy::Alignment; 1002575208caSGeorge Rimar if (skip("SORT_BY_INIT_PRIORITY")) 1003be394db3SGeorge Rimar return SortSectionPolicy::Priority; 1004be394db3SGeorge Rimar if (skip("SORT_NONE")) 1005be394db3SGeorge Rimar return SortSectionPolicy::None; 1006*b2a0abdfSRui Ueyama return SortSectionPolicy::Default; 1007be394db3SGeorge Rimar } 1008be394db3SGeorge Rimar 1009be394db3SGeorge Rimar static void selectSortKind(InputSectionDescription *Cmd) { 1010*b2a0abdfSRui Ueyama if (Cmd->SortOuter == SortSectionPolicy::None) { 1011*b2a0abdfSRui Ueyama Cmd->SortOuter = SortSectionPolicy::Default; 1012be394db3SGeorge Rimar return; 1013be394db3SGeorge Rimar } 1014be394db3SGeorge Rimar 1015*b2a0abdfSRui Ueyama if (Cmd->SortOuter != SortSectionPolicy::Default) { 1016be394db3SGeorge Rimar // If the section sorting command in linker script is nested, the command 1017be394db3SGeorge Rimar // line option will be ignored. 1018*b2a0abdfSRui Ueyama if (Cmd->SortInner != SortSectionPolicy::Default) 1019be394db3SGeorge Rimar return; 1020be394db3SGeorge Rimar // If the section sorting command in linker script isn't nested, the 1021be394db3SGeorge Rimar // command line option will make the section sorting command to be treated 1022be394db3SGeorge Rimar // as nested sorting command. 1023be394db3SGeorge Rimar Cmd->SortInner = Config->SortSection; 1024be394db3SGeorge Rimar return; 1025be394db3SGeorge Rimar } 1026be394db3SGeorge Rimar // If sorting rule not specified, use command line option. 1027be394db3SGeorge Rimar Cmd->SortOuter = Config->SortSection; 1028742c3836SRui Ueyama } 1029742c3836SRui Ueyama 1030395281cfSGeorge Rimar // Method reads a list of sequence of excluded files and section globs given in 1031395281cfSGeorge Rimar // a following form: ((EXCLUDE_FILE(file_pattern+))? section_pattern+)+ 1032395281cfSGeorge Rimar // Example: *(.foo.1 EXCLUDE_FILE (*a.o) .foo.2 EXCLUDE_FILE (*b.o) .foo.3) 1033395281cfSGeorge Rimar void ScriptParser::readSectionExcludes(InputSectionDescription *Cmd) { 1034395281cfSGeorge Rimar llvm::Regex ExcludeFileRe; 1035395281cfSGeorge Rimar std::vector<StringRef> V; 1036395281cfSGeorge Rimar 1037395281cfSGeorge Rimar while (!Error) { 1038395281cfSGeorge Rimar if (skip(")")) { 1039395281cfSGeorge Rimar Cmd->SectionsVec.push_back( 1040395281cfSGeorge Rimar {std::move(ExcludeFileRe), compileGlobPatterns(V)}); 1041395281cfSGeorge Rimar return; 1042395281cfSGeorge Rimar } 1043395281cfSGeorge Rimar 1044395281cfSGeorge Rimar if (skip("EXCLUDE_FILE")) { 1045395281cfSGeorge Rimar if (!V.empty()) { 1046395281cfSGeorge Rimar Cmd->SectionsVec.push_back( 1047395281cfSGeorge Rimar {std::move(ExcludeFileRe), compileGlobPatterns(V)}); 1048395281cfSGeorge Rimar V.clear(); 1049395281cfSGeorge Rimar } 1050395281cfSGeorge Rimar 1051395281cfSGeorge Rimar expect("("); 1052395281cfSGeorge Rimar ExcludeFileRe = readFilePatterns(); 1053395281cfSGeorge Rimar continue; 1054395281cfSGeorge Rimar } 1055395281cfSGeorge Rimar 1056395281cfSGeorge Rimar V.push_back(next()); 1057395281cfSGeorge Rimar } 1058395281cfSGeorge Rimar } 1059395281cfSGeorge Rimar 1060a2496cbeSGeorge Rimar InputSectionDescription * 1061a2496cbeSGeorge Rimar ScriptParser::readInputSectionRules(StringRef FilePattern) { 1062c91930a1SGeorge Rimar auto *Cmd = new InputSectionDescription(FilePattern); 10630ed42b0cSDavide Italiano expect("("); 1064e7282797SDavide Italiano 1065742c3836SRui Ueyama // Read SORT(). 1066be394db3SGeorge Rimar SortSectionPolicy K1 = readSortKind(); 1067*b2a0abdfSRui Ueyama if (K1 != SortSectionPolicy::Default) { 1068742c3836SRui Ueyama Cmd->SortOuter = K1; 10690702c4e8SGeorge Rimar expect("("); 1070be394db3SGeorge Rimar SortSectionPolicy K2 = readSortKind(); 1071*b2a0abdfSRui Ueyama if (K2 != SortSectionPolicy::Default) { 1072742c3836SRui Ueyama Cmd->SortInner = K2; 1073350ece4eSGeorge Rimar expect("("); 1074395281cfSGeorge Rimar Cmd->SectionsVec.push_back({llvm::Regex(), readFilePatterns()}); 10750702c4e8SGeorge Rimar expect(")"); 1076350ece4eSGeorge Rimar } else { 1077395281cfSGeorge Rimar Cmd->SectionsVec.push_back({llvm::Regex(), readFilePatterns()}); 1078350ece4eSGeorge Rimar } 1079350ece4eSGeorge Rimar expect(")"); 1080be394db3SGeorge Rimar selectSortKind(Cmd); 108110416564SRui Ueyama return Cmd; 10820659800eSGeorge Rimar } 10830702c4e8SGeorge Rimar 1084be394db3SGeorge Rimar selectSortKind(Cmd); 1085395281cfSGeorge Rimar readSectionExcludes(Cmd); 108610416564SRui Ueyama return Cmd; 10870659800eSGeorge Rimar } 10880659800eSGeorge Rimar 1089a2496cbeSGeorge Rimar InputSectionDescription * 1090a2496cbeSGeorge Rimar ScriptParser::readInputSectionDescription(StringRef Tok) { 10910659800eSGeorge Rimar // Input section wildcard can be surrounded by KEEP. 10920659800eSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep 1093a2496cbeSGeorge Rimar if (Tok == "KEEP") { 1094e7282797SDavide Italiano expect("("); 1095a2496cbeSGeorge Rimar StringRef FilePattern = next(); 1096a2496cbeSGeorge Rimar InputSectionDescription *Cmd = readInputSectionRules(FilePattern); 10970ed42b0cSDavide Italiano expect(")"); 1098395281cfSGeorge Rimar for (std::pair<llvm::Regex, llvm::Regex> &Regex : Cmd->SectionsVec) 1099395281cfSGeorge Rimar Opt.KeptSections.push_back(&Regex.second); 110010416564SRui Ueyama return Cmd; 110110416564SRui Ueyama } 1102a2496cbeSGeorge Rimar return readInputSectionRules(Tok); 11030659800eSGeorge Rimar } 11040659800eSGeorge Rimar 110503fc010eSGeorge Rimar void ScriptParser::readSort() { 110603fc010eSGeorge Rimar expect("("); 110703fc010eSGeorge Rimar expect("CONSTRUCTORS"); 110803fc010eSGeorge Rimar expect(")"); 110903fc010eSGeorge Rimar } 111003fc010eSGeorge Rimar 1111eefa758eSGeorge Rimar Expr ScriptParser::readAssert() { 1112eefa758eSGeorge Rimar expect("("); 1113eefa758eSGeorge Rimar Expr E = readExpr(); 1114eefa758eSGeorge Rimar expect(","); 1115cd574a5eSGeorge Rimar StringRef Msg = unquote(next()); 1116eefa758eSGeorge Rimar expect(")"); 1117eefa758eSGeorge Rimar return [=](uint64_t Dot) { 1118eefa758eSGeorge Rimar uint64_t V = E(Dot); 1119eefa758eSGeorge Rimar if (!V) 1120eefa758eSGeorge Rimar error(Msg); 1121eefa758eSGeorge Rimar return V; 1122eefa758eSGeorge Rimar }; 1123eefa758eSGeorge Rimar } 1124eefa758eSGeorge Rimar 112525150e8bSRui Ueyama // Reads a FILL(expr) command. We handle the FILL command as an 112625150e8bSRui Ueyama // alias for =fillexp section attribute, which is different from 112725150e8bSRui Ueyama // what GNU linkers do. 112825150e8bSRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html 1129ff1f29e0SGeorge Rimar std::vector<uint8_t> ScriptParser::readFill() { 1130ff1f29e0SGeorge Rimar expect("("); 1131ff1f29e0SGeorge Rimar std::vector<uint8_t> V = readOutputSectionFiller(next()); 1132ff1f29e0SGeorge Rimar expect(")"); 1133ff1f29e0SGeorge Rimar expect(";"); 1134ff1f29e0SGeorge Rimar return V; 1135ff1f29e0SGeorge Rimar } 1136ff1f29e0SGeorge Rimar 113710416564SRui Ueyama OutputSectionCommand * 113810416564SRui Ueyama ScriptParser::readOutputSectionDescription(StringRef OutSec) { 1139076fe157SGeorge Rimar OutputSectionCommand *Cmd = new OutputSectionCommand(OutSec); 114058e5c4dcSGeorge Rimar 114158e5c4dcSGeorge Rimar // Read an address expression. 114258e5c4dcSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html#Output-Section-Address 114358e5c4dcSGeorge Rimar if (peek() != ":") 114458e5c4dcSGeorge Rimar Cmd->AddrExpr = readExpr(); 114558e5c4dcSGeorge Rimar 11468e3b38abSDenis Protivensky expect(":"); 1147246f681eSDavide Italiano 11488ceadb38SGeorge Rimar if (skip("AT")) 11496ad7dfccSRui Ueyama Cmd->LmaExpr = readParenExpr(); 1150630c6179SGeorge Rimar if (skip("ALIGN")) 11516ad7dfccSRui Ueyama Cmd->AlignExpr = readParenExpr(); 1152db24d9c3SGeorge Rimar if (skip("SUBALIGN")) 1153db24d9c3SGeorge Rimar Cmd->SubalignExpr = readParenExpr(); 1154630c6179SGeorge Rimar 1155246f681eSDavide Italiano // Parse constraints. 1156246f681eSDavide Italiano if (skip("ONLY_IF_RO")) 1157efc4066bSRui Ueyama Cmd->Constraint = ConstraintKind::ReadOnly; 1158246f681eSDavide Italiano if (skip("ONLY_IF_RW")) 1159efc4066bSRui Ueyama Cmd->Constraint = ConstraintKind::ReadWrite; 11608e3b38abSDenis Protivensky expect("{"); 11618ec77e64SRui Ueyama 1162025d59b1SRui Ueyama while (!Error && !skip("}")) { 1163ceabe80eSEugene Leviant StringRef Tok = next(); 1164db741e72SEugene Leviant if (SymbolAssignment *Assignment = readProvideOrAssignment(Tok, false)) 1165ceabe80eSEugene Leviant Cmd->Commands.emplace_back(Assignment); 1166ff1f29e0SGeorge Rimar else if (Tok == "FILL") 1167ff1f29e0SGeorge Rimar Cmd->Filler = readFill(); 1168ceabe80eSEugene Leviant else if (Tok == "SORT") 116903fc010eSGeorge Rimar readSort(); 1170a2496cbeSGeorge Rimar else if (peek() == "(") 1171a2496cbeSGeorge Rimar Cmd->Commands.emplace_back(readInputSectionDescription(Tok)); 1172ceabe80eSEugene Leviant else 1173ceabe80eSEugene Leviant setError("unknown command " + Tok); 11748e3b38abSDenis Protivensky } 1175076fe157SGeorge Rimar Cmd->Phdrs = readOutputSectionPhdrs(); 1176ff1f29e0SGeorge Rimar if (peek().startswith("=")) 1177ff1f29e0SGeorge Rimar Cmd->Filler = readOutputSectionFiller(next().drop_front()); 117810416564SRui Ueyama return Cmd; 1179f71caa2bSRui Ueyama } 11808ec77e64SRui Ueyama 11812c8f1f04SRui Ueyama // Read "=<number>" where <number> is an octal/decimal/hexadecimal number. 11822c8f1f04SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html 11832c8f1f04SRui Ueyama // 11842c8f1f04SRui Ueyama // ld.gold is not fully compatible with ld.bfd. ld.bfd handles 11852c8f1f04SRui Ueyama // hexstrings as blobs of arbitrary sizes, while ld.gold handles them 11862c8f1f04SRui Ueyama // as 32-bit big-endian values. We will do the same as ld.gold does 11872c8f1f04SRui Ueyama // because it's simpler than what ld.bfd does. 1188ff1f29e0SGeorge Rimar std::vector<uint8_t> ScriptParser::readOutputSectionFiller(StringRef Tok) { 1189965827d6SRui Ueyama uint32_t V; 1190ff1f29e0SGeorge Rimar if (Tok.getAsInteger(0, V)) { 1191965827d6SRui Ueyama setError("invalid filler expression: " + Tok); 1192f71caa2bSRui Ueyama return {}; 1193e2ee72b5SGeorge Rimar } 1194965827d6SRui Ueyama return {uint8_t(V >> 24), uint8_t(V >> 16), uint8_t(V >> 8), uint8_t(V)}; 11958e3b38abSDenis Protivensky } 11968e3b38abSDenis Protivensky 1197a35e39caSPetr Hosek SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) { 1198a31c91b1SEugene Leviant expect("("); 1199174e0a16SRui Ueyama SymbolAssignment *Cmd = readAssignment(next()); 1200a35e39caSPetr Hosek Cmd->Provide = Provide; 1201174e0a16SRui Ueyama Cmd->Hidden = Hidden; 1202a31c91b1SEugene Leviant expect(")"); 1203a31c91b1SEugene Leviant expect(";"); 120410416564SRui Ueyama return Cmd; 1205eda81a1bSEugene Leviant } 1206eda81a1bSEugene Leviant 1207db741e72SEugene Leviant SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok, 1208db741e72SEugene Leviant bool MakeAbsolute) { 1209ceabe80eSEugene Leviant SymbolAssignment *Cmd = nullptr; 1210ceabe80eSEugene Leviant if (peek() == "=" || peek() == "+=") { 1211ceabe80eSEugene Leviant Cmd = readAssignment(Tok); 1212ceabe80eSEugene Leviant expect(";"); 1213ceabe80eSEugene Leviant } else if (Tok == "PROVIDE") { 1214a35e39caSPetr Hosek Cmd = readProvideHidden(true, false); 1215a35e39caSPetr Hosek } else if (Tok == "HIDDEN") { 1216a35e39caSPetr Hosek Cmd = readProvideHidden(false, true); 1217ceabe80eSEugene Leviant } else if (Tok == "PROVIDE_HIDDEN") { 1218a35e39caSPetr Hosek Cmd = readProvideHidden(true, true); 1219ceabe80eSEugene Leviant } 1220db741e72SEugene Leviant if (Cmd && MakeAbsolute) 1221db741e72SEugene Leviant Cmd->IsAbsolute = true; 1222ceabe80eSEugene Leviant return Cmd; 1223ceabe80eSEugene Leviant } 1224ceabe80eSEugene Leviant 122530835ea4SGeorge Rimar static uint64_t getSymbolValue(StringRef S, uint64_t Dot) { 122630835ea4SGeorge Rimar if (S == ".") 122730835ea4SGeorge Rimar return Dot; 1228884e786dSGeorge Rimar return ScriptBase->getSymbolValue(S); 1229e32a3598SGeorge Rimar } 1230e32a3598SGeorge Rimar 123130835ea4SGeorge Rimar SymbolAssignment *ScriptParser::readAssignment(StringRef Name) { 123230835ea4SGeorge Rimar StringRef Op = next(); 1233db741e72SEugene Leviant bool IsAbsolute = false; 1234db741e72SEugene Leviant Expr E; 123530835ea4SGeorge Rimar assert(Op == "=" || Op == "+="); 1236db741e72SEugene Leviant if (skip("ABSOLUTE")) { 1237db741e72SEugene Leviant E = readParenExpr(); 1238db741e72SEugene Leviant IsAbsolute = true; 1239db741e72SEugene Leviant } else { 1240db741e72SEugene Leviant E = readExpr(); 1241db741e72SEugene Leviant } 124230835ea4SGeorge Rimar if (Op == "+=") 124330835ea4SGeorge Rimar E = [=](uint64_t Dot) { return getSymbolValue(Name, Dot) + E(Dot); }; 1244db741e72SEugene Leviant return new SymbolAssignment(Name, E, IsAbsolute); 124530835ea4SGeorge Rimar } 124630835ea4SGeorge Rimar 124730835ea4SGeorge Rimar // This is an operator-precedence parser to parse a linker 124830835ea4SGeorge Rimar // script expression. 124930835ea4SGeorge Rimar Expr ScriptParser::readExpr() { return readExpr1(readPrimary(), 0); } 125030835ea4SGeorge Rimar 125136c1cd23SRui Ueyama static Expr combine(StringRef Op, Expr L, Expr R) { 125236c1cd23SRui Ueyama if (Op == "*") 125336c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) * R(Dot); }; 125436c1cd23SRui Ueyama if (Op == "/") { 125536c1cd23SRui Ueyama return [=](uint64_t Dot) -> uint64_t { 125636c1cd23SRui Ueyama uint64_t RHS = R(Dot); 125736c1cd23SRui Ueyama if (RHS == 0) { 125836c1cd23SRui Ueyama error("division by zero"); 125936c1cd23SRui Ueyama return 0; 126036c1cd23SRui Ueyama } 126136c1cd23SRui Ueyama return L(Dot) / RHS; 126236c1cd23SRui Ueyama }; 126336c1cd23SRui Ueyama } 126436c1cd23SRui Ueyama if (Op == "+") 126536c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) + R(Dot); }; 126636c1cd23SRui Ueyama if (Op == "-") 126736c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) - R(Dot); }; 126836c1cd23SRui Ueyama if (Op == "<") 126936c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) < R(Dot); }; 127036c1cd23SRui Ueyama if (Op == ">") 127136c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) > R(Dot); }; 127236c1cd23SRui Ueyama if (Op == ">=") 127336c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) >= R(Dot); }; 127436c1cd23SRui Ueyama if (Op == "<=") 127536c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) <= R(Dot); }; 127636c1cd23SRui Ueyama if (Op == "==") 127736c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) == R(Dot); }; 127836c1cd23SRui Ueyama if (Op == "!=") 127936c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) != R(Dot); }; 128036c1cd23SRui Ueyama if (Op == "&") 128136c1cd23SRui Ueyama return [=](uint64_t Dot) { return L(Dot) & R(Dot); }; 1282cc3dd629SRafael Espindola if (Op == "|") 1283cc3dd629SRafael Espindola return [=](uint64_t Dot) { return L(Dot) | R(Dot); }; 128436c1cd23SRui Ueyama llvm_unreachable("invalid operator"); 128536c1cd23SRui Ueyama } 128636c1cd23SRui Ueyama 1287708019c4SRui Ueyama // This is a part of the operator-precedence parser. This function 1288708019c4SRui Ueyama // assumes that the remaining token stream starts with an operator. 1289708019c4SRui Ueyama Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) { 1290708019c4SRui Ueyama while (!atEOF() && !Error) { 1291708019c4SRui Ueyama // Read an operator and an expression. 1292708019c4SRui Ueyama StringRef Op1 = peek(); 1293708019c4SRui Ueyama if (Op1 == "?") 1294708019c4SRui Ueyama return readTernary(Lhs); 1295708019c4SRui Ueyama if (precedence(Op1) < MinPrec) 1296a31c91b1SEugene Leviant break; 1297a31c91b1SEugene Leviant next(); 1298708019c4SRui Ueyama Expr Rhs = readPrimary(); 1299708019c4SRui Ueyama 1300708019c4SRui Ueyama // Evaluate the remaining part of the expression first if the 1301708019c4SRui Ueyama // next operator has greater precedence than the previous one. 1302708019c4SRui Ueyama // For example, if we have read "+" and "3", and if the next 1303708019c4SRui Ueyama // operator is "*", then we'll evaluate 3 * ... part first. 1304708019c4SRui Ueyama while (!atEOF()) { 1305708019c4SRui Ueyama StringRef Op2 = peek(); 1306708019c4SRui Ueyama if (precedence(Op2) <= precedence(Op1)) 1307eda81a1bSEugene Leviant break; 1308708019c4SRui Ueyama Rhs = readExpr1(Rhs, precedence(Op2)); 1309eda81a1bSEugene Leviant } 1310708019c4SRui Ueyama 1311708019c4SRui Ueyama Lhs = combine(Op1, Lhs, Rhs); 1312708019c4SRui Ueyama } 1313708019c4SRui Ueyama return Lhs; 1314708019c4SRui Ueyama } 1315708019c4SRui Ueyama 1316708019c4SRui Ueyama uint64_t static getConstant(StringRef S) { 1317e2cc07bcSMichael J. Spencer if (S == "COMMONPAGESIZE") 1318708019c4SRui Ueyama return Target->PageSize; 1319e2cc07bcSMichael J. Spencer if (S == "MAXPAGESIZE") 1320e2cc07bcSMichael J. Spencer return Target->MaxPageSize; 1321708019c4SRui Ueyama error("unknown constant: " + S); 1322708019c4SRui Ueyama return 0; 1323708019c4SRui Ueyama } 1324708019c4SRui Ueyama 1325626e0b08SRui Ueyama // Parses Tok as an integer. Returns true if successful. 1326626e0b08SRui Ueyama // It recognizes hexadecimal (prefixed with "0x" or suffixed with "H") 1327626e0b08SRui Ueyama // and decimal numbers. Decimal numbers may have "K" (kilo) or 1328626e0b08SRui Ueyama // "M" (mega) prefixes. 13299f2f7ad9SGeorge Rimar static bool readInteger(StringRef Tok, uint64_t &Result) { 1330eaeafb2bSSimon Atanasyan if (Tok.startswith("-")) { 1331eaeafb2bSSimon Atanasyan if (!readInteger(Tok.substr(1), Result)) 1332eaeafb2bSSimon Atanasyan return false; 1333eaeafb2bSSimon Atanasyan Result = -Result; 1334eaeafb2bSSimon Atanasyan return true; 1335eaeafb2bSSimon Atanasyan } 13369f2f7ad9SGeorge Rimar if (Tok.startswith_lower("0x")) 13379f2f7ad9SGeorge Rimar return !Tok.substr(2).getAsInteger(16, Result); 13389f2f7ad9SGeorge Rimar if (Tok.endswith_lower("H")) 13399f2f7ad9SGeorge Rimar return !Tok.drop_back().getAsInteger(16, Result); 13409f2f7ad9SGeorge Rimar 13419f2f7ad9SGeorge Rimar int Suffix = 1; 13429f2f7ad9SGeorge Rimar if (Tok.endswith_lower("K")) { 13439f2f7ad9SGeorge Rimar Suffix = 1024; 13449f2f7ad9SGeorge Rimar Tok = Tok.drop_back(); 13459f2f7ad9SGeorge Rimar } else if (Tok.endswith_lower("M")) { 13469f2f7ad9SGeorge Rimar Suffix = 1024 * 1024; 13479f2f7ad9SGeorge Rimar Tok = Tok.drop_back(); 13489f2f7ad9SGeorge Rimar } 13499f2f7ad9SGeorge Rimar if (Tok.getAsInteger(10, Result)) 13509f2f7ad9SGeorge Rimar return false; 13519f2f7ad9SGeorge Rimar Result *= Suffix; 13529f2f7ad9SGeorge Rimar return true; 13539f2f7ad9SGeorge Rimar } 13549f2f7ad9SGeorge Rimar 1355708019c4SRui Ueyama Expr ScriptParser::readPrimary() { 13566ad7dfccSRui Ueyama if (peek() == "(") 13576ad7dfccSRui Ueyama return readParenExpr(); 1358708019c4SRui Ueyama 13596ad7dfccSRui Ueyama StringRef Tok = next(); 1360708019c4SRui Ueyama 1361eaeafb2bSSimon Atanasyan if (Tok == "~") { 1362eaeafb2bSSimon Atanasyan Expr E = readPrimary(); 1363eaeafb2bSSimon Atanasyan return [=](uint64_t Dot) { return ~E(Dot); }; 1364eaeafb2bSSimon Atanasyan } 1365eaeafb2bSSimon Atanasyan if (Tok == "-") { 1366eaeafb2bSSimon Atanasyan Expr E = readPrimary(); 1367eaeafb2bSSimon Atanasyan return [=](uint64_t Dot) { return -E(Dot); }; 1368eaeafb2bSSimon Atanasyan } 1369eaeafb2bSSimon Atanasyan 1370708019c4SRui Ueyama // Built-in functions are parsed here. 1371708019c4SRui Ueyama // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html. 137296659df0SGeorge Rimar if (Tok == "ADDR") { 137396659df0SGeorge Rimar expect("("); 137496659df0SGeorge Rimar StringRef Name = next(); 137596659df0SGeorge Rimar expect(")"); 1376884e786dSGeorge Rimar return 1377884e786dSGeorge Rimar [=](uint64_t Dot) { return ScriptBase->getOutputSectionAddress(Name); }; 137896659df0SGeorge Rimar } 1379eefa758eSGeorge Rimar if (Tok == "ASSERT") 1380eefa758eSGeorge Rimar return readAssert(); 1381708019c4SRui Ueyama if (Tok == "ALIGN") { 13826ad7dfccSRui Ueyama Expr E = readParenExpr(); 1383708019c4SRui Ueyama return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); }; 1384708019c4SRui Ueyama } 1385708019c4SRui Ueyama if (Tok == "CONSTANT") { 1386708019c4SRui Ueyama expect("("); 1387708019c4SRui Ueyama StringRef Tok = next(); 1388708019c4SRui Ueyama expect(")"); 1389708019c4SRui Ueyama return [=](uint64_t Dot) { return getConstant(Tok); }; 1390708019c4SRui Ueyama } 139154c145ceSRafael Espindola if (Tok == "SEGMENT_START") { 139254c145ceSRafael Espindola expect("("); 139354c145ceSRafael Espindola next(); 139454c145ceSRafael Espindola expect(","); 139554c145ceSRafael Espindola uint64_t Val; 13963adbbc38SRafael Espindola if (next().getAsInteger(0, Val)) 13973adbbc38SRafael Espindola setError("integer expected"); 139854c145ceSRafael Espindola expect(")"); 139954c145ceSRafael Espindola return [=](uint64_t Dot) { return Val; }; 140054c145ceSRafael Espindola } 1401708019c4SRui Ueyama if (Tok == "DATA_SEGMENT_ALIGN") { 1402708019c4SRui Ueyama expect("("); 1403708019c4SRui Ueyama Expr E = readExpr(); 1404708019c4SRui Ueyama expect(","); 1405708019c4SRui Ueyama readExpr(); 1406708019c4SRui Ueyama expect(")"); 1407f7791bb9SRui Ueyama return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); }; 1408708019c4SRui Ueyama } 1409708019c4SRui Ueyama if (Tok == "DATA_SEGMENT_END") { 1410708019c4SRui Ueyama expect("("); 1411708019c4SRui Ueyama expect("."); 1412708019c4SRui Ueyama expect(")"); 1413708019c4SRui Ueyama return [](uint64_t Dot) { return Dot; }; 1414708019c4SRui Ueyama } 1415276b4e64SGeorge Rimar // GNU linkers implements more complicated logic to handle 1416276b4e64SGeorge Rimar // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and just align to 1417276b4e64SGeorge Rimar // the next page boundary for simplicity. 1418276b4e64SGeorge Rimar if (Tok == "DATA_SEGMENT_RELRO_END") { 1419276b4e64SGeorge Rimar expect("("); 142097bdc722SRafael Espindola readExpr(); 1421276b4e64SGeorge Rimar expect(","); 1422276b4e64SGeorge Rimar readExpr(); 1423276b4e64SGeorge Rimar expect(")"); 1424276b4e64SGeorge Rimar return [](uint64_t Dot) { return alignTo(Dot, Target->PageSize); }; 1425276b4e64SGeorge Rimar } 14269e69450eSGeorge Rimar if (Tok == "SIZEOF") { 14279e69450eSGeorge Rimar expect("("); 14289e69450eSGeorge Rimar StringRef Name = next(); 14299e69450eSGeorge Rimar expect(")"); 1430884e786dSGeorge Rimar return [=](uint64_t Dot) { return ScriptBase->getOutputSectionSize(Name); }; 14319e69450eSGeorge Rimar } 143236fac7f0SEugene Leviant if (Tok == "ALIGNOF") { 143336fac7f0SEugene Leviant expect("("); 143436fac7f0SEugene Leviant StringRef Name = next(); 143536fac7f0SEugene Leviant expect(")"); 143636fac7f0SEugene Leviant return 143736fac7f0SEugene Leviant [=](uint64_t Dot) { return ScriptBase->getOutputSectionAlign(Name); }; 143836fac7f0SEugene Leviant } 1439e32a3598SGeorge Rimar if (Tok == "SIZEOF_HEADERS") 1440884e786dSGeorge Rimar return [=](uint64_t Dot) { return ScriptBase->getHeaderSize(); }; 1441708019c4SRui Ueyama 14429f2f7ad9SGeorge Rimar // Tok is a literal number. 14439f2f7ad9SGeorge Rimar uint64_t V; 14449f2f7ad9SGeorge Rimar if (readInteger(Tok, V)) 14459f2f7ad9SGeorge Rimar return [=](uint64_t Dot) { return V; }; 14469f2f7ad9SGeorge Rimar 14479f2f7ad9SGeorge Rimar // Tok is a symbol name. 144830835ea4SGeorge Rimar if (Tok != "." && !isValidCIdentifier(Tok)) 1449708019c4SRui Ueyama setError("malformed number: " + Tok); 145030835ea4SGeorge Rimar return [=](uint64_t Dot) { return getSymbolValue(Tok, Dot); }; 1451a9c5a528SGeorge Rimar } 1452708019c4SRui Ueyama 1453708019c4SRui Ueyama Expr ScriptParser::readTernary(Expr Cond) { 1454708019c4SRui Ueyama next(); 1455708019c4SRui Ueyama Expr L = readExpr(); 1456708019c4SRui Ueyama expect(":"); 1457708019c4SRui Ueyama Expr R = readExpr(); 1458708019c4SRui Ueyama return [=](uint64_t Dot) { return Cond(Dot) ? L(Dot) : R(Dot); }; 1459708019c4SRui Ueyama } 1460708019c4SRui Ueyama 14616ad7dfccSRui Ueyama Expr ScriptParser::readParenExpr() { 14626ad7dfccSRui Ueyama expect("("); 14636ad7dfccSRui Ueyama Expr E = readExpr(); 14646ad7dfccSRui Ueyama expect(")"); 14656ad7dfccSRui Ueyama return E; 14666ad7dfccSRui Ueyama } 14676ad7dfccSRui Ueyama 1468bbe38602SEugene Leviant std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() { 1469bbe38602SEugene Leviant std::vector<StringRef> Phdrs; 1470bbe38602SEugene Leviant while (!Error && peek().startswith(":")) { 1471bbe38602SEugene Leviant StringRef Tok = next(); 1472bbe38602SEugene Leviant Tok = (Tok.size() == 1) ? next() : Tok.substr(1); 1473bbe38602SEugene Leviant if (Tok.empty()) { 1474bbe38602SEugene Leviant setError("section header name is empty"); 1475bbe38602SEugene Leviant break; 1476bbe38602SEugene Leviant } 1477bbe38602SEugene Leviant Phdrs.push_back(Tok); 1478bbe38602SEugene Leviant } 1479bbe38602SEugene Leviant return Phdrs; 1480bbe38602SEugene Leviant } 1481bbe38602SEugene Leviant 1482bbe38602SEugene Leviant unsigned ScriptParser::readPhdrType() { 1483bbe38602SEugene Leviant StringRef Tok = next(); 1484b0f6c590SRui Ueyama unsigned Ret = StringSwitch<unsigned>(Tok) 1485b0f6c590SRui Ueyama .Case("PT_NULL", PT_NULL) 1486b0f6c590SRui Ueyama .Case("PT_LOAD", PT_LOAD) 1487b0f6c590SRui Ueyama .Case("PT_DYNAMIC", PT_DYNAMIC) 1488b0f6c590SRui Ueyama .Case("PT_INTERP", PT_INTERP) 1489b0f6c590SRui Ueyama .Case("PT_NOTE", PT_NOTE) 1490b0f6c590SRui Ueyama .Case("PT_SHLIB", PT_SHLIB) 1491b0f6c590SRui Ueyama .Case("PT_PHDR", PT_PHDR) 1492b0f6c590SRui Ueyama .Case("PT_TLS", PT_TLS) 1493b0f6c590SRui Ueyama .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME) 1494b0f6c590SRui Ueyama .Case("PT_GNU_STACK", PT_GNU_STACK) 1495b0f6c590SRui Ueyama .Case("PT_GNU_RELRO", PT_GNU_RELRO) 1496b0f6c590SRui Ueyama .Default(-1); 1497bbe38602SEugene Leviant 1498b0f6c590SRui Ueyama if (Ret == (unsigned)-1) { 1499b0f6c590SRui Ueyama setError("invalid program header type: " + Tok); 1500b0f6c590SRui Ueyama return PT_NULL; 1501b0f6c590SRui Ueyama } 1502b0f6c590SRui Ueyama return Ret; 1503bbe38602SEugene Leviant } 1504bbe38602SEugene Leviant 150595769b4aSRui Ueyama void ScriptParser::readVersionDeclaration(StringRef VerStr) { 150620b6598cSGeorge Rimar // Identifiers start at 2 because 0 and 1 are reserved 150720b6598cSGeorge Rimar // for VER_NDX_LOCAL and VER_NDX_GLOBAL constants. 150820b6598cSGeorge Rimar size_t VersionId = Config->VersionDefinitions.size() + 2; 150920b6598cSGeorge Rimar Config->VersionDefinitions.push_back({VerStr, VersionId}); 151020b6598cSGeorge Rimar 151120b6598cSGeorge Rimar if (skip("global:") || peek() != "local:") 151220b6598cSGeorge Rimar readGlobal(VerStr); 151320b6598cSGeorge Rimar if (skip("local:")) 151420b6598cSGeorge Rimar readLocal(); 151520b6598cSGeorge Rimar expect("}"); 151620b6598cSGeorge Rimar 151720b6598cSGeorge Rimar // Each version may have a parent version. For example, "Ver2" defined as 151820b6598cSGeorge Rimar // "Ver2 { global: foo; local: *; } Ver1;" has "Ver1" as a parent. This 151920b6598cSGeorge Rimar // version hierarchy is, probably against your instinct, purely for human; the 152020b6598cSGeorge Rimar // runtime doesn't care about them at all. In LLD, we simply skip the token. 152120b6598cSGeorge Rimar if (!VerStr.empty() && peek() != ";") 152220b6598cSGeorge Rimar next(); 152320b6598cSGeorge Rimar expect(";"); 152420b6598cSGeorge Rimar } 152520b6598cSGeorge Rimar 152620b6598cSGeorge Rimar void ScriptParser::readLocal() { 152720b6598cSGeorge Rimar Config->DefaultSymbolVersion = VER_NDX_LOCAL; 152820b6598cSGeorge Rimar expect("*"); 152920b6598cSGeorge Rimar expect(";"); 153020b6598cSGeorge Rimar } 153120b6598cSGeorge Rimar 153220b6598cSGeorge Rimar void ScriptParser::readExtern(std::vector<SymbolVersion> *Globals) { 1533cd574a5eSGeorge Rimar expect("\"C++\""); 153420b6598cSGeorge Rimar expect("{"); 153520b6598cSGeorge Rimar 153620b6598cSGeorge Rimar for (;;) { 153720b6598cSGeorge Rimar if (peek() == "}" || Error) 153820b6598cSGeorge Rimar break; 1539cd574a5eSGeorge Rimar bool HasWildcard = !peek().startswith("\"") && hasWildcard(peek()); 1540cd574a5eSGeorge Rimar Globals->push_back({unquote(next()), true, HasWildcard}); 154120b6598cSGeorge Rimar expect(";"); 154220b6598cSGeorge Rimar } 154320b6598cSGeorge Rimar 154420b6598cSGeorge Rimar expect("}"); 154520b6598cSGeorge Rimar expect(";"); 154620b6598cSGeorge Rimar } 154720b6598cSGeorge Rimar 154820b6598cSGeorge Rimar void ScriptParser::readGlobal(StringRef VerStr) { 154920b6598cSGeorge Rimar std::vector<SymbolVersion> *Globals; 155020b6598cSGeorge Rimar if (VerStr.empty()) 155120b6598cSGeorge Rimar Globals = &Config->VersionScriptGlobals; 155220b6598cSGeorge Rimar else 155320b6598cSGeorge Rimar Globals = &Config->VersionDefinitions.back().Globals; 155420b6598cSGeorge Rimar 155520b6598cSGeorge Rimar for (;;) { 155620b6598cSGeorge Rimar if (skip("extern")) 155720b6598cSGeorge Rimar readExtern(Globals); 155820b6598cSGeorge Rimar 155920b6598cSGeorge Rimar StringRef Cur = peek(); 156020b6598cSGeorge Rimar if (Cur == "}" || Cur == "local:" || Error) 156120b6598cSGeorge Rimar return; 156220b6598cSGeorge Rimar next(); 1563cd574a5eSGeorge Rimar Globals->push_back({unquote(Cur), false, hasWildcard(Cur)}); 156420b6598cSGeorge Rimar expect(";"); 156520b6598cSGeorge Rimar } 156620b6598cSGeorge Rimar } 156720b6598cSGeorge Rimar 156816b0cc9eSSimon Atanasyan static bool isUnderSysroot(StringRef Path) { 156916b0cc9eSSimon Atanasyan if (Config->Sysroot == "") 157016b0cc9eSSimon Atanasyan return false; 157116b0cc9eSSimon Atanasyan for (; !Path.empty(); Path = sys::path::parent_path(Path)) 157216b0cc9eSSimon Atanasyan if (sys::fs::equivalent(Config->Sysroot, Path)) 157316b0cc9eSSimon Atanasyan return true; 157416b0cc9eSSimon Atanasyan return false; 157516b0cc9eSSimon Atanasyan } 157616b0cc9eSSimon Atanasyan 157707320e40SRui Ueyama void elf::readLinkerScript(MemoryBufferRef MB) { 157816b0cc9eSSimon Atanasyan StringRef Path = MB.getBufferIdentifier(); 157920b6598cSGeorge Rimar ScriptParser(MB.getBuffer(), isUnderSysroot(Path)).readLinkerScript(); 158020b6598cSGeorge Rimar } 158120b6598cSGeorge Rimar 158220b6598cSGeorge Rimar void elf::readVersionScript(MemoryBufferRef MB) { 158320b6598cSGeorge Rimar ScriptParser(MB.getBuffer(), false).readVersionScript(); 1584f7c5fbb1SRui Ueyama } 15851ebc8ed7SRui Ueyama 158607320e40SRui Ueyama template class elf::LinkerScript<ELF32LE>; 158707320e40SRui Ueyama template class elf::LinkerScript<ELF32BE>; 158807320e40SRui Ueyama template class elf::LinkerScript<ELF64LE>; 158907320e40SRui Ueyama template class elf::LinkerScript<ELF64BE>; 1590