1f7c5fbb1SRui Ueyama //===- LinkerScript.cpp ---------------------------------------------------===//
2f7c5fbb1SRui Ueyama //
3f7c5fbb1SRui Ueyama //                             The LLVM Linker
4f7c5fbb1SRui Ueyama //
5f7c5fbb1SRui Ueyama // This file is distributed under the University of Illinois Open Source
6f7c5fbb1SRui Ueyama // License. See LICENSE.TXT for details.
7f7c5fbb1SRui Ueyama //
8f7c5fbb1SRui Ueyama //===----------------------------------------------------------------------===//
9f7c5fbb1SRui Ueyama //
10f7c5fbb1SRui Ueyama // This file contains the parser/evaluator of the linker script.
11629e0aa5SRui Ueyama // It parses a linker script and write the result to Config or ScriptConfig
12629e0aa5SRui Ueyama // objects.
13629e0aa5SRui Ueyama //
14629e0aa5SRui Ueyama // If SECTIONS command is used, a ScriptConfig contains an AST
15629e0aa5SRui Ueyama // of the command which will later be consumed by createSections() and
16629e0aa5SRui Ueyama // assignAddresses().
17f7c5fbb1SRui Ueyama //
18f7c5fbb1SRui Ueyama //===----------------------------------------------------------------------===//
19f7c5fbb1SRui Ueyama 
20717677afSRui Ueyama #include "LinkerScript.h"
21f7c5fbb1SRui Ueyama #include "Config.h"
22f7c5fbb1SRui Ueyama #include "Driver.h"
231ebc8ed7SRui Ueyama #include "InputSection.h"
24652852c5SGeorge Rimar #include "OutputSections.h"
25e77b5bf6SAdhemerval Zanella #include "ScriptParser.h"
2693c9af42SRui Ueyama #include "Strings.h"
27eda81a1bSEugene Leviant #include "Symbols.h"
28f7c5fbb1SRui Ueyama #include "SymbolTable.h"
29467c4d55SEugene Leviant #include "Target.h"
30bbe38602SEugene Leviant #include "Writer.h"
31960504b9SRui Ueyama #include "llvm/ADT/StringSwitch.h"
32652852c5SGeorge Rimar #include "llvm/Support/ELF.h"
33f7c5fbb1SRui Ueyama #include "llvm/Support/FileSystem.h"
34f7c5fbb1SRui Ueyama #include "llvm/Support/MemoryBuffer.h"
35f03f3cc1SRui Ueyama #include "llvm/Support/Path.h"
36a47ee68dSRui Ueyama #include "llvm/Support/StringSaver.h"
37f7c5fbb1SRui Ueyama 
38f7c5fbb1SRui Ueyama using namespace llvm;
39652852c5SGeorge Rimar using namespace llvm::ELF;
401ebc8ed7SRui Ueyama using namespace llvm::object;
41f7c5fbb1SRui Ueyama using namespace lld;
42e0df00b9SRafael Espindola using namespace lld::elf;
43f7c5fbb1SRui Ueyama 
44884e786dSGeorge Rimar LinkerScriptBase *elf::ScriptBase;
4507320e40SRui Ueyama ScriptConfiguration *elf::ScriptConfig;
46717677afSRui Ueyama 
476c55f0e3SGeorge Rimar template <class ELFT> static void addRegular(SymbolAssignment *Cmd) {
481602421cSRui Ueyama   Symbol *Sym = Symtab<ELFT>::X->addRegular(Cmd->Name, STB_GLOBAL, STV_DEFAULT);
491602421cSRui Ueyama   Sym->Visibility = Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT;
501602421cSRui Ueyama   Cmd->Sym = Sym->body();
5120d03194SEugene Leviant 
5220d03194SEugene Leviant   // If we have no SECTIONS then we don't have '.' and don't call
5320d03194SEugene Leviant   // assignAddresses(). We calculate symbol value immediately in this case.
5420d03194SEugene Leviant   if (!ScriptConfig->HasSections)
5520d03194SEugene Leviant     cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(0);
56ceabe80eSEugene Leviant }
57ceabe80eSEugene Leviant 
580c70d3ccSRui Ueyama template <class ELFT> static void addSynthetic(SymbolAssignment *Cmd) {
59e1937bb5SGeorge Rimar   Symbol *Sym = Symtab<ELFT>::X->addSynthetic(
60e1937bb5SGeorge Rimar       Cmd->Name, nullptr, 0, Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT);
611602421cSRui Ueyama   Cmd->Sym = Sym->body();
62ceabe80eSEugene Leviant }
63ceabe80eSEugene Leviant 
64db741e72SEugene Leviant template <class ELFT> static void addSymbol(SymbolAssignment *Cmd) {
65db741e72SEugene Leviant   if (Cmd->IsAbsolute)
66db741e72SEugene Leviant     addRegular<ELFT>(Cmd);
67db741e72SEugene Leviant   else
68db741e72SEugene Leviant     addSynthetic<ELFT>(Cmd);
69db741e72SEugene Leviant }
701602421cSRui Ueyama // If a symbol was in PROVIDE(), we need to define it only when
711602421cSRui Ueyama // it is an undefined symbol.
721602421cSRui Ueyama template <class ELFT> static bool shouldDefine(SymbolAssignment *Cmd) {
731602421cSRui Ueyama   if (Cmd->Name == ".")
74ceabe80eSEugene Leviant     return false;
751602421cSRui Ueyama   if (!Cmd->Provide)
76ceabe80eSEugene Leviant     return true;
771602421cSRui Ueyama   SymbolBody *B = Symtab<ELFT>::X->find(Cmd->Name);
781602421cSRui Ueyama   return B && B->isUndefined();
79ceabe80eSEugene Leviant }
80ceabe80eSEugene Leviant 
81076fe157SGeorge Rimar bool SymbolAssignment::classof(const BaseCommand *C) {
82076fe157SGeorge Rimar   return C->Kind == AssignmentKind;
83076fe157SGeorge Rimar }
84076fe157SGeorge Rimar 
85076fe157SGeorge Rimar bool OutputSectionCommand::classof(const BaseCommand *C) {
86076fe157SGeorge Rimar   return C->Kind == OutputSectionKind;
87076fe157SGeorge Rimar }
88076fe157SGeorge Rimar 
89eea3114fSGeorge Rimar bool InputSectionDescription::classof(const BaseCommand *C) {
90eea3114fSGeorge Rimar   return C->Kind == InputSectionKind;
91eea3114fSGeorge Rimar }
92eea3114fSGeorge Rimar 
93eefa758eSGeorge Rimar bool AssertCommand::classof(const BaseCommand *C) {
94eefa758eSGeorge Rimar   return C->Kind == AssertKind;
95eefa758eSGeorge Rimar }
96eefa758eSGeorge Rimar 
9736a153cdSRui Ueyama template <class ELFT> static bool isDiscarded(InputSectionBase<ELFT> *S) {
98eea3114fSGeorge Rimar   return !S || !S->Live;
99717677afSRui Ueyama }
100717677afSRui Ueyama 
101f34d0e08SRui Ueyama template <class ELFT> LinkerScript<ELFT>::LinkerScript() {}
102f34d0e08SRui Ueyama template <class ELFT> LinkerScript<ELFT>::~LinkerScript() {}
103f34d0e08SRui Ueyama 
10407320e40SRui Ueyama template <class ELFT>
10507320e40SRui Ueyama bool LinkerScript<ELFT>::shouldKeep(InputSectionBase<ELFT> *S) {
106c91930a1SGeorge Rimar   for (Regex *Re : Opt.KeptSections)
107042a3f20SRafael Espindola     if (Re->match(S->Name))
108eea3114fSGeorge Rimar       return true;
109eea3114fSGeorge Rimar   return false;
110eea3114fSGeorge Rimar }
111eea3114fSGeorge Rimar 
112395281cfSGeorge Rimar static bool fileMatches(const llvm::Regex &FileRe,
113395281cfSGeorge Rimar                         const llvm::Regex &ExcludedFileRe, StringRef Filename) {
114395281cfSGeorge Rimar   return const_cast<Regex &>(FileRe).match(Filename) &&
115395281cfSGeorge Rimar          !const_cast<Regex &>(ExcludedFileRe).match(Filename);
1160659800eSGeorge Rimar }
1170659800eSGeorge Rimar 
118575208caSGeorge Rimar static bool comparePriority(InputSectionData *A, InputSectionData *B) {
119575208caSGeorge Rimar   return getPriority(A->Name) < getPriority(B->Name);
120575208caSGeorge Rimar }
121575208caSGeorge Rimar 
122c0028d3dSRafael Espindola static bool compareName(InputSectionData *A, InputSectionData *B) {
123042a3f20SRafael Espindola   return A->Name < B->Name;
1240702c4e8SGeorge Rimar }
125742c3836SRui Ueyama 
126c0028d3dSRafael Espindola static bool compareAlignment(InputSectionData *A, InputSectionData *B) {
127742c3836SRui Ueyama   // ">" is not a mistake. Larger alignments are placed before smaller
128742c3836SRui Ueyama   // alignments in order to reduce the amount of padding necessary.
129742c3836SRui Ueyama   // This is compatible with GNU.
130742c3836SRui Ueyama   return A->Alignment > B->Alignment;
131742c3836SRui Ueyama }
132742c3836SRui Ueyama 
133c0028d3dSRafael Espindola static std::function<bool(InputSectionData *, InputSectionData *)>
134be394db3SGeorge Rimar getComparator(SortSectionPolicy K) {
135be394db3SGeorge Rimar   switch (K) {
136be394db3SGeorge Rimar   case SortSectionPolicy::Alignment:
137c0028d3dSRafael Espindola     return compareAlignment;
138be394db3SGeorge Rimar   case SortSectionPolicy::Name:
139be394db3SGeorge Rimar     return compareName;
140be394db3SGeorge Rimar   case SortSectionPolicy::Priority:
141be394db3SGeorge Rimar     return comparePriority;
142be394db3SGeorge Rimar   default:
143be394db3SGeorge Rimar     llvm_unreachable("unknown sort policy");
144be394db3SGeorge Rimar   }
145742c3836SRui Ueyama }
1460702c4e8SGeorge Rimar 
1478f66df92SGeorge Rimar static bool checkConstraint(uint64_t Flags, ConstraintKind Kind) {
1488f66df92SGeorge Rimar   bool RO = (Kind == ConstraintKind::ReadOnly);
1498f66df92SGeorge Rimar   bool RW = (Kind == ConstraintKind::ReadWrite);
1508f66df92SGeorge Rimar   bool Writable = Flags & SHF_WRITE;
151adcdb664SRui Ueyama   return !(RO && Writable) && !(RW && !Writable);
1528f66df92SGeorge Rimar }
1538f66df92SGeorge Rimar 
15448c3f1ceSRui Ueyama template <class ELFT>
155e71a3f8aSRafael Espindola static bool matchConstraints(ArrayRef<InputSectionBase<ELFT> *> Sections,
15606ae6836SGeorge Rimar                              ConstraintKind Kind) {
1578f66df92SGeorge Rimar   if (Kind == ConstraintKind::NoConstraint)
1588f66df92SGeorge Rimar     return true;
159d3190795SRafael Espindola   return llvm::all_of(Sections, [=](InputSectionData *Sec2) {
160d3190795SRafael Espindola     auto *Sec = static_cast<InputSectionBase<ELFT> *>(Sec2);
1618f66df92SGeorge Rimar     return checkConstraint(Sec->getSectionHdr()->sh_flags, Kind);
16206ae6836SGeorge Rimar   });
16306ae6836SGeorge Rimar }
16406ae6836SGeorge Rimar 
165d3190795SRafael Espindola // Compute and remember which sections the InputSectionDescription matches.
166be94e1b6SRafael Espindola template <class ELFT>
167e71a3f8aSRafael Espindola void LinkerScript<ELFT>::computeInputSections(InputSectionDescription *I) {
168395281cfSGeorge Rimar   for (const std::pair<llvm::Regex, llvm::Regex> &V : I->SectionsVec) {
169395281cfSGeorge Rimar     for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles()) {
170395281cfSGeorge Rimar       if (fileMatches(I->FileRe, V.first, sys::path::filename(F->getName()))) {
171395281cfSGeorge Rimar         Regex &Re = const_cast<Regex &>(V.second);
172be94e1b6SRafael Espindola         for (InputSectionBase<ELFT> *S : F->getSections())
173395281cfSGeorge Rimar           if (!isDiscarded(S) && !S->OutSec && Re.match(S->Name))
174d3190795SRafael Espindola             I->Sections.push_back(S);
175be94e1b6SRafael Espindola 
176395281cfSGeorge Rimar         if (Re.match("COMMON"))
177d3190795SRafael Espindola           I->Sections.push_back(CommonInputSection<ELFT>::X);
178395281cfSGeorge Rimar       }
179395281cfSGeorge Rimar     }
180395281cfSGeorge Rimar   }
181d3190795SRafael Espindola 
182*b2a0abdfSRui Ueyama   if (I->SortInner != SortSectionPolicy::Default)
183d3190795SRafael Espindola     std::stable_sort(I->Sections.begin(), I->Sections.end(),
184d3190795SRafael Espindola                      getComparator(I->SortInner));
185*b2a0abdfSRui Ueyama   if (I->SortOuter != SortSectionPolicy::Default)
186d3190795SRafael Espindola     std::stable_sort(I->Sections.begin(), I->Sections.end(),
187d3190795SRafael Espindola                      getComparator(I->SortOuter));
188d3190795SRafael Espindola 
189d3190795SRafael Espindola   // We do not add duplicate input sections, so mark them with a dummy output
190d3190795SRafael Espindola   // section for now.
191d3190795SRafael Espindola   for (InputSectionData *S : I->Sections) {
192d3190795SRafael Espindola     auto *S2 = static_cast<InputSectionBase<ELFT> *>(S);
193d3190795SRafael Espindola     S2->OutSec = (OutputSectionBase<ELFT> *)-1;
194d3190795SRafael Espindola   }
195be94e1b6SRafael Espindola }
196be94e1b6SRafael Espindola 
197be94e1b6SRafael Espindola template <class ELFT>
198be94e1b6SRafael Espindola void LinkerScript<ELFT>::discard(ArrayRef<InputSectionBase<ELFT> *> V) {
199be94e1b6SRafael Espindola   for (InputSectionBase<ELFT> *S : V) {
200be94e1b6SRafael Espindola     S->Live = false;
201be94e1b6SRafael Espindola     reportDiscarded(S);
202be94e1b6SRafael Espindola   }
203be94e1b6SRafael Espindola }
204be94e1b6SRafael Espindola 
20506ae6836SGeorge Rimar template <class ELFT>
2060b9ce6a4SRui Ueyama std::vector<InputSectionBase<ELFT> *>
20706ae6836SGeorge Rimar LinkerScript<ELFT>::createInputSectionList(OutputSectionCommand &OutCmd) {
2080b9ce6a4SRui Ueyama   std::vector<InputSectionBase<ELFT> *> Ret;
209e7f912cdSRui Ueyama 
21006ae6836SGeorge Rimar   for (const std::unique_ptr<BaseCommand> &Base : OutCmd.Commands) {
2117c3ff2ebSRafael Espindola     auto *Cmd = dyn_cast<InputSectionDescription>(Base.get());
2127c3ff2ebSRafael Espindola     if (!Cmd)
2130b9ce6a4SRui Ueyama       continue;
214e71a3f8aSRafael Espindola     computeInputSections(Cmd);
215d3190795SRafael Espindola     for (InputSectionData *S : Cmd->Sections)
216d3190795SRafael Espindola       Ret.push_back(static_cast<InputSectionBase<ELFT> *>(S));
2170b9ce6a4SRui Ueyama   }
218e71a3f8aSRafael Espindola 
2190b9ce6a4SRui Ueyama   return Ret;
2200b9ce6a4SRui Ueyama }
2210b9ce6a4SRui Ueyama 
222e5d3ca50SPetr Hosek template <class ELFT>
22310897f18SRafael Espindola static SectionKey<ELFT::Is64Bits> createKey(InputSectionBase<ELFT> *C,
22410897f18SRafael Espindola                                             StringRef OutsecName) {
22510897f18SRafael Espindola   // When using linker script the merge rules are different.
22610897f18SRafael Espindola   // Unfortunately, linker scripts are name based. This means that expressions
22710897f18SRafael Espindola   // like *(.foo*) can refer to multiple input sections that would normally be
22810897f18SRafael Espindola   // placed in different output sections. We cannot put them in different
22910897f18SRafael Espindola   // output sections or we would produce wrong results for
23010897f18SRafael Espindola   // start = .; *(.foo.*) end = .; *(.bar)
23110897f18SRafael Espindola   // and a mapping of .foo1 and .bar1 to one section and .foo2 and .bar2 to
23210897f18SRafael Espindola   // another. The problem is that there is no way to layout those output
23310897f18SRafael Espindola   // sections such that the .foo sections are the only thing between the
23410897f18SRafael Espindola   // start and end symbols.
23510897f18SRafael Espindola 
23610897f18SRafael Espindola   // An extra annoyance is that we cannot simply disable merging of the contents
23710897f18SRafael Espindola   // of SHF_MERGE sections, but our implementation requires one output section
23810897f18SRafael Espindola   // per "kind" (string or not, which size/aligment).
23910897f18SRafael Espindola   // Fortunately, creating symbols in the middle of a merge section is not
24010897f18SRafael Espindola   // supported by bfd or gold, so we can just create multiple section in that
24110897f18SRafael Espindola   // case.
24210897f18SRafael Espindola   const typename ELFT::Shdr *H = C->getSectionHdr();
24310897f18SRafael Espindola   typedef typename ELFT::uint uintX_t;
24410897f18SRafael Espindola   uintX_t Flags = H->sh_flags & (SHF_MERGE | SHF_STRINGS);
24510897f18SRafael Espindola 
24610897f18SRafael Espindola   uintX_t Alignment = 0;
24710897f18SRafael Espindola   if (isa<MergeInputSection<ELFT>>(C))
24810897f18SRafael Espindola     Alignment = std::max(H->sh_addralign, H->sh_entsize);
24910897f18SRafael Espindola 
25010897f18SRafael Espindola   return SectionKey<ELFT::Is64Bits>{OutsecName, /*Type*/ 0, Flags, Alignment};
25110897f18SRafael Espindola }
25210897f18SRafael Espindola 
25310897f18SRafael Espindola template <class ELFT>
25420d03194SEugene Leviant void LinkerScript<ELFT>::addSection(OutputSectionFactory<ELFT> &Factory,
25520d03194SEugene Leviant                                     InputSectionBase<ELFT> *Sec,
25620d03194SEugene Leviant                                     StringRef Name) {
25728c1597aSRafael Espindola   OutputSectionBase<ELFT> *OutSec;
25828c1597aSRafael Espindola   bool IsNew;
25910897f18SRafael Espindola   std::tie(OutSec, IsNew) = Factory.create(createKey(Sec, Name), Sec);
26028c1597aSRafael Espindola   if (IsNew)
26128c1597aSRafael Espindola     OutputSections->push_back(OutSec);
26220d03194SEugene Leviant   OutSec->addSection(Sec);
26320d03194SEugene Leviant }
26420d03194SEugene Leviant 
26520d03194SEugene Leviant template <class ELFT>
26620d03194SEugene Leviant void LinkerScript<ELFT>::processCommands(OutputSectionFactory<ELFT> &Factory) {
26728c1597aSRafael Espindola 
2687c3ff2ebSRafael Espindola   for (unsigned I = 0; I < Opt.Commands.size(); ++I) {
2697c3ff2ebSRafael Espindola     auto Iter = Opt.Commands.begin() + I;
2707c3ff2ebSRafael Espindola     const std::unique_ptr<BaseCommand> &Base1 = *Iter;
2712ab5f73dSRui Ueyama     if (auto *Cmd = dyn_cast<SymbolAssignment>(Base1.get())) {
2722ab5f73dSRui Ueyama       if (shouldDefine<ELFT>(Cmd))
2732ab5f73dSRui Ueyama         addRegular<ELFT>(Cmd);
2742ab5f73dSRui Ueyama       continue;
2752ab5f73dSRui Ueyama     }
27620d03194SEugene Leviant     if (auto *Cmd = dyn_cast<AssertCommand>(Base1.get())) {
27720d03194SEugene Leviant       // If we don't have SECTIONS then output sections have already been
27820d03194SEugene Leviant       // created by Writer<EFLT>. The LinkerScript<ELFT>::assignAddresses
27920d03194SEugene Leviant       // will not be called, so ASSERT should be evaluated now.
28020d03194SEugene Leviant       if (!Opt.HasSections)
28120d03194SEugene Leviant         Cmd->Expression(0);
28220d03194SEugene Leviant       continue;
28320d03194SEugene Leviant     }
2842ab5f73dSRui Ueyama 
285ceabe80eSEugene Leviant     if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base1.get())) {
2867bd37870SRafael Espindola       std::vector<InputSectionBase<ELFT> *> V = createInputSectionList(*Cmd);
2877bd37870SRafael Espindola 
28848c3f1ceSRui Ueyama       if (Cmd->Name == "/DISCARD/") {
2897bd37870SRafael Espindola         discard(V);
29048c3f1ceSRui Ueyama         continue;
29148c3f1ceSRui Ueyama       }
2920b9ce6a4SRui Ueyama 
2937c3ff2ebSRafael Espindola       if (!matchConstraints<ELFT>(V, Cmd->Constraint)) {
2947c3ff2ebSRafael Espindola         for (InputSectionBase<ELFT> *S : V)
2957c3ff2ebSRafael Espindola           S->OutSec = nullptr;
2967c3ff2ebSRafael Espindola         Opt.Commands.erase(Iter);
2977c3ff2ebSRafael Espindola         continue;
2987c3ff2ebSRafael Espindola       }
2997c3ff2ebSRafael Espindola 
3007c3ff2ebSRafael Espindola       for (const std::unique_ptr<BaseCommand> &Base : Cmd->Commands)
3017c3ff2ebSRafael Espindola         if (auto *OutCmd = dyn_cast<SymbolAssignment>(Base.get()))
3027c3ff2ebSRafael Espindola           if (shouldDefine<ELFT>(OutCmd))
3037c3ff2ebSRafael Espindola             addSymbol<ELFT>(OutCmd);
3047c3ff2ebSRafael Espindola 
30597403d15SEugene Leviant       if (V.empty())
3060b9ce6a4SRui Ueyama         continue;
3070b9ce6a4SRui Ueyama 
308a14b13d8SGeorge Rimar       for (InputSectionBase<ELFT> *Sec : V) {
30920d03194SEugene Leviant         addSection(Factory, Sec, Cmd->Name);
31020d03194SEugene Leviant         if (uint32_t Subalign = Cmd->SubalignExpr ? Cmd->SubalignExpr(0) : 0)
311db24d9c3SGeorge Rimar           Sec->Alignment = Subalign;
31220d03194SEugene Leviant       }
313eea3114fSGeorge Rimar     }
31448c3f1ceSRui Ueyama   }
315db24d9c3SGeorge Rimar }
316e63d81bdSEugene Leviant 
31720d03194SEugene Leviant template <class ELFT>
31820d03194SEugene Leviant void LinkerScript<ELFT>::createSections(OutputSectionFactory<ELFT> &Factory) {
31920d03194SEugene Leviant   processCommands(Factory);
3200b9ce6a4SRui Ueyama   // Add orphan sections.
32120d03194SEugene Leviant   for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles())
32220d03194SEugene Leviant     for (InputSectionBase<ELFT> *S : F->getSections())
32320d03194SEugene Leviant       if (!isDiscarded(S) && !S->OutSec)
32420d03194SEugene Leviant         addSection(Factory, S, getOutputSectionName(S));
325e63d81bdSEugene Leviant }
326e63d81bdSEugene Leviant 
327db741e72SEugene Leviant // Sets value of a section-defined symbol. Two kinds of
328db741e72SEugene Leviant // symbols are processed: synthetic symbols, whose value
329db741e72SEugene Leviant // is an offset from beginning of section and regular
330db741e72SEugene Leviant // symbols whose value is absolute.
331db741e72SEugene Leviant template <class ELFT>
332db741e72SEugene Leviant static void assignSectionSymbol(SymbolAssignment *Cmd,
333db741e72SEugene Leviant                                 OutputSectionBase<ELFT> *Sec,
334db741e72SEugene Leviant                                 typename ELFT::uint Off) {
335db741e72SEugene Leviant   if (!Cmd->Sym)
336db741e72SEugene Leviant     return;
337db741e72SEugene Leviant 
338db741e72SEugene Leviant   if (auto *Body = dyn_cast<DefinedSynthetic<ELFT>>(Cmd->Sym)) {
339db741e72SEugene Leviant     Body->Section = Sec;
340db741e72SEugene Leviant     Body->Value = Cmd->Expression(Sec->getVA() + Off) - Sec->getVA();
341db741e72SEugene Leviant     return;
342db741e72SEugene Leviant   }
343db741e72SEugene Leviant   auto *Body = cast<DefinedRegular<ELFT>>(Cmd->Sym);
344db741e72SEugene Leviant   Body->Value = Cmd->Expression(Sec->getVA() + Off);
345db741e72SEugene Leviant }
346db741e72SEugene Leviant 
347d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::output(InputSection<ELFT> *S) {
348d3190795SRafael Espindola   if (!AlreadyOutputIS.insert(S).second)
349ceabe80eSEugene Leviant     return;
350d3190795SRafael Espindola   bool IsTbss =
351d3190795SRafael Espindola       (CurOutSec->getFlags() & SHF_TLS) && CurOutSec->getType() == SHT_NOBITS;
352d3190795SRafael Espindola 
353d3190795SRafael Espindola   uintX_t Pos = IsTbss ? Dot + ThreadBssOffset : Dot;
354d3190795SRafael Espindola   Pos = alignTo(Pos, S->Alignment);
355d3190795SRafael Espindola   S->OutSecOff = Pos - CurOutSec->getVA();
356d3190795SRafael Espindola   Pos += S->getSize();
357d3190795SRafael Espindola 
358d3190795SRafael Espindola   // Update output section size after adding each section. This is so that
359d3190795SRafael Espindola   // SIZEOF works correctly in the case below:
360d3190795SRafael Espindola   // .foo { *(.aaa) a = SIZEOF(.foo); *(.bbb) }
361d3190795SRafael Espindola   CurOutSec->setSize(Pos - CurOutSec->getVA());
362d3190795SRafael Espindola 
363d3190795SRafael Espindola   if (!IsTbss)
364d3190795SRafael Espindola     Dot = Pos;
3652de509c3SRui Ueyama }
366ceabe80eSEugene Leviant 
367d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::flush() {
368d3190795SRafael Espindola   if (auto *OutSec = dyn_cast_or_null<OutputSection<ELFT>>(CurOutSec)) {
369d3190795SRafael Espindola     for (InputSection<ELFT> *I : OutSec->Sections)
370d3190795SRafael Espindola       output(I);
371d3190795SRafael Espindola     AlreadyOutputOS.insert(CurOutSec);
372d3190795SRafael Espindola   }
373d3190795SRafael Espindola }
37497403d15SEugene Leviant 
375d3190795SRafael Espindola template <class ELFT>
376d3190795SRafael Espindola void LinkerScript<ELFT>::switchTo(OutputSectionBase<ELFT> *Sec) {
377d3190795SRafael Espindola   if (CurOutSec == Sec)
378d3190795SRafael Espindola     return;
379d3190795SRafael Espindola   if (AlreadyOutputOS.count(Sec))
380d3190795SRafael Espindola     return;
381d3190795SRafael Espindola 
382d3190795SRafael Espindola   flush();
383d3190795SRafael Espindola   CurOutSec = Sec;
384d3190795SRafael Espindola 
385d3190795SRafael Espindola   Dot = alignTo(Dot, CurOutSec->getAlignment());
386d3190795SRafael Espindola   CurOutSec->setVA(Dot);
387d3190795SRafael Espindola }
388d3190795SRafael Espindola 
389d3190795SRafael Espindola template <class ELFT> void LinkerScript<ELFT>::process(BaseCommand &Base) {
390d3190795SRafael Espindola   if (auto *AssignCmd = dyn_cast<SymbolAssignment>(&Base)) {
39197403d15SEugene Leviant     if (AssignCmd->Name == ".") {
39297403d15SEugene Leviant       // Update to location counter means update to section size.
393d3190795SRafael Espindola       Dot = AssignCmd->Expression(Dot);
394d3190795SRafael Espindola       CurOutSec->setSize(Dot - CurOutSec->getVA());
395d3190795SRafael Espindola       return;
39697403d15SEugene Leviant     }
397d3190795SRafael Espindola     assignSectionSymbol<ELFT>(AssignCmd, CurOutSec, Dot - CurOutSec->getVA());
398d3190795SRafael Espindola     return;
39997403d15SEugene Leviant   }
400d3190795SRafael Espindola   auto &ICmd = cast<InputSectionDescription>(Base);
401d3190795SRafael Espindola   for (InputSectionData *ID : ICmd.Sections) {
402d3190795SRafael Espindola     auto *IB = static_cast<InputSectionBase<ELFT> *>(ID);
403d3190795SRafael Espindola     switchTo(IB->OutSec);
404d3190795SRafael Espindola     if (auto *I = dyn_cast<InputSection<ELFT>>(IB))
405d3190795SRafael Espindola       output(I);
406d3190795SRafael Espindola     else if (AlreadyOutputOS.insert(CurOutSec).second)
407d3190795SRafael Espindola       Dot += CurOutSec->getSize();
408ceabe80eSEugene Leviant   }
409ceabe80eSEugene Leviant }
410ceabe80eSEugene Leviant 
4118f66df92SGeorge Rimar template <class ELFT>
412a14b13d8SGeorge Rimar static std::vector<OutputSectionBase<ELFT> *>
413a14b13d8SGeorge Rimar findSections(OutputSectionCommand &Cmd,
414d3190795SRafael Espindola              const std::vector<OutputSectionBase<ELFT> *> &Sections) {
415a14b13d8SGeorge Rimar   std::vector<OutputSectionBase<ELFT> *> Ret;
416a14b13d8SGeorge Rimar   for (OutputSectionBase<ELFT> *Sec : Sections)
4177c3ff2ebSRafael Espindola     if (Sec->getName() == Cmd.Name)
418a14b13d8SGeorge Rimar       Ret.push_back(Sec);
419a14b13d8SGeorge Rimar   return Ret;
4208f66df92SGeorge Rimar }
4218f66df92SGeorge Rimar 
422d3190795SRafael Espindola template <class ELFT>
423d3190795SRafael Espindola void LinkerScript<ELFT>::assignOffsets(OutputSectionCommand *Cmd) {
424d3190795SRafael Espindola   std::vector<OutputSectionBase<ELFT> *> Sections =
425d3190795SRafael Espindola       findSections(*Cmd, *OutputSections);
426d3190795SRafael Espindola   if (Sections.empty())
427d3190795SRafael Espindola     return;
428d3190795SRafael Espindola   switchTo(Sections[0]);
429d3190795SRafael Espindola 
430d3190795SRafael Espindola   // Find the last section output location. We will output orphan sections
431d3190795SRafael Espindola   // there so that end symbols point to the correct location.
432d3190795SRafael Espindola   auto E = std::find_if(Cmd->Commands.rbegin(), Cmd->Commands.rend(),
433d3190795SRafael Espindola                         [](const std::unique_ptr<BaseCommand> &Cmd) {
434d3190795SRafael Espindola                           return !isa<SymbolAssignment>(*Cmd);
435d3190795SRafael Espindola                         })
436d3190795SRafael Espindola                .base();
437d3190795SRafael Espindola   for (auto I = Cmd->Commands.begin(); I != E; ++I)
438d3190795SRafael Espindola     process(**I);
439d3190795SRafael Espindola   flush();
440d3190795SRafael Espindola   for (OutputSectionBase<ELFT> *Base : Sections) {
441d3190795SRafael Espindola     if (!AlreadyOutputOS.insert(Base).second)
442d3190795SRafael Espindola       continue;
443d3190795SRafael Espindola     switchTo(Base);
444d3190795SRafael Espindola     Dot += CurOutSec->getSize();
445d3190795SRafael Espindola   }
446d3190795SRafael Espindola   for (auto I = E, E = Cmd->Commands.end(); I != E; ++I)
447d3190795SRafael Espindola     process(**I);
448d3190795SRafael Espindola }
449d3190795SRafael Espindola 
450a4b41dcaSRafael Espindola template <class ELFT> void LinkerScript<ELFT>::assignAddresses() {
451652852c5SGeorge Rimar   // Orphan sections are sections present in the input files which
4527c18c28cSRui Ueyama   // are not explicitly placed into the output file by the linker script.
4537c18c28cSRui Ueyama   // We place orphan sections at end of file.
4547c18c28cSRui Ueyama   // Other linkers places them using some heuristics as described in
455652852c5SGeorge Rimar   // https://sourceware.org/binutils/docs/ld/Orphan-Sections.html#Orphan-Sections.
456e5cc668eSRui Ueyama   for (OutputSectionBase<ELFT> *Sec : *OutputSections) {
457652852c5SGeorge Rimar     StringRef Name = Sec->getName();
458c3e2a4b0SRui Ueyama     if (getSectionIndex(Name) == INT_MAX)
459076fe157SGeorge Rimar       Opt.Commands.push_back(llvm::make_unique<OutputSectionCommand>(Name));
460652852c5SGeorge Rimar   }
461652852c5SGeorge Rimar 
4627c18c28cSRui Ueyama   // Assign addresses as instructed by linker script SECTIONS sub-commands.
4634f7500bfSRui Ueyama   Dot = getHeaderSize();
464467c4d55SEugene Leviant   uintX_t MinVA = std::numeric_limits<uintX_t>::max();
465652852c5SGeorge Rimar 
466076fe157SGeorge Rimar   for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
467076fe157SGeorge Rimar     if (auto *Cmd = dyn_cast<SymbolAssignment>(Base.get())) {
4688d083e6aSRui Ueyama       if (Cmd->Name == ".") {
4698d083e6aSRui Ueyama         Dot = Cmd->Expression(Dot);
4708d083e6aSRui Ueyama       } else if (Cmd->Sym) {
4718d083e6aSRui Ueyama         cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(Dot);
4728d083e6aSRui Ueyama       }
47305ef4cffSRui Ueyama       continue;
474652852c5SGeorge Rimar     }
475652852c5SGeorge Rimar 
476eefa758eSGeorge Rimar     if (auto *Cmd = dyn_cast<AssertCommand>(Base.get())) {
477eefa758eSGeorge Rimar       Cmd->Expression(Dot);
478eefa758eSGeorge Rimar       continue;
479eefa758eSGeorge Rimar     }
480eefa758eSGeorge Rimar 
481076fe157SGeorge Rimar     auto *Cmd = cast<OutputSectionCommand>(Base.get());
482652852c5SGeorge Rimar 
48358e5c4dcSGeorge Rimar     if (Cmd->AddrExpr)
48458e5c4dcSGeorge Rimar       Dot = Cmd->AddrExpr(Dot);
48558e5c4dcSGeorge Rimar 
486467c4d55SEugene Leviant     MinVA = std::min(MinVA, Dot);
487d3190795SRafael Espindola     assignOffsets(Cmd);
488a14b13d8SGeorge Rimar   }
489467c4d55SEugene Leviant 
490d3190795SRafael Espindola   for (OutputSectionBase<ELFT> *Sec : *OutputSections)
491d3190795SRafael Espindola     if (!(Sec->getFlags() & SHF_ALLOC))
492d3190795SRafael Espindola       Sec->setVA(0);
4934ec013acSRafael Espindola   uintX_t HeaderSize =
4944ec013acSRafael Espindola       Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize();
4954ec013acSRafael Espindola   if (HeaderSize > MinVA)
4964ec013acSRafael Espindola     fatal("Not enough space for ELF and program headers");
4974ec013acSRafael Espindola 
49864c32d6fSRafael Espindola   // ELF and Program headers need to be right before the first section in
499b91e7118SGeorge Rimar   // memory. Set their addresses accordingly.
5004ec013acSRafael Espindola   MinVA = alignDown(MinVA - HeaderSize, Target->PageSize);
501467c4d55SEugene Leviant   Out<ELFT>::ElfHeader->setVA(MinVA);
502467c4d55SEugene Leviant   Out<ELFT>::ProgramHeaders->setVA(Out<ELFT>::ElfHeader->getSize() + MinVA);
503fb8978fcSDima Stepanov }
504652852c5SGeorge Rimar 
505464daadcSRui Ueyama // Creates program headers as instructed by PHDRS linker script command.
50607320e40SRui Ueyama template <class ELFT>
507a4b41dcaSRafael Espindola std::vector<PhdrEntry<ELFT>> LinkerScript<ELFT>::createPhdrs() {
508edebbdf1SRui Ueyama   std::vector<PhdrEntry<ELFT>> Ret;
509bbe38602SEugene Leviant 
510464daadcSRui Ueyama   // Process PHDRS and FILEHDR keywords because they are not
511464daadcSRui Ueyama   // real output sections and cannot be added in the following loop.
512bbe38602SEugene Leviant   for (const PhdrsCommand &Cmd : Opt.PhdrsCommands) {
513edebbdf1SRui Ueyama     Ret.emplace_back(Cmd.Type, Cmd.Flags == UINT_MAX ? PF_R : Cmd.Flags);
514edebbdf1SRui Ueyama     PhdrEntry<ELFT> &Phdr = Ret.back();
515bbe38602SEugene Leviant 
516bbe38602SEugene Leviant     if (Cmd.HasFilehdr)
517adca245fSRui Ueyama       Phdr.add(Out<ELFT>::ElfHeader);
518bbe38602SEugene Leviant     if (Cmd.HasPhdrs)
519adca245fSRui Ueyama       Phdr.add(Out<ELFT>::ProgramHeaders);
52056b21c86SEugene Leviant 
52156b21c86SEugene Leviant     if (Cmd.LMAExpr) {
52256b21c86SEugene Leviant       Phdr.H.p_paddr = Cmd.LMAExpr(0);
52356b21c86SEugene Leviant       Phdr.HasLMA = true;
52456b21c86SEugene Leviant     }
525bbe38602SEugene Leviant   }
526bbe38602SEugene Leviant 
527464daadcSRui Ueyama   // Add output sections to program headers.
528edebbdf1SRui Ueyama   PhdrEntry<ELFT> *Load = nullptr;
529edebbdf1SRui Ueyama   uintX_t Flags = PF_R;
530464daadcSRui Ueyama   for (OutputSectionBase<ELFT> *Sec : *OutputSections) {
531bbe38602SEugene Leviant     if (!(Sec->getFlags() & SHF_ALLOC))
532bbe38602SEugene Leviant       break;
533bbe38602SEugene Leviant 
534edebbdf1SRui Ueyama     std::vector<size_t> PhdrIds = getPhdrIndices(Sec->getName());
535bbe38602SEugene Leviant     if (!PhdrIds.empty()) {
536bbe38602SEugene Leviant       // Assign headers specified by linker script
537bbe38602SEugene Leviant       for (size_t Id : PhdrIds) {
538edebbdf1SRui Ueyama         Ret[Id].add(Sec);
539865bf863SEugene Leviant         if (Opt.PhdrsCommands[Id].Flags == UINT_MAX)
5400b113671SRafael Espindola           Ret[Id].H.p_flags |= Sec->getPhdrFlags();
541bbe38602SEugene Leviant       }
542bbe38602SEugene Leviant     } else {
543bbe38602SEugene Leviant       // If we have no load segment or flags've changed then we want new load
544bbe38602SEugene Leviant       // segment.
5450b113671SRafael Espindola       uintX_t NewFlags = Sec->getPhdrFlags();
546bbe38602SEugene Leviant       if (Load == nullptr || Flags != NewFlags) {
547edebbdf1SRui Ueyama         Load = &*Ret.emplace(Ret.end(), PT_LOAD, NewFlags);
548bbe38602SEugene Leviant         Flags = NewFlags;
549bbe38602SEugene Leviant       }
55018f084ffSRui Ueyama       Load->add(Sec);
551bbe38602SEugene Leviant     }
552bbe38602SEugene Leviant   }
553edebbdf1SRui Ueyama   return Ret;
554bbe38602SEugene Leviant }
555bbe38602SEugene Leviant 
556f9bc3bd2SEugene Leviant template <class ELFT> bool LinkerScript<ELFT>::ignoreInterpSection() {
557f9bc3bd2SEugene Leviant   // Ignore .interp section in case we have PHDRS specification
558f9bc3bd2SEugene Leviant   // and PT_INTERP isn't listed.
559f9bc3bd2SEugene Leviant   return !Opt.PhdrsCommands.empty() &&
560f9bc3bd2SEugene Leviant          llvm::find_if(Opt.PhdrsCommands, [](const PhdrsCommand &Cmd) {
561f9bc3bd2SEugene Leviant            return Cmd.Type == PT_INTERP;
562f9bc3bd2SEugene Leviant          }) == Opt.PhdrsCommands.end();
563f9bc3bd2SEugene Leviant }
564f9bc3bd2SEugene Leviant 
565bbe38602SEugene Leviant template <class ELFT>
56607320e40SRui Ueyama ArrayRef<uint8_t> LinkerScript<ELFT>::getFiller(StringRef Name) {
567f6c3ccefSGeorge Rimar   for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands)
568f6c3ccefSGeorge Rimar     if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
569f6c3ccefSGeorge Rimar       if (Cmd->Name == Name)
570f6c3ccefSGeorge Rimar         return Cmd->Filler;
571e2ee72b5SGeorge Rimar   return {};
572e2ee72b5SGeorge Rimar }
573e2ee72b5SGeorge Rimar 
574206fffa1SGeorge Rimar template <class ELFT> Expr LinkerScript<ELFT>::getLma(StringRef Name) {
5758ceadb38SGeorge Rimar   for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands)
5768ceadb38SGeorge Rimar     if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
5778ceadb38SGeorge Rimar       if (Cmd->LmaExpr && Cmd->Name == Name)
5788ceadb38SGeorge Rimar         return Cmd->LmaExpr;
5798ceadb38SGeorge Rimar   return {};
5808ceadb38SGeorge Rimar }
5818ceadb38SGeorge Rimar 
582c3e2a4b0SRui Ueyama // Returns the index of the given section name in linker script
583c3e2a4b0SRui Ueyama // SECTIONS commands. Sections are laid out as the same order as they
584c3e2a4b0SRui Ueyama // were in the script. If a given name did not appear in the script,
585c3e2a4b0SRui Ueyama // it returns INT_MAX, so that it will be laid out at end of file.
586076fe157SGeorge Rimar template <class ELFT> int LinkerScript<ELFT>::getSectionIndex(StringRef Name) {
587f510fa6bSRui Ueyama   int I = 0;
588f510fa6bSRui Ueyama   for (std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
589076fe157SGeorge Rimar     if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
590076fe157SGeorge Rimar       if (Cmd->Name == Name)
591f510fa6bSRui Ueyama         return I;
592f510fa6bSRui Ueyama     ++I;
593f510fa6bSRui Ueyama   }
594f510fa6bSRui Ueyama   return INT_MAX;
59571b26e94SGeorge Rimar }
59671b26e94SGeorge Rimar 
59771b26e94SGeorge Rimar // A compartor to sort output sections. Returns -1 or 1 if
59871b26e94SGeorge Rimar // A or B are mentioned in linker script. Otherwise, returns 0.
59907320e40SRui Ueyama template <class ELFT>
60007320e40SRui Ueyama int LinkerScript<ELFT>::compareSections(StringRef A, StringRef B) {
601c3e2a4b0SRui Ueyama   int I = getSectionIndex(A);
602c3e2a4b0SRui Ueyama   int J = getSectionIndex(B);
603c3e2a4b0SRui Ueyama   if (I == INT_MAX && J == INT_MAX)
604717677afSRui Ueyama     return 0;
605717677afSRui Ueyama   return I < J ? -1 : 1;
606717677afSRui Ueyama }
607717677afSRui Ueyama 
608bbe38602SEugene Leviant template <class ELFT> bool LinkerScript<ELFT>::hasPhdrsCommands() {
609bbe38602SEugene Leviant   return !Opt.PhdrsCommands.empty();
610bbe38602SEugene Leviant }
611bbe38602SEugene Leviant 
6129e69450eSGeorge Rimar template <class ELFT>
613884e786dSGeorge Rimar uint64_t LinkerScript<ELFT>::getOutputSectionAddress(StringRef Name) {
61496659df0SGeorge Rimar   for (OutputSectionBase<ELFT> *Sec : *OutputSections)
61596659df0SGeorge Rimar     if (Sec->getName() == Name)
61696659df0SGeorge Rimar       return Sec->getVA();
61796659df0SGeorge Rimar   error("undefined section " + Name);
61896659df0SGeorge Rimar   return 0;
61996659df0SGeorge Rimar }
62096659df0SGeorge Rimar 
62196659df0SGeorge Rimar template <class ELFT>
622884e786dSGeorge Rimar uint64_t LinkerScript<ELFT>::getOutputSectionSize(StringRef Name) {
6239e69450eSGeorge Rimar   for (OutputSectionBase<ELFT> *Sec : *OutputSections)
6249e69450eSGeorge Rimar     if (Sec->getName() == Name)
6259e69450eSGeorge Rimar       return Sec->getSize();
6269e69450eSGeorge Rimar   error("undefined section " + Name);
6279e69450eSGeorge Rimar   return 0;
6289e69450eSGeorge Rimar }
6299e69450eSGeorge Rimar 
63036fac7f0SEugene Leviant template <class ELFT>
63136fac7f0SEugene Leviant uint64_t LinkerScript<ELFT>::getOutputSectionAlign(StringRef Name) {
63236fac7f0SEugene Leviant   for (OutputSectionBase<ELFT> *Sec : *OutputSections)
63336fac7f0SEugene Leviant     if (Sec->getName() == Name)
63436fac7f0SEugene Leviant       return Sec->getAlignment();
63536fac7f0SEugene Leviant   error("undefined section " + Name);
63636fac7f0SEugene Leviant   return 0;
63736fac7f0SEugene Leviant }
63836fac7f0SEugene Leviant 
639884e786dSGeorge Rimar template <class ELFT> uint64_t LinkerScript<ELFT>::getHeaderSize() {
640e32a3598SGeorge Rimar   return Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize();
641e32a3598SGeorge Rimar }
642e32a3598SGeorge Rimar 
643884e786dSGeorge Rimar template <class ELFT> uint64_t LinkerScript<ELFT>::getSymbolValue(StringRef S) {
644884e786dSGeorge Rimar   if (SymbolBody *B = Symtab<ELFT>::X->find(S))
645884e786dSGeorge Rimar     return B->getVA<ELFT>();
646884e786dSGeorge Rimar   error("symbol not found: " + S);
647884e786dSGeorge Rimar   return 0;
648884e786dSGeorge Rimar }
649884e786dSGeorge Rimar 
650bbe38602SEugene Leviant // Returns indices of ELF headers containing specific section, identified
651bbe38602SEugene Leviant // by Name. Each index is a zero based number of ELF header listed within
652bbe38602SEugene Leviant // PHDRS {} script block.
653bbe38602SEugene Leviant template <class ELFT>
654edebbdf1SRui Ueyama std::vector<size_t> LinkerScript<ELFT>::getPhdrIndices(StringRef SectionName) {
655076fe157SGeorge Rimar   for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
656076fe157SGeorge Rimar     auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get());
657edebbdf1SRui Ueyama     if (!Cmd || Cmd->Name != SectionName)
65831d842f5SGeorge Rimar       continue;
65931d842f5SGeorge Rimar 
66029c5a2a9SRui Ueyama     std::vector<size_t> Ret;
66129c5a2a9SRui Ueyama     for (StringRef PhdrName : Cmd->Phdrs)
66229c5a2a9SRui Ueyama       Ret.push_back(getPhdrIndex(PhdrName));
66329c5a2a9SRui Ueyama     return Ret;
664bbe38602SEugene Leviant   }
66531d842f5SGeorge Rimar   return {};
66631d842f5SGeorge Rimar }
667bbe38602SEugene Leviant 
66829c5a2a9SRui Ueyama template <class ELFT>
66929c5a2a9SRui Ueyama size_t LinkerScript<ELFT>::getPhdrIndex(StringRef PhdrName) {
67029c5a2a9SRui Ueyama   size_t I = 0;
67129c5a2a9SRui Ueyama   for (PhdrsCommand &Cmd : Opt.PhdrsCommands) {
67229c5a2a9SRui Ueyama     if (Cmd.Name == PhdrName)
67329c5a2a9SRui Ueyama       return I;
67429c5a2a9SRui Ueyama     ++I;
67529c5a2a9SRui Ueyama   }
67629c5a2a9SRui Ueyama   error("section header '" + PhdrName + "' is not listed in PHDRS");
67729c5a2a9SRui Ueyama   return 0;
67829c5a2a9SRui Ueyama }
67929c5a2a9SRui Ueyama 
68007320e40SRui Ueyama class elf::ScriptParser : public ScriptParserBase {
681c3794e58SGeorge Rimar   typedef void (ScriptParser::*Handler)();
682c3794e58SGeorge Rimar 
683f7c5fbb1SRui Ueyama public:
68407320e40SRui Ueyama   ScriptParser(StringRef S, bool B) : ScriptParserBase(S), IsUnderSysroot(B) {}
685f23b2320SGeorge Rimar 
68620b6598cSGeorge Rimar   void readLinkerScript();
68720b6598cSGeorge Rimar   void readVersionScript();
688f7c5fbb1SRui Ueyama 
689f7c5fbb1SRui Ueyama private:
69052a1509eSRui Ueyama   void addFile(StringRef Path);
69152a1509eSRui Ueyama 
692f7c5fbb1SRui Ueyama   void readAsNeeded();
69390c5099eSDenis Protivensky   void readEntry();
69483f406cfSGeorge Rimar   void readExtern();
695f7c5fbb1SRui Ueyama   void readGroup();
69631aa1f83SRui Ueyama   void readInclude();
697ee59282bSRui Ueyama   void readOutput();
6989159ce93SDavide Italiano   void readOutputArch();
699f7c5fbb1SRui Ueyama   void readOutputFormat();
700bbe38602SEugene Leviant   void readPhdrs();
70168a39a65SDavide Italiano   void readSearchDir();
7028e3b38abSDenis Protivensky   void readSections();
70395769b4aSRui Ueyama   void readVersion();
70495769b4aSRui Ueyama   void readVersionScriptCommand();
7058e3b38abSDenis Protivensky 
706113cdec9SRui Ueyama   SymbolAssignment *readAssignment(StringRef Name);
707ff1f29e0SGeorge Rimar   std::vector<uint8_t> readFill();
70810416564SRui Ueyama   OutputSectionCommand *readOutputSectionDescription(StringRef OutSec);
709ff1f29e0SGeorge Rimar   std::vector<uint8_t> readOutputSectionFiller(StringRef Tok);
710bbe38602SEugene Leviant   std::vector<StringRef> readOutputSectionPhdrs();
711a2496cbeSGeorge Rimar   InputSectionDescription *readInputSectionDescription(StringRef Tok);
712c91930a1SGeorge Rimar   Regex readFilePatterns();
713395281cfSGeorge Rimar   void readSectionExcludes(InputSectionDescription *Cmd);
714a2496cbeSGeorge Rimar   InputSectionDescription *readInputSectionRules(StringRef FilePattern);
715bbe38602SEugene Leviant   unsigned readPhdrType();
716be394db3SGeorge Rimar   SortSectionPolicy readSortKind();
717a35e39caSPetr Hosek   SymbolAssignment *readProvideHidden(bool Provide, bool Hidden);
718db741e72SEugene Leviant   SymbolAssignment *readProvideOrAssignment(StringRef Tok, bool MakeAbsolute);
71903fc010eSGeorge Rimar   void readSort();
720eefa758eSGeorge Rimar   Expr readAssert();
721708019c4SRui Ueyama 
722708019c4SRui Ueyama   Expr readExpr();
723708019c4SRui Ueyama   Expr readExpr1(Expr Lhs, int MinPrec);
724708019c4SRui Ueyama   Expr readPrimary();
725708019c4SRui Ueyama   Expr readTernary(Expr Cond);
7266ad7dfccSRui Ueyama   Expr readParenExpr();
727f7c5fbb1SRui Ueyama 
72820b6598cSGeorge Rimar   // For parsing version script.
72920b6598cSGeorge Rimar   void readExtern(std::vector<SymbolVersion> *Globals);
73095769b4aSRui Ueyama   void readVersionDeclaration(StringRef VerStr);
73120b6598cSGeorge Rimar   void readGlobal(StringRef VerStr);
73220b6598cSGeorge Rimar   void readLocal();
73320b6598cSGeorge Rimar 
73407320e40SRui Ueyama   ScriptConfiguration &Opt = *ScriptConfig;
73507320e40SRui Ueyama   StringSaver Saver = {ScriptConfig->Alloc};
73616b0cc9eSSimon Atanasyan   bool IsUnderSysroot;
737f7c5fbb1SRui Ueyama };
738f7c5fbb1SRui Ueyama 
73920b6598cSGeorge Rimar void ScriptParser::readVersionScript() {
74095769b4aSRui Ueyama   readVersionScriptCommand();
74120b6598cSGeorge Rimar   if (!atEOF())
74295769b4aSRui Ueyama     setError("EOF expected, but got " + next());
74395769b4aSRui Ueyama }
74495769b4aSRui Ueyama 
74595769b4aSRui Ueyama void ScriptParser::readVersionScriptCommand() {
74695769b4aSRui Ueyama   if (skip("{")) {
74795769b4aSRui Ueyama     readVersionDeclaration("");
74820b6598cSGeorge Rimar     return;
74920b6598cSGeorge Rimar   }
75020b6598cSGeorge Rimar 
75195769b4aSRui Ueyama   while (!atEOF() && !Error && peek() != "}") {
75220b6598cSGeorge Rimar     StringRef VerStr = next();
75320b6598cSGeorge Rimar     if (VerStr == "{") {
75495769b4aSRui Ueyama       setError("anonymous version definition is used in "
75595769b4aSRui Ueyama                "combination with other version definitions");
75620b6598cSGeorge Rimar       return;
75720b6598cSGeorge Rimar     }
75820b6598cSGeorge Rimar     expect("{");
75995769b4aSRui Ueyama     readVersionDeclaration(VerStr);
76020b6598cSGeorge Rimar   }
76120b6598cSGeorge Rimar }
76220b6598cSGeorge Rimar 
76395769b4aSRui Ueyama void ScriptParser::readVersion() {
76495769b4aSRui Ueyama   expect("{");
76595769b4aSRui Ueyama   readVersionScriptCommand();
76695769b4aSRui Ueyama   expect("}");
76795769b4aSRui Ueyama }
76895769b4aSRui Ueyama 
76920b6598cSGeorge Rimar void ScriptParser::readLinkerScript() {
770f7c5fbb1SRui Ueyama   while (!atEOF()) {
771f7c5fbb1SRui Ueyama     StringRef Tok = next();
772a27eeccaSRui Ueyama     if (Tok == ";")
773a27eeccaSRui Ueyama       continue;
774a27eeccaSRui Ueyama 
77520d03194SEugene Leviant     if (Tok == "ASSERT") {
77620d03194SEugene Leviant       Opt.Commands.emplace_back(new AssertCommand(readAssert()));
77720d03194SEugene Leviant     } else if (Tok == "ENTRY") {
778a27eeccaSRui Ueyama       readEntry();
779a27eeccaSRui Ueyama     } else if (Tok == "EXTERN") {
780a27eeccaSRui Ueyama       readExtern();
781a27eeccaSRui Ueyama     } else if (Tok == "GROUP" || Tok == "INPUT") {
782a27eeccaSRui Ueyama       readGroup();
783a27eeccaSRui Ueyama     } else if (Tok == "INCLUDE") {
784a27eeccaSRui Ueyama       readInclude();
785a27eeccaSRui Ueyama     } else if (Tok == "OUTPUT") {
786a27eeccaSRui Ueyama       readOutput();
787a27eeccaSRui Ueyama     } else if (Tok == "OUTPUT_ARCH") {
788a27eeccaSRui Ueyama       readOutputArch();
789a27eeccaSRui Ueyama     } else if (Tok == "OUTPUT_FORMAT") {
790a27eeccaSRui Ueyama       readOutputFormat();
791a27eeccaSRui Ueyama     } else if (Tok == "PHDRS") {
792a27eeccaSRui Ueyama       readPhdrs();
793a27eeccaSRui Ueyama     } else if (Tok == "SEARCH_DIR") {
794a27eeccaSRui Ueyama       readSearchDir();
795a27eeccaSRui Ueyama     } else if (Tok == "SECTIONS") {
796a27eeccaSRui Ueyama       readSections();
797a27eeccaSRui Ueyama     } else if (Tok == "VERSION") {
798a27eeccaSRui Ueyama       readVersion();
799db741e72SEugene Leviant     } else if (SymbolAssignment *Cmd = readProvideOrAssignment(Tok, true)) {
8000df80befSPetr Hosek       Opt.Commands.emplace_back(Cmd);
801e5d3ca50SPetr Hosek     } else {
8025761042dSGeorge Rimar       setError("unknown directive: " + Tok);
803f7c5fbb1SRui Ueyama     }
804f7c5fbb1SRui Ueyama   }
805e5d3ca50SPetr Hosek }
806f7c5fbb1SRui Ueyama 
807717677afSRui Ueyama void ScriptParser::addFile(StringRef S) {
80816b0cc9eSSimon Atanasyan   if (IsUnderSysroot && S.startswith("/")) {
80916b0cc9eSSimon Atanasyan     SmallString<128> Path;
81016b0cc9eSSimon Atanasyan     (Config->Sysroot + S).toStringRef(Path);
81116b0cc9eSSimon Atanasyan     if (sys::fs::exists(Path)) {
81216b0cc9eSSimon Atanasyan       Driver->addFile(Saver.save(Path.str()));
81316b0cc9eSSimon Atanasyan       return;
81416b0cc9eSSimon Atanasyan     }
81516b0cc9eSSimon Atanasyan   }
81616b0cc9eSSimon Atanasyan 
817f03f3cc1SRui Ueyama   if (sys::path::is_absolute(S)) {
81852a1509eSRui Ueyama     Driver->addFile(S);
81952a1509eSRui Ueyama   } else if (S.startswith("=")) {
82052a1509eSRui Ueyama     if (Config->Sysroot.empty())
82152a1509eSRui Ueyama       Driver->addFile(S.substr(1));
82252a1509eSRui Ueyama     else
82352a1509eSRui Ueyama       Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1)));
82452a1509eSRui Ueyama   } else if (S.startswith("-l")) {
82521eecb4fSRui Ueyama     Driver->addLibrary(S.substr(2));
826a1b8fc3bSSimon Atanasyan   } else if (sys::fs::exists(S)) {
827a1b8fc3bSSimon Atanasyan     Driver->addFile(S);
82852a1509eSRui Ueyama   } else {
82952a1509eSRui Ueyama     std::string Path = findFromSearchPaths(S);
83052a1509eSRui Ueyama     if (Path.empty())
831777f9630SGeorge Rimar       setError("unable to find " + S);
832025d59b1SRui Ueyama     else
83352a1509eSRui Ueyama       Driver->addFile(Saver.save(Path));
83452a1509eSRui Ueyama   }
83552a1509eSRui Ueyama }
83652a1509eSRui Ueyama 
837717677afSRui Ueyama void ScriptParser::readAsNeeded() {
838f7c5fbb1SRui Ueyama   expect("(");
83935da9b6eSRui Ueyama   bool Orig = Config->AsNeeded;
84035da9b6eSRui Ueyama   Config->AsNeeded = true;
841a2acc931SRui Ueyama   while (!Error && !skip(")"))
842cd574a5eSGeorge Rimar     addFile(unquote(next()));
84335da9b6eSRui Ueyama   Config->AsNeeded = Orig;
844f7c5fbb1SRui Ueyama }
845f7c5fbb1SRui Ueyama 
846717677afSRui Ueyama void ScriptParser::readEntry() {
84790c5099eSDenis Protivensky   // -e <symbol> takes predecence over ENTRY(<symbol>).
84890c5099eSDenis Protivensky   expect("(");
84990c5099eSDenis Protivensky   StringRef Tok = next();
85090c5099eSDenis Protivensky   if (Config->Entry.empty())
85190c5099eSDenis Protivensky     Config->Entry = Tok;
85290c5099eSDenis Protivensky   expect(")");
85390c5099eSDenis Protivensky }
85490c5099eSDenis Protivensky 
855717677afSRui Ueyama void ScriptParser::readExtern() {
85683f406cfSGeorge Rimar   expect("(");
857a2acc931SRui Ueyama   while (!Error && !skip(")"))
858a2acc931SRui Ueyama     Config->Undefined.push_back(next());
85983f406cfSGeorge Rimar }
86083f406cfSGeorge Rimar 
861717677afSRui Ueyama void ScriptParser::readGroup() {
862f7c5fbb1SRui Ueyama   expect("(");
863a2acc931SRui Ueyama   while (!Error && !skip(")")) {
864f7c5fbb1SRui Ueyama     StringRef Tok = next();
865a2acc931SRui Ueyama     if (Tok == "AS_NEEDED")
866f7c5fbb1SRui Ueyama       readAsNeeded();
867a2acc931SRui Ueyama     else
868cd574a5eSGeorge Rimar       addFile(unquote(Tok));
869f7c5fbb1SRui Ueyama   }
870f7c5fbb1SRui Ueyama }
871f7c5fbb1SRui Ueyama 
872717677afSRui Ueyama void ScriptParser::readInclude() {
87331aa1f83SRui Ueyama   StringRef Tok = next();
874cd574a5eSGeorge Rimar   auto MBOrErr = MemoryBuffer::getFile(unquote(Tok));
875025d59b1SRui Ueyama   if (!MBOrErr) {
8765761042dSGeorge Rimar     setError("cannot open " + Tok);
877025d59b1SRui Ueyama     return;
878025d59b1SRui Ueyama   }
87931aa1f83SRui Ueyama   std::unique_ptr<MemoryBuffer> &MB = *MBOrErr;
880a47ee68dSRui Ueyama   StringRef S = Saver.save(MB->getMemBufferRef().getBuffer());
881a47ee68dSRui Ueyama   std::vector<StringRef> V = tokenize(S);
88231aa1f83SRui Ueyama   Tokens.insert(Tokens.begin() + Pos, V.begin(), V.end());
88331aa1f83SRui Ueyama }
88431aa1f83SRui Ueyama 
885717677afSRui Ueyama void ScriptParser::readOutput() {
886ee59282bSRui Ueyama   // -o <file> takes predecence over OUTPUT(<file>).
887ee59282bSRui Ueyama   expect("(");
888ee59282bSRui Ueyama   StringRef Tok = next();
889ee59282bSRui Ueyama   if (Config->OutputFile.empty())
890cd574a5eSGeorge Rimar     Config->OutputFile = unquote(Tok);
891ee59282bSRui Ueyama   expect(")");
892ee59282bSRui Ueyama }
893ee59282bSRui Ueyama 
894717677afSRui Ueyama void ScriptParser::readOutputArch() {
8959159ce93SDavide Italiano   // Error checking only for now.
8969159ce93SDavide Italiano   expect("(");
8979159ce93SDavide Italiano   next();
8989159ce93SDavide Italiano   expect(")");
8999159ce93SDavide Italiano }
9009159ce93SDavide Italiano 
901717677afSRui Ueyama void ScriptParser::readOutputFormat() {
902f7c5fbb1SRui Ueyama   // Error checking only for now.
903f7c5fbb1SRui Ueyama   expect("(");
904f7c5fbb1SRui Ueyama   next();
9056836c618SDavide Italiano   StringRef Tok = next();
9066836c618SDavide Italiano   if (Tok == ")")
9076836c618SDavide Italiano     return;
908025d59b1SRui Ueyama   if (Tok != ",") {
9095761042dSGeorge Rimar     setError("unexpected token: " + Tok);
910025d59b1SRui Ueyama     return;
911025d59b1SRui Ueyama   }
9126836c618SDavide Italiano   next();
9136836c618SDavide Italiano   expect(",");
9146836c618SDavide Italiano   next();
915f7c5fbb1SRui Ueyama   expect(")");
916f7c5fbb1SRui Ueyama }
917f7c5fbb1SRui Ueyama 
918bbe38602SEugene Leviant void ScriptParser::readPhdrs() {
919bbe38602SEugene Leviant   expect("{");
920bbe38602SEugene Leviant   while (!Error && !skip("}")) {
921bbe38602SEugene Leviant     StringRef Tok = next();
92256b21c86SEugene Leviant     Opt.PhdrsCommands.push_back(
92356b21c86SEugene Leviant         {Tok, PT_NULL, false, false, UINT_MAX, nullptr});
924bbe38602SEugene Leviant     PhdrsCommand &PhdrCmd = Opt.PhdrsCommands.back();
925bbe38602SEugene Leviant 
926bbe38602SEugene Leviant     PhdrCmd.Type = readPhdrType();
927bbe38602SEugene Leviant     do {
928bbe38602SEugene Leviant       Tok = next();
929bbe38602SEugene Leviant       if (Tok == ";")
930bbe38602SEugene Leviant         break;
931bbe38602SEugene Leviant       if (Tok == "FILEHDR")
932bbe38602SEugene Leviant         PhdrCmd.HasFilehdr = true;
933bbe38602SEugene Leviant       else if (Tok == "PHDRS")
934bbe38602SEugene Leviant         PhdrCmd.HasPhdrs = true;
93556b21c86SEugene Leviant       else if (Tok == "AT")
93656b21c86SEugene Leviant         PhdrCmd.LMAExpr = readParenExpr();
937865bf863SEugene Leviant       else if (Tok == "FLAGS") {
938865bf863SEugene Leviant         expect("(");
939eb685cd7SRafael Espindola         // Passing 0 for the value of dot is a bit of a hack. It means that
940eb685cd7SRafael Espindola         // we accept expressions like ".|1".
941eb685cd7SRafael Espindola         PhdrCmd.Flags = readExpr()(0);
942865bf863SEugene Leviant         expect(")");
943865bf863SEugene Leviant       } else
944bbe38602SEugene Leviant         setError("unexpected header attribute: " + Tok);
945bbe38602SEugene Leviant     } while (!Error);
946bbe38602SEugene Leviant   }
947bbe38602SEugene Leviant }
948bbe38602SEugene Leviant 
949717677afSRui Ueyama void ScriptParser::readSearchDir() {
95068a39a65SDavide Italiano   expect("(");
95186c5fb82SRui Ueyama   StringRef Tok = next();
9526c7ad13fSRui Ueyama   if (!Config->Nostdlib)
953cd574a5eSGeorge Rimar     Config->SearchPaths.push_back(unquote(Tok));
95468a39a65SDavide Italiano   expect(")");
95568a39a65SDavide Italiano }
95668a39a65SDavide Italiano 
957717677afSRui Ueyama void ScriptParser::readSections() {
958e05336ffSEugene Leviant   Opt.HasSections = true;
9598e3b38abSDenis Protivensky   expect("{");
960652852c5SGeorge Rimar   while (!Error && !skip("}")) {
961113cdec9SRui Ueyama     StringRef Tok = next();
962db741e72SEugene Leviant     BaseCommand *Cmd = readProvideOrAssignment(Tok, true);
963ceabe80eSEugene Leviant     if (!Cmd) {
964ceabe80eSEugene Leviant       if (Tok == "ASSERT")
965eefa758eSGeorge Rimar         Cmd = new AssertCommand(readAssert());
966ceabe80eSEugene Leviant       else
96710416564SRui Ueyama         Cmd = readOutputSectionDescription(Tok);
9688e3b38abSDenis Protivensky     }
96910416564SRui Ueyama     Opt.Commands.emplace_back(Cmd);
970652852c5SGeorge Rimar   }
971708019c4SRui Ueyama }
9728e3b38abSDenis Protivensky 
973708019c4SRui Ueyama static int precedence(StringRef Op) {
974708019c4SRui Ueyama   return StringSwitch<int>(Op)
975708019c4SRui Ueyama       .Case("*", 4)
976708019c4SRui Ueyama       .Case("/", 4)
977708019c4SRui Ueyama       .Case("+", 3)
978708019c4SRui Ueyama       .Case("-", 3)
979708019c4SRui Ueyama       .Case("<", 2)
980708019c4SRui Ueyama       .Case(">", 2)
981708019c4SRui Ueyama       .Case(">=", 2)
982708019c4SRui Ueyama       .Case("<=", 2)
983708019c4SRui Ueyama       .Case("==", 2)
984708019c4SRui Ueyama       .Case("!=", 2)
985708019c4SRui Ueyama       .Case("&", 1)
986cc3dd629SRafael Espindola       .Case("|", 1)
987708019c4SRui Ueyama       .Default(-1);
988708019c4SRui Ueyama }
989708019c4SRui Ueyama 
990c91930a1SGeorge Rimar Regex ScriptParser::readFilePatterns() {
99110416564SRui Ueyama   std::vector<StringRef> V;
99210416564SRui Ueyama   while (!Error && !skip(")"))
99310416564SRui Ueyama     V.push_back(next());
994c91930a1SGeorge Rimar   return compileGlobPatterns(V);
9950702c4e8SGeorge Rimar }
9960702c4e8SGeorge Rimar 
997be394db3SGeorge Rimar SortSectionPolicy ScriptParser::readSortKind() {
998742c3836SRui Ueyama   if (skip("SORT") || skip("SORT_BY_NAME"))
999be394db3SGeorge Rimar     return SortSectionPolicy::Name;
1000742c3836SRui Ueyama   if (skip("SORT_BY_ALIGNMENT"))
1001be394db3SGeorge Rimar     return SortSectionPolicy::Alignment;
1002575208caSGeorge Rimar   if (skip("SORT_BY_INIT_PRIORITY"))
1003be394db3SGeorge Rimar     return SortSectionPolicy::Priority;
1004be394db3SGeorge Rimar   if (skip("SORT_NONE"))
1005be394db3SGeorge Rimar     return SortSectionPolicy::None;
1006*b2a0abdfSRui Ueyama   return SortSectionPolicy::Default;
1007be394db3SGeorge Rimar }
1008be394db3SGeorge Rimar 
1009be394db3SGeorge Rimar static void selectSortKind(InputSectionDescription *Cmd) {
1010*b2a0abdfSRui Ueyama   if (Cmd->SortOuter == SortSectionPolicy::None) {
1011*b2a0abdfSRui Ueyama     Cmd->SortOuter = SortSectionPolicy::Default;
1012be394db3SGeorge Rimar     return;
1013be394db3SGeorge Rimar   }
1014be394db3SGeorge Rimar 
1015*b2a0abdfSRui Ueyama   if (Cmd->SortOuter != SortSectionPolicy::Default) {
1016be394db3SGeorge Rimar     // If the section sorting command in linker script is nested, the command
1017be394db3SGeorge Rimar     // line option will be ignored.
1018*b2a0abdfSRui Ueyama     if (Cmd->SortInner != SortSectionPolicy::Default)
1019be394db3SGeorge Rimar       return;
1020be394db3SGeorge Rimar     // If the section sorting command in linker script isn't nested, the
1021be394db3SGeorge Rimar     // command line option will make the section sorting command to be treated
1022be394db3SGeorge Rimar     // as nested sorting command.
1023be394db3SGeorge Rimar     Cmd->SortInner = Config->SortSection;
1024be394db3SGeorge Rimar     return;
1025be394db3SGeorge Rimar   }
1026be394db3SGeorge Rimar   // If sorting rule not specified, use command line option.
1027be394db3SGeorge Rimar   Cmd->SortOuter = Config->SortSection;
1028742c3836SRui Ueyama }
1029742c3836SRui Ueyama 
1030395281cfSGeorge Rimar // Method reads a list of sequence of excluded files and section globs given in
1031395281cfSGeorge Rimar // a following form: ((EXCLUDE_FILE(file_pattern+))? section_pattern+)+
1032395281cfSGeorge Rimar // Example: *(.foo.1 EXCLUDE_FILE (*a.o) .foo.2 EXCLUDE_FILE (*b.o) .foo.3)
1033395281cfSGeorge Rimar void ScriptParser::readSectionExcludes(InputSectionDescription *Cmd) {
1034395281cfSGeorge Rimar   llvm::Regex ExcludeFileRe;
1035395281cfSGeorge Rimar   std::vector<StringRef> V;
1036395281cfSGeorge Rimar 
1037395281cfSGeorge Rimar   while (!Error) {
1038395281cfSGeorge Rimar     if (skip(")")) {
1039395281cfSGeorge Rimar       Cmd->SectionsVec.push_back(
1040395281cfSGeorge Rimar           {std::move(ExcludeFileRe), compileGlobPatterns(V)});
1041395281cfSGeorge Rimar       return;
1042395281cfSGeorge Rimar     }
1043395281cfSGeorge Rimar 
1044395281cfSGeorge Rimar     if (skip("EXCLUDE_FILE")) {
1045395281cfSGeorge Rimar       if (!V.empty()) {
1046395281cfSGeorge Rimar         Cmd->SectionsVec.push_back(
1047395281cfSGeorge Rimar             {std::move(ExcludeFileRe), compileGlobPatterns(V)});
1048395281cfSGeorge Rimar         V.clear();
1049395281cfSGeorge Rimar       }
1050395281cfSGeorge Rimar 
1051395281cfSGeorge Rimar       expect("(");
1052395281cfSGeorge Rimar       ExcludeFileRe = readFilePatterns();
1053395281cfSGeorge Rimar       continue;
1054395281cfSGeorge Rimar     }
1055395281cfSGeorge Rimar 
1056395281cfSGeorge Rimar     V.push_back(next());
1057395281cfSGeorge Rimar   }
1058395281cfSGeorge Rimar }
1059395281cfSGeorge Rimar 
1060a2496cbeSGeorge Rimar InputSectionDescription *
1061a2496cbeSGeorge Rimar ScriptParser::readInputSectionRules(StringRef FilePattern) {
1062c91930a1SGeorge Rimar   auto *Cmd = new InputSectionDescription(FilePattern);
10630ed42b0cSDavide Italiano   expect("(");
1064e7282797SDavide Italiano 
1065742c3836SRui Ueyama   // Read SORT().
1066be394db3SGeorge Rimar   SortSectionPolicy K1 = readSortKind();
1067*b2a0abdfSRui Ueyama   if (K1 != SortSectionPolicy::Default) {
1068742c3836SRui Ueyama     Cmd->SortOuter = K1;
10690702c4e8SGeorge Rimar     expect("(");
1070be394db3SGeorge Rimar     SortSectionPolicy K2 = readSortKind();
1071*b2a0abdfSRui Ueyama     if (K2 != SortSectionPolicy::Default) {
1072742c3836SRui Ueyama       Cmd->SortInner = K2;
1073350ece4eSGeorge Rimar       expect("(");
1074395281cfSGeorge Rimar       Cmd->SectionsVec.push_back({llvm::Regex(), readFilePatterns()});
10750702c4e8SGeorge Rimar       expect(")");
1076350ece4eSGeorge Rimar     } else {
1077395281cfSGeorge Rimar       Cmd->SectionsVec.push_back({llvm::Regex(), readFilePatterns()});
1078350ece4eSGeorge Rimar     }
1079350ece4eSGeorge Rimar     expect(")");
1080be394db3SGeorge Rimar     selectSortKind(Cmd);
108110416564SRui Ueyama     return Cmd;
10820659800eSGeorge Rimar   }
10830702c4e8SGeorge Rimar 
1084be394db3SGeorge Rimar   selectSortKind(Cmd);
1085395281cfSGeorge Rimar   readSectionExcludes(Cmd);
108610416564SRui Ueyama   return Cmd;
10870659800eSGeorge Rimar }
10880659800eSGeorge Rimar 
1089a2496cbeSGeorge Rimar InputSectionDescription *
1090a2496cbeSGeorge Rimar ScriptParser::readInputSectionDescription(StringRef Tok) {
10910659800eSGeorge Rimar   // Input section wildcard can be surrounded by KEEP.
10920659800eSGeorge Rimar   // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep
1093a2496cbeSGeorge Rimar   if (Tok == "KEEP") {
1094e7282797SDavide Italiano     expect("(");
1095a2496cbeSGeorge Rimar     StringRef FilePattern = next();
1096a2496cbeSGeorge Rimar     InputSectionDescription *Cmd = readInputSectionRules(FilePattern);
10970ed42b0cSDavide Italiano     expect(")");
1098395281cfSGeorge Rimar     for (std::pair<llvm::Regex, llvm::Regex> &Regex : Cmd->SectionsVec)
1099395281cfSGeorge Rimar       Opt.KeptSections.push_back(&Regex.second);
110010416564SRui Ueyama     return Cmd;
110110416564SRui Ueyama   }
1102a2496cbeSGeorge Rimar   return readInputSectionRules(Tok);
11030659800eSGeorge Rimar }
11040659800eSGeorge Rimar 
110503fc010eSGeorge Rimar void ScriptParser::readSort() {
110603fc010eSGeorge Rimar   expect("(");
110703fc010eSGeorge Rimar   expect("CONSTRUCTORS");
110803fc010eSGeorge Rimar   expect(")");
110903fc010eSGeorge Rimar }
111003fc010eSGeorge Rimar 
1111eefa758eSGeorge Rimar Expr ScriptParser::readAssert() {
1112eefa758eSGeorge Rimar   expect("(");
1113eefa758eSGeorge Rimar   Expr E = readExpr();
1114eefa758eSGeorge Rimar   expect(",");
1115cd574a5eSGeorge Rimar   StringRef Msg = unquote(next());
1116eefa758eSGeorge Rimar   expect(")");
1117eefa758eSGeorge Rimar   return [=](uint64_t Dot) {
1118eefa758eSGeorge Rimar     uint64_t V = E(Dot);
1119eefa758eSGeorge Rimar     if (!V)
1120eefa758eSGeorge Rimar       error(Msg);
1121eefa758eSGeorge Rimar     return V;
1122eefa758eSGeorge Rimar   };
1123eefa758eSGeorge Rimar }
1124eefa758eSGeorge Rimar 
112525150e8bSRui Ueyama // Reads a FILL(expr) command. We handle the FILL command as an
112625150e8bSRui Ueyama // alias for =fillexp section attribute, which is different from
112725150e8bSRui Ueyama // what GNU linkers do.
112825150e8bSRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html
1129ff1f29e0SGeorge Rimar std::vector<uint8_t> ScriptParser::readFill() {
1130ff1f29e0SGeorge Rimar   expect("(");
1131ff1f29e0SGeorge Rimar   std::vector<uint8_t> V = readOutputSectionFiller(next());
1132ff1f29e0SGeorge Rimar   expect(")");
1133ff1f29e0SGeorge Rimar   expect(";");
1134ff1f29e0SGeorge Rimar   return V;
1135ff1f29e0SGeorge Rimar }
1136ff1f29e0SGeorge Rimar 
113710416564SRui Ueyama OutputSectionCommand *
113810416564SRui Ueyama ScriptParser::readOutputSectionDescription(StringRef OutSec) {
1139076fe157SGeorge Rimar   OutputSectionCommand *Cmd = new OutputSectionCommand(OutSec);
114058e5c4dcSGeorge Rimar 
114158e5c4dcSGeorge Rimar   // Read an address expression.
114258e5c4dcSGeorge Rimar   // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html#Output-Section-Address
114358e5c4dcSGeorge Rimar   if (peek() != ":")
114458e5c4dcSGeorge Rimar     Cmd->AddrExpr = readExpr();
114558e5c4dcSGeorge Rimar 
11468e3b38abSDenis Protivensky   expect(":");
1147246f681eSDavide Italiano 
11488ceadb38SGeorge Rimar   if (skip("AT"))
11496ad7dfccSRui Ueyama     Cmd->LmaExpr = readParenExpr();
1150630c6179SGeorge Rimar   if (skip("ALIGN"))
11516ad7dfccSRui Ueyama     Cmd->AlignExpr = readParenExpr();
1152db24d9c3SGeorge Rimar   if (skip("SUBALIGN"))
1153db24d9c3SGeorge Rimar     Cmd->SubalignExpr = readParenExpr();
1154630c6179SGeorge Rimar 
1155246f681eSDavide Italiano   // Parse constraints.
1156246f681eSDavide Italiano   if (skip("ONLY_IF_RO"))
1157efc4066bSRui Ueyama     Cmd->Constraint = ConstraintKind::ReadOnly;
1158246f681eSDavide Italiano   if (skip("ONLY_IF_RW"))
1159efc4066bSRui Ueyama     Cmd->Constraint = ConstraintKind::ReadWrite;
11608e3b38abSDenis Protivensky   expect("{");
11618ec77e64SRui Ueyama 
1162025d59b1SRui Ueyama   while (!Error && !skip("}")) {
1163ceabe80eSEugene Leviant     StringRef Tok = next();
1164db741e72SEugene Leviant     if (SymbolAssignment *Assignment = readProvideOrAssignment(Tok, false))
1165ceabe80eSEugene Leviant       Cmd->Commands.emplace_back(Assignment);
1166ff1f29e0SGeorge Rimar     else if (Tok == "FILL")
1167ff1f29e0SGeorge Rimar       Cmd->Filler = readFill();
1168ceabe80eSEugene Leviant     else if (Tok == "SORT")
116903fc010eSGeorge Rimar       readSort();
1170a2496cbeSGeorge Rimar     else if (peek() == "(")
1171a2496cbeSGeorge Rimar       Cmd->Commands.emplace_back(readInputSectionDescription(Tok));
1172ceabe80eSEugene Leviant     else
1173ceabe80eSEugene Leviant       setError("unknown command " + Tok);
11748e3b38abSDenis Protivensky   }
1175076fe157SGeorge Rimar   Cmd->Phdrs = readOutputSectionPhdrs();
1176ff1f29e0SGeorge Rimar   if (peek().startswith("="))
1177ff1f29e0SGeorge Rimar     Cmd->Filler = readOutputSectionFiller(next().drop_front());
117810416564SRui Ueyama   return Cmd;
1179f71caa2bSRui Ueyama }
11808ec77e64SRui Ueyama 
11812c8f1f04SRui Ueyama // Read "=<number>" where <number> is an octal/decimal/hexadecimal number.
11822c8f1f04SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html
11832c8f1f04SRui Ueyama //
11842c8f1f04SRui Ueyama // ld.gold is not fully compatible with ld.bfd. ld.bfd handles
11852c8f1f04SRui Ueyama // hexstrings as blobs of arbitrary sizes, while ld.gold handles them
11862c8f1f04SRui Ueyama // as 32-bit big-endian values. We will do the same as ld.gold does
11872c8f1f04SRui Ueyama // because it's simpler than what ld.bfd does.
1188ff1f29e0SGeorge Rimar std::vector<uint8_t> ScriptParser::readOutputSectionFiller(StringRef Tok) {
1189965827d6SRui Ueyama   uint32_t V;
1190ff1f29e0SGeorge Rimar   if (Tok.getAsInteger(0, V)) {
1191965827d6SRui Ueyama     setError("invalid filler expression: " + Tok);
1192f71caa2bSRui Ueyama     return {};
1193e2ee72b5SGeorge Rimar   }
1194965827d6SRui Ueyama   return {uint8_t(V >> 24), uint8_t(V >> 16), uint8_t(V >> 8), uint8_t(V)};
11958e3b38abSDenis Protivensky }
11968e3b38abSDenis Protivensky 
1197a35e39caSPetr Hosek SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) {
1198a31c91b1SEugene Leviant   expect("(");
1199174e0a16SRui Ueyama   SymbolAssignment *Cmd = readAssignment(next());
1200a35e39caSPetr Hosek   Cmd->Provide = Provide;
1201174e0a16SRui Ueyama   Cmd->Hidden = Hidden;
1202a31c91b1SEugene Leviant   expect(")");
1203a31c91b1SEugene Leviant   expect(";");
120410416564SRui Ueyama   return Cmd;
1205eda81a1bSEugene Leviant }
1206eda81a1bSEugene Leviant 
1207db741e72SEugene Leviant SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok,
1208db741e72SEugene Leviant                                                         bool MakeAbsolute) {
1209ceabe80eSEugene Leviant   SymbolAssignment *Cmd = nullptr;
1210ceabe80eSEugene Leviant   if (peek() == "=" || peek() == "+=") {
1211ceabe80eSEugene Leviant     Cmd = readAssignment(Tok);
1212ceabe80eSEugene Leviant     expect(";");
1213ceabe80eSEugene Leviant   } else if (Tok == "PROVIDE") {
1214a35e39caSPetr Hosek     Cmd = readProvideHidden(true, false);
1215a35e39caSPetr Hosek   } else if (Tok == "HIDDEN") {
1216a35e39caSPetr Hosek     Cmd = readProvideHidden(false, true);
1217ceabe80eSEugene Leviant   } else if (Tok == "PROVIDE_HIDDEN") {
1218a35e39caSPetr Hosek     Cmd = readProvideHidden(true, true);
1219ceabe80eSEugene Leviant   }
1220db741e72SEugene Leviant   if (Cmd && MakeAbsolute)
1221db741e72SEugene Leviant     Cmd->IsAbsolute = true;
1222ceabe80eSEugene Leviant   return Cmd;
1223ceabe80eSEugene Leviant }
1224ceabe80eSEugene Leviant 
122530835ea4SGeorge Rimar static uint64_t getSymbolValue(StringRef S, uint64_t Dot) {
122630835ea4SGeorge Rimar   if (S == ".")
122730835ea4SGeorge Rimar     return Dot;
1228884e786dSGeorge Rimar   return ScriptBase->getSymbolValue(S);
1229e32a3598SGeorge Rimar }
1230e32a3598SGeorge Rimar 
123130835ea4SGeorge Rimar SymbolAssignment *ScriptParser::readAssignment(StringRef Name) {
123230835ea4SGeorge Rimar   StringRef Op = next();
1233db741e72SEugene Leviant   bool IsAbsolute = false;
1234db741e72SEugene Leviant   Expr E;
123530835ea4SGeorge Rimar   assert(Op == "=" || Op == "+=");
1236db741e72SEugene Leviant   if (skip("ABSOLUTE")) {
1237db741e72SEugene Leviant     E = readParenExpr();
1238db741e72SEugene Leviant     IsAbsolute = true;
1239db741e72SEugene Leviant   } else {
1240db741e72SEugene Leviant     E = readExpr();
1241db741e72SEugene Leviant   }
124230835ea4SGeorge Rimar   if (Op == "+=")
124330835ea4SGeorge Rimar     E = [=](uint64_t Dot) { return getSymbolValue(Name, Dot) + E(Dot); };
1244db741e72SEugene Leviant   return new SymbolAssignment(Name, E, IsAbsolute);
124530835ea4SGeorge Rimar }
124630835ea4SGeorge Rimar 
124730835ea4SGeorge Rimar // This is an operator-precedence parser to parse a linker
124830835ea4SGeorge Rimar // script expression.
124930835ea4SGeorge Rimar Expr ScriptParser::readExpr() { return readExpr1(readPrimary(), 0); }
125030835ea4SGeorge Rimar 
125136c1cd23SRui Ueyama static Expr combine(StringRef Op, Expr L, Expr R) {
125236c1cd23SRui Ueyama   if (Op == "*")
125336c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) * R(Dot); };
125436c1cd23SRui Ueyama   if (Op == "/") {
125536c1cd23SRui Ueyama     return [=](uint64_t Dot) -> uint64_t {
125636c1cd23SRui Ueyama       uint64_t RHS = R(Dot);
125736c1cd23SRui Ueyama       if (RHS == 0) {
125836c1cd23SRui Ueyama         error("division by zero");
125936c1cd23SRui Ueyama         return 0;
126036c1cd23SRui Ueyama       }
126136c1cd23SRui Ueyama       return L(Dot) / RHS;
126236c1cd23SRui Ueyama     };
126336c1cd23SRui Ueyama   }
126436c1cd23SRui Ueyama   if (Op == "+")
126536c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) + R(Dot); };
126636c1cd23SRui Ueyama   if (Op == "-")
126736c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) - R(Dot); };
126836c1cd23SRui Ueyama   if (Op == "<")
126936c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) < R(Dot); };
127036c1cd23SRui Ueyama   if (Op == ">")
127136c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) > R(Dot); };
127236c1cd23SRui Ueyama   if (Op == ">=")
127336c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) >= R(Dot); };
127436c1cd23SRui Ueyama   if (Op == "<=")
127536c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) <= R(Dot); };
127636c1cd23SRui Ueyama   if (Op == "==")
127736c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) == R(Dot); };
127836c1cd23SRui Ueyama   if (Op == "!=")
127936c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) != R(Dot); };
128036c1cd23SRui Ueyama   if (Op == "&")
128136c1cd23SRui Ueyama     return [=](uint64_t Dot) { return L(Dot) & R(Dot); };
1282cc3dd629SRafael Espindola   if (Op == "|")
1283cc3dd629SRafael Espindola     return [=](uint64_t Dot) { return L(Dot) | R(Dot); };
128436c1cd23SRui Ueyama   llvm_unreachable("invalid operator");
128536c1cd23SRui Ueyama }
128636c1cd23SRui Ueyama 
1287708019c4SRui Ueyama // This is a part of the operator-precedence parser. This function
1288708019c4SRui Ueyama // assumes that the remaining token stream starts with an operator.
1289708019c4SRui Ueyama Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) {
1290708019c4SRui Ueyama   while (!atEOF() && !Error) {
1291708019c4SRui Ueyama     // Read an operator and an expression.
1292708019c4SRui Ueyama     StringRef Op1 = peek();
1293708019c4SRui Ueyama     if (Op1 == "?")
1294708019c4SRui Ueyama       return readTernary(Lhs);
1295708019c4SRui Ueyama     if (precedence(Op1) < MinPrec)
1296a31c91b1SEugene Leviant       break;
1297a31c91b1SEugene Leviant     next();
1298708019c4SRui Ueyama     Expr Rhs = readPrimary();
1299708019c4SRui Ueyama 
1300708019c4SRui Ueyama     // Evaluate the remaining part of the expression first if the
1301708019c4SRui Ueyama     // next operator has greater precedence than the previous one.
1302708019c4SRui Ueyama     // For example, if we have read "+" and "3", and if the next
1303708019c4SRui Ueyama     // operator is "*", then we'll evaluate 3 * ... part first.
1304708019c4SRui Ueyama     while (!atEOF()) {
1305708019c4SRui Ueyama       StringRef Op2 = peek();
1306708019c4SRui Ueyama       if (precedence(Op2) <= precedence(Op1))
1307eda81a1bSEugene Leviant         break;
1308708019c4SRui Ueyama       Rhs = readExpr1(Rhs, precedence(Op2));
1309eda81a1bSEugene Leviant     }
1310708019c4SRui Ueyama 
1311708019c4SRui Ueyama     Lhs = combine(Op1, Lhs, Rhs);
1312708019c4SRui Ueyama   }
1313708019c4SRui Ueyama   return Lhs;
1314708019c4SRui Ueyama }
1315708019c4SRui Ueyama 
1316708019c4SRui Ueyama uint64_t static getConstant(StringRef S) {
1317e2cc07bcSMichael J. Spencer   if (S == "COMMONPAGESIZE")
1318708019c4SRui Ueyama     return Target->PageSize;
1319e2cc07bcSMichael J. Spencer   if (S == "MAXPAGESIZE")
1320e2cc07bcSMichael J. Spencer     return Target->MaxPageSize;
1321708019c4SRui Ueyama   error("unknown constant: " + S);
1322708019c4SRui Ueyama   return 0;
1323708019c4SRui Ueyama }
1324708019c4SRui Ueyama 
1325626e0b08SRui Ueyama // Parses Tok as an integer. Returns true if successful.
1326626e0b08SRui Ueyama // It recognizes hexadecimal (prefixed with "0x" or suffixed with "H")
1327626e0b08SRui Ueyama // and decimal numbers. Decimal numbers may have "K" (kilo) or
1328626e0b08SRui Ueyama // "M" (mega) prefixes.
13299f2f7ad9SGeorge Rimar static bool readInteger(StringRef Tok, uint64_t &Result) {
1330eaeafb2bSSimon Atanasyan   if (Tok.startswith("-")) {
1331eaeafb2bSSimon Atanasyan     if (!readInteger(Tok.substr(1), Result))
1332eaeafb2bSSimon Atanasyan       return false;
1333eaeafb2bSSimon Atanasyan     Result = -Result;
1334eaeafb2bSSimon Atanasyan     return true;
1335eaeafb2bSSimon Atanasyan   }
13369f2f7ad9SGeorge Rimar   if (Tok.startswith_lower("0x"))
13379f2f7ad9SGeorge Rimar     return !Tok.substr(2).getAsInteger(16, Result);
13389f2f7ad9SGeorge Rimar   if (Tok.endswith_lower("H"))
13399f2f7ad9SGeorge Rimar     return !Tok.drop_back().getAsInteger(16, Result);
13409f2f7ad9SGeorge Rimar 
13419f2f7ad9SGeorge Rimar   int Suffix = 1;
13429f2f7ad9SGeorge Rimar   if (Tok.endswith_lower("K")) {
13439f2f7ad9SGeorge Rimar     Suffix = 1024;
13449f2f7ad9SGeorge Rimar     Tok = Tok.drop_back();
13459f2f7ad9SGeorge Rimar   } else if (Tok.endswith_lower("M")) {
13469f2f7ad9SGeorge Rimar     Suffix = 1024 * 1024;
13479f2f7ad9SGeorge Rimar     Tok = Tok.drop_back();
13489f2f7ad9SGeorge Rimar   }
13499f2f7ad9SGeorge Rimar   if (Tok.getAsInteger(10, Result))
13509f2f7ad9SGeorge Rimar     return false;
13519f2f7ad9SGeorge Rimar   Result *= Suffix;
13529f2f7ad9SGeorge Rimar   return true;
13539f2f7ad9SGeorge Rimar }
13549f2f7ad9SGeorge Rimar 
1355708019c4SRui Ueyama Expr ScriptParser::readPrimary() {
13566ad7dfccSRui Ueyama   if (peek() == "(")
13576ad7dfccSRui Ueyama     return readParenExpr();
1358708019c4SRui Ueyama 
13596ad7dfccSRui Ueyama   StringRef Tok = next();
1360708019c4SRui Ueyama 
1361eaeafb2bSSimon Atanasyan   if (Tok == "~") {
1362eaeafb2bSSimon Atanasyan     Expr E = readPrimary();
1363eaeafb2bSSimon Atanasyan     return [=](uint64_t Dot) { return ~E(Dot); };
1364eaeafb2bSSimon Atanasyan   }
1365eaeafb2bSSimon Atanasyan   if (Tok == "-") {
1366eaeafb2bSSimon Atanasyan     Expr E = readPrimary();
1367eaeafb2bSSimon Atanasyan     return [=](uint64_t Dot) { return -E(Dot); };
1368eaeafb2bSSimon Atanasyan   }
1369eaeafb2bSSimon Atanasyan 
1370708019c4SRui Ueyama   // Built-in functions are parsed here.
1371708019c4SRui Ueyama   // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html.
137296659df0SGeorge Rimar   if (Tok == "ADDR") {
137396659df0SGeorge Rimar     expect("(");
137496659df0SGeorge Rimar     StringRef Name = next();
137596659df0SGeorge Rimar     expect(")");
1376884e786dSGeorge Rimar     return
1377884e786dSGeorge Rimar         [=](uint64_t Dot) { return ScriptBase->getOutputSectionAddress(Name); };
137896659df0SGeorge Rimar   }
1379eefa758eSGeorge Rimar   if (Tok == "ASSERT")
1380eefa758eSGeorge Rimar     return readAssert();
1381708019c4SRui Ueyama   if (Tok == "ALIGN") {
13826ad7dfccSRui Ueyama     Expr E = readParenExpr();
1383708019c4SRui Ueyama     return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); };
1384708019c4SRui Ueyama   }
1385708019c4SRui Ueyama   if (Tok == "CONSTANT") {
1386708019c4SRui Ueyama     expect("(");
1387708019c4SRui Ueyama     StringRef Tok = next();
1388708019c4SRui Ueyama     expect(")");
1389708019c4SRui Ueyama     return [=](uint64_t Dot) { return getConstant(Tok); };
1390708019c4SRui Ueyama   }
139154c145ceSRafael Espindola   if (Tok == "SEGMENT_START") {
139254c145ceSRafael Espindola     expect("(");
139354c145ceSRafael Espindola     next();
139454c145ceSRafael Espindola     expect(",");
139554c145ceSRafael Espindola     uint64_t Val;
13963adbbc38SRafael Espindola     if (next().getAsInteger(0, Val))
13973adbbc38SRafael Espindola       setError("integer expected");
139854c145ceSRafael Espindola     expect(")");
139954c145ceSRafael Espindola     return [=](uint64_t Dot) { return Val; };
140054c145ceSRafael Espindola   }
1401708019c4SRui Ueyama   if (Tok == "DATA_SEGMENT_ALIGN") {
1402708019c4SRui Ueyama     expect("(");
1403708019c4SRui Ueyama     Expr E = readExpr();
1404708019c4SRui Ueyama     expect(",");
1405708019c4SRui Ueyama     readExpr();
1406708019c4SRui Ueyama     expect(")");
1407f7791bb9SRui Ueyama     return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); };
1408708019c4SRui Ueyama   }
1409708019c4SRui Ueyama   if (Tok == "DATA_SEGMENT_END") {
1410708019c4SRui Ueyama     expect("(");
1411708019c4SRui Ueyama     expect(".");
1412708019c4SRui Ueyama     expect(")");
1413708019c4SRui Ueyama     return [](uint64_t Dot) { return Dot; };
1414708019c4SRui Ueyama   }
1415276b4e64SGeorge Rimar   // GNU linkers implements more complicated logic to handle
1416276b4e64SGeorge Rimar   // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and just align to
1417276b4e64SGeorge Rimar   // the next page boundary for simplicity.
1418276b4e64SGeorge Rimar   if (Tok == "DATA_SEGMENT_RELRO_END") {
1419276b4e64SGeorge Rimar     expect("(");
142097bdc722SRafael Espindola     readExpr();
1421276b4e64SGeorge Rimar     expect(",");
1422276b4e64SGeorge Rimar     readExpr();
1423276b4e64SGeorge Rimar     expect(")");
1424276b4e64SGeorge Rimar     return [](uint64_t Dot) { return alignTo(Dot, Target->PageSize); };
1425276b4e64SGeorge Rimar   }
14269e69450eSGeorge Rimar   if (Tok == "SIZEOF") {
14279e69450eSGeorge Rimar     expect("(");
14289e69450eSGeorge Rimar     StringRef Name = next();
14299e69450eSGeorge Rimar     expect(")");
1430884e786dSGeorge Rimar     return [=](uint64_t Dot) { return ScriptBase->getOutputSectionSize(Name); };
14319e69450eSGeorge Rimar   }
143236fac7f0SEugene Leviant   if (Tok == "ALIGNOF") {
143336fac7f0SEugene Leviant     expect("(");
143436fac7f0SEugene Leviant     StringRef Name = next();
143536fac7f0SEugene Leviant     expect(")");
143636fac7f0SEugene Leviant     return
143736fac7f0SEugene Leviant         [=](uint64_t Dot) { return ScriptBase->getOutputSectionAlign(Name); };
143836fac7f0SEugene Leviant   }
1439e32a3598SGeorge Rimar   if (Tok == "SIZEOF_HEADERS")
1440884e786dSGeorge Rimar     return [=](uint64_t Dot) { return ScriptBase->getHeaderSize(); };
1441708019c4SRui Ueyama 
14429f2f7ad9SGeorge Rimar   // Tok is a literal number.
14439f2f7ad9SGeorge Rimar   uint64_t V;
14449f2f7ad9SGeorge Rimar   if (readInteger(Tok, V))
14459f2f7ad9SGeorge Rimar     return [=](uint64_t Dot) { return V; };
14469f2f7ad9SGeorge Rimar 
14479f2f7ad9SGeorge Rimar   // Tok is a symbol name.
144830835ea4SGeorge Rimar   if (Tok != "." && !isValidCIdentifier(Tok))
1449708019c4SRui Ueyama     setError("malformed number: " + Tok);
145030835ea4SGeorge Rimar   return [=](uint64_t Dot) { return getSymbolValue(Tok, Dot); };
1451a9c5a528SGeorge Rimar }
1452708019c4SRui Ueyama 
1453708019c4SRui Ueyama Expr ScriptParser::readTernary(Expr Cond) {
1454708019c4SRui Ueyama   next();
1455708019c4SRui Ueyama   Expr L = readExpr();
1456708019c4SRui Ueyama   expect(":");
1457708019c4SRui Ueyama   Expr R = readExpr();
1458708019c4SRui Ueyama   return [=](uint64_t Dot) { return Cond(Dot) ? L(Dot) : R(Dot); };
1459708019c4SRui Ueyama }
1460708019c4SRui Ueyama 
14616ad7dfccSRui Ueyama Expr ScriptParser::readParenExpr() {
14626ad7dfccSRui Ueyama   expect("(");
14636ad7dfccSRui Ueyama   Expr E = readExpr();
14646ad7dfccSRui Ueyama   expect(")");
14656ad7dfccSRui Ueyama   return E;
14666ad7dfccSRui Ueyama }
14676ad7dfccSRui Ueyama 
1468bbe38602SEugene Leviant std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() {
1469bbe38602SEugene Leviant   std::vector<StringRef> Phdrs;
1470bbe38602SEugene Leviant   while (!Error && peek().startswith(":")) {
1471bbe38602SEugene Leviant     StringRef Tok = next();
1472bbe38602SEugene Leviant     Tok = (Tok.size() == 1) ? next() : Tok.substr(1);
1473bbe38602SEugene Leviant     if (Tok.empty()) {
1474bbe38602SEugene Leviant       setError("section header name is empty");
1475bbe38602SEugene Leviant       break;
1476bbe38602SEugene Leviant     }
1477bbe38602SEugene Leviant     Phdrs.push_back(Tok);
1478bbe38602SEugene Leviant   }
1479bbe38602SEugene Leviant   return Phdrs;
1480bbe38602SEugene Leviant }
1481bbe38602SEugene Leviant 
1482bbe38602SEugene Leviant unsigned ScriptParser::readPhdrType() {
1483bbe38602SEugene Leviant   StringRef Tok = next();
1484b0f6c590SRui Ueyama   unsigned Ret = StringSwitch<unsigned>(Tok)
1485b0f6c590SRui Ueyama                      .Case("PT_NULL", PT_NULL)
1486b0f6c590SRui Ueyama                      .Case("PT_LOAD", PT_LOAD)
1487b0f6c590SRui Ueyama                      .Case("PT_DYNAMIC", PT_DYNAMIC)
1488b0f6c590SRui Ueyama                      .Case("PT_INTERP", PT_INTERP)
1489b0f6c590SRui Ueyama                      .Case("PT_NOTE", PT_NOTE)
1490b0f6c590SRui Ueyama                      .Case("PT_SHLIB", PT_SHLIB)
1491b0f6c590SRui Ueyama                      .Case("PT_PHDR", PT_PHDR)
1492b0f6c590SRui Ueyama                      .Case("PT_TLS", PT_TLS)
1493b0f6c590SRui Ueyama                      .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME)
1494b0f6c590SRui Ueyama                      .Case("PT_GNU_STACK", PT_GNU_STACK)
1495b0f6c590SRui Ueyama                      .Case("PT_GNU_RELRO", PT_GNU_RELRO)
1496b0f6c590SRui Ueyama                      .Default(-1);
1497bbe38602SEugene Leviant 
1498b0f6c590SRui Ueyama   if (Ret == (unsigned)-1) {
1499b0f6c590SRui Ueyama     setError("invalid program header type: " + Tok);
1500b0f6c590SRui Ueyama     return PT_NULL;
1501b0f6c590SRui Ueyama   }
1502b0f6c590SRui Ueyama   return Ret;
1503bbe38602SEugene Leviant }
1504bbe38602SEugene Leviant 
150595769b4aSRui Ueyama void ScriptParser::readVersionDeclaration(StringRef VerStr) {
150620b6598cSGeorge Rimar   // Identifiers start at 2 because 0 and 1 are reserved
150720b6598cSGeorge Rimar   // for VER_NDX_LOCAL and VER_NDX_GLOBAL constants.
150820b6598cSGeorge Rimar   size_t VersionId = Config->VersionDefinitions.size() + 2;
150920b6598cSGeorge Rimar   Config->VersionDefinitions.push_back({VerStr, VersionId});
151020b6598cSGeorge Rimar 
151120b6598cSGeorge Rimar   if (skip("global:") || peek() != "local:")
151220b6598cSGeorge Rimar     readGlobal(VerStr);
151320b6598cSGeorge Rimar   if (skip("local:"))
151420b6598cSGeorge Rimar     readLocal();
151520b6598cSGeorge Rimar   expect("}");
151620b6598cSGeorge Rimar 
151720b6598cSGeorge Rimar   // Each version may have a parent version. For example, "Ver2" defined as
151820b6598cSGeorge Rimar   // "Ver2 { global: foo; local: *; } Ver1;" has "Ver1" as a parent. This
151920b6598cSGeorge Rimar   // version hierarchy is, probably against your instinct, purely for human; the
152020b6598cSGeorge Rimar   // runtime doesn't care about them at all. In LLD, we simply skip the token.
152120b6598cSGeorge Rimar   if (!VerStr.empty() && peek() != ";")
152220b6598cSGeorge Rimar     next();
152320b6598cSGeorge Rimar   expect(";");
152420b6598cSGeorge Rimar }
152520b6598cSGeorge Rimar 
152620b6598cSGeorge Rimar void ScriptParser::readLocal() {
152720b6598cSGeorge Rimar   Config->DefaultSymbolVersion = VER_NDX_LOCAL;
152820b6598cSGeorge Rimar   expect("*");
152920b6598cSGeorge Rimar   expect(";");
153020b6598cSGeorge Rimar }
153120b6598cSGeorge Rimar 
153220b6598cSGeorge Rimar void ScriptParser::readExtern(std::vector<SymbolVersion> *Globals) {
1533cd574a5eSGeorge Rimar   expect("\"C++\"");
153420b6598cSGeorge Rimar   expect("{");
153520b6598cSGeorge Rimar 
153620b6598cSGeorge Rimar   for (;;) {
153720b6598cSGeorge Rimar     if (peek() == "}" || Error)
153820b6598cSGeorge Rimar       break;
1539cd574a5eSGeorge Rimar     bool HasWildcard = !peek().startswith("\"") && hasWildcard(peek());
1540cd574a5eSGeorge Rimar     Globals->push_back({unquote(next()), true, HasWildcard});
154120b6598cSGeorge Rimar     expect(";");
154220b6598cSGeorge Rimar   }
154320b6598cSGeorge Rimar 
154420b6598cSGeorge Rimar   expect("}");
154520b6598cSGeorge Rimar   expect(";");
154620b6598cSGeorge Rimar }
154720b6598cSGeorge Rimar 
154820b6598cSGeorge Rimar void ScriptParser::readGlobal(StringRef VerStr) {
154920b6598cSGeorge Rimar   std::vector<SymbolVersion> *Globals;
155020b6598cSGeorge Rimar   if (VerStr.empty())
155120b6598cSGeorge Rimar     Globals = &Config->VersionScriptGlobals;
155220b6598cSGeorge Rimar   else
155320b6598cSGeorge Rimar     Globals = &Config->VersionDefinitions.back().Globals;
155420b6598cSGeorge Rimar 
155520b6598cSGeorge Rimar   for (;;) {
155620b6598cSGeorge Rimar     if (skip("extern"))
155720b6598cSGeorge Rimar       readExtern(Globals);
155820b6598cSGeorge Rimar 
155920b6598cSGeorge Rimar     StringRef Cur = peek();
156020b6598cSGeorge Rimar     if (Cur == "}" || Cur == "local:" || Error)
156120b6598cSGeorge Rimar       return;
156220b6598cSGeorge Rimar     next();
1563cd574a5eSGeorge Rimar     Globals->push_back({unquote(Cur), false, hasWildcard(Cur)});
156420b6598cSGeorge Rimar     expect(";");
156520b6598cSGeorge Rimar   }
156620b6598cSGeorge Rimar }
156720b6598cSGeorge Rimar 
156816b0cc9eSSimon Atanasyan static bool isUnderSysroot(StringRef Path) {
156916b0cc9eSSimon Atanasyan   if (Config->Sysroot == "")
157016b0cc9eSSimon Atanasyan     return false;
157116b0cc9eSSimon Atanasyan   for (; !Path.empty(); Path = sys::path::parent_path(Path))
157216b0cc9eSSimon Atanasyan     if (sys::fs::equivalent(Config->Sysroot, Path))
157316b0cc9eSSimon Atanasyan       return true;
157416b0cc9eSSimon Atanasyan   return false;
157516b0cc9eSSimon Atanasyan }
157616b0cc9eSSimon Atanasyan 
157707320e40SRui Ueyama void elf::readLinkerScript(MemoryBufferRef MB) {
157816b0cc9eSSimon Atanasyan   StringRef Path = MB.getBufferIdentifier();
157920b6598cSGeorge Rimar   ScriptParser(MB.getBuffer(), isUnderSysroot(Path)).readLinkerScript();
158020b6598cSGeorge Rimar }
158120b6598cSGeorge Rimar 
158220b6598cSGeorge Rimar void elf::readVersionScript(MemoryBufferRef MB) {
158320b6598cSGeorge Rimar   ScriptParser(MB.getBuffer(), false).readVersionScript();
1584f7c5fbb1SRui Ueyama }
15851ebc8ed7SRui Ueyama 
158607320e40SRui Ueyama template class elf::LinkerScript<ELF32LE>;
158707320e40SRui Ueyama template class elf::LinkerScript<ELF32BE>;
158807320e40SRui Ueyama template class elf::LinkerScript<ELF64LE>;
158907320e40SRui Ueyama template class elf::LinkerScript<ELF64BE>;
1590