12ec34544SRui Ueyama //===- ScriptParser.cpp ---------------------------------------------------===//
22ec34544SRui Ueyama //
32ec34544SRui Ueyama //                             The LLVM Linker
42ec34544SRui Ueyama //
52ec34544SRui Ueyama // This file is distributed under the University of Illinois Open Source
62ec34544SRui Ueyama // License. See LICENSE.TXT for details.
72ec34544SRui Ueyama //
82ec34544SRui Ueyama //===----------------------------------------------------------------------===//
905f6b852SRui Ueyama //
1005f6b852SRui Ueyama // This file contains a recursive-descendent parser for linker scripts.
1105f6b852SRui Ueyama // Parsed results are stored to Config and Script global objects.
1205f6b852SRui Ueyama //
1305f6b852SRui Ueyama //===----------------------------------------------------------------------===//
142ec34544SRui Ueyama 
152ec34544SRui Ueyama #include "ScriptParser.h"
162ec34544SRui Ueyama #include "Config.h"
172ec34544SRui Ueyama #include "Driver.h"
182ec34544SRui Ueyama #include "InputSection.h"
192ec34544SRui Ueyama #include "LinkerScript.h"
202ec34544SRui Ueyama #include "OutputSections.h"
212ec34544SRui Ueyama #include "ScriptLexer.h"
222ec34544SRui Ueyama #include "Symbols.h"
232ec34544SRui Ueyama #include "Target.h"
242017d52bSRui Ueyama #include "lld/Common/Memory.h"
252ec34544SRui Ueyama #include "llvm/ADT/SmallString.h"
262ec34544SRui Ueyama #include "llvm/ADT/StringRef.h"
270440be4aSRui Ueyama #include "llvm/ADT/StringSet.h"
282ec34544SRui Ueyama #include "llvm/ADT/StringSwitch.h"
29264b5d9eSZachary Turner #include "llvm/BinaryFormat/ELF.h"
302ec34544SRui Ueyama #include "llvm/Support/Casting.h"
312ec34544SRui Ueyama #include "llvm/Support/ErrorHandling.h"
322ec34544SRui Ueyama #include "llvm/Support/FileSystem.h"
332ec34544SRui Ueyama #include "llvm/Support/Path.h"
342ec34544SRui Ueyama #include <cassert>
352ec34544SRui Ueyama #include <limits>
362ec34544SRui Ueyama #include <vector>
372ec34544SRui Ueyama 
382ec34544SRui Ueyama using namespace llvm;
392ec34544SRui Ueyama using namespace llvm::ELF;
40b58079d4SRui Ueyama using namespace llvm::support::endian;
412ec34544SRui Ueyama using namespace lld;
422ec34544SRui Ueyama using namespace lld::elf;
432ec34544SRui Ueyama 
442ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path);
452ec34544SRui Ueyama 
4696b3fe02SRui Ueyama namespace {
4796b3fe02SRui Ueyama class ScriptParser final : ScriptLexer {
482ec34544SRui Ueyama public:
492ec34544SRui Ueyama   ScriptParser(MemoryBufferRef MB)
502ec34544SRui Ueyama       : ScriptLexer(MB),
512ec34544SRui Ueyama         IsUnderSysroot(isUnderSysroot(MB.getBufferIdentifier())) {}
522ec34544SRui Ueyama 
532ec34544SRui Ueyama   void readLinkerScript();
542ec34544SRui Ueyama   void readVersionScript();
552ec34544SRui Ueyama   void readDynamicList();
568c7e8cceSPetr Hosek   void readDefsym(StringRef Name);
572ec34544SRui Ueyama 
582ec34544SRui Ueyama private:
592ec34544SRui Ueyama   void addFile(StringRef Path);
602ec34544SRui Ueyama 
612ec34544SRui Ueyama   void readAsNeeded();
622ec34544SRui Ueyama   void readEntry();
632ec34544SRui Ueyama   void readExtern();
642ec34544SRui Ueyama   void readGroup();
652ec34544SRui Ueyama   void readInclude();
662ec34544SRui Ueyama   void readMemory();
672ec34544SRui Ueyama   void readOutput();
682ec34544SRui Ueyama   void readOutputArch();
692ec34544SRui Ueyama   void readOutputFormat();
702ec34544SRui Ueyama   void readPhdrs();
715f37541cSGeorge Rimar   void readRegionAlias();
722ec34544SRui Ueyama   void readSearchDir();
732ec34544SRui Ueyama   void readSections();
742ec34544SRui Ueyama   void readVersion();
752ec34544SRui Ueyama   void readVersionScriptCommand();
762ec34544SRui Ueyama 
772ec34544SRui Ueyama   SymbolAssignment *readAssignment(StringRef Name);
78f0403c60SRui Ueyama   ByteCommand *readByteCommand(StringRef Tok);
792ec34544SRui Ueyama   uint32_t readFill();
808acbf1ccSRui Ueyama   uint32_t parseFill(StringRef Tok);
818c022ca7SRafael Espindola   void readSectionAddressType(OutputSection *Cmd);
828c022ca7SRafael Espindola   OutputSection *readOutputSectionDescription(StringRef OutSec);
832ec34544SRui Ueyama   std::vector<StringRef> readOutputSectionPhdrs();
842ec34544SRui Ueyama   InputSectionDescription *readInputSectionDescription(StringRef Tok);
852ec34544SRui Ueyama   StringMatcher readFilePatterns();
862ec34544SRui Ueyama   std::vector<SectionPattern> readInputSectionsList();
872ec34544SRui Ueyama   InputSectionDescription *readInputSectionRules(StringRef FilePattern);
882ec34544SRui Ueyama   unsigned readPhdrType();
892ec34544SRui Ueyama   SortSectionPolicy readSortKind();
902ec34544SRui Ueyama   SymbolAssignment *readProvideHidden(bool Provide, bool Hidden);
912ec34544SRui Ueyama   SymbolAssignment *readProvideOrAssignment(StringRef Tok);
922ec34544SRui Ueyama   void readSort();
9323af89ccSRui Ueyama   AssertCommand *readAssert();
9423af89ccSRui Ueyama   Expr readAssertExpr();
955fb17128SGeorge Rimar   Expr readConstant();
965fb17128SGeorge Rimar   Expr getPageSize();
972ec34544SRui Ueyama 
982ec34544SRui Ueyama   uint64_t readMemoryAssignment(StringRef, StringRef, StringRef);
992ec34544SRui Ueyama   std::pair<uint32_t, uint32_t> readMemoryAttributes();
1002ec34544SRui Ueyama 
1017b91e213SGeorge Rimar   Expr combine(StringRef Op, Expr L, Expr R);
1022ec34544SRui Ueyama   Expr readExpr();
1032ec34544SRui Ueyama   Expr readExpr1(Expr Lhs, int MinPrec);
1042ec34544SRui Ueyama   StringRef readParenLiteral();
1052ec34544SRui Ueyama   Expr readPrimary();
1062ec34544SRui Ueyama   Expr readTernary(Expr Cond);
1072ec34544SRui Ueyama   Expr readParenExpr();
1082ec34544SRui Ueyama 
1092ec34544SRui Ueyama   // For parsing version script.
1102ec34544SRui Ueyama   std::vector<SymbolVersion> readVersionExtern();
1112ec34544SRui Ueyama   void readAnonymousDeclaration();
1122ec34544SRui Ueyama   void readVersionDeclaration(StringRef VerStr);
1132ec34544SRui Ueyama 
1142ec34544SRui Ueyama   std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>>
1152ec34544SRui Ueyama   readSymbols();
1162ec34544SRui Ueyama 
117fd06b025SRui Ueyama   // True if a script being read is in a subdirectory specified by -sysroot.
1182ec34544SRui Ueyama   bool IsUnderSysroot;
1190440be4aSRui Ueyama 
1200440be4aSRui Ueyama   // A set to detect an INCLUDE() cycle.
1210440be4aSRui Ueyama   StringSet<> Seen;
1222ec34544SRui Ueyama };
12396b3fe02SRui Ueyama } // namespace
1242ec34544SRui Ueyama 
1251e77ad14SRui Ueyama static StringRef unquote(StringRef S) {
1261e77ad14SRui Ueyama   if (S.startswith("\""))
1271e77ad14SRui Ueyama     return S.substr(1, S.size() - 2);
1281e77ad14SRui Ueyama   return S;
1291e77ad14SRui Ueyama }
1301e77ad14SRui Ueyama 
1312ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path) {
1322ec34544SRui Ueyama   if (Config->Sysroot == "")
1332ec34544SRui Ueyama     return false;
1342ec34544SRui Ueyama   for (; !Path.empty(); Path = sys::path::parent_path(Path))
1352ec34544SRui Ueyama     if (sys::fs::equivalent(Config->Sysroot, Path))
1362ec34544SRui Ueyama       return true;
1372ec34544SRui Ueyama   return false;
1382ec34544SRui Ueyama }
1392ec34544SRui Ueyama 
1402ec34544SRui Ueyama // Some operations only support one non absolute value. Move the
1412ec34544SRui Ueyama // absolute one to the right hand side for convenience.
1422ec34544SRui Ueyama static void moveAbsRight(ExprValue &A, ExprValue &B) {
14323be5e8dSRafael Espindola   if (A.Sec == nullptr || (A.ForceAbsolute && !B.isAbsolute()))
1442ec34544SRui Ueyama     std::swap(A, B);
1452ec34544SRui Ueyama   if (!B.isAbsolute())
14641c7ab4aSGeorge Rimar     error(A.Loc + ": at least one side of the expression must be absolute");
1472ec34544SRui Ueyama }
1482ec34544SRui Ueyama 
1492ec34544SRui Ueyama static ExprValue add(ExprValue A, ExprValue B) {
1502ec34544SRui Ueyama   moveAbsRight(A, B);
151a6acd23cSRafael Espindola   return {A.Sec, A.ForceAbsolute, A.getSectionOffset() + B.getValue(), A.Loc};
1522ec34544SRui Ueyama }
1532ec34544SRui Ueyama 
1542ec34544SRui Ueyama static ExprValue sub(ExprValue A, ExprValue B) {
15563a4a98eSRafael Espindola   // The distance between two symbols in sections is absolute.
1569cbb6dd1SRafael Espindola   if (!A.isAbsolute() && !B.isAbsolute())
1579cbb6dd1SRafael Espindola     return A.getValue() - B.getValue();
1584fbe3518SRui Ueyama   return {A.Sec, false, A.getSectionOffset() - B.getValue(), A.Loc};
1592ec34544SRui Ueyama }
1602ec34544SRui Ueyama 
1612ec34544SRui Ueyama static ExprValue bitAnd(ExprValue A, ExprValue B) {
1622ec34544SRui Ueyama   moveAbsRight(A, B);
1632ec34544SRui Ueyama   return {A.Sec, A.ForceAbsolute,
16441c7ab4aSGeorge Rimar           (A.getValue() & B.getValue()) - A.getSecAddr(), A.Loc};
1652ec34544SRui Ueyama }
1662ec34544SRui Ueyama 
1672ec34544SRui Ueyama static ExprValue bitOr(ExprValue A, ExprValue B) {
1682ec34544SRui Ueyama   moveAbsRight(A, B);
1692ec34544SRui Ueyama   return {A.Sec, A.ForceAbsolute,
17041c7ab4aSGeorge Rimar           (A.getValue() | B.getValue()) - A.getSecAddr(), A.Loc};
1712ec34544SRui Ueyama }
1722ec34544SRui Ueyama 
1732ec34544SRui Ueyama void ScriptParser::readDynamicList() {
1748016bdfdSRafael Espindola   Config->HasDynamicList = true;
1752ec34544SRui Ueyama   expect("{");
176d72d97b3SRafael Espindola   std::vector<SymbolVersion> Locals;
177d72d97b3SRafael Espindola   std::vector<SymbolVersion> Globals;
178d72d97b3SRafael Espindola   std::tie(Locals, Globals) = readSymbols();
179d72d97b3SRafael Espindola   expect(";");
180d72d97b3SRafael Espindola 
181d72d97b3SRafael Espindola   if (!atEOF()) {
1822ec34544SRui Ueyama     setError("EOF expected, but got " + next());
183d72d97b3SRafael Espindola     return;
184d72d97b3SRafael Espindola   }
185d72d97b3SRafael Espindola   if (!Locals.empty()) {
186d72d97b3SRafael Espindola     setError("\"local:\" scope not supported in --dynamic-list");
187d72d97b3SRafael Espindola     return;
188d72d97b3SRafael Espindola   }
189d72d97b3SRafael Espindola 
190d72d97b3SRafael Espindola   for (SymbolVersion V : Globals)
191d72d97b3SRafael Espindola     Config->DynamicList.push_back(V);
1922ec34544SRui Ueyama }
1932ec34544SRui Ueyama 
1942ec34544SRui Ueyama void ScriptParser::readVersionScript() {
1952ec34544SRui Ueyama   readVersionScriptCommand();
1962ec34544SRui Ueyama   if (!atEOF())
1972ec34544SRui Ueyama     setError("EOF expected, but got " + next());
1982ec34544SRui Ueyama }
1992ec34544SRui Ueyama 
2002ec34544SRui Ueyama void ScriptParser::readVersionScriptCommand() {
2012ec34544SRui Ueyama   if (consume("{")) {
2022ec34544SRui Ueyama     readAnonymousDeclaration();
2032ec34544SRui Ueyama     return;
2042ec34544SRui Ueyama   }
2052ec34544SRui Ueyama 
206b8a59c8aSBob Haarman   while (!atEOF() && !errorCount() && peek() != "}") {
2072ec34544SRui Ueyama     StringRef VerStr = next();
2082ec34544SRui Ueyama     if (VerStr == "{") {
2092ec34544SRui Ueyama       setError("anonymous version definition is used in "
2102ec34544SRui Ueyama                "combination with other version definitions");
2112ec34544SRui Ueyama       return;
2122ec34544SRui Ueyama     }
2132ec34544SRui Ueyama     expect("{");
2142ec34544SRui Ueyama     readVersionDeclaration(VerStr);
2152ec34544SRui Ueyama   }
2162ec34544SRui Ueyama }
2172ec34544SRui Ueyama 
2182ec34544SRui Ueyama void ScriptParser::readVersion() {
2192ec34544SRui Ueyama   expect("{");
2202ec34544SRui Ueyama   readVersionScriptCommand();
2212ec34544SRui Ueyama   expect("}");
2222ec34544SRui Ueyama }
2232ec34544SRui Ueyama 
2242ec34544SRui Ueyama void ScriptParser::readLinkerScript() {
2252ec34544SRui Ueyama   while (!atEOF()) {
2262ec34544SRui Ueyama     StringRef Tok = next();
2272ec34544SRui Ueyama     if (Tok == ";")
2282ec34544SRui Ueyama       continue;
2292ec34544SRui Ueyama 
2302ec34544SRui Ueyama     if (Tok == "ASSERT") {
2316b394caaSRui Ueyama       Script->SectionCommands.push_back(readAssert());
2322ec34544SRui Ueyama     } else if (Tok == "ENTRY") {
2332ec34544SRui Ueyama       readEntry();
2342ec34544SRui Ueyama     } else if (Tok == "EXTERN") {
2352ec34544SRui Ueyama       readExtern();
2362ec34544SRui Ueyama     } else if (Tok == "GROUP" || Tok == "INPUT") {
2372ec34544SRui Ueyama       readGroup();
2382ec34544SRui Ueyama     } else if (Tok == "INCLUDE") {
2392ec34544SRui Ueyama       readInclude();
2402ec34544SRui Ueyama     } else if (Tok == "MEMORY") {
2412ec34544SRui Ueyama       readMemory();
2422ec34544SRui Ueyama     } else if (Tok == "OUTPUT") {
2432ec34544SRui Ueyama       readOutput();
2442ec34544SRui Ueyama     } else if (Tok == "OUTPUT_ARCH") {
2452ec34544SRui Ueyama       readOutputArch();
2462ec34544SRui Ueyama     } else if (Tok == "OUTPUT_FORMAT") {
2472ec34544SRui Ueyama       readOutputFormat();
2482ec34544SRui Ueyama     } else if (Tok == "PHDRS") {
2492ec34544SRui Ueyama       readPhdrs();
2505f37541cSGeorge Rimar     } else if (Tok == "REGION_ALIAS") {
2515f37541cSGeorge Rimar       readRegionAlias();
2522ec34544SRui Ueyama     } else if (Tok == "SEARCH_DIR") {
2532ec34544SRui Ueyama       readSearchDir();
2542ec34544SRui Ueyama     } else if (Tok == "SECTIONS") {
2552ec34544SRui Ueyama       readSections();
2562ec34544SRui Ueyama     } else if (Tok == "VERSION") {
2572ec34544SRui Ueyama       readVersion();
2582ec34544SRui Ueyama     } else if (SymbolAssignment *Cmd = readProvideOrAssignment(Tok)) {
2596b394caaSRui Ueyama       Script->SectionCommands.push_back(Cmd);
2602ec34544SRui Ueyama     } else {
2612ec34544SRui Ueyama       setError("unknown directive: " + Tok);
2622ec34544SRui Ueyama     }
2632ec34544SRui Ueyama   }
2642ec34544SRui Ueyama }
2652ec34544SRui Ueyama 
2668c7e8cceSPetr Hosek void ScriptParser::readDefsym(StringRef Name) {
2678c7e8cceSPetr Hosek   Expr E = readExpr();
2688c7e8cceSPetr Hosek   if (!atEOF())
2698c7e8cceSPetr Hosek     setError("EOF expected, but got " + next());
27084bcabcbSGeorge Rimar   SymbolAssignment *Cmd = make<SymbolAssignment>(Name, E, getCurrentLocation(),
27184bcabcbSGeorge Rimar                                                  "" /*CommandString*/);
2728c7e8cceSPetr Hosek   Script->SectionCommands.push_back(Cmd);
2738c7e8cceSPetr Hosek }
2748c7e8cceSPetr Hosek 
2752ec34544SRui Ueyama void ScriptParser::addFile(StringRef S) {
2762ec34544SRui Ueyama   if (IsUnderSysroot && S.startswith("/")) {
2772ec34544SRui Ueyama     SmallString<128> PathData;
2782ec34544SRui Ueyama     StringRef Path = (Config->Sysroot + S).toStringRef(PathData);
2792ec34544SRui Ueyama     if (sys::fs::exists(Path)) {
280a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(Path), /*WithLOption=*/false);
2812ec34544SRui Ueyama       return;
2822ec34544SRui Ueyama     }
2832ec34544SRui Ueyama   }
2842ec34544SRui Ueyama 
285875ae82bSRui Ueyama   if (S.startswith("/")) {
286a76349bfSEvgeniy Stepanov     Driver->addFile(S, /*WithLOption=*/false);
2872ec34544SRui Ueyama   } else if (S.startswith("=")) {
2882ec34544SRui Ueyama     if (Config->Sysroot.empty())
289a76349bfSEvgeniy Stepanov       Driver->addFile(S.substr(1), /*WithLOption=*/false);
2902ec34544SRui Ueyama     else
291a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1)),
292a76349bfSEvgeniy Stepanov                       /*WithLOption=*/false);
2932ec34544SRui Ueyama   } else if (S.startswith("-l")) {
2942ec34544SRui Ueyama     Driver->addLibrary(S.substr(2));
2952ec34544SRui Ueyama   } else if (sys::fs::exists(S)) {
296a76349bfSEvgeniy Stepanov     Driver->addFile(S, /*WithLOption=*/false);
2972ec34544SRui Ueyama   } else {
2982ec34544SRui Ueyama     if (Optional<std::string> Path = findFromSearchPaths(S))
299a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(*Path), /*WithLOption=*/true);
3002ec34544SRui Ueyama     else
3012ec34544SRui Ueyama       setError("unable to find " + S);
3022ec34544SRui Ueyama   }
3032ec34544SRui Ueyama }
3042ec34544SRui Ueyama 
3052ec34544SRui Ueyama void ScriptParser::readAsNeeded() {
3062ec34544SRui Ueyama   expect("(");
3072ec34544SRui Ueyama   bool Orig = Config->AsNeeded;
3082ec34544SRui Ueyama   Config->AsNeeded = true;
309b8a59c8aSBob Haarman   while (!errorCount() && !consume(")"))
3102ec34544SRui Ueyama     addFile(unquote(next()));
3112ec34544SRui Ueyama   Config->AsNeeded = Orig;
3122ec34544SRui Ueyama }
3132ec34544SRui Ueyama 
3142ec34544SRui Ueyama void ScriptParser::readEntry() {
3152ec34544SRui Ueyama   // -e <symbol> takes predecence over ENTRY(<symbol>).
3162ec34544SRui Ueyama   expect("(");
3172ec34544SRui Ueyama   StringRef Tok = next();
3182ec34544SRui Ueyama   if (Config->Entry.empty())
3192ec34544SRui Ueyama     Config->Entry = Tok;
3202ec34544SRui Ueyama   expect(")");
3212ec34544SRui Ueyama }
3222ec34544SRui Ueyama 
3232ec34544SRui Ueyama void ScriptParser::readExtern() {
3242ec34544SRui Ueyama   expect("(");
325b8a59c8aSBob Haarman   while (!errorCount() && !consume(")"))
3262ec34544SRui Ueyama     Config->Undefined.push_back(next());
3272ec34544SRui Ueyama }
3282ec34544SRui Ueyama 
3292ec34544SRui Ueyama void ScriptParser::readGroup() {
3302ec34544SRui Ueyama   expect("(");
331b8a59c8aSBob Haarman   while (!errorCount() && !consume(")")) {
332b579c439SRui Ueyama     if (consume("AS_NEEDED"))
3332ec34544SRui Ueyama       readAsNeeded();
3342ec34544SRui Ueyama     else
335b579c439SRui Ueyama       addFile(unquote(next()));
3362ec34544SRui Ueyama   }
3372ec34544SRui Ueyama }
3382ec34544SRui Ueyama 
3392ec34544SRui Ueyama void ScriptParser::readInclude() {
3402ec34544SRui Ueyama   StringRef Tok = unquote(next());
3412ec34544SRui Ueyama 
3420440be4aSRui Ueyama   if (!Seen.insert(Tok).second) {
3430440be4aSRui Ueyama     setError("there is a cycle in linker script INCLUDEs");
3440440be4aSRui Ueyama     return;
3450440be4aSRui Ueyama   }
3460440be4aSRui Ueyama 
3471de78471SAlexander Richardson   if (Optional<std::string> Path = searchLinkerScript(Tok)) {
3482ec34544SRui Ueyama     if (Optional<MemoryBufferRef> MB = readFile(*Path))
3492ec34544SRui Ueyama       tokenize(*MB);
3502ec34544SRui Ueyama     return;
3512ec34544SRui Ueyama   }
3521de78471SAlexander Richardson   setError("cannot find linker script " + Tok);
3532ec34544SRui Ueyama }
3542ec34544SRui Ueyama 
3552ec34544SRui Ueyama void ScriptParser::readOutput() {
3562ec34544SRui Ueyama   // -o <file> takes predecence over OUTPUT(<file>).
3572ec34544SRui Ueyama   expect("(");
3582ec34544SRui Ueyama   StringRef Tok = next();
3592ec34544SRui Ueyama   if (Config->OutputFile.empty())
3602ec34544SRui Ueyama     Config->OutputFile = unquote(Tok);
3612ec34544SRui Ueyama   expect(")");
3622ec34544SRui Ueyama }
3632ec34544SRui Ueyama 
3642ec34544SRui Ueyama void ScriptParser::readOutputArch() {
3652ec34544SRui Ueyama   // OUTPUT_ARCH is ignored for now.
3662ec34544SRui Ueyama   expect("(");
367b8a59c8aSBob Haarman   while (!errorCount() && !consume(")"))
3682ec34544SRui Ueyama     skip();
3692ec34544SRui Ueyama }
3702ec34544SRui Ueyama 
3712ec34544SRui Ueyama void ScriptParser::readOutputFormat() {
3722ec34544SRui Ueyama   // Error checking only for now.
3732ec34544SRui Ueyama   expect("(");
3742ec34544SRui Ueyama   skip();
375b579c439SRui Ueyama   if (consume(")"))
3762ec34544SRui Ueyama     return;
377b579c439SRui Ueyama   expect(",");
3782ec34544SRui Ueyama   skip();
3792ec34544SRui Ueyama   expect(",");
3802ec34544SRui Ueyama   skip();
3812ec34544SRui Ueyama   expect(")");
3822ec34544SRui Ueyama }
3832ec34544SRui Ueyama 
3842ec34544SRui Ueyama void ScriptParser::readPhdrs() {
3852ec34544SRui Ueyama   expect("{");
3862ec34544SRui Ueyama 
387b8a59c8aSBob Haarman   while (!errorCount() && !consume("}")) {
3880ae2c24cSRui Ueyama     PhdrsCommand Cmd;
3890ae2c24cSRui Ueyama     Cmd.Name = next();
3900ae2c24cSRui Ueyama     Cmd.Type = readPhdrType();
391b579c439SRui Ueyama 
392b8a59c8aSBob Haarman     while (!errorCount() && !consume(";")) {
393b579c439SRui Ueyama       if (consume("FILEHDR"))
3940ae2c24cSRui Ueyama         Cmd.HasFilehdr = true;
395b579c439SRui Ueyama       else if (consume("PHDRS"))
3960ae2c24cSRui Ueyama         Cmd.HasPhdrs = true;
397b579c439SRui Ueyama       else if (consume("AT"))
3980ae2c24cSRui Ueyama         Cmd.LMAExpr = readParenExpr();
399b579c439SRui Ueyama       else if (consume("FLAGS"))
4000ae2c24cSRui Ueyama         Cmd.Flags = readParenExpr()().getValue();
401b579c439SRui Ueyama       else
402b579c439SRui Ueyama         setError("unexpected header attribute: " + next());
403b579c439SRui Ueyama     }
4040ae2c24cSRui Ueyama 
405ac27de9dSRui Ueyama     Script->PhdrsCommands.push_back(Cmd);
4062ec34544SRui Ueyama   }
4072ec34544SRui Ueyama }
4082ec34544SRui Ueyama 
4095f37541cSGeorge Rimar void ScriptParser::readRegionAlias() {
4105f37541cSGeorge Rimar   expect("(");
4115f37541cSGeorge Rimar   StringRef Alias = unquote(next());
4125f37541cSGeorge Rimar   expect(",");
4135f37541cSGeorge Rimar   StringRef Name = next();
4145f37541cSGeorge Rimar   expect(")");
4155f37541cSGeorge Rimar 
416ac27de9dSRui Ueyama   if (Script->MemoryRegions.count(Alias))
4175f37541cSGeorge Rimar     setError("redefinition of memory region '" + Alias + "'");
418ac27de9dSRui Ueyama   if (!Script->MemoryRegions.count(Name))
4195f37541cSGeorge Rimar     setError("memory region '" + Name + "' is not defined");
4208c825db2SGeorge Rimar   Script->MemoryRegions.insert({Alias, Script->MemoryRegions[Name]});
4215f37541cSGeorge Rimar }
4225f37541cSGeorge Rimar 
4232ec34544SRui Ueyama void ScriptParser::readSearchDir() {
4242ec34544SRui Ueyama   expect("(");
4252ec34544SRui Ueyama   StringRef Tok = next();
4262ec34544SRui Ueyama   if (!Config->Nostdlib)
4272ec34544SRui Ueyama     Config->SearchPaths.push_back(unquote(Tok));
4282ec34544SRui Ueyama   expect(")");
4292ec34544SRui Ueyama }
4302ec34544SRui Ueyama 
4312ec34544SRui Ueyama void ScriptParser::readSections() {
432a323e2a7SRui Ueyama   Script->HasSectionsCommand = true;
433b579c439SRui Ueyama 
4342ec34544SRui Ueyama   // -no-rosegment is used to avoid placing read only non-executable sections in
4352ec34544SRui Ueyama   // their own segment. We do the same if SECTIONS command is present in linker
4362ec34544SRui Ueyama   // script. See comment for computeFlags().
4372ec34544SRui Ueyama   Config->SingleRoRx = true;
4382ec34544SRui Ueyama 
4392ec34544SRui Ueyama   expect("{");
4409e2c8a9dSGeorge Rimar   std::vector<BaseCommand *> V;
441b8a59c8aSBob Haarman   while (!errorCount() && !consume("}")) {
4422ec34544SRui Ueyama     StringRef Tok = next();
4432ec34544SRui Ueyama     BaseCommand *Cmd = readProvideOrAssignment(Tok);
4442ec34544SRui Ueyama     if (!Cmd) {
4452ec34544SRui Ueyama       if (Tok == "ASSERT")
44623af89ccSRui Ueyama         Cmd = readAssert();
4472ec34544SRui Ueyama       else
4482ec34544SRui Ueyama         Cmd = readOutputSectionDescription(Tok);
4492ec34544SRui Ueyama     }
4509e2c8a9dSGeorge Rimar     V.push_back(Cmd);
4512ec34544SRui Ueyama   }
4529e2c8a9dSGeorge Rimar 
4539e2c8a9dSGeorge Rimar   if (!atEOF() && consume("INSERT")) {
454796684b4SGeorge Rimar     std::vector<BaseCommand *> *Dest = nullptr;
455796684b4SGeorge Rimar     if (consume("AFTER"))
456796684b4SGeorge Rimar       Dest = &Script->InsertAfterCommands[next()];
457796684b4SGeorge Rimar     else if (consume("BEFORE"))
458796684b4SGeorge Rimar       Dest = &Script->InsertBeforeCommands[next()];
459796684b4SGeorge Rimar     else
460796684b4SGeorge Rimar       setError("expected AFTER/BEFORE, but got '" + next() + "'");
461796684b4SGeorge Rimar     if (Dest)
462796684b4SGeorge Rimar       Dest->insert(Dest->end(), V.begin(), V.end());
4639e2c8a9dSGeorge Rimar     return;
4649e2c8a9dSGeorge Rimar   }
4659e2c8a9dSGeorge Rimar 
4669e2c8a9dSGeorge Rimar   Script->SectionCommands.insert(Script->SectionCommands.end(), V.begin(),
4679e2c8a9dSGeorge Rimar                                  V.end());
4682ec34544SRui Ueyama }
4692ec34544SRui Ueyama 
4702ec34544SRui Ueyama static int precedence(StringRef Op) {
4712ec34544SRui Ueyama   return StringSwitch<int>(Op)
472*aa92fca8SRui Ueyama       .Cases("*", "/", "%", 6)
473*aa92fca8SRui Ueyama       .Cases("+", "-", 5)
474*aa92fca8SRui Ueyama       .Cases("<<", ">>", 4)
475*aa92fca8SRui Ueyama       .Cases("<", "<=", ">", ">=", "==", "!=", 3)
476*aa92fca8SRui Ueyama       .Case("&", 2)
477*aa92fca8SRui Ueyama       .Case("|", 1)
4782ec34544SRui Ueyama       .Default(-1);
4792ec34544SRui Ueyama }
4802ec34544SRui Ueyama 
4812ec34544SRui Ueyama StringMatcher ScriptParser::readFilePatterns() {
4822ec34544SRui Ueyama   std::vector<StringRef> V;
483b8a59c8aSBob Haarman   while (!errorCount() && !consume(")"))
4842ec34544SRui Ueyama     V.push_back(next());
4852ec34544SRui Ueyama   return StringMatcher(V);
4862ec34544SRui Ueyama }
4872ec34544SRui Ueyama 
4882ec34544SRui Ueyama SortSectionPolicy ScriptParser::readSortKind() {
4892ec34544SRui Ueyama   if (consume("SORT") || consume("SORT_BY_NAME"))
4902ec34544SRui Ueyama     return SortSectionPolicy::Name;
4912ec34544SRui Ueyama   if (consume("SORT_BY_ALIGNMENT"))
4922ec34544SRui Ueyama     return SortSectionPolicy::Alignment;
4932ec34544SRui Ueyama   if (consume("SORT_BY_INIT_PRIORITY"))
4942ec34544SRui Ueyama     return SortSectionPolicy::Priority;
4952ec34544SRui Ueyama   if (consume("SORT_NONE"))
4962ec34544SRui Ueyama     return SortSectionPolicy::None;
4972ec34544SRui Ueyama   return SortSectionPolicy::Default;
4982ec34544SRui Ueyama }
4992ec34544SRui Ueyama 
50003fc8d1eSRui Ueyama // Reads SECTIONS command contents in the following form:
50103fc8d1eSRui Ueyama //
50203fc8d1eSRui Ueyama // <contents> ::= <elem>*
50303fc8d1eSRui Ueyama // <elem>     ::= <exclude>? <glob-pattern>
50403fc8d1eSRui Ueyama // <exclude>  ::= "EXCLUDE_FILE" "(" <glob-pattern>+ ")"
50503fc8d1eSRui Ueyama //
50603fc8d1eSRui Ueyama // For example,
50703fc8d1eSRui Ueyama //
50803fc8d1eSRui Ueyama // *(.foo EXCLUDE_FILE (a.o) .bar EXCLUDE_FILE (b.o) .baz)
50903fc8d1eSRui Ueyama //
51003fc8d1eSRui Ueyama // is parsed as ".foo", ".bar" with "a.o", and ".baz" with "b.o".
51103fc8d1eSRui Ueyama // The semantics of that is section .foo in any file, section .bar in
51203fc8d1eSRui Ueyama // any file but a.o, and section .baz in any file but b.o.
5132ec34544SRui Ueyama std::vector<SectionPattern> ScriptParser::readInputSectionsList() {
5142ec34544SRui Ueyama   std::vector<SectionPattern> Ret;
515b8a59c8aSBob Haarman   while (!errorCount() && peek() != ")") {
5162ec34544SRui Ueyama     StringMatcher ExcludeFilePat;
5172ec34544SRui Ueyama     if (consume("EXCLUDE_FILE")) {
5182ec34544SRui Ueyama       expect("(");
5192ec34544SRui Ueyama       ExcludeFilePat = readFilePatterns();
5202ec34544SRui Ueyama     }
5212ec34544SRui Ueyama 
5222ec34544SRui Ueyama     std::vector<StringRef> V;
523b8a59c8aSBob Haarman     while (!errorCount() && peek() != ")" && peek() != "EXCLUDE_FILE")
5242ec34544SRui Ueyama       V.push_back(next());
5252ec34544SRui Ueyama 
5262ec34544SRui Ueyama     if (!V.empty())
5272ec34544SRui Ueyama       Ret.push_back({std::move(ExcludeFilePat), StringMatcher(V)});
5282ec34544SRui Ueyama     else
5292ec34544SRui Ueyama       setError("section pattern is expected");
5302ec34544SRui Ueyama   }
5312ec34544SRui Ueyama   return Ret;
5322ec34544SRui Ueyama }
5332ec34544SRui Ueyama 
5342ec34544SRui Ueyama // Reads contents of "SECTIONS" directive. That directive contains a
5352ec34544SRui Ueyama // list of glob patterns for input sections. The grammar is as follows.
5362ec34544SRui Ueyama //
5372ec34544SRui Ueyama // <patterns> ::= <section-list>
5382ec34544SRui Ueyama //              | <sort> "(" <section-list> ")"
5392ec34544SRui Ueyama //              | <sort> "(" <sort> "(" <section-list> ")" ")"
5402ec34544SRui Ueyama //
5412ec34544SRui Ueyama // <sort>     ::= "SORT" | "SORT_BY_NAME" | "SORT_BY_ALIGNMENT"
5422ec34544SRui Ueyama //              | "SORT_BY_INIT_PRIORITY" | "SORT_NONE"
5432ec34544SRui Ueyama //
5442ec34544SRui Ueyama // <section-list> is parsed by readInputSectionsList().
5452ec34544SRui Ueyama InputSectionDescription *
5462ec34544SRui Ueyama ScriptParser::readInputSectionRules(StringRef FilePattern) {
5472ec34544SRui Ueyama   auto *Cmd = make<InputSectionDescription>(FilePattern);
5482ec34544SRui Ueyama   expect("(");
5492ec34544SRui Ueyama 
550b8a59c8aSBob Haarman   while (!errorCount() && !consume(")")) {
5512ec34544SRui Ueyama     SortSectionPolicy Outer = readSortKind();
5522ec34544SRui Ueyama     SortSectionPolicy Inner = SortSectionPolicy::Default;
5532ec34544SRui Ueyama     std::vector<SectionPattern> V;
5542ec34544SRui Ueyama     if (Outer != SortSectionPolicy::Default) {
5552ec34544SRui Ueyama       expect("(");
5562ec34544SRui Ueyama       Inner = readSortKind();
5572ec34544SRui Ueyama       if (Inner != SortSectionPolicy::Default) {
5582ec34544SRui Ueyama         expect("(");
5592ec34544SRui Ueyama         V = readInputSectionsList();
5602ec34544SRui Ueyama         expect(")");
5612ec34544SRui Ueyama       } else {
5622ec34544SRui Ueyama         V = readInputSectionsList();
5632ec34544SRui Ueyama       }
5642ec34544SRui Ueyama       expect(")");
5652ec34544SRui Ueyama     } else {
5662ec34544SRui Ueyama       V = readInputSectionsList();
5672ec34544SRui Ueyama     }
5682ec34544SRui Ueyama 
5692ec34544SRui Ueyama     for (SectionPattern &Pat : V) {
5702ec34544SRui Ueyama       Pat.SortInner = Inner;
5712ec34544SRui Ueyama       Pat.SortOuter = Outer;
5722ec34544SRui Ueyama     }
5732ec34544SRui Ueyama 
5742ec34544SRui Ueyama     std::move(V.begin(), V.end(), std::back_inserter(Cmd->SectionPatterns));
5752ec34544SRui Ueyama   }
5762ec34544SRui Ueyama   return Cmd;
5772ec34544SRui Ueyama }
5782ec34544SRui Ueyama 
5792ec34544SRui Ueyama InputSectionDescription *
5802ec34544SRui Ueyama ScriptParser::readInputSectionDescription(StringRef Tok) {
5812ec34544SRui Ueyama   // Input section wildcard can be surrounded by KEEP.
5822ec34544SRui Ueyama   // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep
5832ec34544SRui Ueyama   if (Tok == "KEEP") {
5842ec34544SRui Ueyama     expect("(");
5852ec34544SRui Ueyama     StringRef FilePattern = next();
5862ec34544SRui Ueyama     InputSectionDescription *Cmd = readInputSectionRules(FilePattern);
5872ec34544SRui Ueyama     expect(")");
588ac27de9dSRui Ueyama     Script->KeptSections.push_back(Cmd);
5892ec34544SRui Ueyama     return Cmd;
5902ec34544SRui Ueyama   }
5912ec34544SRui Ueyama   return readInputSectionRules(Tok);
5922ec34544SRui Ueyama }
5932ec34544SRui Ueyama 
5942ec34544SRui Ueyama void ScriptParser::readSort() {
5952ec34544SRui Ueyama   expect("(");
5962ec34544SRui Ueyama   expect("CONSTRUCTORS");
5972ec34544SRui Ueyama   expect(")");
5982ec34544SRui Ueyama }
5992ec34544SRui Ueyama 
60023af89ccSRui Ueyama AssertCommand *ScriptParser::readAssert() {
60123af89ccSRui Ueyama   return make<AssertCommand>(readAssertExpr());
60223af89ccSRui Ueyama }
60323af89ccSRui Ueyama 
60423af89ccSRui Ueyama Expr ScriptParser::readAssertExpr() {
6052ec34544SRui Ueyama   expect("(");
6062ec34544SRui Ueyama   Expr E = readExpr();
6072ec34544SRui Ueyama   expect(",");
6082ec34544SRui Ueyama   StringRef Msg = unquote(next());
6092ec34544SRui Ueyama   expect(")");
610b579c439SRui Ueyama 
6112ec34544SRui Ueyama   return [=] {
6122ec34544SRui Ueyama     if (!E().getValue())
6132ec34544SRui Ueyama       error(Msg);
6142ec34544SRui Ueyama     return Script->getDot();
6152ec34544SRui Ueyama   };
6162ec34544SRui Ueyama }
6172ec34544SRui Ueyama 
6182ec34544SRui Ueyama // Reads a FILL(expr) command. We handle the FILL command as an
6192ec34544SRui Ueyama // alias for =fillexp section attribute, which is different from
6202ec34544SRui Ueyama // what GNU linkers do.
6212ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html
6222ec34544SRui Ueyama uint32_t ScriptParser::readFill() {
6232ec34544SRui Ueyama   expect("(");
6248acbf1ccSRui Ueyama   uint32_t V = parseFill(next());
6252ec34544SRui Ueyama   expect(")");
6262ec34544SRui Ueyama   return V;
6272ec34544SRui Ueyama }
6282ec34544SRui Ueyama 
6291c08e9f5SGeorge Rimar // Reads an expression and/or the special directive for an output
6301c08e9f5SGeorge Rimar // section definition. Directive is one of following: "(NOLOAD)",
6311c08e9f5SGeorge Rimar // "(COPY)", "(INFO)" or "(OVERLAY)".
6323271d370SRui Ueyama //
6333271d370SRui Ueyama // An output section name can be followed by an address expression
6341c08e9f5SGeorge Rimar // and/or directive. This grammar is not LL(1) because "(" can be
63597f4d158SGeorge Rimar // interpreted as either the beginning of some expression or beginning
6361c08e9f5SGeorge Rimar // of directive.
6373271d370SRui Ueyama //
638b579c439SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html
639fbb0463fSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Type.html
6408c022ca7SRafael Espindola void ScriptParser::readSectionAddressType(OutputSection *Cmd) {
6413271d370SRui Ueyama   if (consume("(")) {
6423271d370SRui Ueyama     if (consume("NOLOAD")) {
6433271d370SRui Ueyama       expect(")");
6443271d370SRui Ueyama       Cmd->Noload = true;
6453271d370SRui Ueyama       return;
6463271d370SRui Ueyama     }
6471c08e9f5SGeorge Rimar     if (consume("COPY") || consume("INFO") || consume("OVERLAY")) {
6481c08e9f5SGeorge Rimar       expect(")");
6491c08e9f5SGeorge Rimar       Cmd->NonAlloc = true;
6501c08e9f5SGeorge Rimar       return;
6511c08e9f5SGeorge Rimar     }
6523271d370SRui Ueyama     Cmd->AddrExpr = readExpr();
6533271d370SRui Ueyama     expect(")");
6543271d370SRui Ueyama   } else {
6553271d370SRui Ueyama     Cmd->AddrExpr = readExpr();
6563271d370SRui Ueyama   }
6573271d370SRui Ueyama 
658fbb0463fSGeorge Rimar   if (consume("(")) {
659fbb0463fSGeorge Rimar     expect("NOLOAD");
660fbb0463fSGeorge Rimar     expect(")");
661fbb0463fSGeorge Rimar     Cmd->Noload = true;
662fbb0463fSGeorge Rimar   }
663fbb0463fSGeorge Rimar }
664fbb0463fSGeorge Rimar 
665f22ec9ddSGeorge Rimar static Expr checkAlignment(Expr E, std::string &Loc) {
666f22ec9ddSGeorge Rimar   return [=] {
667f22ec9ddSGeorge Rimar     uint64_t Alignment = std::max((uint64_t)1, E().getValue());
668f22ec9ddSGeorge Rimar     if (!isPowerOf2_64(Alignment)) {
669f22ec9ddSGeorge Rimar       error(Loc + ": alignment must be power of 2");
670f22ec9ddSGeorge Rimar       return (uint64_t)1; // Return a dummy value.
671f22ec9ddSGeorge Rimar     }
672f22ec9ddSGeorge Rimar     return Alignment;
673f22ec9ddSGeorge Rimar   };
674f22ec9ddSGeorge Rimar }
675f22ec9ddSGeorge Rimar 
6768c022ca7SRafael Espindola OutputSection *ScriptParser::readOutputSectionDescription(StringRef OutSec) {
6778c022ca7SRafael Espindola   OutputSection *Cmd =
6788c022ca7SRafael Espindola       Script->createOutputSection(OutSec, getCurrentLocation());
6793271d370SRui Ueyama 
680c4df670dSGeorge Rimar   size_t SymbolsReferenced = Script->ReferencedSymbols.size();
681c4df670dSGeorge Rimar 
6823271d370SRui Ueyama   if (peek() != ":")
6833271d370SRui Ueyama     readSectionAddressType(Cmd);
6842ec34544SRui Ueyama   expect(":");
6852ec34544SRui Ueyama 
686f22ec9ddSGeorge Rimar   std::string Location = getCurrentLocation();
6872ec34544SRui Ueyama   if (consume("AT"))
6882ec34544SRui Ueyama     Cmd->LMAExpr = readParenExpr();
6892ec34544SRui Ueyama   if (consume("ALIGN"))
690f22ec9ddSGeorge Rimar     Cmd->AlignExpr = checkAlignment(readParenExpr(), Location);
6912ec34544SRui Ueyama   if (consume("SUBALIGN"))
692f22ec9ddSGeorge Rimar     Cmd->SubalignExpr = checkAlignment(readParenExpr(), Location);
6932ec34544SRui Ueyama 
6942ec34544SRui Ueyama   // Parse constraints.
6952ec34544SRui Ueyama   if (consume("ONLY_IF_RO"))
6962ec34544SRui Ueyama     Cmd->Constraint = ConstraintKind::ReadOnly;
6972ec34544SRui Ueyama   if (consume("ONLY_IF_RW"))
6982ec34544SRui Ueyama     Cmd->Constraint = ConstraintKind::ReadWrite;
6992ec34544SRui Ueyama   expect("{");
7002ec34544SRui Ueyama 
701b8a59c8aSBob Haarman   while (!errorCount() && !consume("}")) {
7022ec34544SRui Ueyama     StringRef Tok = next();
7032ec34544SRui Ueyama     if (Tok == ";") {
7042ec34544SRui Ueyama       // Empty commands are allowed. Do nothing here.
705b579c439SRui Ueyama     } else if (SymbolAssignment *Assign = readProvideOrAssignment(Tok)) {
7066b394caaSRui Ueyama       Cmd->SectionCommands.push_back(Assign);
707f0403c60SRui Ueyama     } else if (ByteCommand *Data = readByteCommand(Tok)) {
7086b394caaSRui Ueyama       Cmd->SectionCommands.push_back(Data);
7092ec34544SRui Ueyama     } else if (Tok == "ASSERT") {
7106b394caaSRui Ueyama       Cmd->SectionCommands.push_back(readAssert());
7112ec34544SRui Ueyama       expect(";");
7122ec34544SRui Ueyama     } else if (Tok == "CONSTRUCTORS") {
7132ec34544SRui Ueyama       // CONSTRUCTORS is a keyword to make the linker recognize C++ ctors/dtors
7142ec34544SRui Ueyama       // by name. This is for very old file formats such as ECOFF/XCOFF.
7152ec34544SRui Ueyama       // For ELF, we should ignore.
7162ec34544SRui Ueyama     } else if (Tok == "FILL") {
7172ec34544SRui Ueyama       Cmd->Filler = readFill();
7182ec34544SRui Ueyama     } else if (Tok == "SORT") {
7192ec34544SRui Ueyama       readSort();
7202ec34544SRui Ueyama     } else if (peek() == "(") {
7216b394caaSRui Ueyama       Cmd->SectionCommands.push_back(readInputSectionDescription(Tok));
7222ec34544SRui Ueyama     } else {
7232ec34544SRui Ueyama       setError("unknown command " + Tok);
7242ec34544SRui Ueyama     }
7252ec34544SRui Ueyama   }
7262ec34544SRui Ueyama 
7272ec34544SRui Ueyama   if (consume(">"))
7282ec34544SRui Ueyama     Cmd->MemoryRegionName = next();
7292ec34544SRui Ueyama 
7305d01a8beSGeorge Rimar   if (consume("AT")) {
7315d01a8beSGeorge Rimar     expect(">");
7325d01a8beSGeorge Rimar     Cmd->LMARegionName = next();
7335d01a8beSGeorge Rimar   }
7345d01a8beSGeorge Rimar 
7355d01a8beSGeorge Rimar   if (Cmd->LMAExpr && !Cmd->LMARegionName.empty())
7365d01a8beSGeorge Rimar     error("section can't have both LMA and a load region");
7375d01a8beSGeorge Rimar 
7382ec34544SRui Ueyama   Cmd->Phdrs = readOutputSectionPhdrs();
7392ec34544SRui Ueyama 
7402ec34544SRui Ueyama   if (consume("="))
7418acbf1ccSRui Ueyama     Cmd->Filler = parseFill(next());
7422ec34544SRui Ueyama   else if (peek().startswith("="))
7438acbf1ccSRui Ueyama     Cmd->Filler = parseFill(next().drop_front());
7442ec34544SRui Ueyama 
7452ec34544SRui Ueyama   // Consume optional comma following output section command.
7462ec34544SRui Ueyama   consume(",");
7472ec34544SRui Ueyama 
748c4df670dSGeorge Rimar   if (Script->ReferencedSymbols.size() > SymbolsReferenced)
749c4df670dSGeorge Rimar     Cmd->ExpressionsUseSymbols = true;
7502ec34544SRui Ueyama   return Cmd;
7512ec34544SRui Ueyama }
7522ec34544SRui Ueyama 
7538acbf1ccSRui Ueyama // Parses a given string as a octal/decimal/hexadecimal number and
7548acbf1ccSRui Ueyama // returns it as a big-endian number. Used for `=<fillexp>`.
7552ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html
7562ec34544SRui Ueyama //
7578acbf1ccSRui Ueyama // When reading a hexstring, ld.bfd handles it as a blob of arbitrary
7588acbf1ccSRui Ueyama // size, while ld.gold always handles it as a 32-bit big-endian number.
7598acbf1ccSRui Ueyama // We are compatible with ld.gold because it's easier to implement.
7608acbf1ccSRui Ueyama uint32_t ScriptParser::parseFill(StringRef Tok) {
761b58079d4SRui Ueyama   uint32_t V = 0;
762ab94768cSGeorge Rimar   if (!to_integer(Tok, V))
7632ec34544SRui Ueyama     setError("invalid filler expression: " + Tok);
764b58079d4SRui Ueyama 
765b58079d4SRui Ueyama   uint32_t Buf;
766b58079d4SRui Ueyama   write32be(&Buf, V);
767b58079d4SRui Ueyama   return Buf;
7682ec34544SRui Ueyama }
7692ec34544SRui Ueyama 
7702ec34544SRui Ueyama SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) {
7712ec34544SRui Ueyama   expect("(");
7722ec34544SRui Ueyama   SymbolAssignment *Cmd = readAssignment(next());
7732ec34544SRui Ueyama   Cmd->Provide = Provide;
7742ec34544SRui Ueyama   Cmd->Hidden = Hidden;
7752ec34544SRui Ueyama   expect(")");
7762ec34544SRui Ueyama   expect(";");
7772ec34544SRui Ueyama   return Cmd;
7782ec34544SRui Ueyama }
7792ec34544SRui Ueyama 
7802ec34544SRui Ueyama SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok) {
7812ec34544SRui Ueyama   SymbolAssignment *Cmd = nullptr;
7822ec34544SRui Ueyama   if (peek() == "=" || peek() == "+=") {
7832ec34544SRui Ueyama     Cmd = readAssignment(Tok);
7842ec34544SRui Ueyama     expect(";");
7852ec34544SRui Ueyama   } else if (Tok == "PROVIDE") {
7862ec34544SRui Ueyama     Cmd = readProvideHidden(true, false);
7872ec34544SRui Ueyama   } else if (Tok == "HIDDEN") {
7882ec34544SRui Ueyama     Cmd = readProvideHidden(false, true);
7892ec34544SRui Ueyama   } else if (Tok == "PROVIDE_HIDDEN") {
7902ec34544SRui Ueyama     Cmd = readProvideHidden(true, true);
7912ec34544SRui Ueyama   }
7922ec34544SRui Ueyama   return Cmd;
7932ec34544SRui Ueyama }
7942ec34544SRui Ueyama 
7952ec34544SRui Ueyama SymbolAssignment *ScriptParser::readAssignment(StringRef Name) {
79684bcabcbSGeorge Rimar   size_t OldPos = Pos;
7972ec34544SRui Ueyama   StringRef Op = next();
7982ec34544SRui Ueyama   assert(Op == "=" || Op == "+=");
7992ec34544SRui Ueyama   Expr E = readExpr();
8002ec34544SRui Ueyama   if (Op == "+=") {
8012ec34544SRui Ueyama     std::string Loc = getCurrentLocation();
802722221f5SRui Ueyama     E = [=] { return add(Script->getSymbolValue(Name, Loc), E()); };
8032ec34544SRui Ueyama   }
80484bcabcbSGeorge Rimar 
80584bcabcbSGeorge Rimar   std::string CommandString =
80684bcabcbSGeorge Rimar       Name.str() + " " +
80784bcabcbSGeorge Rimar       llvm::join(Tokens.begin() + OldPos, Tokens.begin() + Pos, " ");
80884bcabcbSGeorge Rimar   return make<SymbolAssignment>(Name, E, getCurrentLocation(), CommandString);
8092ec34544SRui Ueyama }
8102ec34544SRui Ueyama 
8112ec34544SRui Ueyama // This is an operator-precedence parser to parse a linker
8122ec34544SRui Ueyama // script expression.
8132ec34544SRui Ueyama Expr ScriptParser::readExpr() {
8142ec34544SRui Ueyama   // Our lexer is context-aware. Set the in-expression bit so that
8152ec34544SRui Ueyama   // they apply different tokenization rules.
8162ec34544SRui Ueyama   bool Orig = InExpr;
8172ec34544SRui Ueyama   InExpr = true;
8182ec34544SRui Ueyama   Expr E = readExpr1(readPrimary(), 0);
8192ec34544SRui Ueyama   InExpr = Orig;
8202ec34544SRui Ueyama   return E;
8212ec34544SRui Ueyama }
8222ec34544SRui Ueyama 
8237b91e213SGeorge Rimar Expr ScriptParser::combine(StringRef Op, Expr L, Expr R) {
8242ec34544SRui Ueyama   if (Op == "+")
8252ec34544SRui Ueyama     return [=] { return add(L(), R()); };
8262ec34544SRui Ueyama   if (Op == "-")
8272ec34544SRui Ueyama     return [=] { return sub(L(), R()); };
828b579c439SRui Ueyama   if (Op == "*")
8291d20222aSRui Ueyama     return [=] { return L().getValue() * R().getValue(); };
8307b91e213SGeorge Rimar   if (Op == "/") {
8317b91e213SGeorge Rimar     std::string Loc = getCurrentLocation();
8327b91e213SGeorge Rimar     return [=]() -> uint64_t {
8337b91e213SGeorge Rimar       if (uint64_t RV = R().getValue())
8347b91e213SGeorge Rimar         return L().getValue() / RV;
8357b91e213SGeorge Rimar       error(Loc + ": division by zero");
836067617f9SRui Ueyama       return 0;
8377b91e213SGeorge Rimar     };
8387b91e213SGeorge Rimar   }
8397b91e213SGeorge Rimar   if (Op == "%") {
8407b91e213SGeorge Rimar     std::string Loc = getCurrentLocation();
8417b91e213SGeorge Rimar     return [=]() -> uint64_t {
8427b91e213SGeorge Rimar       if (uint64_t RV = R().getValue())
8437b91e213SGeorge Rimar         return L().getValue() % RV;
8447b91e213SGeorge Rimar       error(Loc + ": modulo by zero");
845067617f9SRui Ueyama       return 0;
8467b91e213SGeorge Rimar     };
8477b91e213SGeorge Rimar   }
8482ec34544SRui Ueyama   if (Op == "<<")
8497e915511SRui Ueyama     return [=] { return L().getValue() << R().getValue(); };
8502ec34544SRui Ueyama   if (Op == ">>")
8517e915511SRui Ueyama     return [=] { return L().getValue() >> R().getValue(); };
8522ec34544SRui Ueyama   if (Op == "<")
8532ec34544SRui Ueyama     return [=] { return L().getValue() < R().getValue(); };
8542ec34544SRui Ueyama   if (Op == ">")
8552ec34544SRui Ueyama     return [=] { return L().getValue() > R().getValue(); };
8562ec34544SRui Ueyama   if (Op == ">=")
8572ec34544SRui Ueyama     return [=] { return L().getValue() >= R().getValue(); };
8582ec34544SRui Ueyama   if (Op == "<=")
8592ec34544SRui Ueyama     return [=] { return L().getValue() <= R().getValue(); };
8602ec34544SRui Ueyama   if (Op == "==")
8612ec34544SRui Ueyama     return [=] { return L().getValue() == R().getValue(); };
8622ec34544SRui Ueyama   if (Op == "!=")
8632ec34544SRui Ueyama     return [=] { return L().getValue() != R().getValue(); };
8642ec34544SRui Ueyama   if (Op == "&")
8652ec34544SRui Ueyama     return [=] { return bitAnd(L(), R()); };
8662ec34544SRui Ueyama   if (Op == "|")
8672ec34544SRui Ueyama     return [=] { return bitOr(L(), R()); };
8682ec34544SRui Ueyama   llvm_unreachable("invalid operator");
8692ec34544SRui Ueyama }
8702ec34544SRui Ueyama 
8712ec34544SRui Ueyama // This is a part of the operator-precedence parser. This function
8722ec34544SRui Ueyama // assumes that the remaining token stream starts with an operator.
8732ec34544SRui Ueyama Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) {
874b8a59c8aSBob Haarman   while (!atEOF() && !errorCount()) {
8752ec34544SRui Ueyama     // Read an operator and an expression.
8762ec34544SRui Ueyama     if (consume("?"))
8772ec34544SRui Ueyama       return readTernary(Lhs);
8782ec34544SRui Ueyama     StringRef Op1 = peek();
8792ec34544SRui Ueyama     if (precedence(Op1) < MinPrec)
8802ec34544SRui Ueyama       break;
8812ec34544SRui Ueyama     skip();
8822ec34544SRui Ueyama     Expr Rhs = readPrimary();
8832ec34544SRui Ueyama 
8842ec34544SRui Ueyama     // Evaluate the remaining part of the expression first if the
8852ec34544SRui Ueyama     // next operator has greater precedence than the previous one.
8862ec34544SRui Ueyama     // For example, if we have read "+" and "3", and if the next
8872ec34544SRui Ueyama     // operator is "*", then we'll evaluate 3 * ... part first.
8882ec34544SRui Ueyama     while (!atEOF()) {
8892ec34544SRui Ueyama       StringRef Op2 = peek();
8902ec34544SRui Ueyama       if (precedence(Op2) <= precedence(Op1))
8912ec34544SRui Ueyama         break;
8922ec34544SRui Ueyama       Rhs = readExpr1(Rhs, precedence(Op2));
8932ec34544SRui Ueyama     }
8942ec34544SRui Ueyama 
8952ec34544SRui Ueyama     Lhs = combine(Op1, Lhs, Rhs);
8962ec34544SRui Ueyama   }
8972ec34544SRui Ueyama   return Lhs;
8982ec34544SRui Ueyama }
8992ec34544SRui Ueyama 
9005fb17128SGeorge Rimar Expr ScriptParser::getPageSize() {
9015fb17128SGeorge Rimar   std::string Location = getCurrentLocation();
9025fb17128SGeorge Rimar   return [=]() -> uint64_t {
9035fb17128SGeorge Rimar     if (Target)
9042ec34544SRui Ueyama       return Target->PageSize;
9055fb17128SGeorge Rimar     error(Location + ": unable to calculate page size");
9065fb17128SGeorge Rimar     return 4096; // Return a dummy value.
9075fb17128SGeorge Rimar   };
9085fb17128SGeorge Rimar }
9095fb17128SGeorge Rimar 
9105fb17128SGeorge Rimar Expr ScriptParser::readConstant() {
9115fb17128SGeorge Rimar   StringRef S = readParenLiteral();
9125fb17128SGeorge Rimar   if (S == "COMMONPAGESIZE")
9135fb17128SGeorge Rimar     return getPageSize();
9142ec34544SRui Ueyama   if (S == "MAXPAGESIZE")
9155fb17128SGeorge Rimar     return [] { return Config->MaxPageSize; };
9165fb17128SGeorge Rimar   setError("unknown constant: " + S);
917b068b037SGeorge Rimar   return [] { return 0; };
9182ec34544SRui Ueyama }
9192ec34544SRui Ueyama 
9205c65088fSRui Ueyama // Parses Tok as an integer. It recognizes hexadecimal (prefixed with
9215c65088fSRui Ueyama // "0x" or suffixed with "H") and decimal numbers. Decimal numbers may
9225c65088fSRui Ueyama // have "K" (Ki) or "M" (Mi) suffixes.
9235c65088fSRui Ueyama static Optional<uint64_t> parseInt(StringRef Tok) {
9242ec34544SRui Ueyama   // Hexadecimal
9255c65088fSRui Ueyama   uint64_t Val;
9264092016bSRui Ueyama   if (Tok.startswith_lower("0x")) {
9274092016bSRui Ueyama     if (!to_integer(Tok.substr(2), Val, 16))
9284092016bSRui Ueyama       return None;
9295c65088fSRui Ueyama     return Val;
9304092016bSRui Ueyama   }
9314092016bSRui Ueyama   if (Tok.endswith_lower("H")) {
9324092016bSRui Ueyama     if (!to_integer(Tok.drop_back(), Val, 16))
9334092016bSRui Ueyama       return None;
9345c65088fSRui Ueyama     return Val;
9354092016bSRui Ueyama   }
9362ec34544SRui Ueyama 
9372ec34544SRui Ueyama   // Decimal
9382ec34544SRui Ueyama   if (Tok.endswith_lower("K")) {
939ab94768cSGeorge Rimar     if (!to_integer(Tok.drop_back(), Val, 10))
9405c65088fSRui Ueyama       return None;
9415c65088fSRui Ueyama     return Val * 1024;
9422ec34544SRui Ueyama   }
9435c65088fSRui Ueyama   if (Tok.endswith_lower("M")) {
944ab94768cSGeorge Rimar     if (!to_integer(Tok.drop_back(), Val, 10))
9455c65088fSRui Ueyama       return None;
9465c65088fSRui Ueyama     return Val * 1024 * 1024;
9475c65088fSRui Ueyama   }
948ab94768cSGeorge Rimar   if (!to_integer(Tok, Val, 10))
9495c65088fSRui Ueyama     return None;
9505c65088fSRui Ueyama   return Val;
9512ec34544SRui Ueyama }
9522ec34544SRui Ueyama 
953f0403c60SRui Ueyama ByteCommand *ScriptParser::readByteCommand(StringRef Tok) {
954b579c439SRui Ueyama   int Size = StringSwitch<int>(Tok)
9552ec34544SRui Ueyama                  .Case("BYTE", 1)
9562ec34544SRui Ueyama                  .Case("SHORT", 2)
9572ec34544SRui Ueyama                  .Case("LONG", 4)
9582ec34544SRui Ueyama                  .Case("QUAD", 8)
9592ec34544SRui Ueyama                  .Default(-1);
9602ec34544SRui Ueyama   if (Size == -1)
9612ec34544SRui Ueyama     return nullptr;
96284bcabcbSGeorge Rimar 
96384bcabcbSGeorge Rimar   size_t OldPos = Pos;
96484bcabcbSGeorge Rimar   Expr E = readParenExpr();
96584bcabcbSGeorge Rimar   std::string CommandString =
96684bcabcbSGeorge Rimar       Tok.str() + " " +
96784bcabcbSGeorge Rimar       llvm::join(Tokens.begin() + OldPos, Tokens.begin() + Pos, " ");
96884bcabcbSGeorge Rimar   return make<ByteCommand>(E, Size, CommandString);
9692ec34544SRui Ueyama }
9702ec34544SRui Ueyama 
9712ec34544SRui Ueyama StringRef ScriptParser::readParenLiteral() {
9722ec34544SRui Ueyama   expect("(");
9735e9c7762SRafael Espindola   bool Orig = InExpr;
9745e9c7762SRafael Espindola   InExpr = false;
9752ec34544SRui Ueyama   StringRef Tok = next();
9765e9c7762SRafael Espindola   InExpr = Orig;
9772ec34544SRui Ueyama   expect(")");
9782ec34544SRui Ueyama   return Tok;
9792ec34544SRui Ueyama }
9802ec34544SRui Ueyama 
981617e2f98SRui Ueyama static void checkIfExists(OutputSection *Cmd, StringRef Location) {
98205c4f67cSRafael Espindola   if (Cmd->Location.empty() && Script->ErrorOnMissingSection)
98305c4f67cSRafael Espindola     error(Location + ": undefined section " + Cmd->Name);
98405c4f67cSRafael Espindola }
98505c4f67cSRafael Espindola 
9862ec34544SRui Ueyama Expr ScriptParser::readPrimary() {
9872ec34544SRui Ueyama   if (peek() == "(")
9882ec34544SRui Ueyama     return readParenExpr();
9892ec34544SRui Ueyama 
9905c65088fSRui Ueyama   if (consume("~")) {
9912ec34544SRui Ueyama     Expr E = readPrimary();
992b2fb84a1SRui Ueyama     return [=] { return ~E().getValue(); };
9932ec34544SRui Ueyama   }
9946f1d954eSHafiz Abid Qadeer   if (consume("!")) {
9956f1d954eSHafiz Abid Qadeer     Expr E = readPrimary();
9966f1d954eSHafiz Abid Qadeer     return [=] { return !E().getValue(); };
9976f1d954eSHafiz Abid Qadeer   }
9985c65088fSRui Ueyama   if (consume("-")) {
9992ec34544SRui Ueyama     Expr E = readPrimary();
1000b2fb84a1SRui Ueyama     return [=] { return -E().getValue(); };
10012ec34544SRui Ueyama   }
10022ec34544SRui Ueyama 
10035c65088fSRui Ueyama   StringRef Tok = next();
10045c65088fSRui Ueyama   std::string Location = getCurrentLocation();
10055c65088fSRui Ueyama 
10062ec34544SRui Ueyama   // Built-in functions are parsed here.
10072ec34544SRui Ueyama   // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html.
10082ec34544SRui Ueyama   if (Tok == "ABSOLUTE") {
10092ec34544SRui Ueyama     Expr Inner = readParenExpr();
10102ec34544SRui Ueyama     return [=] {
10112ec34544SRui Ueyama       ExprValue I = Inner();
10122ec34544SRui Ueyama       I.ForceAbsolute = true;
10132ec34544SRui Ueyama       return I;
10142ec34544SRui Ueyama     };
10152ec34544SRui Ueyama   }
10162ec34544SRui Ueyama   if (Tok == "ADDR") {
10172ec34544SRui Ueyama     StringRef Name = readParenLiteral();
10184fbe3518SRui Ueyama     OutputSection *Sec = Script->getOrCreateOutputSection(Name);
101941c7ab4aSGeorge Rimar     return [=]() -> ExprValue {
10204fbe3518SRui Ueyama       checkIfExists(Sec, Location);
10214fbe3518SRui Ueyama       return {Sec, false, 0, Location};
102241c7ab4aSGeorge Rimar     };
10232ec34544SRui Ueyama   }
10242ec34544SRui Ueyama   if (Tok == "ALIGN") {
10252ec34544SRui Ueyama     expect("(");
10262ec34544SRui Ueyama     Expr E = readExpr();
1027f22ec9ddSGeorge Rimar     if (consume(")")) {
1028f22ec9ddSGeorge Rimar       E = checkAlignment(E, Location);
1029f22ec9ddSGeorge Rimar       return [=] { return alignTo(Script->getDot(), E().getValue()); };
1030f22ec9ddSGeorge Rimar     }
1031b579c439SRui Ueyama     expect(",");
1032f22ec9ddSGeorge Rimar     Expr E2 = checkAlignment(readExpr(), Location);
10332ec34544SRui Ueyama     expect(")");
10343c6de1a6SPetr Hosek     return [=] {
10353c6de1a6SPetr Hosek       ExprValue V = E();
1036f22ec9ddSGeorge Rimar       V.Alignment = E2().getValue();
10373c6de1a6SPetr Hosek       return V;
10383c6de1a6SPetr Hosek     };
10392ec34544SRui Ueyama   }
10402ec34544SRui Ueyama   if (Tok == "ALIGNOF") {
10412ec34544SRui Ueyama     StringRef Name = readParenLiteral();
10428c022ca7SRafael Espindola     OutputSection *Cmd = Script->getOrCreateOutputSection(Name);
1043617e2f98SRui Ueyama     return [=] {
1044617e2f98SRui Ueyama       checkIfExists(Cmd, Location);
1045617e2f98SRui Ueyama       return Cmd->Alignment;
1046617e2f98SRui Ueyama     };
10472ec34544SRui Ueyama   }
10482ec34544SRui Ueyama   if (Tok == "ASSERT")
104923af89ccSRui Ueyama     return readAssertExpr();
10505fb17128SGeorge Rimar   if (Tok == "CONSTANT")
10515fb17128SGeorge Rimar     return readConstant();
10522ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_ALIGN") {
10532ec34544SRui Ueyama     expect("(");
10542ec34544SRui Ueyama     Expr E = readExpr();
10552ec34544SRui Ueyama     expect(",");
10562ec34544SRui Ueyama     readExpr();
10572ec34544SRui Ueyama     expect(")");
105860833f6eSGeorge Rimar     return [=] {
105960833f6eSGeorge Rimar       return alignTo(Script->getDot(), std::max((uint64_t)1, E().getValue()));
106060833f6eSGeorge Rimar     };
10612ec34544SRui Ueyama   }
10622ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_END") {
10632ec34544SRui Ueyama     expect("(");
10642ec34544SRui Ueyama     expect(".");
10652ec34544SRui Ueyama     expect(")");
10662ec34544SRui Ueyama     return [] { return Script->getDot(); };
10672ec34544SRui Ueyama   }
10682ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_RELRO_END") {
10692ec34544SRui Ueyama     // GNU linkers implements more complicated logic to handle
10702ec34544SRui Ueyama     // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and
10712ec34544SRui Ueyama     // just align to the next page boundary for simplicity.
10722ec34544SRui Ueyama     expect("(");
10732ec34544SRui Ueyama     readExpr();
10742ec34544SRui Ueyama     expect(",");
10752ec34544SRui Ueyama     readExpr();
10762ec34544SRui Ueyama     expect(")");
10775fb17128SGeorge Rimar     Expr E = getPageSize();
10785fb17128SGeorge Rimar     return [=] { return alignTo(Script->getDot(), E().getValue()); };
10792ec34544SRui Ueyama   }
10802ec34544SRui Ueyama   if (Tok == "DEFINED") {
10812ec34544SRui Ueyama     StringRef Name = readParenLiteral();
10829b18f50fSRui Ueyama     return [=] { return Symtab->find(Name) ? 1 : 0; };
10832ec34544SRui Ueyama   }
108491b95b61SRui Ueyama   if (Tok == "LENGTH") {
108591b95b61SRui Ueyama     StringRef Name = readParenLiteral();
1086b068b037SGeorge Rimar     if (Script->MemoryRegions.count(Name) == 0) {
108791b95b61SRui Ueyama       setError("memory region not defined: " + Name);
1088b068b037SGeorge Rimar       return [] { return 0; };
1089b068b037SGeorge Rimar     }
1090ac27de9dSRui Ueyama     return [=] { return Script->MemoryRegions[Name]->Length; };
109191b95b61SRui Ueyama   }
10922ec34544SRui Ueyama   if (Tok == "LOADADDR") {
10932ec34544SRui Ueyama     StringRef Name = readParenLiteral();
10948c022ca7SRafael Espindola     OutputSection *Cmd = Script->getOrCreateOutputSection(Name);
1095617e2f98SRui Ueyama     return [=] {
1096617e2f98SRui Ueyama       checkIfExists(Cmd, Location);
1097617e2f98SRui Ueyama       return Cmd->getLMA();
1098617e2f98SRui Ueyama     };
10992ec34544SRui Ueyama   }
110091b95b61SRui Ueyama   if (Tok == "ORIGIN") {
110191b95b61SRui Ueyama     StringRef Name = readParenLiteral();
1102b068b037SGeorge Rimar     if (Script->MemoryRegions.count(Name) == 0) {
110391b95b61SRui Ueyama       setError("memory region not defined: " + Name);
1104b068b037SGeorge Rimar       return [] { return 0; };
1105b068b037SGeorge Rimar     }
1106ac27de9dSRui Ueyama     return [=] { return Script->MemoryRegions[Name]->Origin; };
110791b95b61SRui Ueyama   }
11082ec34544SRui Ueyama   if (Tok == "SEGMENT_START") {
11092ec34544SRui Ueyama     expect("(");
11102ec34544SRui Ueyama     skip();
11112ec34544SRui Ueyama     expect(",");
11122ec34544SRui Ueyama     Expr E = readExpr();
11132ec34544SRui Ueyama     expect(")");
11142ec34544SRui Ueyama     return [=] { return E(); };
11152ec34544SRui Ueyama   }
11162ec34544SRui Ueyama   if (Tok == "SIZEOF") {
11172ec34544SRui Ueyama     StringRef Name = readParenLiteral();
11188c022ca7SRafael Espindola     OutputSection *Cmd = Script->getOrCreateOutputSection(Name);
111905c4f67cSRafael Espindola     // Linker script does not create an output section if its content is empty.
112005c4f67cSRafael Espindola     // We want to allow SIZEOF(.foo) where .foo is a section which happened to
112105c4f67cSRafael Espindola     // be empty.
11228c022ca7SRafael Espindola     return [=] { return Cmd->Size; };
11232ec34544SRui Ueyama   }
11242ec34544SRui Ueyama   if (Tok == "SIZEOF_HEADERS")
11252ec34544SRui Ueyama     return [=] { return elf::getHeaderSize(); };
11262ec34544SRui Ueyama 
11274eb2eccbSRui Ueyama   // Tok is the dot.
11284eb2eccbSRui Ueyama   if (Tok == ".")
1129722221f5SRui Ueyama     return [=] { return Script->getSymbolValue(Tok, Location); };
11304eb2eccbSRui Ueyama 
11312ec34544SRui Ueyama   // Tok is a literal number.
11325c65088fSRui Ueyama   if (Optional<uint64_t> Val = parseInt(Tok))
11335c65088fSRui Ueyama     return [=] { return *Val; };
11342ec34544SRui Ueyama 
11352ec34544SRui Ueyama   // Tok is a symbol name.
11362ec34544SRui Ueyama   if (!isValidCIdentifier(Tok))
11372ec34544SRui Ueyama     setError("malformed number: " + Tok);
1138ac27de9dSRui Ueyama   Script->ReferencedSymbols.push_back(Tok);
1139722221f5SRui Ueyama   return [=] { return Script->getSymbolValue(Tok, Location); };
11402ec34544SRui Ueyama }
11412ec34544SRui Ueyama 
11422ec34544SRui Ueyama Expr ScriptParser::readTernary(Expr Cond) {
11432ec34544SRui Ueyama   Expr L = readExpr();
11442ec34544SRui Ueyama   expect(":");
11452ec34544SRui Ueyama   Expr R = readExpr();
11462ec34544SRui Ueyama   return [=] { return Cond().getValue() ? L() : R(); };
11472ec34544SRui Ueyama }
11482ec34544SRui Ueyama 
11492ec34544SRui Ueyama Expr ScriptParser::readParenExpr() {
11502ec34544SRui Ueyama   expect("(");
11512ec34544SRui Ueyama   Expr E = readExpr();
11522ec34544SRui Ueyama   expect(")");
11532ec34544SRui Ueyama   return E;
11542ec34544SRui Ueyama }
11552ec34544SRui Ueyama 
11562ec34544SRui Ueyama std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() {
11572ec34544SRui Ueyama   std::vector<StringRef> Phdrs;
1158b8a59c8aSBob Haarman   while (!errorCount() && peek().startswith(":")) {
11592ec34544SRui Ueyama     StringRef Tok = next();
11602ec34544SRui Ueyama     Phdrs.push_back((Tok.size() == 1) ? next() : Tok.substr(1));
11612ec34544SRui Ueyama   }
11622ec34544SRui Ueyama   return Phdrs;
11632ec34544SRui Ueyama }
11642ec34544SRui Ueyama 
11652ec34544SRui Ueyama // Read a program header type name. The next token must be a
11662ec34544SRui Ueyama // name of a program header type or a constant (e.g. "0x3").
11672ec34544SRui Ueyama unsigned ScriptParser::readPhdrType() {
11682ec34544SRui Ueyama   StringRef Tok = next();
11695c65088fSRui Ueyama   if (Optional<uint64_t> Val = parseInt(Tok))
11705c65088fSRui Ueyama     return *Val;
11712ec34544SRui Ueyama 
11722ec34544SRui Ueyama   unsigned Ret = StringSwitch<unsigned>(Tok)
11732ec34544SRui Ueyama                      .Case("PT_NULL", PT_NULL)
11742ec34544SRui Ueyama                      .Case("PT_LOAD", PT_LOAD)
11752ec34544SRui Ueyama                      .Case("PT_DYNAMIC", PT_DYNAMIC)
11762ec34544SRui Ueyama                      .Case("PT_INTERP", PT_INTERP)
11772ec34544SRui Ueyama                      .Case("PT_NOTE", PT_NOTE)
11782ec34544SRui Ueyama                      .Case("PT_SHLIB", PT_SHLIB)
11792ec34544SRui Ueyama                      .Case("PT_PHDR", PT_PHDR)
11802ec34544SRui Ueyama                      .Case("PT_TLS", PT_TLS)
11812ec34544SRui Ueyama                      .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME)
11822ec34544SRui Ueyama                      .Case("PT_GNU_STACK", PT_GNU_STACK)
11832ec34544SRui Ueyama                      .Case("PT_GNU_RELRO", PT_GNU_RELRO)
11842ec34544SRui Ueyama                      .Case("PT_OPENBSD_RANDOMIZE", PT_OPENBSD_RANDOMIZE)
11852ec34544SRui Ueyama                      .Case("PT_OPENBSD_WXNEEDED", PT_OPENBSD_WXNEEDED)
11862ec34544SRui Ueyama                      .Case("PT_OPENBSD_BOOTDATA", PT_OPENBSD_BOOTDATA)
11872ec34544SRui Ueyama                      .Default(-1);
11882ec34544SRui Ueyama 
11892ec34544SRui Ueyama   if (Ret == (unsigned)-1) {
11902ec34544SRui Ueyama     setError("invalid program header type: " + Tok);
11912ec34544SRui Ueyama     return PT_NULL;
11922ec34544SRui Ueyama   }
11932ec34544SRui Ueyama   return Ret;
11942ec34544SRui Ueyama }
11952ec34544SRui Ueyama 
11962ec34544SRui Ueyama // Reads an anonymous version declaration.
11972ec34544SRui Ueyama void ScriptParser::readAnonymousDeclaration() {
11982ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
11992ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
12002ec34544SRui Ueyama   std::tie(Locals, Globals) = readSymbols();
12012ec34544SRui Ueyama 
12022ec34544SRui Ueyama   for (SymbolVersion V : Locals) {
12032ec34544SRui Ueyama     if (V.Name == "*")
12042ec34544SRui Ueyama       Config->DefaultSymbolVersion = VER_NDX_LOCAL;
12052ec34544SRui Ueyama     else
12062ec34544SRui Ueyama       Config->VersionScriptLocals.push_back(V);
12072ec34544SRui Ueyama   }
12082ec34544SRui Ueyama 
12092ec34544SRui Ueyama   for (SymbolVersion V : Globals)
12102ec34544SRui Ueyama     Config->VersionScriptGlobals.push_back(V);
12112ec34544SRui Ueyama 
12122ec34544SRui Ueyama   expect(";");
12132ec34544SRui Ueyama }
12142ec34544SRui Ueyama 
12152ec34544SRui Ueyama // Reads a non-anonymous version definition,
12162ec34544SRui Ueyama // e.g. "VerStr { global: foo; bar; local: *; };".
12172ec34544SRui Ueyama void ScriptParser::readVersionDeclaration(StringRef VerStr) {
12182ec34544SRui Ueyama   // Read a symbol list.
12192ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
12202ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
12212ec34544SRui Ueyama   std::tie(Locals, Globals) = readSymbols();
12222ec34544SRui Ueyama 
12232ec34544SRui Ueyama   for (SymbolVersion V : Locals) {
12242ec34544SRui Ueyama     if (V.Name == "*")
12252ec34544SRui Ueyama       Config->DefaultSymbolVersion = VER_NDX_LOCAL;
12262ec34544SRui Ueyama     else
12272ec34544SRui Ueyama       Config->VersionScriptLocals.push_back(V);
12282ec34544SRui Ueyama   }
12292ec34544SRui Ueyama 
12302ec34544SRui Ueyama   // Create a new version definition and add that to the global symbols.
12312ec34544SRui Ueyama   VersionDefinition Ver;
12322ec34544SRui Ueyama   Ver.Name = VerStr;
12332ec34544SRui Ueyama   Ver.Globals = Globals;
12342ec34544SRui Ueyama 
12352ec34544SRui Ueyama   // User-defined version number starts from 2 because 0 and 1 are
12362ec34544SRui Ueyama   // reserved for VER_NDX_LOCAL and VER_NDX_GLOBAL, respectively.
12372ec34544SRui Ueyama   Ver.Id = Config->VersionDefinitions.size() + 2;
12382ec34544SRui Ueyama   Config->VersionDefinitions.push_back(Ver);
12392ec34544SRui Ueyama 
12402ec34544SRui Ueyama   // Each version may have a parent version. For example, "Ver2"
12412ec34544SRui Ueyama   // defined as "Ver2 { global: foo; local: *; } Ver1;" has "Ver1"
12422ec34544SRui Ueyama   // as a parent. This version hierarchy is, probably against your
12432ec34544SRui Ueyama   // instinct, purely for hint; the runtime doesn't care about it
12442ec34544SRui Ueyama   // at all. In LLD, we simply ignore it.
12452ec34544SRui Ueyama   if (peek() != ";")
12462ec34544SRui Ueyama     skip();
12472ec34544SRui Ueyama   expect(";");
12482ec34544SRui Ueyama }
12492ec34544SRui Ueyama 
12501e77ad14SRui Ueyama static bool hasWildcard(StringRef S) {
12511e77ad14SRui Ueyama   return S.find_first_of("?*[") != StringRef::npos;
12521e77ad14SRui Ueyama }
12531e77ad14SRui Ueyama 
12542ec34544SRui Ueyama // Reads a list of symbols, e.g. "{ global: foo; bar; local: *; };".
12552ec34544SRui Ueyama std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>>
12562ec34544SRui Ueyama ScriptParser::readSymbols() {
12572ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
12582ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
12592ec34544SRui Ueyama   std::vector<SymbolVersion> *V = &Globals;
12602ec34544SRui Ueyama 
1261b8a59c8aSBob Haarman   while (!errorCount()) {
12622ec34544SRui Ueyama     if (consume("}"))
12632ec34544SRui Ueyama       break;
12642ec34544SRui Ueyama     if (consumeLabel("local")) {
12652ec34544SRui Ueyama       V = &Locals;
12662ec34544SRui Ueyama       continue;
12672ec34544SRui Ueyama     }
12682ec34544SRui Ueyama     if (consumeLabel("global")) {
12692ec34544SRui Ueyama       V = &Globals;
12702ec34544SRui Ueyama       continue;
12712ec34544SRui Ueyama     }
12722ec34544SRui Ueyama 
12732ec34544SRui Ueyama     if (consume("extern")) {
12742ec34544SRui Ueyama       std::vector<SymbolVersion> Ext = readVersionExtern();
12752ec34544SRui Ueyama       V->insert(V->end(), Ext.begin(), Ext.end());
12762ec34544SRui Ueyama     } else {
12772ec34544SRui Ueyama       StringRef Tok = next();
12782ec34544SRui Ueyama       V->push_back({unquote(Tok), false, hasWildcard(Tok)});
12792ec34544SRui Ueyama     }
12802ec34544SRui Ueyama     expect(";");
12812ec34544SRui Ueyama   }
12822ec34544SRui Ueyama   return {Locals, Globals};
12832ec34544SRui Ueyama }
12842ec34544SRui Ueyama 
12852ec34544SRui Ueyama // Reads an "extern C++" directive, e.g.,
12862ec34544SRui Ueyama // "extern "C++" { ns::*; "f(int, double)"; };"
128717324d8bSRui Ueyama //
128817324d8bSRui Ueyama // The last semicolon is optional. E.g. this is OK:
128917324d8bSRui Ueyama // "extern "C++" { ns::*; "f(int, double)" };"
12902ec34544SRui Ueyama std::vector<SymbolVersion> ScriptParser::readVersionExtern() {
12912ec34544SRui Ueyama   StringRef Tok = next();
12922ec34544SRui Ueyama   bool IsCXX = Tok == "\"C++\"";
12932ec34544SRui Ueyama   if (!IsCXX && Tok != "\"C\"")
12942ec34544SRui Ueyama     setError("Unknown language");
12952ec34544SRui Ueyama   expect("{");
12962ec34544SRui Ueyama 
12972ec34544SRui Ueyama   std::vector<SymbolVersion> Ret;
1298b8a59c8aSBob Haarman   while (!errorCount() && peek() != "}") {
12992ec34544SRui Ueyama     StringRef Tok = next();
13002ec34544SRui Ueyama     bool HasWildcard = !Tok.startswith("\"") && hasWildcard(Tok);
13012ec34544SRui Ueyama     Ret.push_back({unquote(Tok), IsCXX, HasWildcard});
130217324d8bSRui Ueyama     if (consume("}"))
130317324d8bSRui Ueyama       return Ret;
13042ec34544SRui Ueyama     expect(";");
13052ec34544SRui Ueyama   }
13062ec34544SRui Ueyama 
13072ec34544SRui Ueyama   expect("}");
13082ec34544SRui Ueyama   return Ret;
13092ec34544SRui Ueyama }
13102ec34544SRui Ueyama 
13112ec34544SRui Ueyama uint64_t ScriptParser::readMemoryAssignment(StringRef S1, StringRef S2,
13122ec34544SRui Ueyama                                             StringRef S3) {
1313b579c439SRui Ueyama   if (!consume(S1) && !consume(S2) && !consume(S3)) {
13142ec34544SRui Ueyama     setError("expected one of: " + S1 + ", " + S2 + ", or " + S3);
13152ec34544SRui Ueyama     return 0;
13162ec34544SRui Ueyama   }
13172ec34544SRui Ueyama   expect("=");
1318040af7deSRui Ueyama   return readExpr()().getValue();
13192ec34544SRui Ueyama }
13202ec34544SRui Ueyama 
13212ec34544SRui Ueyama // Parse the MEMORY command as specified in:
13222ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/MEMORY.html
13232ec34544SRui Ueyama //
13242ec34544SRui Ueyama // MEMORY { name [(attr)] : ORIGIN = origin, LENGTH = len ... }
13252ec34544SRui Ueyama void ScriptParser::readMemory() {
13262ec34544SRui Ueyama   expect("{");
1327b8a59c8aSBob Haarman   while (!errorCount() && !consume("}")) {
13282ec34544SRui Ueyama     StringRef Name = next();
13292ec34544SRui Ueyama 
13302ec34544SRui Ueyama     uint32_t Flags = 0;
13312ec34544SRui Ueyama     uint32_t NegFlags = 0;
13322ec34544SRui Ueyama     if (consume("(")) {
13332ec34544SRui Ueyama       std::tie(Flags, NegFlags) = readMemoryAttributes();
13342ec34544SRui Ueyama       expect(")");
13352ec34544SRui Ueyama     }
13362ec34544SRui Ueyama     expect(":");
13372ec34544SRui Ueyama 
13382ec34544SRui Ueyama     uint64_t Origin = readMemoryAssignment("ORIGIN", "org", "o");
13392ec34544SRui Ueyama     expect(",");
13402ec34544SRui Ueyama     uint64_t Length = readMemoryAssignment("LENGTH", "len", "l");
13412ec34544SRui Ueyama 
13425f37541cSGeorge Rimar     // Add the memory region to the region map.
1343490f0a4dSRafael Espindola     MemoryRegion *MR =
1344490f0a4dSRafael Espindola         make<MemoryRegion>(Name, Origin, Length, Flags, NegFlags);
13450984cfa9SGeorge Rimar     if (!Script->MemoryRegions.insert({Name, MR}).second)
13460984cfa9SGeorge Rimar       setError("region '" + Name + "' already defined");
13472ec34544SRui Ueyama   }
13482ec34544SRui Ueyama }
13492ec34544SRui Ueyama 
13502ec34544SRui Ueyama // This function parses the attributes used to match against section
13512ec34544SRui Ueyama // flags when placing output sections in a memory region. These flags
13522ec34544SRui Ueyama // are only used when an explicit memory region name is not used.
13532ec34544SRui Ueyama std::pair<uint32_t, uint32_t> ScriptParser::readMemoryAttributes() {
13542ec34544SRui Ueyama   uint32_t Flags = 0;
13552ec34544SRui Ueyama   uint32_t NegFlags = 0;
13562ec34544SRui Ueyama   bool Invert = false;
13572ec34544SRui Ueyama 
13582ec34544SRui Ueyama   for (char C : next().lower()) {
13592ec34544SRui Ueyama     uint32_t Flag = 0;
13602ec34544SRui Ueyama     if (C == '!')
13612ec34544SRui Ueyama       Invert = !Invert;
13622ec34544SRui Ueyama     else if (C == 'w')
13632ec34544SRui Ueyama       Flag = SHF_WRITE;
13642ec34544SRui Ueyama     else if (C == 'x')
13652ec34544SRui Ueyama       Flag = SHF_EXECINSTR;
13662ec34544SRui Ueyama     else if (C == 'a')
13672ec34544SRui Ueyama       Flag = SHF_ALLOC;
13682ec34544SRui Ueyama     else if (C != 'r')
13692ec34544SRui Ueyama       setError("invalid memory region attribute");
13702ec34544SRui Ueyama 
13712ec34544SRui Ueyama     if (Invert)
13722ec34544SRui Ueyama       NegFlags |= Flag;
13732ec34544SRui Ueyama     else
13742ec34544SRui Ueyama       Flags |= Flag;
13752ec34544SRui Ueyama   }
13762ec34544SRui Ueyama   return {Flags, NegFlags};
13772ec34544SRui Ueyama }
13782ec34544SRui Ueyama 
13792ec34544SRui Ueyama void elf::readLinkerScript(MemoryBufferRef MB) {
13802ec34544SRui Ueyama   ScriptParser(MB).readLinkerScript();
13812ec34544SRui Ueyama }
13822ec34544SRui Ueyama 
13832ec34544SRui Ueyama void elf::readVersionScript(MemoryBufferRef MB) {
13842ec34544SRui Ueyama   ScriptParser(MB).readVersionScript();
13852ec34544SRui Ueyama }
13862ec34544SRui Ueyama 
13872ec34544SRui Ueyama void elf::readDynamicList(MemoryBufferRef MB) {
13882ec34544SRui Ueyama   ScriptParser(MB).readDynamicList();
13892ec34544SRui Ueyama }
13908c7e8cceSPetr Hosek 
13918c7e8cceSPetr Hosek void elf::readDefsym(StringRef Name, MemoryBufferRef MB) {
13928c7e8cceSPetr Hosek   ScriptParser(MB).readDefsym(Name);
13938c7e8cceSPetr Hosek }
1394