12ec34544SRui Ueyama //===- ScriptParser.cpp ---------------------------------------------------===//
22ec34544SRui Ueyama //
32ec34544SRui Ueyama //                             The LLVM Linker
42ec34544SRui Ueyama //
52ec34544SRui Ueyama // This file is distributed under the University of Illinois Open Source
62ec34544SRui Ueyama // License. See LICENSE.TXT for details.
72ec34544SRui Ueyama //
82ec34544SRui Ueyama //===----------------------------------------------------------------------===//
905f6b852SRui Ueyama //
1005f6b852SRui Ueyama // This file contains a recursive-descendent parser for linker scripts.
1105f6b852SRui Ueyama // Parsed results are stored to Config and Script global objects.
1205f6b852SRui Ueyama //
1305f6b852SRui Ueyama //===----------------------------------------------------------------------===//
142ec34544SRui Ueyama 
152ec34544SRui Ueyama #include "ScriptParser.h"
162ec34544SRui Ueyama #include "Config.h"
172ec34544SRui Ueyama #include "Driver.h"
182ec34544SRui Ueyama #include "InputSection.h"
192ec34544SRui Ueyama #include "LinkerScript.h"
202ec34544SRui Ueyama #include "Memory.h"
212ec34544SRui Ueyama #include "OutputSections.h"
222ec34544SRui Ueyama #include "ScriptLexer.h"
232ec34544SRui Ueyama #include "Symbols.h"
242ec34544SRui Ueyama #include "Target.h"
252ec34544SRui Ueyama #include "llvm/ADT/SmallString.h"
262ec34544SRui Ueyama #include "llvm/ADT/StringRef.h"
272ec34544SRui Ueyama #include "llvm/ADT/StringSwitch.h"
28264b5d9eSZachary Turner #include "llvm/BinaryFormat/ELF.h"
292ec34544SRui Ueyama #include "llvm/Support/Casting.h"
302ec34544SRui Ueyama #include "llvm/Support/ErrorHandling.h"
312ec34544SRui Ueyama #include "llvm/Support/FileSystem.h"
322ec34544SRui Ueyama #include "llvm/Support/Path.h"
332ec34544SRui Ueyama #include <cassert>
342ec34544SRui Ueyama #include <limits>
352ec34544SRui Ueyama #include <vector>
362ec34544SRui Ueyama 
372ec34544SRui Ueyama using namespace llvm;
382ec34544SRui Ueyama using namespace llvm::ELF;
39b58079d4SRui Ueyama using namespace llvm::support::endian;
402ec34544SRui Ueyama using namespace lld;
412ec34544SRui Ueyama using namespace lld::elf;
422ec34544SRui Ueyama 
432ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path);
442ec34544SRui Ueyama 
4596b3fe02SRui Ueyama namespace {
4696b3fe02SRui Ueyama class ScriptParser final : ScriptLexer {
472ec34544SRui Ueyama public:
482ec34544SRui Ueyama   ScriptParser(MemoryBufferRef MB)
492ec34544SRui Ueyama       : ScriptLexer(MB),
502ec34544SRui Ueyama         IsUnderSysroot(isUnderSysroot(MB.getBufferIdentifier())) {}
512ec34544SRui Ueyama 
522ec34544SRui Ueyama   void readLinkerScript();
532ec34544SRui Ueyama   void readVersionScript();
542ec34544SRui Ueyama   void readDynamicList();
552ec34544SRui Ueyama 
562ec34544SRui Ueyama private:
572ec34544SRui Ueyama   void addFile(StringRef Path);
5805c4f67cSRafael Espindola   OutputSection *checkSection(OutputSectionCommand *Cmd, StringRef Loccation);
592ec34544SRui Ueyama 
602ec34544SRui Ueyama   void readAsNeeded();
612ec34544SRui Ueyama   void readEntry();
622ec34544SRui Ueyama   void readExtern();
632ec34544SRui Ueyama   void readGroup();
642ec34544SRui Ueyama   void readInclude();
652ec34544SRui Ueyama   void readMemory();
662ec34544SRui Ueyama   void readOutput();
672ec34544SRui Ueyama   void readOutputArch();
682ec34544SRui Ueyama   void readOutputFormat();
692ec34544SRui Ueyama   void readPhdrs();
702ec34544SRui Ueyama   void readSearchDir();
712ec34544SRui Ueyama   void readSections();
722ec34544SRui Ueyama   void readVersion();
732ec34544SRui Ueyama   void readVersionScriptCommand();
742ec34544SRui Ueyama 
752ec34544SRui Ueyama   SymbolAssignment *readAssignment(StringRef Name);
762ec34544SRui Ueyama   BytesDataCommand *readBytesDataCommand(StringRef Tok);
772ec34544SRui Ueyama   uint32_t readFill();
788acbf1ccSRui Ueyama   uint32_t parseFill(StringRef Tok);
793271d370SRui Ueyama   void readSectionAddressType(OutputSectionCommand *Cmd);
802ec34544SRui Ueyama   OutputSectionCommand *readOutputSectionDescription(StringRef OutSec);
812ec34544SRui Ueyama   std::vector<StringRef> readOutputSectionPhdrs();
822ec34544SRui Ueyama   InputSectionDescription *readInputSectionDescription(StringRef Tok);
832ec34544SRui Ueyama   StringMatcher readFilePatterns();
842ec34544SRui Ueyama   std::vector<SectionPattern> readInputSectionsList();
852ec34544SRui Ueyama   InputSectionDescription *readInputSectionRules(StringRef FilePattern);
862ec34544SRui Ueyama   unsigned readPhdrType();
872ec34544SRui Ueyama   SortSectionPolicy readSortKind();
882ec34544SRui Ueyama   SymbolAssignment *readProvideHidden(bool Provide, bool Hidden);
892ec34544SRui Ueyama   SymbolAssignment *readProvideOrAssignment(StringRef Tok);
902ec34544SRui Ueyama   void readSort();
9123af89ccSRui Ueyama   AssertCommand *readAssert();
9223af89ccSRui Ueyama   Expr readAssertExpr();
932ec34544SRui Ueyama 
942ec34544SRui Ueyama   uint64_t readMemoryAssignment(StringRef, StringRef, StringRef);
952ec34544SRui Ueyama   std::pair<uint32_t, uint32_t> readMemoryAttributes();
962ec34544SRui Ueyama 
972ec34544SRui Ueyama   Expr readExpr();
982ec34544SRui Ueyama   Expr readExpr1(Expr Lhs, int MinPrec);
992ec34544SRui Ueyama   StringRef readParenLiteral();
1002ec34544SRui Ueyama   Expr readPrimary();
1012ec34544SRui Ueyama   Expr readTernary(Expr Cond);
1022ec34544SRui Ueyama   Expr readParenExpr();
1032ec34544SRui Ueyama 
1042ec34544SRui Ueyama   // For parsing version script.
1052ec34544SRui Ueyama   std::vector<SymbolVersion> readVersionExtern();
1062ec34544SRui Ueyama   void readAnonymousDeclaration();
1072ec34544SRui Ueyama   void readVersionDeclaration(StringRef VerStr);
1082ec34544SRui Ueyama 
1092ec34544SRui Ueyama   std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>>
1102ec34544SRui Ueyama   readSymbols();
1112ec34544SRui Ueyama 
1122ec34544SRui Ueyama   bool IsUnderSysroot;
1132ec34544SRui Ueyama };
11496b3fe02SRui Ueyama } // namespace
1152ec34544SRui Ueyama 
1161e77ad14SRui Ueyama static StringRef unquote(StringRef S) {
1171e77ad14SRui Ueyama   if (S.startswith("\""))
1181e77ad14SRui Ueyama     return S.substr(1, S.size() - 2);
1191e77ad14SRui Ueyama   return S;
1201e77ad14SRui Ueyama }
1211e77ad14SRui Ueyama 
1222ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path) {
1232ec34544SRui Ueyama   if (Config->Sysroot == "")
1242ec34544SRui Ueyama     return false;
1252ec34544SRui Ueyama   for (; !Path.empty(); Path = sys::path::parent_path(Path))
1262ec34544SRui Ueyama     if (sys::fs::equivalent(Config->Sysroot, Path))
1272ec34544SRui Ueyama       return true;
1282ec34544SRui Ueyama   return false;
1292ec34544SRui Ueyama }
1302ec34544SRui Ueyama 
1312ec34544SRui Ueyama // Some operations only support one non absolute value. Move the
1322ec34544SRui Ueyama // absolute one to the right hand side for convenience.
1332ec34544SRui Ueyama static void moveAbsRight(ExprValue &A, ExprValue &B) {
1342ec34544SRui Ueyama   if (A.isAbsolute())
1352ec34544SRui Ueyama     std::swap(A, B);
1362ec34544SRui Ueyama   if (!B.isAbsolute())
13741c7ab4aSGeorge Rimar     error(A.Loc + ": at least one side of the expression must be absolute");
1382ec34544SRui Ueyama }
1392ec34544SRui Ueyama 
1402ec34544SRui Ueyama static ExprValue add(ExprValue A, ExprValue B) {
1412ec34544SRui Ueyama   moveAbsRight(A, B);
14241c7ab4aSGeorge Rimar   return {A.Sec, A.ForceAbsolute, A.Val + B.getValue(), A.Loc};
1432ec34544SRui Ueyama }
1442ec34544SRui Ueyama 
1452ec34544SRui Ueyama static ExprValue sub(ExprValue A, ExprValue B) {
14641c7ab4aSGeorge Rimar   return {A.Sec, A.Val - B.getValue(), A.Loc};
1472ec34544SRui Ueyama }
1482ec34544SRui Ueyama 
1492ec34544SRui Ueyama static ExprValue mul(ExprValue A, ExprValue B) {
1502ec34544SRui Ueyama   return A.getValue() * B.getValue();
1512ec34544SRui Ueyama }
1522ec34544SRui Ueyama 
1532ec34544SRui Ueyama static ExprValue div(ExprValue A, ExprValue B) {
1542ec34544SRui Ueyama   if (uint64_t BV = B.getValue())
1552ec34544SRui Ueyama     return A.getValue() / BV;
1562ec34544SRui Ueyama   error("division by zero");
1572ec34544SRui Ueyama   return 0;
1582ec34544SRui Ueyama }
1592ec34544SRui Ueyama 
1602ec34544SRui Ueyama static ExprValue bitAnd(ExprValue A, ExprValue B) {
1612ec34544SRui Ueyama   moveAbsRight(A, B);
1622ec34544SRui Ueyama   return {A.Sec, A.ForceAbsolute,
16341c7ab4aSGeorge Rimar           (A.getValue() & B.getValue()) - A.getSecAddr(), A.Loc};
1642ec34544SRui Ueyama }
1652ec34544SRui Ueyama 
1662ec34544SRui Ueyama static ExprValue bitOr(ExprValue A, ExprValue B) {
1672ec34544SRui Ueyama   moveAbsRight(A, B);
1682ec34544SRui Ueyama   return {A.Sec, A.ForceAbsolute,
16941c7ab4aSGeorge Rimar           (A.getValue() | B.getValue()) - A.getSecAddr(), A.Loc};
1702ec34544SRui Ueyama }
1712ec34544SRui Ueyama 
1722ec34544SRui Ueyama void ScriptParser::readDynamicList() {
1732ec34544SRui Ueyama   expect("{");
1742ec34544SRui Ueyama   readAnonymousDeclaration();
1752ec34544SRui Ueyama   if (!atEOF())
1762ec34544SRui Ueyama     setError("EOF expected, but got " + next());
1772ec34544SRui Ueyama }
1782ec34544SRui Ueyama 
1792ec34544SRui Ueyama void ScriptParser::readVersionScript() {
1802ec34544SRui Ueyama   readVersionScriptCommand();
1812ec34544SRui Ueyama   if (!atEOF())
1822ec34544SRui Ueyama     setError("EOF expected, but got " + next());
1832ec34544SRui Ueyama }
1842ec34544SRui Ueyama 
1852ec34544SRui Ueyama void ScriptParser::readVersionScriptCommand() {
1862ec34544SRui Ueyama   if (consume("{")) {
1872ec34544SRui Ueyama     readAnonymousDeclaration();
1882ec34544SRui Ueyama     return;
1892ec34544SRui Ueyama   }
1902ec34544SRui Ueyama 
1912ec34544SRui Ueyama   while (!atEOF() && !Error && peek() != "}") {
1922ec34544SRui Ueyama     StringRef VerStr = next();
1932ec34544SRui Ueyama     if (VerStr == "{") {
1942ec34544SRui Ueyama       setError("anonymous version definition is used in "
1952ec34544SRui Ueyama                "combination with other version definitions");
1962ec34544SRui Ueyama       return;
1972ec34544SRui Ueyama     }
1982ec34544SRui Ueyama     expect("{");
1992ec34544SRui Ueyama     readVersionDeclaration(VerStr);
2002ec34544SRui Ueyama   }
2012ec34544SRui Ueyama }
2022ec34544SRui Ueyama 
2032ec34544SRui Ueyama void ScriptParser::readVersion() {
2042ec34544SRui Ueyama   expect("{");
2052ec34544SRui Ueyama   readVersionScriptCommand();
2062ec34544SRui Ueyama   expect("}");
2072ec34544SRui Ueyama }
2082ec34544SRui Ueyama 
2092ec34544SRui Ueyama void ScriptParser::readLinkerScript() {
2102ec34544SRui Ueyama   while (!atEOF()) {
2112ec34544SRui Ueyama     StringRef Tok = next();
2122ec34544SRui Ueyama     if (Tok == ";")
2132ec34544SRui Ueyama       continue;
2142ec34544SRui Ueyama 
2152ec34544SRui Ueyama     if (Tok == "ASSERT") {
21623af89ccSRui Ueyama       Script->Opt.Commands.push_back(readAssert());
2172ec34544SRui Ueyama     } else if (Tok == "ENTRY") {
2182ec34544SRui Ueyama       readEntry();
2192ec34544SRui Ueyama     } else if (Tok == "EXTERN") {
2202ec34544SRui Ueyama       readExtern();
2212ec34544SRui Ueyama     } else if (Tok == "GROUP" || Tok == "INPUT") {
2222ec34544SRui Ueyama       readGroup();
2232ec34544SRui Ueyama     } else if (Tok == "INCLUDE") {
2242ec34544SRui Ueyama       readInclude();
2252ec34544SRui Ueyama     } else if (Tok == "MEMORY") {
2262ec34544SRui Ueyama       readMemory();
2272ec34544SRui Ueyama     } else if (Tok == "OUTPUT") {
2282ec34544SRui Ueyama       readOutput();
2292ec34544SRui Ueyama     } else if (Tok == "OUTPUT_ARCH") {
2302ec34544SRui Ueyama       readOutputArch();
2312ec34544SRui Ueyama     } else if (Tok == "OUTPUT_FORMAT") {
2322ec34544SRui Ueyama       readOutputFormat();
2332ec34544SRui Ueyama     } else if (Tok == "PHDRS") {
2342ec34544SRui Ueyama       readPhdrs();
2352ec34544SRui Ueyama     } else if (Tok == "SEARCH_DIR") {
2362ec34544SRui Ueyama       readSearchDir();
2372ec34544SRui Ueyama     } else if (Tok == "SECTIONS") {
2382ec34544SRui Ueyama       readSections();
2392ec34544SRui Ueyama     } else if (Tok == "VERSION") {
2402ec34544SRui Ueyama       readVersion();
2412ec34544SRui Ueyama     } else if (SymbolAssignment *Cmd = readProvideOrAssignment(Tok)) {
2422ec34544SRui Ueyama       Script->Opt.Commands.push_back(Cmd);
2432ec34544SRui Ueyama     } else {
2442ec34544SRui Ueyama       setError("unknown directive: " + Tok);
2452ec34544SRui Ueyama     }
2462ec34544SRui Ueyama   }
2472ec34544SRui Ueyama }
2482ec34544SRui Ueyama 
2492ec34544SRui Ueyama void ScriptParser::addFile(StringRef S) {
2502ec34544SRui Ueyama   if (IsUnderSysroot && S.startswith("/")) {
2512ec34544SRui Ueyama     SmallString<128> PathData;
2522ec34544SRui Ueyama     StringRef Path = (Config->Sysroot + S).toStringRef(PathData);
2532ec34544SRui Ueyama     if (sys::fs::exists(Path)) {
254a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(Path), /*WithLOption=*/false);
2552ec34544SRui Ueyama       return;
2562ec34544SRui Ueyama     }
2572ec34544SRui Ueyama   }
2582ec34544SRui Ueyama 
259*875ae82bSRui Ueyama   if (S.startswith("/")) {
260a76349bfSEvgeniy Stepanov     Driver->addFile(S, /*WithLOption=*/false);
2612ec34544SRui Ueyama   } else if (S.startswith("=")) {
2622ec34544SRui Ueyama     if (Config->Sysroot.empty())
263a76349bfSEvgeniy Stepanov       Driver->addFile(S.substr(1), /*WithLOption=*/false);
2642ec34544SRui Ueyama     else
265a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1)),
266a76349bfSEvgeniy Stepanov                       /*WithLOption=*/false);
2672ec34544SRui Ueyama   } else if (S.startswith("-l")) {
2682ec34544SRui Ueyama     Driver->addLibrary(S.substr(2));
2692ec34544SRui Ueyama   } else if (sys::fs::exists(S)) {
270a76349bfSEvgeniy Stepanov     Driver->addFile(S, /*WithLOption=*/false);
2712ec34544SRui Ueyama   } else {
2722ec34544SRui Ueyama     if (Optional<std::string> Path = findFromSearchPaths(S))
273a76349bfSEvgeniy Stepanov       Driver->addFile(Saver.save(*Path), /*WithLOption=*/true);
2742ec34544SRui Ueyama     else
2752ec34544SRui Ueyama       setError("unable to find " + S);
2762ec34544SRui Ueyama   }
2772ec34544SRui Ueyama }
2782ec34544SRui Ueyama 
2792ec34544SRui Ueyama void ScriptParser::readAsNeeded() {
2802ec34544SRui Ueyama   expect("(");
2812ec34544SRui Ueyama   bool Orig = Config->AsNeeded;
2822ec34544SRui Ueyama   Config->AsNeeded = true;
2832ec34544SRui Ueyama   while (!Error && !consume(")"))
2842ec34544SRui Ueyama     addFile(unquote(next()));
2852ec34544SRui Ueyama   Config->AsNeeded = Orig;
2862ec34544SRui Ueyama }
2872ec34544SRui Ueyama 
2882ec34544SRui Ueyama void ScriptParser::readEntry() {
2892ec34544SRui Ueyama   // -e <symbol> takes predecence over ENTRY(<symbol>).
2902ec34544SRui Ueyama   expect("(");
2912ec34544SRui Ueyama   StringRef Tok = next();
2922ec34544SRui Ueyama   if (Config->Entry.empty())
2932ec34544SRui Ueyama     Config->Entry = Tok;
2942ec34544SRui Ueyama   expect(")");
2952ec34544SRui Ueyama }
2962ec34544SRui Ueyama 
2972ec34544SRui Ueyama void ScriptParser::readExtern() {
2982ec34544SRui Ueyama   expect("(");
2992ec34544SRui Ueyama   while (!Error && !consume(")"))
3002ec34544SRui Ueyama     Config->Undefined.push_back(next());
3012ec34544SRui Ueyama }
3022ec34544SRui Ueyama 
3032ec34544SRui Ueyama void ScriptParser::readGroup() {
3042ec34544SRui Ueyama   expect("(");
3052ec34544SRui Ueyama   while (!Error && !consume(")")) {
306b579c439SRui Ueyama     if (consume("AS_NEEDED"))
3072ec34544SRui Ueyama       readAsNeeded();
3082ec34544SRui Ueyama     else
309b579c439SRui Ueyama       addFile(unquote(next()));
3102ec34544SRui Ueyama   }
3112ec34544SRui Ueyama }
3122ec34544SRui Ueyama 
3132ec34544SRui Ueyama void ScriptParser::readInclude() {
3142ec34544SRui Ueyama   StringRef Tok = unquote(next());
3152ec34544SRui Ueyama 
3162ec34544SRui Ueyama   // https://sourceware.org/binutils/docs/ld/File-Commands.html:
3172ec34544SRui Ueyama   // The file will be searched for in the current directory, and in any
3182ec34544SRui Ueyama   // directory specified with the -L option.
3192ec34544SRui Ueyama   if (sys::fs::exists(Tok)) {
3202ec34544SRui Ueyama     if (Optional<MemoryBufferRef> MB = readFile(Tok))
3212ec34544SRui Ueyama       tokenize(*MB);
3222ec34544SRui Ueyama     return;
3232ec34544SRui Ueyama   }
3242ec34544SRui Ueyama   if (Optional<std::string> Path = findFromSearchPaths(Tok)) {
3252ec34544SRui Ueyama     if (Optional<MemoryBufferRef> MB = readFile(*Path))
3262ec34544SRui Ueyama       tokenize(*MB);
3272ec34544SRui Ueyama     return;
3282ec34544SRui Ueyama   }
3292ec34544SRui Ueyama   setError("cannot open " + Tok);
3302ec34544SRui Ueyama }
3312ec34544SRui Ueyama 
3322ec34544SRui Ueyama void ScriptParser::readOutput() {
3332ec34544SRui Ueyama   // -o <file> takes predecence over OUTPUT(<file>).
3342ec34544SRui Ueyama   expect("(");
3352ec34544SRui Ueyama   StringRef Tok = next();
3362ec34544SRui Ueyama   if (Config->OutputFile.empty())
3372ec34544SRui Ueyama     Config->OutputFile = unquote(Tok);
3382ec34544SRui Ueyama   expect(")");
3392ec34544SRui Ueyama }
3402ec34544SRui Ueyama 
3412ec34544SRui Ueyama void ScriptParser::readOutputArch() {
3422ec34544SRui Ueyama   // OUTPUT_ARCH is ignored for now.
3432ec34544SRui Ueyama   expect("(");
3442ec34544SRui Ueyama   while (!Error && !consume(")"))
3452ec34544SRui Ueyama     skip();
3462ec34544SRui Ueyama }
3472ec34544SRui Ueyama 
3482ec34544SRui Ueyama void ScriptParser::readOutputFormat() {
3492ec34544SRui Ueyama   // Error checking only for now.
3502ec34544SRui Ueyama   expect("(");
3512ec34544SRui Ueyama   skip();
352b579c439SRui Ueyama   if (consume(")"))
3532ec34544SRui Ueyama     return;
354b579c439SRui Ueyama   expect(",");
3552ec34544SRui Ueyama   skip();
3562ec34544SRui Ueyama   expect(",");
3572ec34544SRui Ueyama   skip();
3582ec34544SRui Ueyama   expect(")");
3592ec34544SRui Ueyama }
3602ec34544SRui Ueyama 
3612ec34544SRui Ueyama void ScriptParser::readPhdrs() {
3622ec34544SRui Ueyama   expect("{");
3632ec34544SRui Ueyama   while (!Error && !consume("}")) {
3642ec34544SRui Ueyama     Script->Opt.PhdrsCommands.push_back(
365b579c439SRui Ueyama         {next(), PT_NULL, false, false, UINT_MAX, nullptr});
3662ec34544SRui Ueyama 
367b579c439SRui Ueyama     PhdrsCommand &PhdrCmd = Script->Opt.PhdrsCommands.back();
3682ec34544SRui Ueyama     PhdrCmd.Type = readPhdrType();
369b579c439SRui Ueyama 
370b579c439SRui Ueyama     while (!Error && !consume(";")) {
371b579c439SRui Ueyama       if (consume("FILEHDR"))
3722ec34544SRui Ueyama         PhdrCmd.HasFilehdr = true;
373b579c439SRui Ueyama       else if (consume("PHDRS"))
3742ec34544SRui Ueyama         PhdrCmd.HasPhdrs = true;
375b579c439SRui Ueyama       else if (consume("AT"))
3762ec34544SRui Ueyama         PhdrCmd.LMAExpr = readParenExpr();
377b579c439SRui Ueyama       else if (consume("FLAGS"))
378b579c439SRui Ueyama         PhdrCmd.Flags = readParenExpr()().getValue();
379b579c439SRui Ueyama       else
380b579c439SRui Ueyama         setError("unexpected header attribute: " + next());
381b579c439SRui Ueyama     }
3822ec34544SRui Ueyama   }
3832ec34544SRui Ueyama }
3842ec34544SRui Ueyama 
3852ec34544SRui Ueyama void ScriptParser::readSearchDir() {
3862ec34544SRui Ueyama   expect("(");
3872ec34544SRui Ueyama   StringRef Tok = next();
3882ec34544SRui Ueyama   if (!Config->Nostdlib)
3892ec34544SRui Ueyama     Config->SearchPaths.push_back(unquote(Tok));
3902ec34544SRui Ueyama   expect(")");
3912ec34544SRui Ueyama }
3922ec34544SRui Ueyama 
3932ec34544SRui Ueyama void ScriptParser::readSections() {
3942ec34544SRui Ueyama   Script->Opt.HasSections = true;
395b579c439SRui Ueyama 
3962ec34544SRui Ueyama   // -no-rosegment is used to avoid placing read only non-executable sections in
3972ec34544SRui Ueyama   // their own segment. We do the same if SECTIONS command is present in linker
3982ec34544SRui Ueyama   // script. See comment for computeFlags().
3992ec34544SRui Ueyama   Config->SingleRoRx = true;
4002ec34544SRui Ueyama 
4012ec34544SRui Ueyama   expect("{");
4022ec34544SRui Ueyama   while (!Error && !consume("}")) {
4032ec34544SRui Ueyama     StringRef Tok = next();
4042ec34544SRui Ueyama     BaseCommand *Cmd = readProvideOrAssignment(Tok);
4052ec34544SRui Ueyama     if (!Cmd) {
4062ec34544SRui Ueyama       if (Tok == "ASSERT")
40723af89ccSRui Ueyama         Cmd = readAssert();
4082ec34544SRui Ueyama       else
4092ec34544SRui Ueyama         Cmd = readOutputSectionDescription(Tok);
4102ec34544SRui Ueyama     }
4112ec34544SRui Ueyama     Script->Opt.Commands.push_back(Cmd);
4122ec34544SRui Ueyama   }
4132ec34544SRui Ueyama }
4142ec34544SRui Ueyama 
4152ec34544SRui Ueyama static int precedence(StringRef Op) {
4162ec34544SRui Ueyama   return StringSwitch<int>(Op)
4172ec34544SRui Ueyama       .Cases("*", "/", 5)
4182ec34544SRui Ueyama       .Cases("+", "-", 4)
4192ec34544SRui Ueyama       .Cases("<<", ">>", 3)
4202ec34544SRui Ueyama       .Cases("<", "<=", ">", ">=", "==", "!=", 2)
4212ec34544SRui Ueyama       .Cases("&", "|", 1)
4222ec34544SRui Ueyama       .Default(-1);
4232ec34544SRui Ueyama }
4242ec34544SRui Ueyama 
4252ec34544SRui Ueyama StringMatcher ScriptParser::readFilePatterns() {
4262ec34544SRui Ueyama   std::vector<StringRef> V;
4272ec34544SRui Ueyama   while (!Error && !consume(")"))
4282ec34544SRui Ueyama     V.push_back(next());
4292ec34544SRui Ueyama   return StringMatcher(V);
4302ec34544SRui Ueyama }
4312ec34544SRui Ueyama 
4322ec34544SRui Ueyama SortSectionPolicy ScriptParser::readSortKind() {
4332ec34544SRui Ueyama   if (consume("SORT") || consume("SORT_BY_NAME"))
4342ec34544SRui Ueyama     return SortSectionPolicy::Name;
4352ec34544SRui Ueyama   if (consume("SORT_BY_ALIGNMENT"))
4362ec34544SRui Ueyama     return SortSectionPolicy::Alignment;
4372ec34544SRui Ueyama   if (consume("SORT_BY_INIT_PRIORITY"))
4382ec34544SRui Ueyama     return SortSectionPolicy::Priority;
4392ec34544SRui Ueyama   if (consume("SORT_NONE"))
4402ec34544SRui Ueyama     return SortSectionPolicy::None;
4412ec34544SRui Ueyama   return SortSectionPolicy::Default;
4422ec34544SRui Ueyama }
4432ec34544SRui Ueyama 
44403fc8d1eSRui Ueyama // Reads SECTIONS command contents in the following form:
44503fc8d1eSRui Ueyama //
44603fc8d1eSRui Ueyama // <contents> ::= <elem>*
44703fc8d1eSRui Ueyama // <elem>     ::= <exclude>? <glob-pattern>
44803fc8d1eSRui Ueyama // <exclude>  ::= "EXCLUDE_FILE" "(" <glob-pattern>+ ")"
44903fc8d1eSRui Ueyama //
45003fc8d1eSRui Ueyama // For example,
45103fc8d1eSRui Ueyama //
45203fc8d1eSRui Ueyama // *(.foo EXCLUDE_FILE (a.o) .bar EXCLUDE_FILE (b.o) .baz)
45303fc8d1eSRui Ueyama //
45403fc8d1eSRui Ueyama // is parsed as ".foo", ".bar" with "a.o", and ".baz" with "b.o".
45503fc8d1eSRui Ueyama // The semantics of that is section .foo in any file, section .bar in
45603fc8d1eSRui Ueyama // any file but a.o, and section .baz in any file but b.o.
4572ec34544SRui Ueyama std::vector<SectionPattern> ScriptParser::readInputSectionsList() {
4582ec34544SRui Ueyama   std::vector<SectionPattern> Ret;
4592ec34544SRui Ueyama   while (!Error && peek() != ")") {
4602ec34544SRui Ueyama     StringMatcher ExcludeFilePat;
4612ec34544SRui Ueyama     if (consume("EXCLUDE_FILE")) {
4622ec34544SRui Ueyama       expect("(");
4632ec34544SRui Ueyama       ExcludeFilePat = readFilePatterns();
4642ec34544SRui Ueyama     }
4652ec34544SRui Ueyama 
4662ec34544SRui Ueyama     std::vector<StringRef> V;
4672ec34544SRui Ueyama     while (!Error && peek() != ")" && peek() != "EXCLUDE_FILE")
4682ec34544SRui Ueyama       V.push_back(next());
4692ec34544SRui Ueyama 
4702ec34544SRui Ueyama     if (!V.empty())
4712ec34544SRui Ueyama       Ret.push_back({std::move(ExcludeFilePat), StringMatcher(V)});
4722ec34544SRui Ueyama     else
4732ec34544SRui Ueyama       setError("section pattern is expected");
4742ec34544SRui Ueyama   }
4752ec34544SRui Ueyama   return Ret;
4762ec34544SRui Ueyama }
4772ec34544SRui Ueyama 
4782ec34544SRui Ueyama // Reads contents of "SECTIONS" directive. That directive contains a
4792ec34544SRui Ueyama // list of glob patterns for input sections. The grammar is as follows.
4802ec34544SRui Ueyama //
4812ec34544SRui Ueyama // <patterns> ::= <section-list>
4822ec34544SRui Ueyama //              | <sort> "(" <section-list> ")"
4832ec34544SRui Ueyama //              | <sort> "(" <sort> "(" <section-list> ")" ")"
4842ec34544SRui Ueyama //
4852ec34544SRui Ueyama // <sort>     ::= "SORT" | "SORT_BY_NAME" | "SORT_BY_ALIGNMENT"
4862ec34544SRui Ueyama //              | "SORT_BY_INIT_PRIORITY" | "SORT_NONE"
4872ec34544SRui Ueyama //
4882ec34544SRui Ueyama // <section-list> is parsed by readInputSectionsList().
4892ec34544SRui Ueyama InputSectionDescription *
4902ec34544SRui Ueyama ScriptParser::readInputSectionRules(StringRef FilePattern) {
4912ec34544SRui Ueyama   auto *Cmd = make<InputSectionDescription>(FilePattern);
4922ec34544SRui Ueyama   expect("(");
4932ec34544SRui Ueyama 
4942ec34544SRui Ueyama   while (!Error && !consume(")")) {
4952ec34544SRui Ueyama     SortSectionPolicy Outer = readSortKind();
4962ec34544SRui Ueyama     SortSectionPolicy Inner = SortSectionPolicy::Default;
4972ec34544SRui Ueyama     std::vector<SectionPattern> V;
4982ec34544SRui Ueyama     if (Outer != SortSectionPolicy::Default) {
4992ec34544SRui Ueyama       expect("(");
5002ec34544SRui Ueyama       Inner = readSortKind();
5012ec34544SRui Ueyama       if (Inner != SortSectionPolicy::Default) {
5022ec34544SRui Ueyama         expect("(");
5032ec34544SRui Ueyama         V = readInputSectionsList();
5042ec34544SRui Ueyama         expect(")");
5052ec34544SRui Ueyama       } else {
5062ec34544SRui Ueyama         V = readInputSectionsList();
5072ec34544SRui Ueyama       }
5082ec34544SRui Ueyama       expect(")");
5092ec34544SRui Ueyama     } else {
5102ec34544SRui Ueyama       V = readInputSectionsList();
5112ec34544SRui Ueyama     }
5122ec34544SRui Ueyama 
5132ec34544SRui Ueyama     for (SectionPattern &Pat : V) {
5142ec34544SRui Ueyama       Pat.SortInner = Inner;
5152ec34544SRui Ueyama       Pat.SortOuter = Outer;
5162ec34544SRui Ueyama     }
5172ec34544SRui Ueyama 
5182ec34544SRui Ueyama     std::move(V.begin(), V.end(), std::back_inserter(Cmd->SectionPatterns));
5192ec34544SRui Ueyama   }
5202ec34544SRui Ueyama   return Cmd;
5212ec34544SRui Ueyama }
5222ec34544SRui Ueyama 
5232ec34544SRui Ueyama InputSectionDescription *
5242ec34544SRui Ueyama ScriptParser::readInputSectionDescription(StringRef Tok) {
5252ec34544SRui Ueyama   // Input section wildcard can be surrounded by KEEP.
5262ec34544SRui Ueyama   // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep
5272ec34544SRui Ueyama   if (Tok == "KEEP") {
5282ec34544SRui Ueyama     expect("(");
5292ec34544SRui Ueyama     StringRef FilePattern = next();
5302ec34544SRui Ueyama     InputSectionDescription *Cmd = readInputSectionRules(FilePattern);
5312ec34544SRui Ueyama     expect(")");
5322ec34544SRui Ueyama     Script->Opt.KeptSections.push_back(Cmd);
5332ec34544SRui Ueyama     return Cmd;
5342ec34544SRui Ueyama   }
5352ec34544SRui Ueyama   return readInputSectionRules(Tok);
5362ec34544SRui Ueyama }
5372ec34544SRui Ueyama 
5382ec34544SRui Ueyama void ScriptParser::readSort() {
5392ec34544SRui Ueyama   expect("(");
5402ec34544SRui Ueyama   expect("CONSTRUCTORS");
5412ec34544SRui Ueyama   expect(")");
5422ec34544SRui Ueyama }
5432ec34544SRui Ueyama 
54423af89ccSRui Ueyama AssertCommand *ScriptParser::readAssert() {
54523af89ccSRui Ueyama   return make<AssertCommand>(readAssertExpr());
54623af89ccSRui Ueyama }
54723af89ccSRui Ueyama 
54823af89ccSRui Ueyama Expr ScriptParser::readAssertExpr() {
5492ec34544SRui Ueyama   expect("(");
5502ec34544SRui Ueyama   Expr E = readExpr();
5512ec34544SRui Ueyama   expect(",");
5522ec34544SRui Ueyama   StringRef Msg = unquote(next());
5532ec34544SRui Ueyama   expect(")");
554b579c439SRui Ueyama 
5552ec34544SRui Ueyama   return [=] {
5562ec34544SRui Ueyama     if (!E().getValue())
5572ec34544SRui Ueyama       error(Msg);
5582ec34544SRui Ueyama     return Script->getDot();
5592ec34544SRui Ueyama   };
5602ec34544SRui Ueyama }
5612ec34544SRui Ueyama 
5622ec34544SRui Ueyama // Reads a FILL(expr) command. We handle the FILL command as an
5632ec34544SRui Ueyama // alias for =fillexp section attribute, which is different from
5642ec34544SRui Ueyama // what GNU linkers do.
5652ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html
5662ec34544SRui Ueyama uint32_t ScriptParser::readFill() {
5672ec34544SRui Ueyama   expect("(");
5688acbf1ccSRui Ueyama   uint32_t V = parseFill(next());
5692ec34544SRui Ueyama   expect(")");
5702ec34544SRui Ueyama   return V;
5712ec34544SRui Ueyama }
5722ec34544SRui Ueyama 
5733271d370SRui Ueyama // Reads an expression and/or the special directive "(NOLOAD)" for an
5743271d370SRui Ueyama // output section definition.
5753271d370SRui Ueyama //
5763271d370SRui Ueyama // An output section name can be followed by an address expression
5773271d370SRui Ueyama // and/or by "(NOLOAD)". This grammar is not LL(1) because "(" can be
5783271d370SRui Ueyama // interpreted as either the beginning of some expression or "(NOLOAD)".
5793271d370SRui Ueyama //
580b579c439SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html
581fbb0463fSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Type.html
5823271d370SRui Ueyama void ScriptParser::readSectionAddressType(OutputSectionCommand *Cmd) {
5833271d370SRui Ueyama   if (consume("(")) {
5843271d370SRui Ueyama     if (consume("NOLOAD")) {
5853271d370SRui Ueyama       expect(")");
5863271d370SRui Ueyama       Cmd->Noload = true;
5873271d370SRui Ueyama       return;
5883271d370SRui Ueyama     }
5893271d370SRui Ueyama     Cmd->AddrExpr = readExpr();
5903271d370SRui Ueyama     expect(")");
5913271d370SRui Ueyama   } else {
5923271d370SRui Ueyama     Cmd->AddrExpr = readExpr();
5933271d370SRui Ueyama   }
5943271d370SRui Ueyama 
595fbb0463fSGeorge Rimar   if (consume("(")) {
596fbb0463fSGeorge Rimar     expect("NOLOAD");
597fbb0463fSGeorge Rimar     expect(")");
598fbb0463fSGeorge Rimar     Cmd->Noload = true;
599fbb0463fSGeorge Rimar   }
600fbb0463fSGeorge Rimar }
601fbb0463fSGeorge Rimar 
6023271d370SRui Ueyama OutputSectionCommand *
6033271d370SRui Ueyama ScriptParser::readOutputSectionDescription(StringRef OutSec) {
6043271d370SRui Ueyama   OutputSectionCommand *Cmd =
6053271d370SRui Ueyama       Script->createOutputSectionCommand(OutSec, getCurrentLocation());
6063271d370SRui Ueyama 
6073271d370SRui Ueyama   if (peek() != ":")
6083271d370SRui Ueyama     readSectionAddressType(Cmd);
6092ec34544SRui Ueyama   expect(":");
6102ec34544SRui Ueyama 
6112ec34544SRui Ueyama   if (consume("AT"))
6122ec34544SRui Ueyama     Cmd->LMAExpr = readParenExpr();
6132ec34544SRui Ueyama   if (consume("ALIGN"))
6142ec34544SRui Ueyama     Cmd->AlignExpr = readParenExpr();
6152ec34544SRui Ueyama   if (consume("SUBALIGN"))
6162ec34544SRui Ueyama     Cmd->SubalignExpr = readParenExpr();
6172ec34544SRui Ueyama 
6182ec34544SRui Ueyama   // Parse constraints.
6192ec34544SRui Ueyama   if (consume("ONLY_IF_RO"))
6202ec34544SRui Ueyama     Cmd->Constraint = ConstraintKind::ReadOnly;
6212ec34544SRui Ueyama   if (consume("ONLY_IF_RW"))
6222ec34544SRui Ueyama     Cmd->Constraint = ConstraintKind::ReadWrite;
6232ec34544SRui Ueyama   expect("{");
6242ec34544SRui Ueyama 
6252ec34544SRui Ueyama   while (!Error && !consume("}")) {
6262ec34544SRui Ueyama     StringRef Tok = next();
6272ec34544SRui Ueyama     if (Tok == ";") {
6282ec34544SRui Ueyama       // Empty commands are allowed. Do nothing here.
629b579c439SRui Ueyama     } else if (SymbolAssignment *Assign = readProvideOrAssignment(Tok)) {
630b579c439SRui Ueyama       Cmd->Commands.push_back(Assign);
6312ec34544SRui Ueyama     } else if (BytesDataCommand *Data = readBytesDataCommand(Tok)) {
6322ec34544SRui Ueyama       Cmd->Commands.push_back(Data);
6332ec34544SRui Ueyama     } else if (Tok == "ASSERT") {
63423af89ccSRui Ueyama       Cmd->Commands.push_back(readAssert());
6352ec34544SRui Ueyama       expect(";");
6362ec34544SRui Ueyama     } else if (Tok == "CONSTRUCTORS") {
6372ec34544SRui Ueyama       // CONSTRUCTORS is a keyword to make the linker recognize C++ ctors/dtors
6382ec34544SRui Ueyama       // by name. This is for very old file formats such as ECOFF/XCOFF.
6392ec34544SRui Ueyama       // For ELF, we should ignore.
6402ec34544SRui Ueyama     } else if (Tok == "FILL") {
6412ec34544SRui Ueyama       Cmd->Filler = readFill();
6422ec34544SRui Ueyama     } else if (Tok == "SORT") {
6432ec34544SRui Ueyama       readSort();
6442ec34544SRui Ueyama     } else if (peek() == "(") {
6452ec34544SRui Ueyama       Cmd->Commands.push_back(readInputSectionDescription(Tok));
6462ec34544SRui Ueyama     } else {
6472ec34544SRui Ueyama       setError("unknown command " + Tok);
6482ec34544SRui Ueyama     }
6492ec34544SRui Ueyama   }
6502ec34544SRui Ueyama 
6512ec34544SRui Ueyama   if (consume(">"))
6522ec34544SRui Ueyama     Cmd->MemoryRegionName = next();
6532ec34544SRui Ueyama 
6542ec34544SRui Ueyama   Cmd->Phdrs = readOutputSectionPhdrs();
6552ec34544SRui Ueyama 
6562ec34544SRui Ueyama   if (consume("="))
6578acbf1ccSRui Ueyama     Cmd->Filler = parseFill(next());
6582ec34544SRui Ueyama   else if (peek().startswith("="))
6598acbf1ccSRui Ueyama     Cmd->Filler = parseFill(next().drop_front());
6602ec34544SRui Ueyama 
6612ec34544SRui Ueyama   // Consume optional comma following output section command.
6622ec34544SRui Ueyama   consume(",");
6632ec34544SRui Ueyama 
6642ec34544SRui Ueyama   return Cmd;
6652ec34544SRui Ueyama }
6662ec34544SRui Ueyama 
6678acbf1ccSRui Ueyama // Parses a given string as a octal/decimal/hexadecimal number and
6688acbf1ccSRui Ueyama // returns it as a big-endian number. Used for `=<fillexp>`.
6692ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html
6702ec34544SRui Ueyama //
6718acbf1ccSRui Ueyama // When reading a hexstring, ld.bfd handles it as a blob of arbitrary
6728acbf1ccSRui Ueyama // size, while ld.gold always handles it as a 32-bit big-endian number.
6738acbf1ccSRui Ueyama // We are compatible with ld.gold because it's easier to implement.
6748acbf1ccSRui Ueyama uint32_t ScriptParser::parseFill(StringRef Tok) {
675b58079d4SRui Ueyama   uint32_t V = 0;
676ab94768cSGeorge Rimar   if (!to_integer(Tok, V))
6772ec34544SRui Ueyama     setError("invalid filler expression: " + Tok);
678b58079d4SRui Ueyama 
679b58079d4SRui Ueyama   uint32_t Buf;
680b58079d4SRui Ueyama   write32be(&Buf, V);
681b58079d4SRui Ueyama   return Buf;
6822ec34544SRui Ueyama }
6832ec34544SRui Ueyama 
6842ec34544SRui Ueyama SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) {
6852ec34544SRui Ueyama   expect("(");
6862ec34544SRui Ueyama   SymbolAssignment *Cmd = readAssignment(next());
6872ec34544SRui Ueyama   Cmd->Provide = Provide;
6882ec34544SRui Ueyama   Cmd->Hidden = Hidden;
6892ec34544SRui Ueyama   expect(")");
6902ec34544SRui Ueyama   expect(";");
6912ec34544SRui Ueyama   return Cmd;
6922ec34544SRui Ueyama }
6932ec34544SRui Ueyama 
6942ec34544SRui Ueyama SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok) {
6952ec34544SRui Ueyama   SymbolAssignment *Cmd = nullptr;
6962ec34544SRui Ueyama   if (peek() == "=" || peek() == "+=") {
6972ec34544SRui Ueyama     Cmd = readAssignment(Tok);
6982ec34544SRui Ueyama     expect(";");
6992ec34544SRui Ueyama   } else if (Tok == "PROVIDE") {
7002ec34544SRui Ueyama     Cmd = readProvideHidden(true, false);
7012ec34544SRui Ueyama   } else if (Tok == "HIDDEN") {
7022ec34544SRui Ueyama     Cmd = readProvideHidden(false, true);
7032ec34544SRui Ueyama   } else if (Tok == "PROVIDE_HIDDEN") {
7042ec34544SRui Ueyama     Cmd = readProvideHidden(true, true);
7052ec34544SRui Ueyama   }
7062ec34544SRui Ueyama   return Cmd;
7072ec34544SRui Ueyama }
7082ec34544SRui Ueyama 
7092ec34544SRui Ueyama SymbolAssignment *ScriptParser::readAssignment(StringRef Name) {
7102ec34544SRui Ueyama   StringRef Op = next();
7112ec34544SRui Ueyama   assert(Op == "=" || Op == "+=");
7122ec34544SRui Ueyama   Expr E = readExpr();
7132ec34544SRui Ueyama   if (Op == "+=") {
7142ec34544SRui Ueyama     std::string Loc = getCurrentLocation();
7152ec34544SRui Ueyama     E = [=] { return add(Script->getSymbolValue(Loc, Name), E()); };
7162ec34544SRui Ueyama   }
7172ec34544SRui Ueyama   return make<SymbolAssignment>(Name, E, getCurrentLocation());
7182ec34544SRui Ueyama }
7192ec34544SRui Ueyama 
7202ec34544SRui Ueyama // This is an operator-precedence parser to parse a linker
7212ec34544SRui Ueyama // script expression.
7222ec34544SRui Ueyama Expr ScriptParser::readExpr() {
7232ec34544SRui Ueyama   // Our lexer is context-aware. Set the in-expression bit so that
7242ec34544SRui Ueyama   // they apply different tokenization rules.
7252ec34544SRui Ueyama   bool Orig = InExpr;
7262ec34544SRui Ueyama   InExpr = true;
7272ec34544SRui Ueyama   Expr E = readExpr1(readPrimary(), 0);
7282ec34544SRui Ueyama   InExpr = Orig;
7292ec34544SRui Ueyama   return E;
7302ec34544SRui Ueyama }
7312ec34544SRui Ueyama 
7322ec34544SRui Ueyama static Expr combine(StringRef Op, Expr L, Expr R) {
7332ec34544SRui Ueyama   if (Op == "+")
7342ec34544SRui Ueyama     return [=] { return add(L(), R()); };
7352ec34544SRui Ueyama   if (Op == "-")
7362ec34544SRui Ueyama     return [=] { return sub(L(), R()); };
737b579c439SRui Ueyama   if (Op == "*")
738b579c439SRui Ueyama     return [=] { return mul(L(), R()); };
739b579c439SRui Ueyama   if (Op == "/")
740b579c439SRui Ueyama     return [=] { return div(L(), R()); };
7412ec34544SRui Ueyama   if (Op == "<<")
7427e915511SRui Ueyama     return [=] { return L().getValue() << R().getValue(); };
7432ec34544SRui Ueyama   if (Op == ">>")
7447e915511SRui Ueyama     return [=] { return L().getValue() >> R().getValue(); };
7452ec34544SRui Ueyama   if (Op == "<")
7462ec34544SRui Ueyama     return [=] { return L().getValue() < R().getValue(); };
7472ec34544SRui Ueyama   if (Op == ">")
7482ec34544SRui Ueyama     return [=] { return L().getValue() > R().getValue(); };
7492ec34544SRui Ueyama   if (Op == ">=")
7502ec34544SRui Ueyama     return [=] { return L().getValue() >= R().getValue(); };
7512ec34544SRui Ueyama   if (Op == "<=")
7522ec34544SRui Ueyama     return [=] { return L().getValue() <= R().getValue(); };
7532ec34544SRui Ueyama   if (Op == "==")
7542ec34544SRui Ueyama     return [=] { return L().getValue() == R().getValue(); };
7552ec34544SRui Ueyama   if (Op == "!=")
7562ec34544SRui Ueyama     return [=] { return L().getValue() != R().getValue(); };
7572ec34544SRui Ueyama   if (Op == "&")
7582ec34544SRui Ueyama     return [=] { return bitAnd(L(), R()); };
7592ec34544SRui Ueyama   if (Op == "|")
7602ec34544SRui Ueyama     return [=] { return bitOr(L(), R()); };
7612ec34544SRui Ueyama   llvm_unreachable("invalid operator");
7622ec34544SRui Ueyama }
7632ec34544SRui Ueyama 
7642ec34544SRui Ueyama // This is a part of the operator-precedence parser. This function
7652ec34544SRui Ueyama // assumes that the remaining token stream starts with an operator.
7662ec34544SRui Ueyama Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) {
7672ec34544SRui Ueyama   while (!atEOF() && !Error) {
7682ec34544SRui Ueyama     // Read an operator and an expression.
7692ec34544SRui Ueyama     if (consume("?"))
7702ec34544SRui Ueyama       return readTernary(Lhs);
7712ec34544SRui Ueyama     StringRef Op1 = peek();
7722ec34544SRui Ueyama     if (precedence(Op1) < MinPrec)
7732ec34544SRui Ueyama       break;
7742ec34544SRui Ueyama     skip();
7752ec34544SRui Ueyama     Expr Rhs = readPrimary();
7762ec34544SRui Ueyama 
7772ec34544SRui Ueyama     // Evaluate the remaining part of the expression first if the
7782ec34544SRui Ueyama     // next operator has greater precedence than the previous one.
7792ec34544SRui Ueyama     // For example, if we have read "+" and "3", and if the next
7802ec34544SRui Ueyama     // operator is "*", then we'll evaluate 3 * ... part first.
7812ec34544SRui Ueyama     while (!atEOF()) {
7822ec34544SRui Ueyama       StringRef Op2 = peek();
7832ec34544SRui Ueyama       if (precedence(Op2) <= precedence(Op1))
7842ec34544SRui Ueyama         break;
7852ec34544SRui Ueyama       Rhs = readExpr1(Rhs, precedence(Op2));
7862ec34544SRui Ueyama     }
7872ec34544SRui Ueyama 
7882ec34544SRui Ueyama     Lhs = combine(Op1, Lhs, Rhs);
7892ec34544SRui Ueyama   }
7902ec34544SRui Ueyama   return Lhs;
7912ec34544SRui Ueyama }
7922ec34544SRui Ueyama 
7932ec34544SRui Ueyama uint64_t static getConstant(StringRef S) {
7942ec34544SRui Ueyama   if (S == "COMMONPAGESIZE")
7952ec34544SRui Ueyama     return Target->PageSize;
7962ec34544SRui Ueyama   if (S == "MAXPAGESIZE")
7972ec34544SRui Ueyama     return Config->MaxPageSize;
7982ec34544SRui Ueyama   error("unknown constant: " + S);
7992ec34544SRui Ueyama   return 0;
8002ec34544SRui Ueyama }
8012ec34544SRui Ueyama 
8025c65088fSRui Ueyama // Parses Tok as an integer. It recognizes hexadecimal (prefixed with
8035c65088fSRui Ueyama // "0x" or suffixed with "H") and decimal numbers. Decimal numbers may
8045c65088fSRui Ueyama // have "K" (Ki) or "M" (Mi) suffixes.
8055c65088fSRui Ueyama static Optional<uint64_t> parseInt(StringRef Tok) {
8062ec34544SRui Ueyama   // Negative number
8072ec34544SRui Ueyama   if (Tok.startswith("-")) {
8085c65088fSRui Ueyama     if (Optional<uint64_t> Val = parseInt(Tok.substr(1)))
8095c65088fSRui Ueyama       return -*Val;
8105c65088fSRui Ueyama     return None;
8112ec34544SRui Ueyama   }
8122ec34544SRui Ueyama 
8132ec34544SRui Ueyama   // Hexadecimal
8145c65088fSRui Ueyama   uint64_t Val;
815ab94768cSGeorge Rimar   if (Tok.startswith_lower("0x") && to_integer(Tok.substr(2), Val, 16))
8165c65088fSRui Ueyama     return Val;
817ab94768cSGeorge Rimar   if (Tok.endswith_lower("H") && to_integer(Tok.drop_back(), Val, 16))
8185c65088fSRui Ueyama     return Val;
8192ec34544SRui Ueyama 
8202ec34544SRui Ueyama   // Decimal
8212ec34544SRui Ueyama   if (Tok.endswith_lower("K")) {
822ab94768cSGeorge Rimar     if (!to_integer(Tok.drop_back(), Val, 10))
8235c65088fSRui Ueyama       return None;
8245c65088fSRui Ueyama     return Val * 1024;
8252ec34544SRui Ueyama   }
8265c65088fSRui Ueyama   if (Tok.endswith_lower("M")) {
827ab94768cSGeorge Rimar     if (!to_integer(Tok.drop_back(), Val, 10))
8285c65088fSRui Ueyama       return None;
8295c65088fSRui Ueyama     return Val * 1024 * 1024;
8305c65088fSRui Ueyama   }
831ab94768cSGeorge Rimar   if (!to_integer(Tok, Val, 10))
8325c65088fSRui Ueyama     return None;
8335c65088fSRui Ueyama   return Val;
8342ec34544SRui Ueyama }
8352ec34544SRui Ueyama 
8362ec34544SRui Ueyama BytesDataCommand *ScriptParser::readBytesDataCommand(StringRef Tok) {
837b579c439SRui Ueyama   int Size = StringSwitch<int>(Tok)
8382ec34544SRui Ueyama                  .Case("BYTE", 1)
8392ec34544SRui Ueyama                  .Case("SHORT", 2)
8402ec34544SRui Ueyama                  .Case("LONG", 4)
8412ec34544SRui Ueyama                  .Case("QUAD", 8)
8422ec34544SRui Ueyama                  .Default(-1);
8432ec34544SRui Ueyama   if (Size == -1)
8442ec34544SRui Ueyama     return nullptr;
8452ec34544SRui Ueyama 
8462ec34544SRui Ueyama   return make<BytesDataCommand>(readParenExpr(), Size);
8472ec34544SRui Ueyama }
8482ec34544SRui Ueyama 
8492ec34544SRui Ueyama StringRef ScriptParser::readParenLiteral() {
8502ec34544SRui Ueyama   expect("(");
8512ec34544SRui Ueyama   StringRef Tok = next();
8522ec34544SRui Ueyama   expect(")");
8532ec34544SRui Ueyama   return Tok;
8542ec34544SRui Ueyama }
8552ec34544SRui Ueyama 
85605c4f67cSRafael Espindola OutputSection *ScriptParser::checkSection(OutputSectionCommand *Cmd,
85705c4f67cSRafael Espindola                                           StringRef Location) {
85805c4f67cSRafael Espindola   if (Cmd->Location.empty() && Script->ErrorOnMissingSection)
85905c4f67cSRafael Espindola     error(Location + ": undefined section " + Cmd->Name);
86005c4f67cSRafael Espindola   if (Cmd->Sec)
86105c4f67cSRafael Espindola     return Cmd->Sec;
86205c4f67cSRafael Espindola   static OutputSection Dummy("", 0, 0);
86305c4f67cSRafael Espindola   return &Dummy;
86405c4f67cSRafael Espindola }
86505c4f67cSRafael Espindola 
8662ec34544SRui Ueyama Expr ScriptParser::readPrimary() {
8672ec34544SRui Ueyama   if (peek() == "(")
8682ec34544SRui Ueyama     return readParenExpr();
8692ec34544SRui Ueyama 
8705c65088fSRui Ueyama   if (consume("~")) {
8712ec34544SRui Ueyama     Expr E = readPrimary();
872b2fb84a1SRui Ueyama     return [=] { return ~E().getValue(); };
8732ec34544SRui Ueyama   }
8745c65088fSRui Ueyama   if (consume("-")) {
8752ec34544SRui Ueyama     Expr E = readPrimary();
876b2fb84a1SRui Ueyama     return [=] { return -E().getValue(); };
8772ec34544SRui Ueyama   }
8782ec34544SRui Ueyama 
8795c65088fSRui Ueyama   StringRef Tok = next();
8805c65088fSRui Ueyama   std::string Location = getCurrentLocation();
8815c65088fSRui Ueyama 
8822ec34544SRui Ueyama   // Built-in functions are parsed here.
8832ec34544SRui Ueyama   // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html.
8842ec34544SRui Ueyama   if (Tok == "ABSOLUTE") {
8852ec34544SRui Ueyama     Expr Inner = readParenExpr();
8862ec34544SRui Ueyama     return [=] {
8872ec34544SRui Ueyama       ExprValue I = Inner();
8882ec34544SRui Ueyama       I.ForceAbsolute = true;
8892ec34544SRui Ueyama       return I;
8902ec34544SRui Ueyama     };
8912ec34544SRui Ueyama   }
8922ec34544SRui Ueyama   if (Tok == "ADDR") {
8932ec34544SRui Ueyama     StringRef Name = readParenLiteral();
89405c4f67cSRafael Espindola     OutputSectionCommand *Cmd = Script->getOrCreateOutputSectionCommand(Name);
89541c7ab4aSGeorge Rimar     return [=]() -> ExprValue {
89641c7ab4aSGeorge Rimar       return {checkSection(Cmd, Location), 0, Location};
89741c7ab4aSGeorge Rimar     };
8982ec34544SRui Ueyama   }
8992ec34544SRui Ueyama   if (Tok == "ALIGN") {
9002ec34544SRui Ueyama     expect("(");
9012ec34544SRui Ueyama     Expr E = readExpr();
902b579c439SRui Ueyama     if (consume(")"))
903b579c439SRui Ueyama       return [=] { return alignTo(Script->getDot(), E().getValue()); };
904b579c439SRui Ueyama     expect(",");
9052ec34544SRui Ueyama     Expr E2 = readExpr();
9062ec34544SRui Ueyama     expect(")");
9073c6de1a6SPetr Hosek     return [=] {
9083c6de1a6SPetr Hosek       ExprValue V = E();
9093c6de1a6SPetr Hosek       V.Alignment = E2().getValue();
9103c6de1a6SPetr Hosek       return V;
9113c6de1a6SPetr Hosek     };
9122ec34544SRui Ueyama   }
9132ec34544SRui Ueyama   if (Tok == "ALIGNOF") {
9142ec34544SRui Ueyama     StringRef Name = readParenLiteral();
91505c4f67cSRafael Espindola     OutputSectionCommand *Cmd = Script->getOrCreateOutputSectionCommand(Name);
91605c4f67cSRafael Espindola     return [=] { return checkSection(Cmd, Location)->Alignment; };
9172ec34544SRui Ueyama   }
9182ec34544SRui Ueyama   if (Tok == "ASSERT")
91923af89ccSRui Ueyama     return readAssertExpr();
9202ec34544SRui Ueyama   if (Tok == "CONSTANT") {
9212ec34544SRui Ueyama     StringRef Name = readParenLiteral();
9222ec34544SRui Ueyama     return [=] { return getConstant(Name); };
9232ec34544SRui Ueyama   }
9242ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_ALIGN") {
9252ec34544SRui Ueyama     expect("(");
9262ec34544SRui Ueyama     Expr E = readExpr();
9272ec34544SRui Ueyama     expect(",");
9282ec34544SRui Ueyama     readExpr();
9292ec34544SRui Ueyama     expect(")");
9302ec34544SRui Ueyama     return [=] { return alignTo(Script->getDot(), E().getValue()); };
9312ec34544SRui Ueyama   }
9322ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_END") {
9332ec34544SRui Ueyama     expect("(");
9342ec34544SRui Ueyama     expect(".");
9352ec34544SRui Ueyama     expect(")");
9362ec34544SRui Ueyama     return [] { return Script->getDot(); };
9372ec34544SRui Ueyama   }
9382ec34544SRui Ueyama   if (Tok == "DATA_SEGMENT_RELRO_END") {
9392ec34544SRui Ueyama     // GNU linkers implements more complicated logic to handle
9402ec34544SRui Ueyama     // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and
9412ec34544SRui Ueyama     // just align to the next page boundary for simplicity.
9422ec34544SRui Ueyama     expect("(");
9432ec34544SRui Ueyama     readExpr();
9442ec34544SRui Ueyama     expect(",");
9452ec34544SRui Ueyama     readExpr();
9462ec34544SRui Ueyama     expect(")");
9472ec34544SRui Ueyama     return [] { return alignTo(Script->getDot(), Target->PageSize); };
9482ec34544SRui Ueyama   }
9492ec34544SRui Ueyama   if (Tok == "DEFINED") {
9502ec34544SRui Ueyama     StringRef Name = readParenLiteral();
9512ec34544SRui Ueyama     return [=] { return Script->isDefined(Name) ? 1 : 0; };
9522ec34544SRui Ueyama   }
95391b95b61SRui Ueyama   if (Tok == "LENGTH") {
95491b95b61SRui Ueyama     StringRef Name = readParenLiteral();
95591b95b61SRui Ueyama     if (Script->Opt.MemoryRegions.count(Name) == 0)
95691b95b61SRui Ueyama       setError("memory region not defined: " + Name);
95791b95b61SRui Ueyama     return [=] { return Script->Opt.MemoryRegions[Name].Length; };
95891b95b61SRui Ueyama   }
9592ec34544SRui Ueyama   if (Tok == "LOADADDR") {
9602ec34544SRui Ueyama     StringRef Name = readParenLiteral();
96105c4f67cSRafael Espindola     OutputSectionCommand *Cmd = Script->getOrCreateOutputSectionCommand(Name);
96205c4f67cSRafael Espindola     return [=] { return checkSection(Cmd, Location)->getLMA(); };
9632ec34544SRui Ueyama   }
96491b95b61SRui Ueyama   if (Tok == "ORIGIN") {
96591b95b61SRui Ueyama     StringRef Name = readParenLiteral();
96691b95b61SRui Ueyama     if (Script->Opt.MemoryRegions.count(Name) == 0)
96791b95b61SRui Ueyama       setError("memory region not defined: " + Name);
96891b95b61SRui Ueyama     return [=] { return Script->Opt.MemoryRegions[Name].Origin; };
96991b95b61SRui Ueyama   }
9702ec34544SRui Ueyama   if (Tok == "SEGMENT_START") {
9712ec34544SRui Ueyama     expect("(");
9722ec34544SRui Ueyama     skip();
9732ec34544SRui Ueyama     expect(",");
9742ec34544SRui Ueyama     Expr E = readExpr();
9752ec34544SRui Ueyama     expect(")");
9762ec34544SRui Ueyama     return [=] { return E(); };
9772ec34544SRui Ueyama   }
9782ec34544SRui Ueyama   if (Tok == "SIZEOF") {
9792ec34544SRui Ueyama     StringRef Name = readParenLiteral();
98005c4f67cSRafael Espindola     OutputSectionCommand *Cmd = Script->getOrCreateOutputSectionCommand(Name);
98105c4f67cSRafael Espindola     // Linker script does not create an output section if its content is empty.
98205c4f67cSRafael Espindola     // We want to allow SIZEOF(.foo) where .foo is a section which happened to
98305c4f67cSRafael Espindola     // be empty.
98405c4f67cSRafael Espindola     return [=] { return Cmd->Sec ? Cmd->Sec->Size : 0; };
9852ec34544SRui Ueyama   }
9862ec34544SRui Ueyama   if (Tok == "SIZEOF_HEADERS")
9872ec34544SRui Ueyama     return [=] { return elf::getHeaderSize(); };
9882ec34544SRui Ueyama 
9894eb2eccbSRui Ueyama   // Tok is the dot.
9904eb2eccbSRui Ueyama   if (Tok == ".")
9914eb2eccbSRui Ueyama     return [=] { return Script->getSymbolValue(Location, Tok); };
9924eb2eccbSRui Ueyama 
9932ec34544SRui Ueyama   // Tok is a literal number.
9945c65088fSRui Ueyama   if (Optional<uint64_t> Val = parseInt(Tok))
9955c65088fSRui Ueyama     return [=] { return *Val; };
9962ec34544SRui Ueyama 
9972ec34544SRui Ueyama   // Tok is a symbol name.
9982ec34544SRui Ueyama   if (!isValidCIdentifier(Tok))
9992ec34544SRui Ueyama     setError("malformed number: " + Tok);
10004eb2eccbSRui Ueyama   Script->Opt.ReferencedSymbols.push_back(Tok);
10012ec34544SRui Ueyama   return [=] { return Script->getSymbolValue(Location, Tok); };
10022ec34544SRui Ueyama }
10032ec34544SRui Ueyama 
10042ec34544SRui Ueyama Expr ScriptParser::readTernary(Expr Cond) {
10052ec34544SRui Ueyama   Expr L = readExpr();
10062ec34544SRui Ueyama   expect(":");
10072ec34544SRui Ueyama   Expr R = readExpr();
10082ec34544SRui Ueyama   return [=] { return Cond().getValue() ? L() : R(); };
10092ec34544SRui Ueyama }
10102ec34544SRui Ueyama 
10112ec34544SRui Ueyama Expr ScriptParser::readParenExpr() {
10122ec34544SRui Ueyama   expect("(");
10132ec34544SRui Ueyama   Expr E = readExpr();
10142ec34544SRui Ueyama   expect(")");
10152ec34544SRui Ueyama   return E;
10162ec34544SRui Ueyama }
10172ec34544SRui Ueyama 
10182ec34544SRui Ueyama std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() {
10192ec34544SRui Ueyama   std::vector<StringRef> Phdrs;
10202ec34544SRui Ueyama   while (!Error && peek().startswith(":")) {
10212ec34544SRui Ueyama     StringRef Tok = next();
10222ec34544SRui Ueyama     Phdrs.push_back((Tok.size() == 1) ? next() : Tok.substr(1));
10232ec34544SRui Ueyama   }
10242ec34544SRui Ueyama   return Phdrs;
10252ec34544SRui Ueyama }
10262ec34544SRui Ueyama 
10272ec34544SRui Ueyama // Read a program header type name. The next token must be a
10282ec34544SRui Ueyama // name of a program header type or a constant (e.g. "0x3").
10292ec34544SRui Ueyama unsigned ScriptParser::readPhdrType() {
10302ec34544SRui Ueyama   StringRef Tok = next();
10315c65088fSRui Ueyama   if (Optional<uint64_t> Val = parseInt(Tok))
10325c65088fSRui Ueyama     return *Val;
10332ec34544SRui Ueyama 
10342ec34544SRui Ueyama   unsigned Ret = StringSwitch<unsigned>(Tok)
10352ec34544SRui Ueyama                      .Case("PT_NULL", PT_NULL)
10362ec34544SRui Ueyama                      .Case("PT_LOAD", PT_LOAD)
10372ec34544SRui Ueyama                      .Case("PT_DYNAMIC", PT_DYNAMIC)
10382ec34544SRui Ueyama                      .Case("PT_INTERP", PT_INTERP)
10392ec34544SRui Ueyama                      .Case("PT_NOTE", PT_NOTE)
10402ec34544SRui Ueyama                      .Case("PT_SHLIB", PT_SHLIB)
10412ec34544SRui Ueyama                      .Case("PT_PHDR", PT_PHDR)
10422ec34544SRui Ueyama                      .Case("PT_TLS", PT_TLS)
10432ec34544SRui Ueyama                      .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME)
10442ec34544SRui Ueyama                      .Case("PT_GNU_STACK", PT_GNU_STACK)
10452ec34544SRui Ueyama                      .Case("PT_GNU_RELRO", PT_GNU_RELRO)
10462ec34544SRui Ueyama                      .Case("PT_OPENBSD_RANDOMIZE", PT_OPENBSD_RANDOMIZE)
10472ec34544SRui Ueyama                      .Case("PT_OPENBSD_WXNEEDED", PT_OPENBSD_WXNEEDED)
10482ec34544SRui Ueyama                      .Case("PT_OPENBSD_BOOTDATA", PT_OPENBSD_BOOTDATA)
10492ec34544SRui Ueyama                      .Default(-1);
10502ec34544SRui Ueyama 
10512ec34544SRui Ueyama   if (Ret == (unsigned)-1) {
10522ec34544SRui Ueyama     setError("invalid program header type: " + Tok);
10532ec34544SRui Ueyama     return PT_NULL;
10542ec34544SRui Ueyama   }
10552ec34544SRui Ueyama   return Ret;
10562ec34544SRui Ueyama }
10572ec34544SRui Ueyama 
10582ec34544SRui Ueyama // Reads an anonymous version declaration.
10592ec34544SRui Ueyama void ScriptParser::readAnonymousDeclaration() {
10602ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
10612ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
10622ec34544SRui Ueyama   std::tie(Locals, Globals) = readSymbols();
10632ec34544SRui Ueyama 
10642ec34544SRui Ueyama   for (SymbolVersion V : Locals) {
10652ec34544SRui Ueyama     if (V.Name == "*")
10662ec34544SRui Ueyama       Config->DefaultSymbolVersion = VER_NDX_LOCAL;
10672ec34544SRui Ueyama     else
10682ec34544SRui Ueyama       Config->VersionScriptLocals.push_back(V);
10692ec34544SRui Ueyama   }
10702ec34544SRui Ueyama 
10712ec34544SRui Ueyama   for (SymbolVersion V : Globals)
10722ec34544SRui Ueyama     Config->VersionScriptGlobals.push_back(V);
10732ec34544SRui Ueyama 
10742ec34544SRui Ueyama   expect(";");
10752ec34544SRui Ueyama }
10762ec34544SRui Ueyama 
10772ec34544SRui Ueyama // Reads a non-anonymous version definition,
10782ec34544SRui Ueyama // e.g. "VerStr { global: foo; bar; local: *; };".
10792ec34544SRui Ueyama void ScriptParser::readVersionDeclaration(StringRef VerStr) {
10802ec34544SRui Ueyama   // Read a symbol list.
10812ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
10822ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
10832ec34544SRui Ueyama   std::tie(Locals, Globals) = readSymbols();
10842ec34544SRui Ueyama 
10852ec34544SRui Ueyama   for (SymbolVersion V : Locals) {
10862ec34544SRui Ueyama     if (V.Name == "*")
10872ec34544SRui Ueyama       Config->DefaultSymbolVersion = VER_NDX_LOCAL;
10882ec34544SRui Ueyama     else
10892ec34544SRui Ueyama       Config->VersionScriptLocals.push_back(V);
10902ec34544SRui Ueyama   }
10912ec34544SRui Ueyama 
10922ec34544SRui Ueyama   // Create a new version definition and add that to the global symbols.
10932ec34544SRui Ueyama   VersionDefinition Ver;
10942ec34544SRui Ueyama   Ver.Name = VerStr;
10952ec34544SRui Ueyama   Ver.Globals = Globals;
10962ec34544SRui Ueyama 
10972ec34544SRui Ueyama   // User-defined version number starts from 2 because 0 and 1 are
10982ec34544SRui Ueyama   // reserved for VER_NDX_LOCAL and VER_NDX_GLOBAL, respectively.
10992ec34544SRui Ueyama   Ver.Id = Config->VersionDefinitions.size() + 2;
11002ec34544SRui Ueyama   Config->VersionDefinitions.push_back(Ver);
11012ec34544SRui Ueyama 
11022ec34544SRui Ueyama   // Each version may have a parent version. For example, "Ver2"
11032ec34544SRui Ueyama   // defined as "Ver2 { global: foo; local: *; } Ver1;" has "Ver1"
11042ec34544SRui Ueyama   // as a parent. This version hierarchy is, probably against your
11052ec34544SRui Ueyama   // instinct, purely for hint; the runtime doesn't care about it
11062ec34544SRui Ueyama   // at all. In LLD, we simply ignore it.
11072ec34544SRui Ueyama   if (peek() != ";")
11082ec34544SRui Ueyama     skip();
11092ec34544SRui Ueyama   expect(";");
11102ec34544SRui Ueyama }
11112ec34544SRui Ueyama 
11121e77ad14SRui Ueyama static bool hasWildcard(StringRef S) {
11131e77ad14SRui Ueyama   return S.find_first_of("?*[") != StringRef::npos;
11141e77ad14SRui Ueyama }
11151e77ad14SRui Ueyama 
11162ec34544SRui Ueyama // Reads a list of symbols, e.g. "{ global: foo; bar; local: *; };".
11172ec34544SRui Ueyama std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>>
11182ec34544SRui Ueyama ScriptParser::readSymbols() {
11192ec34544SRui Ueyama   std::vector<SymbolVersion> Locals;
11202ec34544SRui Ueyama   std::vector<SymbolVersion> Globals;
11212ec34544SRui Ueyama   std::vector<SymbolVersion> *V = &Globals;
11222ec34544SRui Ueyama 
11232ec34544SRui Ueyama   while (!Error) {
11242ec34544SRui Ueyama     if (consume("}"))
11252ec34544SRui Ueyama       break;
11262ec34544SRui Ueyama     if (consumeLabel("local")) {
11272ec34544SRui Ueyama       V = &Locals;
11282ec34544SRui Ueyama       continue;
11292ec34544SRui Ueyama     }
11302ec34544SRui Ueyama     if (consumeLabel("global")) {
11312ec34544SRui Ueyama       V = &Globals;
11322ec34544SRui Ueyama       continue;
11332ec34544SRui Ueyama     }
11342ec34544SRui Ueyama 
11352ec34544SRui Ueyama     if (consume("extern")) {
11362ec34544SRui Ueyama       std::vector<SymbolVersion> Ext = readVersionExtern();
11372ec34544SRui Ueyama       V->insert(V->end(), Ext.begin(), Ext.end());
11382ec34544SRui Ueyama     } else {
11392ec34544SRui Ueyama       StringRef Tok = next();
11402ec34544SRui Ueyama       V->push_back({unquote(Tok), false, hasWildcard(Tok)});
11412ec34544SRui Ueyama     }
11422ec34544SRui Ueyama     expect(";");
11432ec34544SRui Ueyama   }
11442ec34544SRui Ueyama   return {Locals, Globals};
11452ec34544SRui Ueyama }
11462ec34544SRui Ueyama 
11472ec34544SRui Ueyama // Reads an "extern C++" directive, e.g.,
11482ec34544SRui Ueyama // "extern "C++" { ns::*; "f(int, double)"; };"
11492ec34544SRui Ueyama std::vector<SymbolVersion> ScriptParser::readVersionExtern() {
11502ec34544SRui Ueyama   StringRef Tok = next();
11512ec34544SRui Ueyama   bool IsCXX = Tok == "\"C++\"";
11522ec34544SRui Ueyama   if (!IsCXX && Tok != "\"C\"")
11532ec34544SRui Ueyama     setError("Unknown language");
11542ec34544SRui Ueyama   expect("{");
11552ec34544SRui Ueyama 
11562ec34544SRui Ueyama   std::vector<SymbolVersion> Ret;
11572ec34544SRui Ueyama   while (!Error && peek() != "}") {
11582ec34544SRui Ueyama     StringRef Tok = next();
11592ec34544SRui Ueyama     bool HasWildcard = !Tok.startswith("\"") && hasWildcard(Tok);
11602ec34544SRui Ueyama     Ret.push_back({unquote(Tok), IsCXX, HasWildcard});
11612ec34544SRui Ueyama     expect(";");
11622ec34544SRui Ueyama   }
11632ec34544SRui Ueyama 
11642ec34544SRui Ueyama   expect("}");
11652ec34544SRui Ueyama   return Ret;
11662ec34544SRui Ueyama }
11672ec34544SRui Ueyama 
11682ec34544SRui Ueyama uint64_t ScriptParser::readMemoryAssignment(StringRef S1, StringRef S2,
11692ec34544SRui Ueyama                                             StringRef S3) {
1170b579c439SRui Ueyama   if (!consume(S1) && !consume(S2) && !consume(S3)) {
11712ec34544SRui Ueyama     setError("expected one of: " + S1 + ", " + S2 + ", or " + S3);
11722ec34544SRui Ueyama     return 0;
11732ec34544SRui Ueyama   }
11742ec34544SRui Ueyama   expect("=");
1175040af7deSRui Ueyama   return readExpr()().getValue();
11762ec34544SRui Ueyama }
11772ec34544SRui Ueyama 
11782ec34544SRui Ueyama // Parse the MEMORY command as specified in:
11792ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/MEMORY.html
11802ec34544SRui Ueyama //
11812ec34544SRui Ueyama // MEMORY { name [(attr)] : ORIGIN = origin, LENGTH = len ... }
11822ec34544SRui Ueyama void ScriptParser::readMemory() {
11832ec34544SRui Ueyama   expect("{");
11842ec34544SRui Ueyama   while (!Error && !consume("}")) {
11852ec34544SRui Ueyama     StringRef Name = next();
11862ec34544SRui Ueyama 
11872ec34544SRui Ueyama     uint32_t Flags = 0;
11882ec34544SRui Ueyama     uint32_t NegFlags = 0;
11892ec34544SRui Ueyama     if (consume("(")) {
11902ec34544SRui Ueyama       std::tie(Flags, NegFlags) = readMemoryAttributes();
11912ec34544SRui Ueyama       expect(")");
11922ec34544SRui Ueyama     }
11932ec34544SRui Ueyama     expect(":");
11942ec34544SRui Ueyama 
11952ec34544SRui Ueyama     uint64_t Origin = readMemoryAssignment("ORIGIN", "org", "o");
11962ec34544SRui Ueyama     expect(",");
11972ec34544SRui Ueyama     uint64_t Length = readMemoryAssignment("LENGTH", "len", "l");
11982ec34544SRui Ueyama 
11992ec34544SRui Ueyama     // Add the memory region to the region map (if it doesn't already exist).
12002ec34544SRui Ueyama     auto It = Script->Opt.MemoryRegions.find(Name);
12012ec34544SRui Ueyama     if (It != Script->Opt.MemoryRegions.end())
12022ec34544SRui Ueyama       setError("region '" + Name + "' already defined");
12032ec34544SRui Ueyama     else
1204906e9a18SPeter Smith       Script->Opt.MemoryRegions[Name] = {Name, Origin, Length, Flags, NegFlags};
12052ec34544SRui Ueyama   }
12062ec34544SRui Ueyama }
12072ec34544SRui Ueyama 
12082ec34544SRui Ueyama // This function parses the attributes used to match against section
12092ec34544SRui Ueyama // flags when placing output sections in a memory region. These flags
12102ec34544SRui Ueyama // are only used when an explicit memory region name is not used.
12112ec34544SRui Ueyama std::pair<uint32_t, uint32_t> ScriptParser::readMemoryAttributes() {
12122ec34544SRui Ueyama   uint32_t Flags = 0;
12132ec34544SRui Ueyama   uint32_t NegFlags = 0;
12142ec34544SRui Ueyama   bool Invert = false;
12152ec34544SRui Ueyama 
12162ec34544SRui Ueyama   for (char C : next().lower()) {
12172ec34544SRui Ueyama     uint32_t Flag = 0;
12182ec34544SRui Ueyama     if (C == '!')
12192ec34544SRui Ueyama       Invert = !Invert;
12202ec34544SRui Ueyama     else if (C == 'w')
12212ec34544SRui Ueyama       Flag = SHF_WRITE;
12222ec34544SRui Ueyama     else if (C == 'x')
12232ec34544SRui Ueyama       Flag = SHF_EXECINSTR;
12242ec34544SRui Ueyama     else if (C == 'a')
12252ec34544SRui Ueyama       Flag = SHF_ALLOC;
12262ec34544SRui Ueyama     else if (C != 'r')
12272ec34544SRui Ueyama       setError("invalid memory region attribute");
12282ec34544SRui Ueyama 
12292ec34544SRui Ueyama     if (Invert)
12302ec34544SRui Ueyama       NegFlags |= Flag;
12312ec34544SRui Ueyama     else
12322ec34544SRui Ueyama       Flags |= Flag;
12332ec34544SRui Ueyama   }
12342ec34544SRui Ueyama   return {Flags, NegFlags};
12352ec34544SRui Ueyama }
12362ec34544SRui Ueyama 
12372ec34544SRui Ueyama void elf::readLinkerScript(MemoryBufferRef MB) {
12382ec34544SRui Ueyama   ScriptParser(MB).readLinkerScript();
12392ec34544SRui Ueyama }
12402ec34544SRui Ueyama 
12412ec34544SRui Ueyama void elf::readVersionScript(MemoryBufferRef MB) {
12422ec34544SRui Ueyama   ScriptParser(MB).readVersionScript();
12432ec34544SRui Ueyama }
12442ec34544SRui Ueyama 
12452ec34544SRui Ueyama void elf::readDynamicList(MemoryBufferRef MB) {
12462ec34544SRui Ueyama   ScriptParser(MB).readDynamicList();
12472ec34544SRui Ueyama }
1248