12ec34544SRui Ueyama //===- ScriptParser.cpp ---------------------------------------------------===// 22ec34544SRui Ueyama // 32ec34544SRui Ueyama // The LLVM Linker 42ec34544SRui Ueyama // 52ec34544SRui Ueyama // This file is distributed under the University of Illinois Open Source 62ec34544SRui Ueyama // License. See LICENSE.TXT for details. 72ec34544SRui Ueyama // 82ec34544SRui Ueyama //===----------------------------------------------------------------------===// 905f6b852SRui Ueyama // 1005f6b852SRui Ueyama // This file contains a recursive-descendent parser for linker scripts. 1105f6b852SRui Ueyama // Parsed results are stored to Config and Script global objects. 1205f6b852SRui Ueyama // 1305f6b852SRui Ueyama //===----------------------------------------------------------------------===// 142ec34544SRui Ueyama 152ec34544SRui Ueyama #include "ScriptParser.h" 162ec34544SRui Ueyama #include "Config.h" 172ec34544SRui Ueyama #include "Driver.h" 182ec34544SRui Ueyama #include "InputSection.h" 192ec34544SRui Ueyama #include "LinkerScript.h" 202ec34544SRui Ueyama #include "OutputSections.h" 212ec34544SRui Ueyama #include "ScriptLexer.h" 222ec34544SRui Ueyama #include "Symbols.h" 232ec34544SRui Ueyama #include "Target.h" 242017d52bSRui Ueyama #include "lld/Common/Memory.h" 252ec34544SRui Ueyama #include "llvm/ADT/SmallString.h" 262ec34544SRui Ueyama #include "llvm/ADT/StringRef.h" 270440be4aSRui Ueyama #include "llvm/ADT/StringSet.h" 282ec34544SRui Ueyama #include "llvm/ADT/StringSwitch.h" 29264b5d9eSZachary Turner #include "llvm/BinaryFormat/ELF.h" 302ec34544SRui Ueyama #include "llvm/Support/Casting.h" 312ec34544SRui Ueyama #include "llvm/Support/ErrorHandling.h" 322ec34544SRui Ueyama #include "llvm/Support/FileSystem.h" 332ec34544SRui Ueyama #include "llvm/Support/Path.h" 342ec34544SRui Ueyama #include <cassert> 352ec34544SRui Ueyama #include <limits> 362ec34544SRui Ueyama #include <vector> 372ec34544SRui Ueyama 382ec34544SRui Ueyama using namespace llvm; 392ec34544SRui Ueyama using namespace llvm::ELF; 40b58079d4SRui Ueyama using namespace llvm::support::endian; 412ec34544SRui Ueyama using namespace lld; 422ec34544SRui Ueyama using namespace lld::elf; 432ec34544SRui Ueyama 442ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path); 452ec34544SRui Ueyama 4696b3fe02SRui Ueyama namespace { 4796b3fe02SRui Ueyama class ScriptParser final : ScriptLexer { 482ec34544SRui Ueyama public: 492ec34544SRui Ueyama ScriptParser(MemoryBufferRef MB) 502ec34544SRui Ueyama : ScriptLexer(MB), 512ec34544SRui Ueyama IsUnderSysroot(isUnderSysroot(MB.getBufferIdentifier())) {} 522ec34544SRui Ueyama 532ec34544SRui Ueyama void readLinkerScript(); 542ec34544SRui Ueyama void readVersionScript(); 552ec34544SRui Ueyama void readDynamicList(); 568c7e8cceSPetr Hosek void readDefsym(StringRef Name); 572ec34544SRui Ueyama 582ec34544SRui Ueyama private: 592ec34544SRui Ueyama void addFile(StringRef Path); 602ec34544SRui Ueyama 612ec34544SRui Ueyama void readAsNeeded(); 622ec34544SRui Ueyama void readEntry(); 632ec34544SRui Ueyama void readExtern(); 642ec34544SRui Ueyama void readGroup(); 652ec34544SRui Ueyama void readInclude(); 661d92aa73SRui Ueyama void readInput(); 672ec34544SRui Ueyama void readMemory(); 682ec34544SRui Ueyama void readOutput(); 692ec34544SRui Ueyama void readOutputArch(); 702ec34544SRui Ueyama void readOutputFormat(); 712ec34544SRui Ueyama void readPhdrs(); 725f37541cSGeorge Rimar void readRegionAlias(); 732ec34544SRui Ueyama void readSearchDir(); 742ec34544SRui Ueyama void readSections(); 75*e262bb1aSRui Ueyama void readTarget(); 762ec34544SRui Ueyama void readVersion(); 772ec34544SRui Ueyama void readVersionScriptCommand(); 782ec34544SRui Ueyama 79d30a78b3SGeorge Rimar SymbolAssignment *readSymbolAssignment(StringRef Name); 80f0403c60SRui Ueyama ByteCommand *readByteCommand(StringRef Tok); 812ec34544SRui Ueyama uint32_t readFill(); 828acbf1ccSRui Ueyama uint32_t parseFill(StringRef Tok); 838c022ca7SRafael Espindola void readSectionAddressType(OutputSection *Cmd); 84a582419aSGeorge Rimar OutputSection *readOverlaySectionDescription(); 858c022ca7SRafael Espindola OutputSection *readOutputSectionDescription(StringRef OutSec); 86a582419aSGeorge Rimar std::vector<BaseCommand *> readOverlay(); 872ec34544SRui Ueyama std::vector<StringRef> readOutputSectionPhdrs(); 882ec34544SRui Ueyama InputSectionDescription *readInputSectionDescription(StringRef Tok); 892ec34544SRui Ueyama StringMatcher readFilePatterns(); 902ec34544SRui Ueyama std::vector<SectionPattern> readInputSectionsList(); 912ec34544SRui Ueyama InputSectionDescription *readInputSectionRules(StringRef FilePattern); 922ec34544SRui Ueyama unsigned readPhdrType(); 932ec34544SRui Ueyama SortSectionPolicy readSortKind(); 942ec34544SRui Ueyama SymbolAssignment *readProvideHidden(bool Provide, bool Hidden); 95d30a78b3SGeorge Rimar SymbolAssignment *readAssignment(StringRef Tok); 962ec34544SRui Ueyama void readSort(); 97d30a78b3SGeorge Rimar Expr readAssert(); 985fb17128SGeorge Rimar Expr readConstant(); 995fb17128SGeorge Rimar Expr getPageSize(); 1002ec34544SRui Ueyama 1012ec34544SRui Ueyama uint64_t readMemoryAssignment(StringRef, StringRef, StringRef); 1022ec34544SRui Ueyama std::pair<uint32_t, uint32_t> readMemoryAttributes(); 1032ec34544SRui Ueyama 1047b91e213SGeorge Rimar Expr combine(StringRef Op, Expr L, Expr R); 1052ec34544SRui Ueyama Expr readExpr(); 1062ec34544SRui Ueyama Expr readExpr1(Expr Lhs, int MinPrec); 1072ec34544SRui Ueyama StringRef readParenLiteral(); 1082ec34544SRui Ueyama Expr readPrimary(); 1092ec34544SRui Ueyama Expr readTernary(Expr Cond); 1102ec34544SRui Ueyama Expr readParenExpr(); 1112ec34544SRui Ueyama 1122ec34544SRui Ueyama // For parsing version script. 1132ec34544SRui Ueyama std::vector<SymbolVersion> readVersionExtern(); 1142ec34544SRui Ueyama void readAnonymousDeclaration(); 1152ec34544SRui Ueyama void readVersionDeclaration(StringRef VerStr); 1162ec34544SRui Ueyama 1172ec34544SRui Ueyama std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>> 1182ec34544SRui Ueyama readSymbols(); 1192ec34544SRui Ueyama 120fd06b025SRui Ueyama // True if a script being read is in a subdirectory specified by -sysroot. 1212ec34544SRui Ueyama bool IsUnderSysroot; 1220440be4aSRui Ueyama 1230440be4aSRui Ueyama // A set to detect an INCLUDE() cycle. 1240440be4aSRui Ueyama StringSet<> Seen; 1252ec34544SRui Ueyama }; 12696b3fe02SRui Ueyama } // namespace 1272ec34544SRui Ueyama 1281e77ad14SRui Ueyama static StringRef unquote(StringRef S) { 1291e77ad14SRui Ueyama if (S.startswith("\"")) 1301e77ad14SRui Ueyama return S.substr(1, S.size() - 2); 1311e77ad14SRui Ueyama return S; 1321e77ad14SRui Ueyama } 1331e77ad14SRui Ueyama 1342ec34544SRui Ueyama static bool isUnderSysroot(StringRef Path) { 1352ec34544SRui Ueyama if (Config->Sysroot == "") 1362ec34544SRui Ueyama return false; 1372ec34544SRui Ueyama for (; !Path.empty(); Path = sys::path::parent_path(Path)) 1382ec34544SRui Ueyama if (sys::fs::equivalent(Config->Sysroot, Path)) 1392ec34544SRui Ueyama return true; 1402ec34544SRui Ueyama return false; 1412ec34544SRui Ueyama } 1422ec34544SRui Ueyama 1432ec34544SRui Ueyama // Some operations only support one non absolute value. Move the 1442ec34544SRui Ueyama // absolute one to the right hand side for convenience. 1452ec34544SRui Ueyama static void moveAbsRight(ExprValue &A, ExprValue &B) { 14623be5e8dSRafael Espindola if (A.Sec == nullptr || (A.ForceAbsolute && !B.isAbsolute())) 1472ec34544SRui Ueyama std::swap(A, B); 1482ec34544SRui Ueyama if (!B.isAbsolute()) 14941c7ab4aSGeorge Rimar error(A.Loc + ": at least one side of the expression must be absolute"); 1502ec34544SRui Ueyama } 1512ec34544SRui Ueyama 1522ec34544SRui Ueyama static ExprValue add(ExprValue A, ExprValue B) { 1532ec34544SRui Ueyama moveAbsRight(A, B); 154a6acd23cSRafael Espindola return {A.Sec, A.ForceAbsolute, A.getSectionOffset() + B.getValue(), A.Loc}; 1552ec34544SRui Ueyama } 1562ec34544SRui Ueyama 1572ec34544SRui Ueyama static ExprValue sub(ExprValue A, ExprValue B) { 15863a4a98eSRafael Espindola // The distance between two symbols in sections is absolute. 1599cbb6dd1SRafael Espindola if (!A.isAbsolute() && !B.isAbsolute()) 1609cbb6dd1SRafael Espindola return A.getValue() - B.getValue(); 1614fbe3518SRui Ueyama return {A.Sec, false, A.getSectionOffset() - B.getValue(), A.Loc}; 1622ec34544SRui Ueyama } 1632ec34544SRui Ueyama 1642ec34544SRui Ueyama static ExprValue bitAnd(ExprValue A, ExprValue B) { 1652ec34544SRui Ueyama moveAbsRight(A, B); 1662ec34544SRui Ueyama return {A.Sec, A.ForceAbsolute, 16741c7ab4aSGeorge Rimar (A.getValue() & B.getValue()) - A.getSecAddr(), A.Loc}; 1682ec34544SRui Ueyama } 1692ec34544SRui Ueyama 1702ec34544SRui Ueyama static ExprValue bitOr(ExprValue A, ExprValue B) { 1712ec34544SRui Ueyama moveAbsRight(A, B); 1722ec34544SRui Ueyama return {A.Sec, A.ForceAbsolute, 17341c7ab4aSGeorge Rimar (A.getValue() | B.getValue()) - A.getSecAddr(), A.Loc}; 1742ec34544SRui Ueyama } 1752ec34544SRui Ueyama 1762ec34544SRui Ueyama void ScriptParser::readDynamicList() { 1778016bdfdSRafael Espindola Config->HasDynamicList = true; 1782ec34544SRui Ueyama expect("{"); 179d72d97b3SRafael Espindola std::vector<SymbolVersion> Locals; 180d72d97b3SRafael Espindola std::vector<SymbolVersion> Globals; 181d72d97b3SRafael Espindola std::tie(Locals, Globals) = readSymbols(); 182d72d97b3SRafael Espindola expect(";"); 183d72d97b3SRafael Espindola 184d72d97b3SRafael Espindola if (!atEOF()) { 1852ec34544SRui Ueyama setError("EOF expected, but got " + next()); 186d72d97b3SRafael Espindola return; 187d72d97b3SRafael Espindola } 188d72d97b3SRafael Espindola if (!Locals.empty()) { 189d72d97b3SRafael Espindola setError("\"local:\" scope not supported in --dynamic-list"); 190d72d97b3SRafael Espindola return; 191d72d97b3SRafael Espindola } 192d72d97b3SRafael Espindola 193d72d97b3SRafael Espindola for (SymbolVersion V : Globals) 194d72d97b3SRafael Espindola Config->DynamicList.push_back(V); 1952ec34544SRui Ueyama } 1962ec34544SRui Ueyama 1972ec34544SRui Ueyama void ScriptParser::readVersionScript() { 1982ec34544SRui Ueyama readVersionScriptCommand(); 1992ec34544SRui Ueyama if (!atEOF()) 2002ec34544SRui Ueyama setError("EOF expected, but got " + next()); 2012ec34544SRui Ueyama } 2022ec34544SRui Ueyama 2032ec34544SRui Ueyama void ScriptParser::readVersionScriptCommand() { 2042ec34544SRui Ueyama if (consume("{")) { 2052ec34544SRui Ueyama readAnonymousDeclaration(); 2062ec34544SRui Ueyama return; 2072ec34544SRui Ueyama } 2082ec34544SRui Ueyama 209b8a59c8aSBob Haarman while (!atEOF() && !errorCount() && peek() != "}") { 2102ec34544SRui Ueyama StringRef VerStr = next(); 2112ec34544SRui Ueyama if (VerStr == "{") { 2122ec34544SRui Ueyama setError("anonymous version definition is used in " 2132ec34544SRui Ueyama "combination with other version definitions"); 2142ec34544SRui Ueyama return; 2152ec34544SRui Ueyama } 2162ec34544SRui Ueyama expect("{"); 2172ec34544SRui Ueyama readVersionDeclaration(VerStr); 2182ec34544SRui Ueyama } 2192ec34544SRui Ueyama } 2202ec34544SRui Ueyama 2212ec34544SRui Ueyama void ScriptParser::readVersion() { 2222ec34544SRui Ueyama expect("{"); 2232ec34544SRui Ueyama readVersionScriptCommand(); 2242ec34544SRui Ueyama expect("}"); 2252ec34544SRui Ueyama } 2262ec34544SRui Ueyama 2272ec34544SRui Ueyama void ScriptParser::readLinkerScript() { 2282ec34544SRui Ueyama while (!atEOF()) { 2292ec34544SRui Ueyama StringRef Tok = next(); 2302ec34544SRui Ueyama if (Tok == ";") 2312ec34544SRui Ueyama continue; 2322ec34544SRui Ueyama 233d30a78b3SGeorge Rimar if (Tok == "ENTRY") { 2342ec34544SRui Ueyama readEntry(); 2352ec34544SRui Ueyama } else if (Tok == "EXTERN") { 2362ec34544SRui Ueyama readExtern(); 2371d92aa73SRui Ueyama } else if (Tok == "GROUP") { 2382ec34544SRui Ueyama readGroup(); 2392ec34544SRui Ueyama } else if (Tok == "INCLUDE") { 2402ec34544SRui Ueyama readInclude(); 2411d92aa73SRui Ueyama } else if (Tok == "INPUT") { 2421d92aa73SRui Ueyama readInput(); 2432ec34544SRui Ueyama } else if (Tok == "MEMORY") { 2442ec34544SRui Ueyama readMemory(); 2452ec34544SRui Ueyama } else if (Tok == "OUTPUT") { 2462ec34544SRui Ueyama readOutput(); 2472ec34544SRui Ueyama } else if (Tok == "OUTPUT_ARCH") { 2482ec34544SRui Ueyama readOutputArch(); 2492ec34544SRui Ueyama } else if (Tok == "OUTPUT_FORMAT") { 2502ec34544SRui Ueyama readOutputFormat(); 2512ec34544SRui Ueyama } else if (Tok == "PHDRS") { 2522ec34544SRui Ueyama readPhdrs(); 2535f37541cSGeorge Rimar } else if (Tok == "REGION_ALIAS") { 2545f37541cSGeorge Rimar readRegionAlias(); 2552ec34544SRui Ueyama } else if (Tok == "SEARCH_DIR") { 2562ec34544SRui Ueyama readSearchDir(); 2572ec34544SRui Ueyama } else if (Tok == "SECTIONS") { 2582ec34544SRui Ueyama readSections(); 259*e262bb1aSRui Ueyama } else if (Tok == "TARGET") { 260*e262bb1aSRui Ueyama readTarget(); 2612ec34544SRui Ueyama } else if (Tok == "VERSION") { 2622ec34544SRui Ueyama readVersion(); 263d30a78b3SGeorge Rimar } else if (SymbolAssignment *Cmd = readAssignment(Tok)) { 2646b394caaSRui Ueyama Script->SectionCommands.push_back(Cmd); 2652ec34544SRui Ueyama } else { 2662ec34544SRui Ueyama setError("unknown directive: " + Tok); 2672ec34544SRui Ueyama } 2682ec34544SRui Ueyama } 2692ec34544SRui Ueyama } 2702ec34544SRui Ueyama 2718c7e8cceSPetr Hosek void ScriptParser::readDefsym(StringRef Name) { 2728c7e8cceSPetr Hosek Expr E = readExpr(); 2738c7e8cceSPetr Hosek if (!atEOF()) 2748c7e8cceSPetr Hosek setError("EOF expected, but got " + next()); 275e88b76a9SGeorge Rimar SymbolAssignment *Cmd = make<SymbolAssignment>(Name, E, getCurrentLocation()); 2768c7e8cceSPetr Hosek Script->SectionCommands.push_back(Cmd); 2778c7e8cceSPetr Hosek } 2788c7e8cceSPetr Hosek 2792ec34544SRui Ueyama void ScriptParser::addFile(StringRef S) { 2802ec34544SRui Ueyama if (IsUnderSysroot && S.startswith("/")) { 2812ec34544SRui Ueyama SmallString<128> PathData; 2822ec34544SRui Ueyama StringRef Path = (Config->Sysroot + S).toStringRef(PathData); 2832ec34544SRui Ueyama if (sys::fs::exists(Path)) { 284a76349bfSEvgeniy Stepanov Driver->addFile(Saver.save(Path), /*WithLOption=*/false); 2852ec34544SRui Ueyama return; 2862ec34544SRui Ueyama } 2872ec34544SRui Ueyama } 2882ec34544SRui Ueyama 289875ae82bSRui Ueyama if (S.startswith("/")) { 290a76349bfSEvgeniy Stepanov Driver->addFile(S, /*WithLOption=*/false); 2912ec34544SRui Ueyama } else if (S.startswith("=")) { 2922ec34544SRui Ueyama if (Config->Sysroot.empty()) 293a76349bfSEvgeniy Stepanov Driver->addFile(S.substr(1), /*WithLOption=*/false); 2942ec34544SRui Ueyama else 295a76349bfSEvgeniy Stepanov Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1)), 296a76349bfSEvgeniy Stepanov /*WithLOption=*/false); 2972ec34544SRui Ueyama } else if (S.startswith("-l")) { 2982ec34544SRui Ueyama Driver->addLibrary(S.substr(2)); 2992ec34544SRui Ueyama } else if (sys::fs::exists(S)) { 300a76349bfSEvgeniy Stepanov Driver->addFile(S, /*WithLOption=*/false); 3012ec34544SRui Ueyama } else { 3022ec34544SRui Ueyama if (Optional<std::string> Path = findFromSearchPaths(S)) 303a76349bfSEvgeniy Stepanov Driver->addFile(Saver.save(*Path), /*WithLOption=*/true); 3042ec34544SRui Ueyama else 3052ec34544SRui Ueyama setError("unable to find " + S); 3062ec34544SRui Ueyama } 3072ec34544SRui Ueyama } 3082ec34544SRui Ueyama 3092ec34544SRui Ueyama void ScriptParser::readAsNeeded() { 3102ec34544SRui Ueyama expect("("); 3112ec34544SRui Ueyama bool Orig = Config->AsNeeded; 3122ec34544SRui Ueyama Config->AsNeeded = true; 313b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 3142ec34544SRui Ueyama addFile(unquote(next())); 3152ec34544SRui Ueyama Config->AsNeeded = Orig; 3162ec34544SRui Ueyama } 3172ec34544SRui Ueyama 3182ec34544SRui Ueyama void ScriptParser::readEntry() { 3192ec34544SRui Ueyama // -e <symbol> takes predecence over ENTRY(<symbol>). 3202ec34544SRui Ueyama expect("("); 3212ec34544SRui Ueyama StringRef Tok = next(); 3222ec34544SRui Ueyama if (Config->Entry.empty()) 3232ec34544SRui Ueyama Config->Entry = Tok; 3242ec34544SRui Ueyama expect(")"); 3252ec34544SRui Ueyama } 3262ec34544SRui Ueyama 3272ec34544SRui Ueyama void ScriptParser::readExtern() { 3282ec34544SRui Ueyama expect("("); 329b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 3302ec34544SRui Ueyama Config->Undefined.push_back(next()); 3312ec34544SRui Ueyama } 3322ec34544SRui Ueyama 3332ec34544SRui Ueyama void ScriptParser::readGroup() { 3341d92aa73SRui Ueyama bool Orig = InputFile::IsInGroup; 3351d92aa73SRui Ueyama InputFile::IsInGroup = true; 3361d92aa73SRui Ueyama readInput(); 3371d92aa73SRui Ueyama InputFile::IsInGroup = Orig; 338b72daf00SFangrui Song if (!Orig) 339b72daf00SFangrui Song ++InputFile::NextGroupId; 3402ec34544SRui Ueyama } 3412ec34544SRui Ueyama 3422ec34544SRui Ueyama void ScriptParser::readInclude() { 3432ec34544SRui Ueyama StringRef Tok = unquote(next()); 3442ec34544SRui Ueyama 3450440be4aSRui Ueyama if (!Seen.insert(Tok).second) { 3460440be4aSRui Ueyama setError("there is a cycle in linker script INCLUDEs"); 3470440be4aSRui Ueyama return; 3480440be4aSRui Ueyama } 3490440be4aSRui Ueyama 350c60f85d0SFangrui Song if (Optional<std::string> Path = searchScript(Tok)) { 3512ec34544SRui Ueyama if (Optional<MemoryBufferRef> MB = readFile(*Path)) 3522ec34544SRui Ueyama tokenize(*MB); 3532ec34544SRui Ueyama return; 3542ec34544SRui Ueyama } 3551de78471SAlexander Richardson setError("cannot find linker script " + Tok); 3562ec34544SRui Ueyama } 3572ec34544SRui Ueyama 3581d92aa73SRui Ueyama void ScriptParser::readInput() { 3591d92aa73SRui Ueyama expect("("); 3601d92aa73SRui Ueyama while (!errorCount() && !consume(")")) { 3611d92aa73SRui Ueyama if (consume("AS_NEEDED")) 3621d92aa73SRui Ueyama readAsNeeded(); 3631d92aa73SRui Ueyama else 3641d92aa73SRui Ueyama addFile(unquote(next())); 3651d92aa73SRui Ueyama } 3661d92aa73SRui Ueyama } 3671d92aa73SRui Ueyama 3682ec34544SRui Ueyama void ScriptParser::readOutput() { 3692ec34544SRui Ueyama // -o <file> takes predecence over OUTPUT(<file>). 3702ec34544SRui Ueyama expect("("); 3712ec34544SRui Ueyama StringRef Tok = next(); 3722ec34544SRui Ueyama if (Config->OutputFile.empty()) 3732ec34544SRui Ueyama Config->OutputFile = unquote(Tok); 3742ec34544SRui Ueyama expect(")"); 3752ec34544SRui Ueyama } 3762ec34544SRui Ueyama 3772ec34544SRui Ueyama void ScriptParser::readOutputArch() { 3782ec34544SRui Ueyama // OUTPUT_ARCH is ignored for now. 3792ec34544SRui Ueyama expect("("); 380b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 3812ec34544SRui Ueyama skip(); 3822ec34544SRui Ueyama } 3832ec34544SRui Ueyama 3842ec34544SRui Ueyama void ScriptParser::readOutputFormat() { 3852ec34544SRui Ueyama // Error checking only for now. 3862ec34544SRui Ueyama expect("("); 3872ec34544SRui Ueyama skip(); 388b579c439SRui Ueyama if (consume(")")) 3892ec34544SRui Ueyama return; 390b579c439SRui Ueyama expect(","); 3912ec34544SRui Ueyama skip(); 3922ec34544SRui Ueyama expect(","); 3932ec34544SRui Ueyama skip(); 3942ec34544SRui Ueyama expect(")"); 3952ec34544SRui Ueyama } 3962ec34544SRui Ueyama 3972ec34544SRui Ueyama void ScriptParser::readPhdrs() { 3982ec34544SRui Ueyama expect("{"); 3992ec34544SRui Ueyama 400b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 4010ae2c24cSRui Ueyama PhdrsCommand Cmd; 4020ae2c24cSRui Ueyama Cmd.Name = next(); 4030ae2c24cSRui Ueyama Cmd.Type = readPhdrType(); 404b579c439SRui Ueyama 405b8a59c8aSBob Haarman while (!errorCount() && !consume(";")) { 406b579c439SRui Ueyama if (consume("FILEHDR")) 4070ae2c24cSRui Ueyama Cmd.HasFilehdr = true; 408b579c439SRui Ueyama else if (consume("PHDRS")) 4090ae2c24cSRui Ueyama Cmd.HasPhdrs = true; 410b579c439SRui Ueyama else if (consume("AT")) 4110ae2c24cSRui Ueyama Cmd.LMAExpr = readParenExpr(); 412b579c439SRui Ueyama else if (consume("FLAGS")) 4130ae2c24cSRui Ueyama Cmd.Flags = readParenExpr()().getValue(); 414b579c439SRui Ueyama else 415b579c439SRui Ueyama setError("unexpected header attribute: " + next()); 416b579c439SRui Ueyama } 4170ae2c24cSRui Ueyama 418ac27de9dSRui Ueyama Script->PhdrsCommands.push_back(Cmd); 4192ec34544SRui Ueyama } 4202ec34544SRui Ueyama } 4212ec34544SRui Ueyama 4225f37541cSGeorge Rimar void ScriptParser::readRegionAlias() { 4235f37541cSGeorge Rimar expect("("); 4245f37541cSGeorge Rimar StringRef Alias = unquote(next()); 4255f37541cSGeorge Rimar expect(","); 4265f37541cSGeorge Rimar StringRef Name = next(); 4275f37541cSGeorge Rimar expect(")"); 4285f37541cSGeorge Rimar 429ac27de9dSRui Ueyama if (Script->MemoryRegions.count(Alias)) 4305f37541cSGeorge Rimar setError("redefinition of memory region '" + Alias + "'"); 431ac27de9dSRui Ueyama if (!Script->MemoryRegions.count(Name)) 4325f37541cSGeorge Rimar setError("memory region '" + Name + "' is not defined"); 4338c825db2SGeorge Rimar Script->MemoryRegions.insert({Alias, Script->MemoryRegions[Name]}); 4345f37541cSGeorge Rimar } 4355f37541cSGeorge Rimar 4362ec34544SRui Ueyama void ScriptParser::readSearchDir() { 4372ec34544SRui Ueyama expect("("); 4382ec34544SRui Ueyama StringRef Tok = next(); 4392ec34544SRui Ueyama if (!Config->Nostdlib) 4402ec34544SRui Ueyama Config->SearchPaths.push_back(unquote(Tok)); 4412ec34544SRui Ueyama expect(")"); 4422ec34544SRui Ueyama } 4432ec34544SRui Ueyama 444a582419aSGeorge Rimar // This reads an overlay description. Overlays are used to describe output 445a582419aSGeorge Rimar // sections that use the same virtual memory range and normally would trigger 446a582419aSGeorge Rimar // linker's sections sanity check failures. 447a582419aSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Overlay-Description.html#Overlay-Description 448a582419aSGeorge Rimar std::vector<BaseCommand *> ScriptParser::readOverlay() { 449a582419aSGeorge Rimar // VA and LMA expressions are optional, though for simplicity of 450a582419aSGeorge Rimar // implementation we assume they are not. That is what OVERLAY was designed 451a582419aSGeorge Rimar // for first of all: to allow sections with overlapping VAs at different LMAs. 452a582419aSGeorge Rimar Expr AddrExpr = readExpr(); 453a582419aSGeorge Rimar expect(":"); 454a582419aSGeorge Rimar expect("AT"); 455a582419aSGeorge Rimar Expr LMAExpr = readParenExpr(); 456a582419aSGeorge Rimar expect("{"); 457a582419aSGeorge Rimar 458a582419aSGeorge Rimar std::vector<BaseCommand *> V; 459a582419aSGeorge Rimar OutputSection *Prev = nullptr; 460a582419aSGeorge Rimar while (!errorCount() && !consume("}")) { 461a582419aSGeorge Rimar // VA is the same for all sections. The LMAs are consecutive in memory 462a582419aSGeorge Rimar // starting from the base load address specified. 463a582419aSGeorge Rimar OutputSection *OS = readOverlaySectionDescription(); 464a582419aSGeorge Rimar OS->AddrExpr = AddrExpr; 465a582419aSGeorge Rimar if (Prev) 466a582419aSGeorge Rimar OS->LMAExpr = [=] { return Prev->getLMA() + Prev->Size; }; 467a582419aSGeorge Rimar else 468a582419aSGeorge Rimar OS->LMAExpr = LMAExpr; 469a582419aSGeorge Rimar V.push_back(OS); 470a582419aSGeorge Rimar Prev = OS; 471a582419aSGeorge Rimar } 472a582419aSGeorge Rimar 473a582419aSGeorge Rimar // According to the specification, at the end of the overlay, the location 474a582419aSGeorge Rimar // counter should be equal to the overlay base address plus size of the 475a582419aSGeorge Rimar // largest section seen in the overlay. 476a582419aSGeorge Rimar // Here we want to create the Dot assignment command to achieve that. 477a582419aSGeorge Rimar Expr MoveDot = [=] { 478a582419aSGeorge Rimar uint64_t Max = 0; 479a582419aSGeorge Rimar for (BaseCommand *Cmd : V) 480a582419aSGeorge Rimar Max = std::max(Max, cast<OutputSection>(Cmd)->Size); 481a582419aSGeorge Rimar return AddrExpr().getValue() + Max; 482a582419aSGeorge Rimar }; 483a582419aSGeorge Rimar V.push_back(make<SymbolAssignment>(".", MoveDot, getCurrentLocation())); 484a582419aSGeorge Rimar return V; 485a582419aSGeorge Rimar } 486a582419aSGeorge Rimar 4872ec34544SRui Ueyama void ScriptParser::readSections() { 488a323e2a7SRui Ueyama Script->HasSectionsCommand = true; 489b579c439SRui Ueyama 4902ec34544SRui Ueyama // -no-rosegment is used to avoid placing read only non-executable sections in 4912ec34544SRui Ueyama // their own segment. We do the same if SECTIONS command is present in linker 4922ec34544SRui Ueyama // script. See comment for computeFlags(). 4932ec34544SRui Ueyama Config->SingleRoRx = true; 4942ec34544SRui Ueyama 4952ec34544SRui Ueyama expect("{"); 4969e2c8a9dSGeorge Rimar std::vector<BaseCommand *> V; 497b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 4982ec34544SRui Ueyama StringRef Tok = next(); 499a582419aSGeorge Rimar if (Tok == "OVERLAY") { 500a582419aSGeorge Rimar for (BaseCommand *Cmd : readOverlay()) 501a582419aSGeorge Rimar V.push_back(Cmd); 502a582419aSGeorge Rimar continue; 503a582419aSGeorge Rimar } 504a582419aSGeorge Rimar 505d30a78b3SGeorge Rimar if (BaseCommand *Cmd = readAssignment(Tok)) 5069e2c8a9dSGeorge Rimar V.push_back(Cmd); 507d30a78b3SGeorge Rimar else 508d30a78b3SGeorge Rimar V.push_back(readOutputSectionDescription(Tok)); 5092ec34544SRui Ueyama } 5109e2c8a9dSGeorge Rimar 5119e2c8a9dSGeorge Rimar if (!atEOF() && consume("INSERT")) { 512796684b4SGeorge Rimar std::vector<BaseCommand *> *Dest = nullptr; 513796684b4SGeorge Rimar if (consume("AFTER")) 514796684b4SGeorge Rimar Dest = &Script->InsertAfterCommands[next()]; 515796684b4SGeorge Rimar else if (consume("BEFORE")) 516796684b4SGeorge Rimar Dest = &Script->InsertBeforeCommands[next()]; 517796684b4SGeorge Rimar else 518796684b4SGeorge Rimar setError("expected AFTER/BEFORE, but got '" + next() + "'"); 519796684b4SGeorge Rimar if (Dest) 520796684b4SGeorge Rimar Dest->insert(Dest->end(), V.begin(), V.end()); 5219e2c8a9dSGeorge Rimar return; 5229e2c8a9dSGeorge Rimar } 5239e2c8a9dSGeorge Rimar 5249e2c8a9dSGeorge Rimar Script->SectionCommands.insert(Script->SectionCommands.end(), V.begin(), 5259e2c8a9dSGeorge Rimar V.end()); 5262ec34544SRui Ueyama } 5272ec34544SRui Ueyama 528*e262bb1aSRui Ueyama void ScriptParser::readTarget() { 529*e262bb1aSRui Ueyama // TARGET(foo) is an alias for "--format foo". Unlike GNU linkers, 530*e262bb1aSRui Ueyama // we accept only a limited set of BFD names (i.e. "elf" or "binary") 531*e262bb1aSRui Ueyama // for --format. We recognize only /^elf/ and "binary" in the linker 532*e262bb1aSRui Ueyama // script as well. 533*e262bb1aSRui Ueyama expect("("); 534*e262bb1aSRui Ueyama StringRef Tok = next(); 535*e262bb1aSRui Ueyama expect(")"); 536*e262bb1aSRui Ueyama 537*e262bb1aSRui Ueyama if (Tok.startswith("elf")) 538*e262bb1aSRui Ueyama Config->FormatBinary = false; 539*e262bb1aSRui Ueyama else if (Tok == "binary") 540*e262bb1aSRui Ueyama Config->FormatBinary = true; 541*e262bb1aSRui Ueyama else 542*e262bb1aSRui Ueyama setError("unknown target: " + Tok); 543*e262bb1aSRui Ueyama } 544*e262bb1aSRui Ueyama 5452ec34544SRui Ueyama static int precedence(StringRef Op) { 5462ec34544SRui Ueyama return StringSwitch<int>(Op) 547a5005482SGeorge Rimar .Cases("*", "/", "%", 8) 548a5005482SGeorge Rimar .Cases("+", "-", 7) 549a5005482SGeorge Rimar .Cases("<<", ">>", 6) 550a5005482SGeorge Rimar .Cases("<", "<=", ">", ">=", "==", "!=", 5) 551a5005482SGeorge Rimar .Case("&", 4) 552a5005482SGeorge Rimar .Case("|", 3) 553a5005482SGeorge Rimar .Case("&&", 2) 554a5005482SGeorge Rimar .Case("||", 1) 5552ec34544SRui Ueyama .Default(-1); 5562ec34544SRui Ueyama } 5572ec34544SRui Ueyama 5582ec34544SRui Ueyama StringMatcher ScriptParser::readFilePatterns() { 5592ec34544SRui Ueyama std::vector<StringRef> V; 560b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 5612ec34544SRui Ueyama V.push_back(next()); 5622ec34544SRui Ueyama return StringMatcher(V); 5632ec34544SRui Ueyama } 5642ec34544SRui Ueyama 5652ec34544SRui Ueyama SortSectionPolicy ScriptParser::readSortKind() { 5662ec34544SRui Ueyama if (consume("SORT") || consume("SORT_BY_NAME")) 5672ec34544SRui Ueyama return SortSectionPolicy::Name; 5682ec34544SRui Ueyama if (consume("SORT_BY_ALIGNMENT")) 5692ec34544SRui Ueyama return SortSectionPolicy::Alignment; 5702ec34544SRui Ueyama if (consume("SORT_BY_INIT_PRIORITY")) 5712ec34544SRui Ueyama return SortSectionPolicy::Priority; 5722ec34544SRui Ueyama if (consume("SORT_NONE")) 5732ec34544SRui Ueyama return SortSectionPolicy::None; 5742ec34544SRui Ueyama return SortSectionPolicy::Default; 5752ec34544SRui Ueyama } 5762ec34544SRui Ueyama 57703fc8d1eSRui Ueyama // Reads SECTIONS command contents in the following form: 57803fc8d1eSRui Ueyama // 57903fc8d1eSRui Ueyama // <contents> ::= <elem>* 58003fc8d1eSRui Ueyama // <elem> ::= <exclude>? <glob-pattern> 58103fc8d1eSRui Ueyama // <exclude> ::= "EXCLUDE_FILE" "(" <glob-pattern>+ ")" 58203fc8d1eSRui Ueyama // 58303fc8d1eSRui Ueyama // For example, 58403fc8d1eSRui Ueyama // 58503fc8d1eSRui Ueyama // *(.foo EXCLUDE_FILE (a.o) .bar EXCLUDE_FILE (b.o) .baz) 58603fc8d1eSRui Ueyama // 58703fc8d1eSRui Ueyama // is parsed as ".foo", ".bar" with "a.o", and ".baz" with "b.o". 58803fc8d1eSRui Ueyama // The semantics of that is section .foo in any file, section .bar in 58903fc8d1eSRui Ueyama // any file but a.o, and section .baz in any file but b.o. 5902ec34544SRui Ueyama std::vector<SectionPattern> ScriptParser::readInputSectionsList() { 5912ec34544SRui Ueyama std::vector<SectionPattern> Ret; 592b8a59c8aSBob Haarman while (!errorCount() && peek() != ")") { 5932ec34544SRui Ueyama StringMatcher ExcludeFilePat; 5942ec34544SRui Ueyama if (consume("EXCLUDE_FILE")) { 5952ec34544SRui Ueyama expect("("); 5962ec34544SRui Ueyama ExcludeFilePat = readFilePatterns(); 5972ec34544SRui Ueyama } 5982ec34544SRui Ueyama 5992ec34544SRui Ueyama std::vector<StringRef> V; 600b8a59c8aSBob Haarman while (!errorCount() && peek() != ")" && peek() != "EXCLUDE_FILE") 6012ec34544SRui Ueyama V.push_back(next()); 6022ec34544SRui Ueyama 6032ec34544SRui Ueyama if (!V.empty()) 6042ec34544SRui Ueyama Ret.push_back({std::move(ExcludeFilePat), StringMatcher(V)}); 6052ec34544SRui Ueyama else 6062ec34544SRui Ueyama setError("section pattern is expected"); 6072ec34544SRui Ueyama } 6082ec34544SRui Ueyama return Ret; 6092ec34544SRui Ueyama } 6102ec34544SRui Ueyama 6112ec34544SRui Ueyama // Reads contents of "SECTIONS" directive. That directive contains a 6122ec34544SRui Ueyama // list of glob patterns for input sections. The grammar is as follows. 6132ec34544SRui Ueyama // 6142ec34544SRui Ueyama // <patterns> ::= <section-list> 6152ec34544SRui Ueyama // | <sort> "(" <section-list> ")" 6162ec34544SRui Ueyama // | <sort> "(" <sort> "(" <section-list> ")" ")" 6172ec34544SRui Ueyama // 6182ec34544SRui Ueyama // <sort> ::= "SORT" | "SORT_BY_NAME" | "SORT_BY_ALIGNMENT" 6192ec34544SRui Ueyama // | "SORT_BY_INIT_PRIORITY" | "SORT_NONE" 6202ec34544SRui Ueyama // 6212ec34544SRui Ueyama // <section-list> is parsed by readInputSectionsList(). 6222ec34544SRui Ueyama InputSectionDescription * 6232ec34544SRui Ueyama ScriptParser::readInputSectionRules(StringRef FilePattern) { 6242ec34544SRui Ueyama auto *Cmd = make<InputSectionDescription>(FilePattern); 6252ec34544SRui Ueyama expect("("); 6262ec34544SRui Ueyama 627b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) { 6282ec34544SRui Ueyama SortSectionPolicy Outer = readSortKind(); 6292ec34544SRui Ueyama SortSectionPolicy Inner = SortSectionPolicy::Default; 6302ec34544SRui Ueyama std::vector<SectionPattern> V; 6312ec34544SRui Ueyama if (Outer != SortSectionPolicy::Default) { 6322ec34544SRui Ueyama expect("("); 6332ec34544SRui Ueyama Inner = readSortKind(); 6342ec34544SRui Ueyama if (Inner != SortSectionPolicy::Default) { 6352ec34544SRui Ueyama expect("("); 6362ec34544SRui Ueyama V = readInputSectionsList(); 6372ec34544SRui Ueyama expect(")"); 6382ec34544SRui Ueyama } else { 6392ec34544SRui Ueyama V = readInputSectionsList(); 6402ec34544SRui Ueyama } 6412ec34544SRui Ueyama expect(")"); 6422ec34544SRui Ueyama } else { 6432ec34544SRui Ueyama V = readInputSectionsList(); 6442ec34544SRui Ueyama } 6452ec34544SRui Ueyama 6462ec34544SRui Ueyama for (SectionPattern &Pat : V) { 6472ec34544SRui Ueyama Pat.SortInner = Inner; 6482ec34544SRui Ueyama Pat.SortOuter = Outer; 6492ec34544SRui Ueyama } 6502ec34544SRui Ueyama 6512ec34544SRui Ueyama std::move(V.begin(), V.end(), std::back_inserter(Cmd->SectionPatterns)); 6522ec34544SRui Ueyama } 6532ec34544SRui Ueyama return Cmd; 6542ec34544SRui Ueyama } 6552ec34544SRui Ueyama 6562ec34544SRui Ueyama InputSectionDescription * 6572ec34544SRui Ueyama ScriptParser::readInputSectionDescription(StringRef Tok) { 6582ec34544SRui Ueyama // Input section wildcard can be surrounded by KEEP. 6592ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep 6602ec34544SRui Ueyama if (Tok == "KEEP") { 6612ec34544SRui Ueyama expect("("); 6622ec34544SRui Ueyama StringRef FilePattern = next(); 6632ec34544SRui Ueyama InputSectionDescription *Cmd = readInputSectionRules(FilePattern); 6642ec34544SRui Ueyama expect(")"); 665ac27de9dSRui Ueyama Script->KeptSections.push_back(Cmd); 6662ec34544SRui Ueyama return Cmd; 6672ec34544SRui Ueyama } 6682ec34544SRui Ueyama return readInputSectionRules(Tok); 6692ec34544SRui Ueyama } 6702ec34544SRui Ueyama 6712ec34544SRui Ueyama void ScriptParser::readSort() { 6722ec34544SRui Ueyama expect("("); 6732ec34544SRui Ueyama expect("CONSTRUCTORS"); 6742ec34544SRui Ueyama expect(")"); 6752ec34544SRui Ueyama } 6762ec34544SRui Ueyama 677d30a78b3SGeorge Rimar Expr ScriptParser::readAssert() { 6782ec34544SRui Ueyama expect("("); 6792ec34544SRui Ueyama Expr E = readExpr(); 6802ec34544SRui Ueyama expect(","); 6812ec34544SRui Ueyama StringRef Msg = unquote(next()); 6822ec34544SRui Ueyama expect(")"); 683b579c439SRui Ueyama 6842ec34544SRui Ueyama return [=] { 6852ec34544SRui Ueyama if (!E().getValue()) 6862ec34544SRui Ueyama error(Msg); 6872ec34544SRui Ueyama return Script->getDot(); 6882ec34544SRui Ueyama }; 6892ec34544SRui Ueyama } 6902ec34544SRui Ueyama 6912ec34544SRui Ueyama // Reads a FILL(expr) command. We handle the FILL command as an 6922ec34544SRui Ueyama // alias for =fillexp section attribute, which is different from 6932ec34544SRui Ueyama // what GNU linkers do. 6942ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html 6952ec34544SRui Ueyama uint32_t ScriptParser::readFill() { 6962ec34544SRui Ueyama expect("("); 6978acbf1ccSRui Ueyama uint32_t V = parseFill(next()); 6982ec34544SRui Ueyama expect(")"); 6992ec34544SRui Ueyama return V; 7002ec34544SRui Ueyama } 7012ec34544SRui Ueyama 7021c08e9f5SGeorge Rimar // Reads an expression and/or the special directive for an output 7031c08e9f5SGeorge Rimar // section definition. Directive is one of following: "(NOLOAD)", 7041c08e9f5SGeorge Rimar // "(COPY)", "(INFO)" or "(OVERLAY)". 7053271d370SRui Ueyama // 7063271d370SRui Ueyama // An output section name can be followed by an address expression 7071c08e9f5SGeorge Rimar // and/or directive. This grammar is not LL(1) because "(" can be 70897f4d158SGeorge Rimar // interpreted as either the beginning of some expression or beginning 7091c08e9f5SGeorge Rimar // of directive. 7103271d370SRui Ueyama // 711b579c439SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html 712fbb0463fSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Type.html 7138c022ca7SRafael Espindola void ScriptParser::readSectionAddressType(OutputSection *Cmd) { 7143271d370SRui Ueyama if (consume("(")) { 7153271d370SRui Ueyama if (consume("NOLOAD")) { 7163271d370SRui Ueyama expect(")"); 7173271d370SRui Ueyama Cmd->Noload = true; 7183271d370SRui Ueyama return; 7193271d370SRui Ueyama } 7201c08e9f5SGeorge Rimar if (consume("COPY") || consume("INFO") || consume("OVERLAY")) { 7211c08e9f5SGeorge Rimar expect(")"); 7221c08e9f5SGeorge Rimar Cmd->NonAlloc = true; 7231c08e9f5SGeorge Rimar return; 7241c08e9f5SGeorge Rimar } 7253271d370SRui Ueyama Cmd->AddrExpr = readExpr(); 7263271d370SRui Ueyama expect(")"); 7273271d370SRui Ueyama } else { 7283271d370SRui Ueyama Cmd->AddrExpr = readExpr(); 7293271d370SRui Ueyama } 7303271d370SRui Ueyama 731fbb0463fSGeorge Rimar if (consume("(")) { 732fbb0463fSGeorge Rimar expect("NOLOAD"); 733fbb0463fSGeorge Rimar expect(")"); 734fbb0463fSGeorge Rimar Cmd->Noload = true; 735fbb0463fSGeorge Rimar } 736fbb0463fSGeorge Rimar } 737fbb0463fSGeorge Rimar 738f22ec9ddSGeorge Rimar static Expr checkAlignment(Expr E, std::string &Loc) { 739f22ec9ddSGeorge Rimar return [=] { 740f22ec9ddSGeorge Rimar uint64_t Alignment = std::max((uint64_t)1, E().getValue()); 741f22ec9ddSGeorge Rimar if (!isPowerOf2_64(Alignment)) { 742f22ec9ddSGeorge Rimar error(Loc + ": alignment must be power of 2"); 743f22ec9ddSGeorge Rimar return (uint64_t)1; // Return a dummy value. 744f22ec9ddSGeorge Rimar } 745f22ec9ddSGeorge Rimar return Alignment; 746f22ec9ddSGeorge Rimar }; 747f22ec9ddSGeorge Rimar } 748f22ec9ddSGeorge Rimar 749a582419aSGeorge Rimar OutputSection *ScriptParser::readOverlaySectionDescription() { 750a582419aSGeorge Rimar OutputSection *Cmd = 751a582419aSGeorge Rimar Script->createOutputSection(next(), getCurrentLocation()); 752a582419aSGeorge Rimar Cmd->InOverlay = true; 753a582419aSGeorge Rimar expect("{"); 754a582419aSGeorge Rimar while (!errorCount() && !consume("}")) 755a582419aSGeorge Rimar Cmd->SectionCommands.push_back(readInputSectionRules(next())); 756a582419aSGeorge Rimar Cmd->Phdrs = readOutputSectionPhdrs(); 757a582419aSGeorge Rimar return Cmd; 758a582419aSGeorge Rimar } 759a582419aSGeorge Rimar 7608c022ca7SRafael Espindola OutputSection *ScriptParser::readOutputSectionDescription(StringRef OutSec) { 7618c022ca7SRafael Espindola OutputSection *Cmd = 7628c022ca7SRafael Espindola Script->createOutputSection(OutSec, getCurrentLocation()); 7633271d370SRui Ueyama 764c4df670dSGeorge Rimar size_t SymbolsReferenced = Script->ReferencedSymbols.size(); 765c4df670dSGeorge Rimar 7663271d370SRui Ueyama if (peek() != ":") 7673271d370SRui Ueyama readSectionAddressType(Cmd); 7682ec34544SRui Ueyama expect(":"); 7692ec34544SRui Ueyama 770f22ec9ddSGeorge Rimar std::string Location = getCurrentLocation(); 7712ec34544SRui Ueyama if (consume("AT")) 7722ec34544SRui Ueyama Cmd->LMAExpr = readParenExpr(); 7732ec34544SRui Ueyama if (consume("ALIGN")) 774f22ec9ddSGeorge Rimar Cmd->AlignExpr = checkAlignment(readParenExpr(), Location); 7752ec34544SRui Ueyama if (consume("SUBALIGN")) 776f22ec9ddSGeorge Rimar Cmd->SubalignExpr = checkAlignment(readParenExpr(), Location); 7772ec34544SRui Ueyama 7782ec34544SRui Ueyama // Parse constraints. 7792ec34544SRui Ueyama if (consume("ONLY_IF_RO")) 7802ec34544SRui Ueyama Cmd->Constraint = ConstraintKind::ReadOnly; 7812ec34544SRui Ueyama if (consume("ONLY_IF_RW")) 7822ec34544SRui Ueyama Cmd->Constraint = ConstraintKind::ReadWrite; 7832ec34544SRui Ueyama expect("{"); 7842ec34544SRui Ueyama 785b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 7862ec34544SRui Ueyama StringRef Tok = next(); 7872ec34544SRui Ueyama if (Tok == ";") { 7882ec34544SRui Ueyama // Empty commands are allowed. Do nothing here. 789d30a78b3SGeorge Rimar } else if (SymbolAssignment *Assign = readAssignment(Tok)) { 7906b394caaSRui Ueyama Cmd->SectionCommands.push_back(Assign); 791f0403c60SRui Ueyama } else if (ByteCommand *Data = readByteCommand(Tok)) { 7926b394caaSRui Ueyama Cmd->SectionCommands.push_back(Data); 7932ec34544SRui Ueyama } else if (Tok == "CONSTRUCTORS") { 7942ec34544SRui Ueyama // CONSTRUCTORS is a keyword to make the linker recognize C++ ctors/dtors 7952ec34544SRui Ueyama // by name. This is for very old file formats such as ECOFF/XCOFF. 7962ec34544SRui Ueyama // For ELF, we should ignore. 7972ec34544SRui Ueyama } else if (Tok == "FILL") { 7982ec34544SRui Ueyama Cmd->Filler = readFill(); 7992ec34544SRui Ueyama } else if (Tok == "SORT") { 8002ec34544SRui Ueyama readSort(); 8012ec34544SRui Ueyama } else if (peek() == "(") { 8026b394caaSRui Ueyama Cmd->SectionCommands.push_back(readInputSectionDescription(Tok)); 8032ec34544SRui Ueyama } else { 8042ec34544SRui Ueyama setError("unknown command " + Tok); 8052ec34544SRui Ueyama } 8062ec34544SRui Ueyama } 8072ec34544SRui Ueyama 8082ec34544SRui Ueyama if (consume(">")) 8092ec34544SRui Ueyama Cmd->MemoryRegionName = next(); 8102ec34544SRui Ueyama 8115d01a8beSGeorge Rimar if (consume("AT")) { 8125d01a8beSGeorge Rimar expect(">"); 8135d01a8beSGeorge Rimar Cmd->LMARegionName = next(); 8145d01a8beSGeorge Rimar } 8155d01a8beSGeorge Rimar 8165d01a8beSGeorge Rimar if (Cmd->LMAExpr && !Cmd->LMARegionName.empty()) 8175d01a8beSGeorge Rimar error("section can't have both LMA and a load region"); 8185d01a8beSGeorge Rimar 8192ec34544SRui Ueyama Cmd->Phdrs = readOutputSectionPhdrs(); 8202ec34544SRui Ueyama 8212ec34544SRui Ueyama if (consume("=")) 8228acbf1ccSRui Ueyama Cmd->Filler = parseFill(next()); 8232ec34544SRui Ueyama else if (peek().startswith("=")) 8248acbf1ccSRui Ueyama Cmd->Filler = parseFill(next().drop_front()); 8252ec34544SRui Ueyama 8262ec34544SRui Ueyama // Consume optional comma following output section command. 8272ec34544SRui Ueyama consume(","); 8282ec34544SRui Ueyama 829c4df670dSGeorge Rimar if (Script->ReferencedSymbols.size() > SymbolsReferenced) 830c4df670dSGeorge Rimar Cmd->ExpressionsUseSymbols = true; 8312ec34544SRui Ueyama return Cmd; 8322ec34544SRui Ueyama } 8332ec34544SRui Ueyama 8348acbf1ccSRui Ueyama // Parses a given string as a octal/decimal/hexadecimal number and 8358acbf1ccSRui Ueyama // returns it as a big-endian number. Used for `=<fillexp>`. 8362ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html 8372ec34544SRui Ueyama // 8388acbf1ccSRui Ueyama // When reading a hexstring, ld.bfd handles it as a blob of arbitrary 8398acbf1ccSRui Ueyama // size, while ld.gold always handles it as a 32-bit big-endian number. 8408acbf1ccSRui Ueyama // We are compatible with ld.gold because it's easier to implement. 8418acbf1ccSRui Ueyama uint32_t ScriptParser::parseFill(StringRef Tok) { 842b58079d4SRui Ueyama uint32_t V = 0; 843ab94768cSGeorge Rimar if (!to_integer(Tok, V)) 8442ec34544SRui Ueyama setError("invalid filler expression: " + Tok); 845b58079d4SRui Ueyama 846b58079d4SRui Ueyama uint32_t Buf; 847b58079d4SRui Ueyama write32be(&Buf, V); 848b58079d4SRui Ueyama return Buf; 8492ec34544SRui Ueyama } 8502ec34544SRui Ueyama 8512ec34544SRui Ueyama SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) { 8522ec34544SRui Ueyama expect("("); 853d30a78b3SGeorge Rimar SymbolAssignment *Cmd = readSymbolAssignment(next()); 8542ec34544SRui Ueyama Cmd->Provide = Provide; 8552ec34544SRui Ueyama Cmd->Hidden = Hidden; 8562ec34544SRui Ueyama expect(")"); 8572ec34544SRui Ueyama return Cmd; 8582ec34544SRui Ueyama } 8592ec34544SRui Ueyama 860d30a78b3SGeorge Rimar SymbolAssignment *ScriptParser::readAssignment(StringRef Tok) { 861d30a78b3SGeorge Rimar // Assert expression returns Dot, so this is equal to ".=." 862d30a78b3SGeorge Rimar if (Tok == "ASSERT") 863d30a78b3SGeorge Rimar return make<SymbolAssignment>(".", readAssert(), getCurrentLocation()); 864d30a78b3SGeorge Rimar 865e88b76a9SGeorge Rimar size_t OldPos = Pos; 8662ec34544SRui Ueyama SymbolAssignment *Cmd = nullptr; 867e88b76a9SGeorge Rimar if (peek() == "=" || peek() == "+=") 868d30a78b3SGeorge Rimar Cmd = readSymbolAssignment(Tok); 869e88b76a9SGeorge Rimar else if (Tok == "PROVIDE") 8702ec34544SRui Ueyama Cmd = readProvideHidden(true, false); 871e88b76a9SGeorge Rimar else if (Tok == "HIDDEN") 8722ec34544SRui Ueyama Cmd = readProvideHidden(false, true); 873e88b76a9SGeorge Rimar else if (Tok == "PROVIDE_HIDDEN") 8742ec34544SRui Ueyama Cmd = readProvideHidden(true, true); 875e88b76a9SGeorge Rimar 876e88b76a9SGeorge Rimar if (Cmd) { 877e88b76a9SGeorge Rimar Cmd->CommandString = 878e88b76a9SGeorge Rimar Tok.str() + " " + 879e88b76a9SGeorge Rimar llvm::join(Tokens.begin() + OldPos, Tokens.begin() + Pos, " "); 880e88b76a9SGeorge Rimar expect(";"); 8812ec34544SRui Ueyama } 8822ec34544SRui Ueyama return Cmd; 8832ec34544SRui Ueyama } 8842ec34544SRui Ueyama 885d30a78b3SGeorge Rimar SymbolAssignment *ScriptParser::readSymbolAssignment(StringRef Name) { 8862ec34544SRui Ueyama StringRef Op = next(); 8872ec34544SRui Ueyama assert(Op == "=" || Op == "+="); 8882ec34544SRui Ueyama Expr E = readExpr(); 8892ec34544SRui Ueyama if (Op == "+=") { 8902ec34544SRui Ueyama std::string Loc = getCurrentLocation(); 891722221f5SRui Ueyama E = [=] { return add(Script->getSymbolValue(Name, Loc), E()); }; 8922ec34544SRui Ueyama } 893e88b76a9SGeorge Rimar return make<SymbolAssignment>(Name, E, getCurrentLocation()); 8942ec34544SRui Ueyama } 8952ec34544SRui Ueyama 8962ec34544SRui Ueyama // This is an operator-precedence parser to parse a linker 8972ec34544SRui Ueyama // script expression. 8982ec34544SRui Ueyama Expr ScriptParser::readExpr() { 8992ec34544SRui Ueyama // Our lexer is context-aware. Set the in-expression bit so that 9002ec34544SRui Ueyama // they apply different tokenization rules. 9012ec34544SRui Ueyama bool Orig = InExpr; 9022ec34544SRui Ueyama InExpr = true; 9032ec34544SRui Ueyama Expr E = readExpr1(readPrimary(), 0); 9042ec34544SRui Ueyama InExpr = Orig; 9052ec34544SRui Ueyama return E; 9062ec34544SRui Ueyama } 9072ec34544SRui Ueyama 9087b91e213SGeorge Rimar Expr ScriptParser::combine(StringRef Op, Expr L, Expr R) { 9092ec34544SRui Ueyama if (Op == "+") 9102ec34544SRui Ueyama return [=] { return add(L(), R()); }; 9112ec34544SRui Ueyama if (Op == "-") 9122ec34544SRui Ueyama return [=] { return sub(L(), R()); }; 913b579c439SRui Ueyama if (Op == "*") 9141d20222aSRui Ueyama return [=] { return L().getValue() * R().getValue(); }; 9157b91e213SGeorge Rimar if (Op == "/") { 9167b91e213SGeorge Rimar std::string Loc = getCurrentLocation(); 9177b91e213SGeorge Rimar return [=]() -> uint64_t { 9187b91e213SGeorge Rimar if (uint64_t RV = R().getValue()) 9197b91e213SGeorge Rimar return L().getValue() / RV; 9207b91e213SGeorge Rimar error(Loc + ": division by zero"); 921067617f9SRui Ueyama return 0; 9227b91e213SGeorge Rimar }; 9237b91e213SGeorge Rimar } 9247b91e213SGeorge Rimar if (Op == "%") { 9257b91e213SGeorge Rimar std::string Loc = getCurrentLocation(); 9267b91e213SGeorge Rimar return [=]() -> uint64_t { 9277b91e213SGeorge Rimar if (uint64_t RV = R().getValue()) 9287b91e213SGeorge Rimar return L().getValue() % RV; 9297b91e213SGeorge Rimar error(Loc + ": modulo by zero"); 930067617f9SRui Ueyama return 0; 9317b91e213SGeorge Rimar }; 9327b91e213SGeorge Rimar } 9332ec34544SRui Ueyama if (Op == "<<") 9347e915511SRui Ueyama return [=] { return L().getValue() << R().getValue(); }; 9352ec34544SRui Ueyama if (Op == ">>") 9367e915511SRui Ueyama return [=] { return L().getValue() >> R().getValue(); }; 9372ec34544SRui Ueyama if (Op == "<") 9382ec34544SRui Ueyama return [=] { return L().getValue() < R().getValue(); }; 9392ec34544SRui Ueyama if (Op == ">") 9402ec34544SRui Ueyama return [=] { return L().getValue() > R().getValue(); }; 9412ec34544SRui Ueyama if (Op == ">=") 9422ec34544SRui Ueyama return [=] { return L().getValue() >= R().getValue(); }; 9432ec34544SRui Ueyama if (Op == "<=") 9442ec34544SRui Ueyama return [=] { return L().getValue() <= R().getValue(); }; 9452ec34544SRui Ueyama if (Op == "==") 9462ec34544SRui Ueyama return [=] { return L().getValue() == R().getValue(); }; 9472ec34544SRui Ueyama if (Op == "!=") 9482ec34544SRui Ueyama return [=] { return L().getValue() != R().getValue(); }; 949a5005482SGeorge Rimar if (Op == "||") 950a5005482SGeorge Rimar return [=] { return L().getValue() || R().getValue(); }; 951a5005482SGeorge Rimar if (Op == "&&") 952a5005482SGeorge Rimar return [=] { return L().getValue() && R().getValue(); }; 9532ec34544SRui Ueyama if (Op == "&") 9542ec34544SRui Ueyama return [=] { return bitAnd(L(), R()); }; 9552ec34544SRui Ueyama if (Op == "|") 9562ec34544SRui Ueyama return [=] { return bitOr(L(), R()); }; 9572ec34544SRui Ueyama llvm_unreachable("invalid operator"); 9582ec34544SRui Ueyama } 9592ec34544SRui Ueyama 9602ec34544SRui Ueyama // This is a part of the operator-precedence parser. This function 9612ec34544SRui Ueyama // assumes that the remaining token stream starts with an operator. 9622ec34544SRui Ueyama Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) { 963b8a59c8aSBob Haarman while (!atEOF() && !errorCount()) { 9642ec34544SRui Ueyama // Read an operator and an expression. 9652ec34544SRui Ueyama if (consume("?")) 9662ec34544SRui Ueyama return readTernary(Lhs); 9672ec34544SRui Ueyama StringRef Op1 = peek(); 9682ec34544SRui Ueyama if (precedence(Op1) < MinPrec) 9692ec34544SRui Ueyama break; 9702ec34544SRui Ueyama skip(); 9712ec34544SRui Ueyama Expr Rhs = readPrimary(); 9722ec34544SRui Ueyama 9732ec34544SRui Ueyama // Evaluate the remaining part of the expression first if the 9742ec34544SRui Ueyama // next operator has greater precedence than the previous one. 9752ec34544SRui Ueyama // For example, if we have read "+" and "3", and if the next 9762ec34544SRui Ueyama // operator is "*", then we'll evaluate 3 * ... part first. 9772ec34544SRui Ueyama while (!atEOF()) { 9782ec34544SRui Ueyama StringRef Op2 = peek(); 9792ec34544SRui Ueyama if (precedence(Op2) <= precedence(Op1)) 9802ec34544SRui Ueyama break; 9812ec34544SRui Ueyama Rhs = readExpr1(Rhs, precedence(Op2)); 9822ec34544SRui Ueyama } 9832ec34544SRui Ueyama 9842ec34544SRui Ueyama Lhs = combine(Op1, Lhs, Rhs); 9852ec34544SRui Ueyama } 9862ec34544SRui Ueyama return Lhs; 9872ec34544SRui Ueyama } 9882ec34544SRui Ueyama 9895fb17128SGeorge Rimar Expr ScriptParser::getPageSize() { 9905fb17128SGeorge Rimar std::string Location = getCurrentLocation(); 9915fb17128SGeorge Rimar return [=]() -> uint64_t { 9925fb17128SGeorge Rimar if (Target) 9932ec34544SRui Ueyama return Target->PageSize; 9945fb17128SGeorge Rimar error(Location + ": unable to calculate page size"); 9955fb17128SGeorge Rimar return 4096; // Return a dummy value. 9965fb17128SGeorge Rimar }; 9975fb17128SGeorge Rimar } 9985fb17128SGeorge Rimar 9995fb17128SGeorge Rimar Expr ScriptParser::readConstant() { 10005fb17128SGeorge Rimar StringRef S = readParenLiteral(); 10015fb17128SGeorge Rimar if (S == "COMMONPAGESIZE") 10025fb17128SGeorge Rimar return getPageSize(); 10032ec34544SRui Ueyama if (S == "MAXPAGESIZE") 10045fb17128SGeorge Rimar return [] { return Config->MaxPageSize; }; 10055fb17128SGeorge Rimar setError("unknown constant: " + S); 1006b068b037SGeorge Rimar return [] { return 0; }; 10072ec34544SRui Ueyama } 10082ec34544SRui Ueyama 10095c65088fSRui Ueyama // Parses Tok as an integer. It recognizes hexadecimal (prefixed with 10105c65088fSRui Ueyama // "0x" or suffixed with "H") and decimal numbers. Decimal numbers may 10115c65088fSRui Ueyama // have "K" (Ki) or "M" (Mi) suffixes. 10125c65088fSRui Ueyama static Optional<uint64_t> parseInt(StringRef Tok) { 10132ec34544SRui Ueyama // Hexadecimal 10145c65088fSRui Ueyama uint64_t Val; 10154092016bSRui Ueyama if (Tok.startswith_lower("0x")) { 10164092016bSRui Ueyama if (!to_integer(Tok.substr(2), Val, 16)) 10174092016bSRui Ueyama return None; 10185c65088fSRui Ueyama return Val; 10194092016bSRui Ueyama } 10204092016bSRui Ueyama if (Tok.endswith_lower("H")) { 10214092016bSRui Ueyama if (!to_integer(Tok.drop_back(), Val, 16)) 10224092016bSRui Ueyama return None; 10235c65088fSRui Ueyama return Val; 10244092016bSRui Ueyama } 10252ec34544SRui Ueyama 10262ec34544SRui Ueyama // Decimal 10272ec34544SRui Ueyama if (Tok.endswith_lower("K")) { 1028ab94768cSGeorge Rimar if (!to_integer(Tok.drop_back(), Val, 10)) 10295c65088fSRui Ueyama return None; 10305c65088fSRui Ueyama return Val * 1024; 10312ec34544SRui Ueyama } 10325c65088fSRui Ueyama if (Tok.endswith_lower("M")) { 1033ab94768cSGeorge Rimar if (!to_integer(Tok.drop_back(), Val, 10)) 10345c65088fSRui Ueyama return None; 10355c65088fSRui Ueyama return Val * 1024 * 1024; 10365c65088fSRui Ueyama } 1037ab94768cSGeorge Rimar if (!to_integer(Tok, Val, 10)) 10385c65088fSRui Ueyama return None; 10395c65088fSRui Ueyama return Val; 10402ec34544SRui Ueyama } 10412ec34544SRui Ueyama 1042f0403c60SRui Ueyama ByteCommand *ScriptParser::readByteCommand(StringRef Tok) { 1043b579c439SRui Ueyama int Size = StringSwitch<int>(Tok) 10442ec34544SRui Ueyama .Case("BYTE", 1) 10452ec34544SRui Ueyama .Case("SHORT", 2) 10462ec34544SRui Ueyama .Case("LONG", 4) 10472ec34544SRui Ueyama .Case("QUAD", 8) 10482ec34544SRui Ueyama .Default(-1); 10492ec34544SRui Ueyama if (Size == -1) 10502ec34544SRui Ueyama return nullptr; 105184bcabcbSGeorge Rimar 105284bcabcbSGeorge Rimar size_t OldPos = Pos; 105384bcabcbSGeorge Rimar Expr E = readParenExpr(); 105484bcabcbSGeorge Rimar std::string CommandString = 105584bcabcbSGeorge Rimar Tok.str() + " " + 105684bcabcbSGeorge Rimar llvm::join(Tokens.begin() + OldPos, Tokens.begin() + Pos, " "); 105784bcabcbSGeorge Rimar return make<ByteCommand>(E, Size, CommandString); 10582ec34544SRui Ueyama } 10592ec34544SRui Ueyama 10602ec34544SRui Ueyama StringRef ScriptParser::readParenLiteral() { 10612ec34544SRui Ueyama expect("("); 10625e9c7762SRafael Espindola bool Orig = InExpr; 10635e9c7762SRafael Espindola InExpr = false; 10642ec34544SRui Ueyama StringRef Tok = next(); 10655e9c7762SRafael Espindola InExpr = Orig; 10662ec34544SRui Ueyama expect(")"); 10672ec34544SRui Ueyama return Tok; 10682ec34544SRui Ueyama } 10692ec34544SRui Ueyama 1070617e2f98SRui Ueyama static void checkIfExists(OutputSection *Cmd, StringRef Location) { 107105c4f67cSRafael Espindola if (Cmd->Location.empty() && Script->ErrorOnMissingSection) 107205c4f67cSRafael Espindola error(Location + ": undefined section " + Cmd->Name); 107305c4f67cSRafael Espindola } 107405c4f67cSRafael Espindola 10752ec34544SRui Ueyama Expr ScriptParser::readPrimary() { 10762ec34544SRui Ueyama if (peek() == "(") 10772ec34544SRui Ueyama return readParenExpr(); 10782ec34544SRui Ueyama 10795c65088fSRui Ueyama if (consume("~")) { 10802ec34544SRui Ueyama Expr E = readPrimary(); 1081b2fb84a1SRui Ueyama return [=] { return ~E().getValue(); }; 10822ec34544SRui Ueyama } 10836f1d954eSHafiz Abid Qadeer if (consume("!")) { 10846f1d954eSHafiz Abid Qadeer Expr E = readPrimary(); 10856f1d954eSHafiz Abid Qadeer return [=] { return !E().getValue(); }; 10866f1d954eSHafiz Abid Qadeer } 10875c65088fSRui Ueyama if (consume("-")) { 10882ec34544SRui Ueyama Expr E = readPrimary(); 1089b2fb84a1SRui Ueyama return [=] { return -E().getValue(); }; 10902ec34544SRui Ueyama } 10912ec34544SRui Ueyama 10925c65088fSRui Ueyama StringRef Tok = next(); 10935c65088fSRui Ueyama std::string Location = getCurrentLocation(); 10945c65088fSRui Ueyama 10952ec34544SRui Ueyama // Built-in functions are parsed here. 10962ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html. 10972ec34544SRui Ueyama if (Tok == "ABSOLUTE") { 10982ec34544SRui Ueyama Expr Inner = readParenExpr(); 10992ec34544SRui Ueyama return [=] { 11002ec34544SRui Ueyama ExprValue I = Inner(); 11012ec34544SRui Ueyama I.ForceAbsolute = true; 11022ec34544SRui Ueyama return I; 11032ec34544SRui Ueyama }; 11042ec34544SRui Ueyama } 11052ec34544SRui Ueyama if (Tok == "ADDR") { 11062ec34544SRui Ueyama StringRef Name = readParenLiteral(); 11074fbe3518SRui Ueyama OutputSection *Sec = Script->getOrCreateOutputSection(Name); 110841c7ab4aSGeorge Rimar return [=]() -> ExprValue { 11094fbe3518SRui Ueyama checkIfExists(Sec, Location); 11104fbe3518SRui Ueyama return {Sec, false, 0, Location}; 111141c7ab4aSGeorge Rimar }; 11122ec34544SRui Ueyama } 11132ec34544SRui Ueyama if (Tok == "ALIGN") { 11142ec34544SRui Ueyama expect("("); 11152ec34544SRui Ueyama Expr E = readExpr(); 1116f22ec9ddSGeorge Rimar if (consume(")")) { 1117f22ec9ddSGeorge Rimar E = checkAlignment(E, Location); 1118f22ec9ddSGeorge Rimar return [=] { return alignTo(Script->getDot(), E().getValue()); }; 1119f22ec9ddSGeorge Rimar } 1120b579c439SRui Ueyama expect(","); 1121f22ec9ddSGeorge Rimar Expr E2 = checkAlignment(readExpr(), Location); 11222ec34544SRui Ueyama expect(")"); 11233c6de1a6SPetr Hosek return [=] { 11243c6de1a6SPetr Hosek ExprValue V = E(); 1125f22ec9ddSGeorge Rimar V.Alignment = E2().getValue(); 11263c6de1a6SPetr Hosek return V; 11273c6de1a6SPetr Hosek }; 11282ec34544SRui Ueyama } 11292ec34544SRui Ueyama if (Tok == "ALIGNOF") { 11302ec34544SRui Ueyama StringRef Name = readParenLiteral(); 11318c022ca7SRafael Espindola OutputSection *Cmd = Script->getOrCreateOutputSection(Name); 1132617e2f98SRui Ueyama return [=] { 1133617e2f98SRui Ueyama checkIfExists(Cmd, Location); 1134617e2f98SRui Ueyama return Cmd->Alignment; 1135617e2f98SRui Ueyama }; 11362ec34544SRui Ueyama } 11372ec34544SRui Ueyama if (Tok == "ASSERT") 1138d30a78b3SGeorge Rimar return readAssert(); 11395fb17128SGeorge Rimar if (Tok == "CONSTANT") 11405fb17128SGeorge Rimar return readConstant(); 11412ec34544SRui Ueyama if (Tok == "DATA_SEGMENT_ALIGN") { 11422ec34544SRui Ueyama expect("("); 11432ec34544SRui Ueyama Expr E = readExpr(); 11442ec34544SRui Ueyama expect(","); 11452ec34544SRui Ueyama readExpr(); 11462ec34544SRui Ueyama expect(")"); 114760833f6eSGeorge Rimar return [=] { 114860833f6eSGeorge Rimar return alignTo(Script->getDot(), std::max((uint64_t)1, E().getValue())); 114960833f6eSGeorge Rimar }; 11502ec34544SRui Ueyama } 11512ec34544SRui Ueyama if (Tok == "DATA_SEGMENT_END") { 11522ec34544SRui Ueyama expect("("); 11532ec34544SRui Ueyama expect("."); 11542ec34544SRui Ueyama expect(")"); 11552ec34544SRui Ueyama return [] { return Script->getDot(); }; 11562ec34544SRui Ueyama } 11572ec34544SRui Ueyama if (Tok == "DATA_SEGMENT_RELRO_END") { 11582ec34544SRui Ueyama // GNU linkers implements more complicated logic to handle 11592ec34544SRui Ueyama // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and 11602ec34544SRui Ueyama // just align to the next page boundary for simplicity. 11612ec34544SRui Ueyama expect("("); 11622ec34544SRui Ueyama readExpr(); 11632ec34544SRui Ueyama expect(","); 11642ec34544SRui Ueyama readExpr(); 11652ec34544SRui Ueyama expect(")"); 11665fb17128SGeorge Rimar Expr E = getPageSize(); 11675fb17128SGeorge Rimar return [=] { return alignTo(Script->getDot(), E().getValue()); }; 11682ec34544SRui Ueyama } 11692ec34544SRui Ueyama if (Tok == "DEFINED") { 11702ec34544SRui Ueyama StringRef Name = readParenLiteral(); 11719b18f50fSRui Ueyama return [=] { return Symtab->find(Name) ? 1 : 0; }; 11722ec34544SRui Ueyama } 117391b95b61SRui Ueyama if (Tok == "LENGTH") { 117491b95b61SRui Ueyama StringRef Name = readParenLiteral(); 1175b068b037SGeorge Rimar if (Script->MemoryRegions.count(Name) == 0) { 117691b95b61SRui Ueyama setError("memory region not defined: " + Name); 1177b068b037SGeorge Rimar return [] { return 0; }; 1178b068b037SGeorge Rimar } 1179ac27de9dSRui Ueyama return [=] { return Script->MemoryRegions[Name]->Length; }; 118091b95b61SRui Ueyama } 11812ec34544SRui Ueyama if (Tok == "LOADADDR") { 11822ec34544SRui Ueyama StringRef Name = readParenLiteral(); 11838c022ca7SRafael Espindola OutputSection *Cmd = Script->getOrCreateOutputSection(Name); 1184617e2f98SRui Ueyama return [=] { 1185617e2f98SRui Ueyama checkIfExists(Cmd, Location); 1186617e2f98SRui Ueyama return Cmd->getLMA(); 1187617e2f98SRui Ueyama }; 11882ec34544SRui Ueyama } 1189fd11560fSGeorge Rimar if (Tok == "MAX" || Tok == "MIN") { 1190fd11560fSGeorge Rimar expect("("); 1191fd11560fSGeorge Rimar Expr A = readExpr(); 1192fd11560fSGeorge Rimar expect(","); 1193fd11560fSGeorge Rimar Expr B = readExpr(); 1194fd11560fSGeorge Rimar expect(")"); 1195fd11560fSGeorge Rimar if (Tok == "MIN") 1196fd11560fSGeorge Rimar return [=] { return std::min(A().getValue(), B().getValue()); }; 1197fd11560fSGeorge Rimar return [=] { return std::max(A().getValue(), B().getValue()); }; 1198fd11560fSGeorge Rimar } 119991b95b61SRui Ueyama if (Tok == "ORIGIN") { 120091b95b61SRui Ueyama StringRef Name = readParenLiteral(); 1201b068b037SGeorge Rimar if (Script->MemoryRegions.count(Name) == 0) { 120291b95b61SRui Ueyama setError("memory region not defined: " + Name); 1203b068b037SGeorge Rimar return [] { return 0; }; 1204b068b037SGeorge Rimar } 1205ac27de9dSRui Ueyama return [=] { return Script->MemoryRegions[Name]->Origin; }; 120691b95b61SRui Ueyama } 12072ec34544SRui Ueyama if (Tok == "SEGMENT_START") { 12082ec34544SRui Ueyama expect("("); 12092ec34544SRui Ueyama skip(); 12102ec34544SRui Ueyama expect(","); 12112ec34544SRui Ueyama Expr E = readExpr(); 12122ec34544SRui Ueyama expect(")"); 12132ec34544SRui Ueyama return [=] { return E(); }; 12142ec34544SRui Ueyama } 12152ec34544SRui Ueyama if (Tok == "SIZEOF") { 12162ec34544SRui Ueyama StringRef Name = readParenLiteral(); 12178c022ca7SRafael Espindola OutputSection *Cmd = Script->getOrCreateOutputSection(Name); 121805c4f67cSRafael Espindola // Linker script does not create an output section if its content is empty. 121905c4f67cSRafael Espindola // We want to allow SIZEOF(.foo) where .foo is a section which happened to 122005c4f67cSRafael Espindola // be empty. 12218c022ca7SRafael Espindola return [=] { return Cmd->Size; }; 12222ec34544SRui Ueyama } 12232ec34544SRui Ueyama if (Tok == "SIZEOF_HEADERS") 12242ec34544SRui Ueyama return [=] { return elf::getHeaderSize(); }; 12252ec34544SRui Ueyama 12264eb2eccbSRui Ueyama // Tok is the dot. 12274eb2eccbSRui Ueyama if (Tok == ".") 1228722221f5SRui Ueyama return [=] { return Script->getSymbolValue(Tok, Location); }; 12294eb2eccbSRui Ueyama 12302ec34544SRui Ueyama // Tok is a literal number. 12315c65088fSRui Ueyama if (Optional<uint64_t> Val = parseInt(Tok)) 12325c65088fSRui Ueyama return [=] { return *Val; }; 12332ec34544SRui Ueyama 12342ec34544SRui Ueyama // Tok is a symbol name. 12352ec34544SRui Ueyama if (!isValidCIdentifier(Tok)) 12362ec34544SRui Ueyama setError("malformed number: " + Tok); 1237ac27de9dSRui Ueyama Script->ReferencedSymbols.push_back(Tok); 1238722221f5SRui Ueyama return [=] { return Script->getSymbolValue(Tok, Location); }; 12392ec34544SRui Ueyama } 12402ec34544SRui Ueyama 12412ec34544SRui Ueyama Expr ScriptParser::readTernary(Expr Cond) { 12422ec34544SRui Ueyama Expr L = readExpr(); 12432ec34544SRui Ueyama expect(":"); 12442ec34544SRui Ueyama Expr R = readExpr(); 12452ec34544SRui Ueyama return [=] { return Cond().getValue() ? L() : R(); }; 12462ec34544SRui Ueyama } 12472ec34544SRui Ueyama 12482ec34544SRui Ueyama Expr ScriptParser::readParenExpr() { 12492ec34544SRui Ueyama expect("("); 12502ec34544SRui Ueyama Expr E = readExpr(); 12512ec34544SRui Ueyama expect(")"); 12522ec34544SRui Ueyama return E; 12532ec34544SRui Ueyama } 12542ec34544SRui Ueyama 12552ec34544SRui Ueyama std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() { 12562ec34544SRui Ueyama std::vector<StringRef> Phdrs; 1257b8a59c8aSBob Haarman while (!errorCount() && peek().startswith(":")) { 12582ec34544SRui Ueyama StringRef Tok = next(); 12592ec34544SRui Ueyama Phdrs.push_back((Tok.size() == 1) ? next() : Tok.substr(1)); 12602ec34544SRui Ueyama } 12612ec34544SRui Ueyama return Phdrs; 12622ec34544SRui Ueyama } 12632ec34544SRui Ueyama 12642ec34544SRui Ueyama // Read a program header type name. The next token must be a 12652ec34544SRui Ueyama // name of a program header type or a constant (e.g. "0x3"). 12662ec34544SRui Ueyama unsigned ScriptParser::readPhdrType() { 12672ec34544SRui Ueyama StringRef Tok = next(); 12685c65088fSRui Ueyama if (Optional<uint64_t> Val = parseInt(Tok)) 12695c65088fSRui Ueyama return *Val; 12702ec34544SRui Ueyama 12712ec34544SRui Ueyama unsigned Ret = StringSwitch<unsigned>(Tok) 12722ec34544SRui Ueyama .Case("PT_NULL", PT_NULL) 12732ec34544SRui Ueyama .Case("PT_LOAD", PT_LOAD) 12742ec34544SRui Ueyama .Case("PT_DYNAMIC", PT_DYNAMIC) 12752ec34544SRui Ueyama .Case("PT_INTERP", PT_INTERP) 12762ec34544SRui Ueyama .Case("PT_NOTE", PT_NOTE) 12772ec34544SRui Ueyama .Case("PT_SHLIB", PT_SHLIB) 12782ec34544SRui Ueyama .Case("PT_PHDR", PT_PHDR) 12792ec34544SRui Ueyama .Case("PT_TLS", PT_TLS) 12802ec34544SRui Ueyama .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME) 12812ec34544SRui Ueyama .Case("PT_GNU_STACK", PT_GNU_STACK) 12822ec34544SRui Ueyama .Case("PT_GNU_RELRO", PT_GNU_RELRO) 12832ec34544SRui Ueyama .Case("PT_OPENBSD_RANDOMIZE", PT_OPENBSD_RANDOMIZE) 12842ec34544SRui Ueyama .Case("PT_OPENBSD_WXNEEDED", PT_OPENBSD_WXNEEDED) 12852ec34544SRui Ueyama .Case("PT_OPENBSD_BOOTDATA", PT_OPENBSD_BOOTDATA) 12862ec34544SRui Ueyama .Default(-1); 12872ec34544SRui Ueyama 12882ec34544SRui Ueyama if (Ret == (unsigned)-1) { 12892ec34544SRui Ueyama setError("invalid program header type: " + Tok); 12902ec34544SRui Ueyama return PT_NULL; 12912ec34544SRui Ueyama } 12922ec34544SRui Ueyama return Ret; 12932ec34544SRui Ueyama } 12942ec34544SRui Ueyama 12952ec34544SRui Ueyama // Reads an anonymous version declaration. 12962ec34544SRui Ueyama void ScriptParser::readAnonymousDeclaration() { 12972ec34544SRui Ueyama std::vector<SymbolVersion> Locals; 12982ec34544SRui Ueyama std::vector<SymbolVersion> Globals; 12992ec34544SRui Ueyama std::tie(Locals, Globals) = readSymbols(); 13002ec34544SRui Ueyama 13012ec34544SRui Ueyama for (SymbolVersion V : Locals) { 13022ec34544SRui Ueyama if (V.Name == "*") 13032ec34544SRui Ueyama Config->DefaultSymbolVersion = VER_NDX_LOCAL; 13042ec34544SRui Ueyama else 13052ec34544SRui Ueyama Config->VersionScriptLocals.push_back(V); 13062ec34544SRui Ueyama } 13072ec34544SRui Ueyama 13082ec34544SRui Ueyama for (SymbolVersion V : Globals) 13092ec34544SRui Ueyama Config->VersionScriptGlobals.push_back(V); 13102ec34544SRui Ueyama 13112ec34544SRui Ueyama expect(";"); 13122ec34544SRui Ueyama } 13132ec34544SRui Ueyama 13142ec34544SRui Ueyama // Reads a non-anonymous version definition, 13152ec34544SRui Ueyama // e.g. "VerStr { global: foo; bar; local: *; };". 13162ec34544SRui Ueyama void ScriptParser::readVersionDeclaration(StringRef VerStr) { 13172ec34544SRui Ueyama // Read a symbol list. 13182ec34544SRui Ueyama std::vector<SymbolVersion> Locals; 13192ec34544SRui Ueyama std::vector<SymbolVersion> Globals; 13202ec34544SRui Ueyama std::tie(Locals, Globals) = readSymbols(); 13212ec34544SRui Ueyama 13222ec34544SRui Ueyama for (SymbolVersion V : Locals) { 13232ec34544SRui Ueyama if (V.Name == "*") 13242ec34544SRui Ueyama Config->DefaultSymbolVersion = VER_NDX_LOCAL; 13252ec34544SRui Ueyama else 13262ec34544SRui Ueyama Config->VersionScriptLocals.push_back(V); 13272ec34544SRui Ueyama } 13282ec34544SRui Ueyama 13292ec34544SRui Ueyama // Create a new version definition and add that to the global symbols. 13302ec34544SRui Ueyama VersionDefinition Ver; 13312ec34544SRui Ueyama Ver.Name = VerStr; 13322ec34544SRui Ueyama Ver.Globals = Globals; 13332ec34544SRui Ueyama 13342ec34544SRui Ueyama // User-defined version number starts from 2 because 0 and 1 are 13352ec34544SRui Ueyama // reserved for VER_NDX_LOCAL and VER_NDX_GLOBAL, respectively. 13362ec34544SRui Ueyama Ver.Id = Config->VersionDefinitions.size() + 2; 13372ec34544SRui Ueyama Config->VersionDefinitions.push_back(Ver); 13382ec34544SRui Ueyama 13392ec34544SRui Ueyama // Each version may have a parent version. For example, "Ver2" 13402ec34544SRui Ueyama // defined as "Ver2 { global: foo; local: *; } Ver1;" has "Ver1" 13412ec34544SRui Ueyama // as a parent. This version hierarchy is, probably against your 13422ec34544SRui Ueyama // instinct, purely for hint; the runtime doesn't care about it 13432ec34544SRui Ueyama // at all. In LLD, we simply ignore it. 13442ec34544SRui Ueyama if (peek() != ";") 13452ec34544SRui Ueyama skip(); 13462ec34544SRui Ueyama expect(";"); 13472ec34544SRui Ueyama } 13482ec34544SRui Ueyama 13491e77ad14SRui Ueyama static bool hasWildcard(StringRef S) { 13501e77ad14SRui Ueyama return S.find_first_of("?*[") != StringRef::npos; 13511e77ad14SRui Ueyama } 13521e77ad14SRui Ueyama 13532ec34544SRui Ueyama // Reads a list of symbols, e.g. "{ global: foo; bar; local: *; };". 13542ec34544SRui Ueyama std::pair<std::vector<SymbolVersion>, std::vector<SymbolVersion>> 13552ec34544SRui Ueyama ScriptParser::readSymbols() { 13562ec34544SRui Ueyama std::vector<SymbolVersion> Locals; 13572ec34544SRui Ueyama std::vector<SymbolVersion> Globals; 13582ec34544SRui Ueyama std::vector<SymbolVersion> *V = &Globals; 13592ec34544SRui Ueyama 1360b8a59c8aSBob Haarman while (!errorCount()) { 13612ec34544SRui Ueyama if (consume("}")) 13622ec34544SRui Ueyama break; 13632ec34544SRui Ueyama if (consumeLabel("local")) { 13642ec34544SRui Ueyama V = &Locals; 13652ec34544SRui Ueyama continue; 13662ec34544SRui Ueyama } 13672ec34544SRui Ueyama if (consumeLabel("global")) { 13682ec34544SRui Ueyama V = &Globals; 13692ec34544SRui Ueyama continue; 13702ec34544SRui Ueyama } 13712ec34544SRui Ueyama 13722ec34544SRui Ueyama if (consume("extern")) { 13732ec34544SRui Ueyama std::vector<SymbolVersion> Ext = readVersionExtern(); 13742ec34544SRui Ueyama V->insert(V->end(), Ext.begin(), Ext.end()); 13752ec34544SRui Ueyama } else { 13762ec34544SRui Ueyama StringRef Tok = next(); 13772ec34544SRui Ueyama V->push_back({unquote(Tok), false, hasWildcard(Tok)}); 13782ec34544SRui Ueyama } 13792ec34544SRui Ueyama expect(";"); 13802ec34544SRui Ueyama } 13812ec34544SRui Ueyama return {Locals, Globals}; 13822ec34544SRui Ueyama } 13832ec34544SRui Ueyama 13842ec34544SRui Ueyama // Reads an "extern C++" directive, e.g., 13852ec34544SRui Ueyama // "extern "C++" { ns::*; "f(int, double)"; };" 138617324d8bSRui Ueyama // 138717324d8bSRui Ueyama // The last semicolon is optional. E.g. this is OK: 138817324d8bSRui Ueyama // "extern "C++" { ns::*; "f(int, double)" };" 13892ec34544SRui Ueyama std::vector<SymbolVersion> ScriptParser::readVersionExtern() { 13902ec34544SRui Ueyama StringRef Tok = next(); 13912ec34544SRui Ueyama bool IsCXX = Tok == "\"C++\""; 13922ec34544SRui Ueyama if (!IsCXX && Tok != "\"C\"") 13932ec34544SRui Ueyama setError("Unknown language"); 13942ec34544SRui Ueyama expect("{"); 13952ec34544SRui Ueyama 13962ec34544SRui Ueyama std::vector<SymbolVersion> Ret; 1397b8a59c8aSBob Haarman while (!errorCount() && peek() != "}") { 13982ec34544SRui Ueyama StringRef Tok = next(); 13992ec34544SRui Ueyama bool HasWildcard = !Tok.startswith("\"") && hasWildcard(Tok); 14002ec34544SRui Ueyama Ret.push_back({unquote(Tok), IsCXX, HasWildcard}); 140117324d8bSRui Ueyama if (consume("}")) 140217324d8bSRui Ueyama return Ret; 14032ec34544SRui Ueyama expect(";"); 14042ec34544SRui Ueyama } 14052ec34544SRui Ueyama 14062ec34544SRui Ueyama expect("}"); 14072ec34544SRui Ueyama return Ret; 14082ec34544SRui Ueyama } 14092ec34544SRui Ueyama 14102ec34544SRui Ueyama uint64_t ScriptParser::readMemoryAssignment(StringRef S1, StringRef S2, 14112ec34544SRui Ueyama StringRef S3) { 1412b579c439SRui Ueyama if (!consume(S1) && !consume(S2) && !consume(S3)) { 14132ec34544SRui Ueyama setError("expected one of: " + S1 + ", " + S2 + ", or " + S3); 14142ec34544SRui Ueyama return 0; 14152ec34544SRui Ueyama } 14162ec34544SRui Ueyama expect("="); 1417040af7deSRui Ueyama return readExpr()().getValue(); 14182ec34544SRui Ueyama } 14192ec34544SRui Ueyama 14202ec34544SRui Ueyama // Parse the MEMORY command as specified in: 14212ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/MEMORY.html 14222ec34544SRui Ueyama // 14232ec34544SRui Ueyama // MEMORY { name [(attr)] : ORIGIN = origin, LENGTH = len ... } 14242ec34544SRui Ueyama void ScriptParser::readMemory() { 14252ec34544SRui Ueyama expect("{"); 1426b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 14272ec34544SRui Ueyama StringRef Name = next(); 14282ec34544SRui Ueyama 14292ec34544SRui Ueyama uint32_t Flags = 0; 14302ec34544SRui Ueyama uint32_t NegFlags = 0; 14312ec34544SRui Ueyama if (consume("(")) { 14322ec34544SRui Ueyama std::tie(Flags, NegFlags) = readMemoryAttributes(); 14332ec34544SRui Ueyama expect(")"); 14342ec34544SRui Ueyama } 14352ec34544SRui Ueyama expect(":"); 14362ec34544SRui Ueyama 14372ec34544SRui Ueyama uint64_t Origin = readMemoryAssignment("ORIGIN", "org", "o"); 14382ec34544SRui Ueyama expect(","); 14392ec34544SRui Ueyama uint64_t Length = readMemoryAssignment("LENGTH", "len", "l"); 14402ec34544SRui Ueyama 14415f37541cSGeorge Rimar // Add the memory region to the region map. 1442490f0a4dSRafael Espindola MemoryRegion *MR = 1443490f0a4dSRafael Espindola make<MemoryRegion>(Name, Origin, Length, Flags, NegFlags); 14440984cfa9SGeorge Rimar if (!Script->MemoryRegions.insert({Name, MR}).second) 14450984cfa9SGeorge Rimar setError("region '" + Name + "' already defined"); 14462ec34544SRui Ueyama } 14472ec34544SRui Ueyama } 14482ec34544SRui Ueyama 14492ec34544SRui Ueyama // This function parses the attributes used to match against section 14502ec34544SRui Ueyama // flags when placing output sections in a memory region. These flags 14512ec34544SRui Ueyama // are only used when an explicit memory region name is not used. 14522ec34544SRui Ueyama std::pair<uint32_t, uint32_t> ScriptParser::readMemoryAttributes() { 14532ec34544SRui Ueyama uint32_t Flags = 0; 14542ec34544SRui Ueyama uint32_t NegFlags = 0; 14552ec34544SRui Ueyama bool Invert = false; 14562ec34544SRui Ueyama 14572ec34544SRui Ueyama for (char C : next().lower()) { 14582ec34544SRui Ueyama uint32_t Flag = 0; 14592ec34544SRui Ueyama if (C == '!') 14602ec34544SRui Ueyama Invert = !Invert; 14612ec34544SRui Ueyama else if (C == 'w') 14622ec34544SRui Ueyama Flag = SHF_WRITE; 14632ec34544SRui Ueyama else if (C == 'x') 14642ec34544SRui Ueyama Flag = SHF_EXECINSTR; 14652ec34544SRui Ueyama else if (C == 'a') 14662ec34544SRui Ueyama Flag = SHF_ALLOC; 14672ec34544SRui Ueyama else if (C != 'r') 14682ec34544SRui Ueyama setError("invalid memory region attribute"); 14692ec34544SRui Ueyama 14702ec34544SRui Ueyama if (Invert) 14712ec34544SRui Ueyama NegFlags |= Flag; 14722ec34544SRui Ueyama else 14732ec34544SRui Ueyama Flags |= Flag; 14742ec34544SRui Ueyama } 14752ec34544SRui Ueyama return {Flags, NegFlags}; 14762ec34544SRui Ueyama } 14772ec34544SRui Ueyama 14782ec34544SRui Ueyama void elf::readLinkerScript(MemoryBufferRef MB) { 14792ec34544SRui Ueyama ScriptParser(MB).readLinkerScript(); 14802ec34544SRui Ueyama } 14812ec34544SRui Ueyama 14822ec34544SRui Ueyama void elf::readVersionScript(MemoryBufferRef MB) { 14832ec34544SRui Ueyama ScriptParser(MB).readVersionScript(); 14842ec34544SRui Ueyama } 14852ec34544SRui Ueyama 14862ec34544SRui Ueyama void elf::readDynamicList(MemoryBufferRef MB) { 14872ec34544SRui Ueyama ScriptParser(MB).readDynamicList(); 14882ec34544SRui Ueyama } 14898c7e8cceSPetr Hosek 14908c7e8cceSPetr Hosek void elf::readDefsym(StringRef Name, MemoryBufferRef MB) { 14918c7e8cceSPetr Hosek ScriptParser(MB).readDefsym(Name); 14928c7e8cceSPetr Hosek } 1493