12ec34544SRui Ueyama //===- ScriptParser.cpp ---------------------------------------------------===// 22ec34544SRui Ueyama // 32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information. 52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 62ec34544SRui Ueyama // 72ec34544SRui Ueyama //===----------------------------------------------------------------------===// 805f6b852SRui Ueyama // 905f6b852SRui Ueyama // This file contains a recursive-descendent parser for linker scripts. 1005f6b852SRui Ueyama // Parsed results are stored to Config and Script global objects. 1105f6b852SRui Ueyama // 1205f6b852SRui Ueyama //===----------------------------------------------------------------------===// 132ec34544SRui Ueyama 142ec34544SRui Ueyama #include "ScriptParser.h" 152ec34544SRui Ueyama #include "Config.h" 162ec34544SRui Ueyama #include "Driver.h" 172ec34544SRui Ueyama #include "InputSection.h" 182ec34544SRui Ueyama #include "LinkerScript.h" 192ec34544SRui Ueyama #include "OutputSections.h" 202ec34544SRui Ueyama #include "ScriptLexer.h" 212ec34544SRui Ueyama #include "Symbols.h" 222ec34544SRui Ueyama #include "Target.h" 232017d52bSRui Ueyama #include "lld/Common/Memory.h" 242ec34544SRui Ueyama #include "llvm/ADT/SmallString.h" 252ec34544SRui Ueyama #include "llvm/ADT/StringRef.h" 260440be4aSRui Ueyama #include "llvm/ADT/StringSet.h" 272ec34544SRui Ueyama #include "llvm/ADT/StringSwitch.h" 28264b5d9eSZachary Turner #include "llvm/BinaryFormat/ELF.h" 292ec34544SRui Ueyama #include "llvm/Support/Casting.h" 302ec34544SRui Ueyama #include "llvm/Support/ErrorHandling.h" 312ec34544SRui Ueyama #include "llvm/Support/FileSystem.h" 32fa1145a8SIsaac Richter #include "llvm/Support/MathExtras.h" 332ec34544SRui Ueyama #include "llvm/Support/Path.h" 34dbd0ad33SPeter Smith #include "llvm/Support/ScopedPrinter.h" 35439341b9SJames Henderson #include "llvm/Support/TimeProfiler.h" 362ec34544SRui Ueyama #include <cassert> 372ec34544SRui Ueyama #include <limits> 382ec34544SRui Ueyama #include <vector> 392ec34544SRui Ueyama 402ec34544SRui Ueyama using namespace llvm; 412ec34544SRui Ueyama using namespace llvm::ELF; 42b58079d4SRui Ueyama using namespace llvm::support::endian; 4307837b8fSFangrui Song using namespace lld; 4407837b8fSFangrui Song using namespace lld::elf; 452ec34544SRui Ueyama 4696b3fe02SRui Ueyama namespace { 4796b3fe02SRui Ueyama class ScriptParser final : ScriptLexer { 482ec34544SRui Ueyama public: 493837f427SRui Ueyama ScriptParser(MemoryBufferRef mb) : ScriptLexer(mb) { 5011ae59f0SRui Ueyama // Initialize IsUnderSysroot 513837f427SRui Ueyama if (config->sysroot == "") 5211ae59f0SRui Ueyama return; 533837f427SRui Ueyama StringRef path = mb.getBufferIdentifier(); 543837f427SRui Ueyama for (; !path.empty(); path = sys::path::parent_path(path)) { 553837f427SRui Ueyama if (!sys::fs::equivalent(config->sysroot, path)) 5611ae59f0SRui Ueyama continue; 573837f427SRui Ueyama isUnderSysroot = true; 5811ae59f0SRui Ueyama return; 5911ae59f0SRui Ueyama } 6011ae59f0SRui Ueyama } 612ec34544SRui Ueyama 622ec34544SRui Ueyama void readLinkerScript(); 632ec34544SRui Ueyama void readVersionScript(); 642ec34544SRui Ueyama void readDynamicList(); 653837f427SRui Ueyama void readDefsym(StringRef name); 662ec34544SRui Ueyama 672ec34544SRui Ueyama private: 683837f427SRui Ueyama void addFile(StringRef path); 692ec34544SRui Ueyama 702ec34544SRui Ueyama void readAsNeeded(); 712ec34544SRui Ueyama void readEntry(); 722ec34544SRui Ueyama void readExtern(); 732ec34544SRui Ueyama void readGroup(); 742ec34544SRui Ueyama void readInclude(); 751d92aa73SRui Ueyama void readInput(); 762ec34544SRui Ueyama void readMemory(); 772ec34544SRui Ueyama void readOutput(); 782ec34544SRui Ueyama void readOutputArch(); 792ec34544SRui Ueyama void readOutputFormat(); 80899fdf54SFangrui Song void readOverwriteSections(); 812ec34544SRui Ueyama void readPhdrs(); 825f37541cSGeorge Rimar void readRegionAlias(); 832ec34544SRui Ueyama void readSearchDir(); 842ec34544SRui Ueyama void readSections(); 85e262bb1aSRui Ueyama void readTarget(); 862ec34544SRui Ueyama void readVersion(); 872ec34544SRui Ueyama void readVersionScriptCommand(); 882ec34544SRui Ueyama 893837f427SRui Ueyama SymbolAssignment *readSymbolAssignment(StringRef name); 903837f427SRui Ueyama ByteCommand *readByteCommand(StringRef tok); 91b0486051SSimon Atanasyan std::array<uint8_t, 4> readFill(); 923837f427SRui Ueyama bool readSectionDirective(OutputSection *cmd, StringRef tok1, StringRef tok2); 933837f427SRui Ueyama void readSectionAddressType(OutputSection *cmd); 94a582419aSGeorge Rimar OutputSection *readOverlaySectionDescription(); 953837f427SRui Ueyama OutputSection *readOutputSectionDescription(StringRef outSec); 96*64038ef8SFangrui Song SmallVector<SectionCommand *, 0> readOverlay(); 97a1c2ee01SFangrui Song SmallVector<StringRef, 0> readOutputSectionPhdrs(); 98dbd0ad33SPeter Smith std::pair<uint64_t, uint64_t> readInputSectionFlags(); 993837f427SRui Ueyama InputSectionDescription *readInputSectionDescription(StringRef tok); 1002ec34544SRui Ueyama StringMatcher readFilePatterns(); 101*64038ef8SFangrui Song SmallVector<SectionPattern, 0> readInputSectionsList(); 102dbd0ad33SPeter Smith InputSectionDescription *readInputSectionRules(StringRef filePattern, 103dbd0ad33SPeter Smith uint64_t withFlags, 104dbd0ad33SPeter Smith uint64_t withoutFlags); 1052ec34544SRui Ueyama unsigned readPhdrType(); 1062a9aed0eSFangrui Song SortSectionPolicy peekSortKind(); 1072ec34544SRui Ueyama SortSectionPolicy readSortKind(); 1083837f427SRui Ueyama SymbolAssignment *readProvideHidden(bool provide, bool hidden); 1093837f427SRui Ueyama SymbolAssignment *readAssignment(StringRef tok); 1102ec34544SRui Ueyama void readSort(); 111d30a78b3SGeorge Rimar Expr readAssert(); 1125fb17128SGeorge Rimar Expr readConstant(); 1135fb17128SGeorge Rimar Expr getPageSize(); 1142ec34544SRui Ueyama 11592b5b980SFangrui Song Expr readMemoryAssignment(StringRef, StringRef, StringRef); 1168cdf1c1eSIgor Kudrin void readMemoryAttributes(uint32_t &flags, uint32_t &invFlags, 1178cdf1c1eSIgor Kudrin uint32_t &negFlags, uint32_t &negInvFlags); 1182ec34544SRui Ueyama 1193837f427SRui Ueyama Expr combine(StringRef op, Expr l, Expr r); 1202ec34544SRui Ueyama Expr readExpr(); 1213837f427SRui Ueyama Expr readExpr1(Expr lhs, int minPrec); 1222ec34544SRui Ueyama StringRef readParenLiteral(); 1232ec34544SRui Ueyama Expr readPrimary(); 1243837f427SRui Ueyama Expr readTernary(Expr cond); 1252ec34544SRui Ueyama Expr readParenExpr(); 1262ec34544SRui Ueyama 1272ec34544SRui Ueyama // For parsing version script. 128*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> readVersionExtern(); 1292ec34544SRui Ueyama void readAnonymousDeclaration(); 1303837f427SRui Ueyama void readVersionDeclaration(StringRef verStr); 1312ec34544SRui Ueyama 132*64038ef8SFangrui Song std::pair<SmallVector<SymbolVersion, 0>, SmallVector<SymbolVersion, 0>> 1332ec34544SRui Ueyama readSymbols(); 1342ec34544SRui Ueyama 135bf6e259bSFangrui Song // True if a script being read is in the --sysroot directory. 1363837f427SRui Ueyama bool isUnderSysroot = false; 1370440be4aSRui Ueyama 1380440be4aSRui Ueyama // A set to detect an INCLUDE() cycle. 1393837f427SRui Ueyama StringSet<> seen; 1402ec34544SRui Ueyama }; 14196b3fe02SRui Ueyama } // namespace 1422ec34544SRui Ueyama 1433837f427SRui Ueyama static StringRef unquote(StringRef s) { 1443837f427SRui Ueyama if (s.startswith("\"")) 1453837f427SRui Ueyama return s.substr(1, s.size() - 2); 1463837f427SRui Ueyama return s; 1471e77ad14SRui Ueyama } 1481e77ad14SRui Ueyama 1492ec34544SRui Ueyama // Some operations only support one non absolute value. Move the 1502ec34544SRui Ueyama // absolute one to the right hand side for convenience. 1513837f427SRui Ueyama static void moveAbsRight(ExprValue &a, ExprValue &b) { 1523837f427SRui Ueyama if (a.sec == nullptr || (a.forceAbsolute && !b.isAbsolute())) 1533837f427SRui Ueyama std::swap(a, b); 1543837f427SRui Ueyama if (!b.isAbsolute()) 1553837f427SRui Ueyama error(a.loc + ": at least one side of the expression must be absolute"); 1562ec34544SRui Ueyama } 1572ec34544SRui Ueyama 1583837f427SRui Ueyama static ExprValue add(ExprValue a, ExprValue b) { 1593837f427SRui Ueyama moveAbsRight(a, b); 1603837f427SRui Ueyama return {a.sec, a.forceAbsolute, a.getSectionOffset() + b.getValue(), a.loc}; 1612ec34544SRui Ueyama } 1622ec34544SRui Ueyama 1633837f427SRui Ueyama static ExprValue sub(ExprValue a, ExprValue b) { 16463a4a98eSRafael Espindola // The distance between two symbols in sections is absolute. 1653837f427SRui Ueyama if (!a.isAbsolute() && !b.isAbsolute()) 1663837f427SRui Ueyama return a.getValue() - b.getValue(); 1673837f427SRui Ueyama return {a.sec, false, a.getSectionOffset() - b.getValue(), a.loc}; 1682ec34544SRui Ueyama } 1692ec34544SRui Ueyama 1703837f427SRui Ueyama static ExprValue bitAnd(ExprValue a, ExprValue b) { 1713837f427SRui Ueyama moveAbsRight(a, b); 1723837f427SRui Ueyama return {a.sec, a.forceAbsolute, 1733837f427SRui Ueyama (a.getValue() & b.getValue()) - a.getSecAddr(), a.loc}; 1742ec34544SRui Ueyama } 1752ec34544SRui Ueyama 1763837f427SRui Ueyama static ExprValue bitOr(ExprValue a, ExprValue b) { 1773837f427SRui Ueyama moveAbsRight(a, b); 1783837f427SRui Ueyama return {a.sec, a.forceAbsolute, 1793837f427SRui Ueyama (a.getValue() | b.getValue()) - a.getSecAddr(), a.loc}; 1802ec34544SRui Ueyama } 1812ec34544SRui Ueyama 1822ec34544SRui Ueyama void ScriptParser::readDynamicList() { 1832ec34544SRui Ueyama expect("{"); 184*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> locals; 185*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> globals; 1863837f427SRui Ueyama std::tie(locals, globals) = readSymbols(); 187d72d97b3SRafael Espindola expect(";"); 188d72d97b3SRafael Espindola 189d72d97b3SRafael Espindola if (!atEOF()) { 1902ec34544SRui Ueyama setError("EOF expected, but got " + next()); 191d72d97b3SRafael Espindola return; 192d72d97b3SRafael Espindola } 1933837f427SRui Ueyama if (!locals.empty()) { 194d72d97b3SRafael Espindola setError("\"local:\" scope not supported in --dynamic-list"); 195d72d97b3SRafael Espindola return; 196d72d97b3SRafael Espindola } 197d72d97b3SRafael Espindola 1983837f427SRui Ueyama for (SymbolVersion v : globals) 1993837f427SRui Ueyama config->dynamicList.push_back(v); 2002ec34544SRui Ueyama } 2012ec34544SRui Ueyama 2022ec34544SRui Ueyama void ScriptParser::readVersionScript() { 2032ec34544SRui Ueyama readVersionScriptCommand(); 2042ec34544SRui Ueyama if (!atEOF()) 2052ec34544SRui Ueyama setError("EOF expected, but got " + next()); 2062ec34544SRui Ueyama } 2072ec34544SRui Ueyama 2082ec34544SRui Ueyama void ScriptParser::readVersionScriptCommand() { 2092ec34544SRui Ueyama if (consume("{")) { 2102ec34544SRui Ueyama readAnonymousDeclaration(); 2112ec34544SRui Ueyama return; 2122ec34544SRui Ueyama } 2132ec34544SRui Ueyama 214b8a59c8aSBob Haarman while (!atEOF() && !errorCount() && peek() != "}") { 2153837f427SRui Ueyama StringRef verStr = next(); 2163837f427SRui Ueyama if (verStr == "{") { 2172ec34544SRui Ueyama setError("anonymous version definition is used in " 2182ec34544SRui Ueyama "combination with other version definitions"); 2192ec34544SRui Ueyama return; 2202ec34544SRui Ueyama } 2212ec34544SRui Ueyama expect("{"); 2223837f427SRui Ueyama readVersionDeclaration(verStr); 2232ec34544SRui Ueyama } 2242ec34544SRui Ueyama } 2252ec34544SRui Ueyama 2262ec34544SRui Ueyama void ScriptParser::readVersion() { 2272ec34544SRui Ueyama expect("{"); 2282ec34544SRui Ueyama readVersionScriptCommand(); 2292ec34544SRui Ueyama expect("}"); 2302ec34544SRui Ueyama } 2312ec34544SRui Ueyama 2322ec34544SRui Ueyama void ScriptParser::readLinkerScript() { 2332ec34544SRui Ueyama while (!atEOF()) { 2343837f427SRui Ueyama StringRef tok = next(); 2353837f427SRui Ueyama if (tok == ";") 2362ec34544SRui Ueyama continue; 2372ec34544SRui Ueyama 2383837f427SRui Ueyama if (tok == "ENTRY") { 2392ec34544SRui Ueyama readEntry(); 2403837f427SRui Ueyama } else if (tok == "EXTERN") { 2412ec34544SRui Ueyama readExtern(); 2423837f427SRui Ueyama } else if (tok == "GROUP") { 2432ec34544SRui Ueyama readGroup(); 2443837f427SRui Ueyama } else if (tok == "INCLUDE") { 2452ec34544SRui Ueyama readInclude(); 2463837f427SRui Ueyama } else if (tok == "INPUT") { 2471d92aa73SRui Ueyama readInput(); 2483837f427SRui Ueyama } else if (tok == "MEMORY") { 2492ec34544SRui Ueyama readMemory(); 2503837f427SRui Ueyama } else if (tok == "OUTPUT") { 2512ec34544SRui Ueyama readOutput(); 2523837f427SRui Ueyama } else if (tok == "OUTPUT_ARCH") { 2532ec34544SRui Ueyama readOutputArch(); 2543837f427SRui Ueyama } else if (tok == "OUTPUT_FORMAT") { 2552ec34544SRui Ueyama readOutputFormat(); 256899fdf54SFangrui Song } else if (tok == "OVERWRITE_SECTIONS") { 257899fdf54SFangrui Song readOverwriteSections(); 2583837f427SRui Ueyama } else if (tok == "PHDRS") { 2592ec34544SRui Ueyama readPhdrs(); 2603837f427SRui Ueyama } else if (tok == "REGION_ALIAS") { 2615f37541cSGeorge Rimar readRegionAlias(); 2623837f427SRui Ueyama } else if (tok == "SEARCH_DIR") { 2632ec34544SRui Ueyama readSearchDir(); 2643837f427SRui Ueyama } else if (tok == "SECTIONS") { 2652ec34544SRui Ueyama readSections(); 2663837f427SRui Ueyama } else if (tok == "TARGET") { 267e262bb1aSRui Ueyama readTarget(); 2683837f427SRui Ueyama } else if (tok == "VERSION") { 2692ec34544SRui Ueyama readVersion(); 2703837f427SRui Ueyama } else if (SymbolAssignment *cmd = readAssignment(tok)) { 2713837f427SRui Ueyama script->sectionCommands.push_back(cmd); 2722ec34544SRui Ueyama } else { 2733837f427SRui Ueyama setError("unknown directive: " + tok); 2742ec34544SRui Ueyama } 2752ec34544SRui Ueyama } 2762ec34544SRui Ueyama } 2772ec34544SRui Ueyama 2783837f427SRui Ueyama void ScriptParser::readDefsym(StringRef name) { 279c1522816SGeorge Rimar if (errorCount()) 280c1522816SGeorge Rimar return; 2813837f427SRui Ueyama Expr e = readExpr(); 2828c7e8cceSPetr Hosek if (!atEOF()) 2838c7e8cceSPetr Hosek setError("EOF expected, but got " + next()); 2843837f427SRui Ueyama SymbolAssignment *cmd = make<SymbolAssignment>(name, e, getCurrentLocation()); 2853837f427SRui Ueyama script->sectionCommands.push_back(cmd); 2868c7e8cceSPetr Hosek } 2878c7e8cceSPetr Hosek 2883837f427SRui Ueyama void ScriptParser::addFile(StringRef s) { 2893837f427SRui Ueyama if (isUnderSysroot && s.startswith("/")) { 2903837f427SRui Ueyama SmallString<128> pathData; 2913837f427SRui Ueyama StringRef path = (config->sysroot + s).toStringRef(pathData); 2922508733eSFangrui Song if (sys::fs::exists(path)) 29349a3ad21SRui Ueyama driver->addFile(saver.save(path), /*withLOption=*/false); 2942508733eSFangrui Song else 2952508733eSFangrui Song setError("cannot find " + s + " inside " + config->sysroot); 2962ec34544SRui Ueyama return; 2972ec34544SRui Ueyama } 2982ec34544SRui Ueyama 2993837f427SRui Ueyama if (s.startswith("/")) { 300c384ca3cSFangrui Song // Case 1: s is an absolute path. Just open it. 30149a3ad21SRui Ueyama driver->addFile(s, /*withLOption=*/false); 3023837f427SRui Ueyama } else if (s.startswith("=")) { 303c384ca3cSFangrui Song // Case 2: relative to the sysroot. 3043837f427SRui Ueyama if (config->sysroot.empty()) 30549a3ad21SRui Ueyama driver->addFile(s.substr(1), /*withLOption=*/false); 3062ec34544SRui Ueyama else 307136d27abSRui Ueyama driver->addFile(saver.save(config->sysroot + "/" + s.substr(1)), 30849a3ad21SRui Ueyama /*withLOption=*/false); 3093837f427SRui Ueyama } else if (s.startswith("-l")) { 310c384ca3cSFangrui Song // Case 3: search in the list of library paths. 3113837f427SRui Ueyama driver->addLibrary(s.substr(2)); 312c384ca3cSFangrui Song } else { 313c384ca3cSFangrui Song // Case 4: s is a relative path. Search in the directory of the script file. 314c384ca3cSFangrui Song std::string filename = std::string(getCurrentMB().getBufferIdentifier()); 315c384ca3cSFangrui Song StringRef directory = sys::path::parent_path(filename); 316c384ca3cSFangrui Song if (!directory.empty()) { 317c384ca3cSFangrui Song SmallString<0> path(directory); 318c384ca3cSFangrui Song sys::path::append(path, s); 319c384ca3cSFangrui Song if (sys::fs::exists(path)) { 320c384ca3cSFangrui Song driver->addFile(path, /*withLOption=*/false); 321c384ca3cSFangrui Song return; 322c384ca3cSFangrui Song } 323c384ca3cSFangrui Song } 324c384ca3cSFangrui Song // Then search in the current working directory. 325c384ca3cSFangrui Song if (sys::fs::exists(s)) { 32649a3ad21SRui Ueyama driver->addFile(s, /*withLOption=*/false); 3272ec34544SRui Ueyama } else { 328c384ca3cSFangrui Song // Finally, search in the list of library paths. 3293837f427SRui Ueyama if (Optional<std::string> path = findFromSearchPaths(s)) 33049a3ad21SRui Ueyama driver->addFile(saver.save(*path), /*withLOption=*/true); 3312ec34544SRui Ueyama else 3323837f427SRui Ueyama setError("unable to find " + s); 3332ec34544SRui Ueyama } 3342ec34544SRui Ueyama } 335c384ca3cSFangrui Song } 3362ec34544SRui Ueyama 3372ec34544SRui Ueyama void ScriptParser::readAsNeeded() { 3382ec34544SRui Ueyama expect("("); 3393837f427SRui Ueyama bool orig = config->asNeeded; 3403837f427SRui Ueyama config->asNeeded = true; 341b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 3422ec34544SRui Ueyama addFile(unquote(next())); 3433837f427SRui Ueyama config->asNeeded = orig; 3442ec34544SRui Ueyama } 3452ec34544SRui Ueyama 3462ec34544SRui Ueyama void ScriptParser::readEntry() { 3472ec34544SRui Ueyama // -e <symbol> takes predecence over ENTRY(<symbol>). 3482ec34544SRui Ueyama expect("("); 3493837f427SRui Ueyama StringRef tok = next(); 3503837f427SRui Ueyama if (config->entry.empty()) 3513837f427SRui Ueyama config->entry = tok; 3522ec34544SRui Ueyama expect(")"); 3532ec34544SRui Ueyama } 3542ec34544SRui Ueyama 3552ec34544SRui Ueyama void ScriptParser::readExtern() { 3562ec34544SRui Ueyama expect("("); 357b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 3583837f427SRui Ueyama config->undefined.push_back(unquote(next())); 3592ec34544SRui Ueyama } 3602ec34544SRui Ueyama 3612ec34544SRui Ueyama void ScriptParser::readGroup() { 3623837f427SRui Ueyama bool orig = InputFile::isInGroup; 3633837f427SRui Ueyama InputFile::isInGroup = true; 3641d92aa73SRui Ueyama readInput(); 3653837f427SRui Ueyama InputFile::isInGroup = orig; 3663837f427SRui Ueyama if (!orig) 3673837f427SRui Ueyama ++InputFile::nextGroupId; 3682ec34544SRui Ueyama } 3692ec34544SRui Ueyama 3702ec34544SRui Ueyama void ScriptParser::readInclude() { 3713837f427SRui Ueyama StringRef tok = unquote(next()); 3722ec34544SRui Ueyama 3733837f427SRui Ueyama if (!seen.insert(tok).second) { 3740440be4aSRui Ueyama setError("there is a cycle in linker script INCLUDEs"); 3750440be4aSRui Ueyama return; 3760440be4aSRui Ueyama } 3770440be4aSRui Ueyama 3783837f427SRui Ueyama if (Optional<std::string> path = searchScript(tok)) { 3793837f427SRui Ueyama if (Optional<MemoryBufferRef> mb = readFile(*path)) 3803837f427SRui Ueyama tokenize(*mb); 3812ec34544SRui Ueyama return; 3822ec34544SRui Ueyama } 3833837f427SRui Ueyama setError("cannot find linker script " + tok); 3842ec34544SRui Ueyama } 3852ec34544SRui Ueyama 3861d92aa73SRui Ueyama void ScriptParser::readInput() { 3871d92aa73SRui Ueyama expect("("); 3881d92aa73SRui Ueyama while (!errorCount() && !consume(")")) { 3891d92aa73SRui Ueyama if (consume("AS_NEEDED")) 3901d92aa73SRui Ueyama readAsNeeded(); 3911d92aa73SRui Ueyama else 3921d92aa73SRui Ueyama addFile(unquote(next())); 3931d92aa73SRui Ueyama } 3941d92aa73SRui Ueyama } 3951d92aa73SRui Ueyama 3962ec34544SRui Ueyama void ScriptParser::readOutput() { 3972ec34544SRui Ueyama // -o <file> takes predecence over OUTPUT(<file>). 3982ec34544SRui Ueyama expect("("); 3993837f427SRui Ueyama StringRef tok = next(); 4003837f427SRui Ueyama if (config->outputFile.empty()) 4013837f427SRui Ueyama config->outputFile = unquote(tok); 4022ec34544SRui Ueyama expect(")"); 4032ec34544SRui Ueyama } 4042ec34544SRui Ueyama 4052ec34544SRui Ueyama void ScriptParser::readOutputArch() { 4062ec34544SRui Ueyama // OUTPUT_ARCH is ignored for now. 4072ec34544SRui Ueyama expect("("); 408b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 4092ec34544SRui Ueyama skip(); 4102ec34544SRui Ueyama } 4112ec34544SRui Ueyama 4123837f427SRui Ueyama static std::pair<ELFKind, uint16_t> parseBfdName(StringRef s) { 4133837f427SRui Ueyama return StringSwitch<std::pair<ELFKind, uint16_t>>(s) 4144f8c8228SRui Ueyama .Case("elf32-i386", {ELF32LEKind, EM_386}) 4154f8c8228SRui Ueyama .Case("elf32-iamcu", {ELF32LEKind, EM_IAMCU}) 4164f8c8228SRui Ueyama .Case("elf32-littlearm", {ELF32LEKind, EM_ARM}) 4174f8c8228SRui Ueyama .Case("elf32-x86-64", {ELF32LEKind, EM_X86_64}) 41819b134ccSDimitry Andric .Case("elf64-aarch64", {ELF64LEKind, EM_AARCH64}) 4194f8c8228SRui Ueyama .Case("elf64-littleaarch64", {ELF64LEKind, EM_AARCH64}) 4207605a9a0SFangrui Song .Case("elf64-bigaarch64", {ELF64BEKind, EM_AARCH64}) 4214134143cSRui Ueyama .Case("elf32-powerpc", {ELF32BEKind, EM_PPC}) 422275eb828SBrandon Bergren .Case("elf32-powerpcle", {ELF32LEKind, EM_PPC}) 4234f8c8228SRui Ueyama .Case("elf64-powerpc", {ELF64BEKind, EM_PPC64}) 4244f8c8228SRui Ueyama .Case("elf64-powerpcle", {ELF64LEKind, EM_PPC64}) 4254f8c8228SRui Ueyama .Case("elf64-x86-64", {ELF64LEKind, EM_X86_64}) 4264134143cSRui Ueyama .Cases("elf32-tradbigmips", "elf32-bigmips", {ELF32BEKind, EM_MIPS}) 4274f8c8228SRui Ueyama .Case("elf32-ntradbigmips", {ELF32BEKind, EM_MIPS}) 4284f8c8228SRui Ueyama .Case("elf32-tradlittlemips", {ELF32LEKind, EM_MIPS}) 4294f8c8228SRui Ueyama .Case("elf32-ntradlittlemips", {ELF32LEKind, EM_MIPS}) 4304f8c8228SRui Ueyama .Case("elf64-tradbigmips", {ELF64BEKind, EM_MIPS}) 4314f8c8228SRui Ueyama .Case("elf64-tradlittlemips", {ELF64LEKind, EM_MIPS}) 43244d908d7SFangrui Song .Case("elf32-littleriscv", {ELF32LEKind, EM_RISCV}) 43344d908d7SFangrui Song .Case("elf64-littleriscv", {ELF64LEKind, EM_RISCV}) 434aff950e9SLemonBoy .Case("elf64-sparc", {ELF64BEKind, EM_SPARCV9}) 43592c6141cSLemonBoy .Case("elf32-msp430", {ELF32LEKind, EM_MSP430}) 4364f8c8228SRui Ueyama .Default({ELFNoneKind, EM_NONE}); 437ea8cd00aSRui Ueyama } 438ea8cd00aSRui Ueyama 439eea34aaeSFangrui Song // Parse OUTPUT_FORMAT(bfdname) or OUTPUT_FORMAT(default, big, little). Choose 440eea34aaeSFangrui Song // big if -EB is specified, little if -EL is specified, or default if neither is 441eea34aaeSFangrui Song // specified. 4422ec34544SRui Ueyama void ScriptParser::readOutputFormat() { 4432ec34544SRui Ueyama expect("("); 444ea8cd00aSRui Ueyama 445eea34aaeSFangrui Song StringRef s; 4462822852fSShoaib Meenai config->bfdname = unquote(next()); 447eea34aaeSFangrui Song if (!consume(")")) { 448eea34aaeSFangrui Song expect(","); 449eea34aaeSFangrui Song s = unquote(next()); 450eea34aaeSFangrui Song if (config->optEB) 451eea34aaeSFangrui Song config->bfdname = s; 452eea34aaeSFangrui Song expect(","); 453eea34aaeSFangrui Song s = unquote(next()); 454eea34aaeSFangrui Song if (config->optEL) 455eea34aaeSFangrui Song config->bfdname = s; 456eea34aaeSFangrui Song consume(")"); 457eea34aaeSFangrui Song } 458eea34aaeSFangrui Song s = config->bfdname; 4593837f427SRui Ueyama if (s.consume_back("-freebsd")) 4603837f427SRui Ueyama config->osabi = ELFOSABI_FREEBSD; 4614f8c8228SRui Ueyama 4623837f427SRui Ueyama std::tie(config->ekind, config->emachine) = parseBfdName(s); 4633837f427SRui Ueyama if (config->emachine == EM_NONE) 4642822852fSShoaib Meenai setError("unknown output format name: " + config->bfdname); 4653837f427SRui Ueyama if (s == "elf32-ntradlittlemips" || s == "elf32-ntradbigmips") 4663837f427SRui Ueyama config->mipsN32Abi = true; 46792c6141cSLemonBoy if (config->emachine == EM_MSP430) 46892c6141cSLemonBoy config->osabi = ELFOSABI_STANDALONE; 4692ec34544SRui Ueyama } 4702ec34544SRui Ueyama 4712ec34544SRui Ueyama void ScriptParser::readPhdrs() { 4722ec34544SRui Ueyama expect("{"); 4732ec34544SRui Ueyama 474b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 4753837f427SRui Ueyama PhdrsCommand cmd; 4763837f427SRui Ueyama cmd.name = next(); 4773837f427SRui Ueyama cmd.type = readPhdrType(); 478b579c439SRui Ueyama 479b8a59c8aSBob Haarman while (!errorCount() && !consume(";")) { 480b579c439SRui Ueyama if (consume("FILEHDR")) 4813837f427SRui Ueyama cmd.hasFilehdr = true; 482b579c439SRui Ueyama else if (consume("PHDRS")) 4833837f427SRui Ueyama cmd.hasPhdrs = true; 484b579c439SRui Ueyama else if (consume("AT")) 4853837f427SRui Ueyama cmd.lmaExpr = readParenExpr(); 486b579c439SRui Ueyama else if (consume("FLAGS")) 4873837f427SRui Ueyama cmd.flags = readParenExpr()().getValue(); 488b579c439SRui Ueyama else 489b579c439SRui Ueyama setError("unexpected header attribute: " + next()); 490b579c439SRui Ueyama } 4910ae2c24cSRui Ueyama 4923837f427SRui Ueyama script->phdrsCommands.push_back(cmd); 4932ec34544SRui Ueyama } 4942ec34544SRui Ueyama } 4952ec34544SRui Ueyama 4965f37541cSGeorge Rimar void ScriptParser::readRegionAlias() { 4975f37541cSGeorge Rimar expect("("); 4983837f427SRui Ueyama StringRef alias = unquote(next()); 4995f37541cSGeorge Rimar expect(","); 5003837f427SRui Ueyama StringRef name = next(); 5015f37541cSGeorge Rimar expect(")"); 5025f37541cSGeorge Rimar 5033837f427SRui Ueyama if (script->memoryRegions.count(alias)) 5043837f427SRui Ueyama setError("redefinition of memory region '" + alias + "'"); 5053837f427SRui Ueyama if (!script->memoryRegions.count(name)) 5063837f427SRui Ueyama setError("memory region '" + name + "' is not defined"); 5073837f427SRui Ueyama script->memoryRegions.insert({alias, script->memoryRegions[name]}); 5085f37541cSGeorge Rimar } 5095f37541cSGeorge Rimar 5102ec34544SRui Ueyama void ScriptParser::readSearchDir() { 5112ec34544SRui Ueyama expect("("); 5123837f427SRui Ueyama StringRef tok = next(); 5133837f427SRui Ueyama if (!config->nostdlib) 5143837f427SRui Ueyama config->searchPaths.push_back(unquote(tok)); 5152ec34544SRui Ueyama expect(")"); 5162ec34544SRui Ueyama } 5172ec34544SRui Ueyama 518a582419aSGeorge Rimar // This reads an overlay description. Overlays are used to describe output 519a582419aSGeorge Rimar // sections that use the same virtual memory range and normally would trigger 520a582419aSGeorge Rimar // linker's sections sanity check failures. 521a582419aSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Overlay-Description.html#Overlay-Description 522*64038ef8SFangrui Song SmallVector<SectionCommand *, 0> ScriptParser::readOverlay() { 523a582419aSGeorge Rimar // VA and LMA expressions are optional, though for simplicity of 524a582419aSGeorge Rimar // implementation we assume they are not. That is what OVERLAY was designed 525a582419aSGeorge Rimar // for first of all: to allow sections with overlapping VAs at different LMAs. 5263837f427SRui Ueyama Expr addrExpr = readExpr(); 527a582419aSGeorge Rimar expect(":"); 528a582419aSGeorge Rimar expect("AT"); 5293837f427SRui Ueyama Expr lmaExpr = readParenExpr(); 530a582419aSGeorge Rimar expect("{"); 531a582419aSGeorge Rimar 532*64038ef8SFangrui Song SmallVector<SectionCommand *, 0> v; 5333837f427SRui Ueyama OutputSection *prev = nullptr; 534a582419aSGeorge Rimar while (!errorCount() && !consume("}")) { 535a582419aSGeorge Rimar // VA is the same for all sections. The LMAs are consecutive in memory 536a582419aSGeorge Rimar // starting from the base load address specified. 5373837f427SRui Ueyama OutputSection *os = readOverlaySectionDescription(); 5383837f427SRui Ueyama os->addrExpr = addrExpr; 5393837f427SRui Ueyama if (prev) 5403837f427SRui Ueyama os->lmaExpr = [=] { return prev->getLMA() + prev->size; }; 541a582419aSGeorge Rimar else 5423837f427SRui Ueyama os->lmaExpr = lmaExpr; 5433837f427SRui Ueyama v.push_back(os); 5443837f427SRui Ueyama prev = os; 545a582419aSGeorge Rimar } 546a582419aSGeorge Rimar 547a582419aSGeorge Rimar // According to the specification, at the end of the overlay, the location 548a582419aSGeorge Rimar // counter should be equal to the overlay base address plus size of the 549a582419aSGeorge Rimar // largest section seen in the overlay. 550a582419aSGeorge Rimar // Here we want to create the Dot assignment command to achieve that. 5513837f427SRui Ueyama Expr moveDot = [=] { 5523837f427SRui Ueyama uint64_t max = 0; 5537051aeefSFangrui Song for (SectionCommand *cmd : v) 5543837f427SRui Ueyama max = std::max(max, cast<OutputSection>(cmd)->size); 5553837f427SRui Ueyama return addrExpr().getValue() + max; 556a582419aSGeorge Rimar }; 5573837f427SRui Ueyama v.push_back(make<SymbolAssignment>(".", moveDot, getCurrentLocation())); 5583837f427SRui Ueyama return v; 559a582419aSGeorge Rimar } 560a582419aSGeorge Rimar 561899fdf54SFangrui Song void ScriptParser::readOverwriteSections() { 562899fdf54SFangrui Song expect("{"); 563899fdf54SFangrui Song while (!errorCount() && !consume("}")) 564899fdf54SFangrui Song script->overwriteSections.push_back(readOutputSectionDescription(next())); 565899fdf54SFangrui Song } 566899fdf54SFangrui Song 5672ec34544SRui Ueyama void ScriptParser::readSections() { 5682ec34544SRui Ueyama expect("{"); 569*64038ef8SFangrui Song SmallVector<SectionCommand *, 0> v; 570b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 5713837f427SRui Ueyama StringRef tok = next(); 5723837f427SRui Ueyama if (tok == "OVERLAY") { 5737051aeefSFangrui Song for (SectionCommand *cmd : readOverlay()) 5743837f427SRui Ueyama v.push_back(cmd); 575a582419aSGeorge Rimar continue; 5763837f427SRui Ueyama } else if (tok == "INCLUDE") { 5772e9d40d5SRui Ueyama readInclude(); 5782e9d40d5SRui Ueyama continue; 579a582419aSGeorge Rimar } 580a582419aSGeorge Rimar 5817051aeefSFangrui Song if (SectionCommand *cmd = readAssignment(tok)) 5823837f427SRui Ueyama v.push_back(cmd); 583d30a78b3SGeorge Rimar else 5843837f427SRui Ueyama v.push_back(readOutputSectionDescription(tok)); 5852ec34544SRui Ueyama } 5867c426fb1SFangrui Song script->sectionCommands.insert(script->sectionCommands.end(), v.begin(), 5877c426fb1SFangrui Song v.end()); 5889e2c8a9dSGeorge Rimar 5897c426fb1SFangrui Song if (atEOF() || !consume("INSERT")) { 5907c426fb1SFangrui Song script->hasSectionsCommand = true; 5919e2c8a9dSGeorge Rimar return; 5929e2c8a9dSGeorge Rimar } 5939e2c8a9dSGeorge Rimar 5947c426fb1SFangrui Song bool isAfter = false; 5957c426fb1SFangrui Song if (consume("AFTER")) 5967c426fb1SFangrui Song isAfter = true; 5977c426fb1SFangrui Song else if (!consume("BEFORE")) 5987c426fb1SFangrui Song setError("expected AFTER/BEFORE, but got '" + next() + "'"); 5997c426fb1SFangrui Song StringRef where = next(); 600a1c2ee01SFangrui Song SmallVector<StringRef, 0> names; 6017051aeefSFangrui Song for (SectionCommand *cmd : v) 6027c426fb1SFangrui Song if (auto *os = dyn_cast<OutputSection>(cmd)) 60303051f7aSFangrui Song names.push_back(os->name); 60403051f7aSFangrui Song if (!names.empty()) 60503051f7aSFangrui Song script->insertCommands.push_back({std::move(names), isAfter, where}); 6062ec34544SRui Ueyama } 6072ec34544SRui Ueyama 608e262bb1aSRui Ueyama void ScriptParser::readTarget() { 609e262bb1aSRui Ueyama // TARGET(foo) is an alias for "--format foo". Unlike GNU linkers, 610e262bb1aSRui Ueyama // we accept only a limited set of BFD names (i.e. "elf" or "binary") 611e262bb1aSRui Ueyama // for --format. We recognize only /^elf/ and "binary" in the linker 612e262bb1aSRui Ueyama // script as well. 613e262bb1aSRui Ueyama expect("("); 6143837f427SRui Ueyama StringRef tok = next(); 615e262bb1aSRui Ueyama expect(")"); 616e262bb1aSRui Ueyama 6173837f427SRui Ueyama if (tok.startswith("elf")) 6183837f427SRui Ueyama config->formatBinary = false; 6193837f427SRui Ueyama else if (tok == "binary") 6203837f427SRui Ueyama config->formatBinary = true; 621e262bb1aSRui Ueyama else 6223837f427SRui Ueyama setError("unknown target: " + tok); 623e262bb1aSRui Ueyama } 624e262bb1aSRui Ueyama 6253837f427SRui Ueyama static int precedence(StringRef op) { 6263837f427SRui Ueyama return StringSwitch<int>(op) 627a5005482SGeorge Rimar .Cases("*", "/", "%", 8) 628a5005482SGeorge Rimar .Cases("+", "-", 7) 629a5005482SGeorge Rimar .Cases("<<", ">>", 6) 630a5005482SGeorge Rimar .Cases("<", "<=", ">", ">=", "==", "!=", 5) 631a5005482SGeorge Rimar .Case("&", 4) 632a5005482SGeorge Rimar .Case("|", 3) 633a5005482SGeorge Rimar .Case("&&", 2) 634a5005482SGeorge Rimar .Case("||", 1) 6352ec34544SRui Ueyama .Default(-1); 6362ec34544SRui Ueyama } 6372ec34544SRui Ueyama 6382ec34544SRui Ueyama StringMatcher ScriptParser::readFilePatterns() { 639c42fe247SThomas Preud'homme StringMatcher Matcher; 640c42fe247SThomas Preud'homme 641b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) 642c42fe247SThomas Preud'homme Matcher.addPattern(SingleStringMatcher(next())); 643c42fe247SThomas Preud'homme return Matcher; 6442ec34544SRui Ueyama } 6452ec34544SRui Ueyama 6462a9aed0eSFangrui Song SortSectionPolicy ScriptParser::peekSortKind() { 6472a9aed0eSFangrui Song return StringSwitch<SortSectionPolicy>(peek()) 6482a9aed0eSFangrui Song .Cases("SORT", "SORT_BY_NAME", SortSectionPolicy::Name) 6492a9aed0eSFangrui Song .Case("SORT_BY_ALIGNMENT", SortSectionPolicy::Alignment) 6502a9aed0eSFangrui Song .Case("SORT_BY_INIT_PRIORITY", SortSectionPolicy::Priority) 6512a9aed0eSFangrui Song .Case("SORT_NONE", SortSectionPolicy::None) 6522a9aed0eSFangrui Song .Default(SortSectionPolicy::Default); 6532a9aed0eSFangrui Song } 6542a9aed0eSFangrui Song 6552ec34544SRui Ueyama SortSectionPolicy ScriptParser::readSortKind() { 6562a9aed0eSFangrui Song SortSectionPolicy ret = peekSortKind(); 6572a9aed0eSFangrui Song if (ret != SortSectionPolicy::Default) 6582a9aed0eSFangrui Song skip(); 6592a9aed0eSFangrui Song return ret; 6602ec34544SRui Ueyama } 6612ec34544SRui Ueyama 66203fc8d1eSRui Ueyama // Reads SECTIONS command contents in the following form: 66303fc8d1eSRui Ueyama // 66403fc8d1eSRui Ueyama // <contents> ::= <elem>* 66503fc8d1eSRui Ueyama // <elem> ::= <exclude>? <glob-pattern> 66603fc8d1eSRui Ueyama // <exclude> ::= "EXCLUDE_FILE" "(" <glob-pattern>+ ")" 66703fc8d1eSRui Ueyama // 66803fc8d1eSRui Ueyama // For example, 66903fc8d1eSRui Ueyama // 67003fc8d1eSRui Ueyama // *(.foo EXCLUDE_FILE (a.o) .bar EXCLUDE_FILE (b.o) .baz) 67103fc8d1eSRui Ueyama // 67203fc8d1eSRui Ueyama // is parsed as ".foo", ".bar" with "a.o", and ".baz" with "b.o". 67303fc8d1eSRui Ueyama // The semantics of that is section .foo in any file, section .bar in 67403fc8d1eSRui Ueyama // any file but a.o, and section .baz in any file but b.o. 675*64038ef8SFangrui Song SmallVector<SectionPattern, 0> ScriptParser::readInputSectionsList() { 676*64038ef8SFangrui Song SmallVector<SectionPattern, 0> ret; 677b8a59c8aSBob Haarman while (!errorCount() && peek() != ")") { 6783837f427SRui Ueyama StringMatcher excludeFilePat; 6792ec34544SRui Ueyama if (consume("EXCLUDE_FILE")) { 6802ec34544SRui Ueyama expect("("); 6813837f427SRui Ueyama excludeFilePat = readFilePatterns(); 6822ec34544SRui Ueyama } 6832ec34544SRui Ueyama 684c42fe247SThomas Preud'homme StringMatcher SectionMatcher; 6852a9aed0eSFangrui Song // Break if the next token is ), EXCLUDE_FILE, or SORT*. 6862a9aed0eSFangrui Song while (!errorCount() && peek() != ")" && peek() != "EXCLUDE_FILE" && 6872a9aed0eSFangrui Song peekSortKind() == SortSectionPolicy::Default) 688c42fe247SThomas Preud'homme SectionMatcher.addPattern(unquote(next())); 6892ec34544SRui Ueyama 690c42fe247SThomas Preud'homme if (!SectionMatcher.empty()) 691c42fe247SThomas Preud'homme ret.push_back({std::move(excludeFilePat), std::move(SectionMatcher)}); 6922a9aed0eSFangrui Song else if (excludeFilePat.empty()) 6932a9aed0eSFangrui Song break; 6942ec34544SRui Ueyama else 6952ec34544SRui Ueyama setError("section pattern is expected"); 6962ec34544SRui Ueyama } 6973837f427SRui Ueyama return ret; 6982ec34544SRui Ueyama } 6992ec34544SRui Ueyama 7002ec34544SRui Ueyama // Reads contents of "SECTIONS" directive. That directive contains a 7012ec34544SRui Ueyama // list of glob patterns for input sections. The grammar is as follows. 7022ec34544SRui Ueyama // 7032ec34544SRui Ueyama // <patterns> ::= <section-list> 7042ec34544SRui Ueyama // | <sort> "(" <section-list> ")" 7052ec34544SRui Ueyama // | <sort> "(" <sort> "(" <section-list> ")" ")" 7062ec34544SRui Ueyama // 7072ec34544SRui Ueyama // <sort> ::= "SORT" | "SORT_BY_NAME" | "SORT_BY_ALIGNMENT" 7082ec34544SRui Ueyama // | "SORT_BY_INIT_PRIORITY" | "SORT_NONE" 7092ec34544SRui Ueyama // 7102ec34544SRui Ueyama // <section-list> is parsed by readInputSectionsList(). 7112ec34544SRui Ueyama InputSectionDescription * 712dbd0ad33SPeter Smith ScriptParser::readInputSectionRules(StringRef filePattern, uint64_t withFlags, 713dbd0ad33SPeter Smith uint64_t withoutFlags) { 714dbd0ad33SPeter Smith auto *cmd = 715dbd0ad33SPeter Smith make<InputSectionDescription>(filePattern, withFlags, withoutFlags); 7162ec34544SRui Ueyama expect("("); 7172ec34544SRui Ueyama 718b8a59c8aSBob Haarman while (!errorCount() && !consume(")")) { 7193837f427SRui Ueyama SortSectionPolicy outer = readSortKind(); 7203837f427SRui Ueyama SortSectionPolicy inner = SortSectionPolicy::Default; 721*64038ef8SFangrui Song SmallVector<SectionPattern, 0> v; 7223837f427SRui Ueyama if (outer != SortSectionPolicy::Default) { 7232ec34544SRui Ueyama expect("("); 7243837f427SRui Ueyama inner = readSortKind(); 7253837f427SRui Ueyama if (inner != SortSectionPolicy::Default) { 7262ec34544SRui Ueyama expect("("); 7273837f427SRui Ueyama v = readInputSectionsList(); 7282ec34544SRui Ueyama expect(")"); 7292ec34544SRui Ueyama } else { 7303837f427SRui Ueyama v = readInputSectionsList(); 7312ec34544SRui Ueyama } 7322ec34544SRui Ueyama expect(")"); 7332ec34544SRui Ueyama } else { 7343837f427SRui Ueyama v = readInputSectionsList(); 7352ec34544SRui Ueyama } 7362ec34544SRui Ueyama 7373837f427SRui Ueyama for (SectionPattern &pat : v) { 7383837f427SRui Ueyama pat.sortInner = inner; 7393837f427SRui Ueyama pat.sortOuter = outer; 7402ec34544SRui Ueyama } 7412ec34544SRui Ueyama 7423837f427SRui Ueyama std::move(v.begin(), v.end(), std::back_inserter(cmd->sectionPatterns)); 7432ec34544SRui Ueyama } 7443837f427SRui Ueyama return cmd; 7452ec34544SRui Ueyama } 7462ec34544SRui Ueyama 7472ec34544SRui Ueyama InputSectionDescription * 7483837f427SRui Ueyama ScriptParser::readInputSectionDescription(StringRef tok) { 7492ec34544SRui Ueyama // Input section wildcard can be surrounded by KEEP. 7502ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep 751dbd0ad33SPeter Smith uint64_t withFlags = 0; 752dbd0ad33SPeter Smith uint64_t withoutFlags = 0; 7533837f427SRui Ueyama if (tok == "KEEP") { 7542ec34544SRui Ueyama expect("("); 755dbd0ad33SPeter Smith if (consume("INPUT_SECTION_FLAGS")) 756dbd0ad33SPeter Smith std::tie(withFlags, withoutFlags) = readInputSectionFlags(); 757dbd0ad33SPeter Smith InputSectionDescription *cmd = 758dbd0ad33SPeter Smith readInputSectionRules(next(), withFlags, withoutFlags); 7592ec34544SRui Ueyama expect(")"); 7603837f427SRui Ueyama script->keptSections.push_back(cmd); 7613837f427SRui Ueyama return cmd; 7622ec34544SRui Ueyama } 763dbd0ad33SPeter Smith if (tok == "INPUT_SECTION_FLAGS") { 764dbd0ad33SPeter Smith std::tie(withFlags, withoutFlags) = readInputSectionFlags(); 765dbd0ad33SPeter Smith tok = next(); 766dbd0ad33SPeter Smith } 767dbd0ad33SPeter Smith return readInputSectionRules(tok, withFlags, withoutFlags); 7682ec34544SRui Ueyama } 7692ec34544SRui Ueyama 7702ec34544SRui Ueyama void ScriptParser::readSort() { 7712ec34544SRui Ueyama expect("("); 7722ec34544SRui Ueyama expect("CONSTRUCTORS"); 7732ec34544SRui Ueyama expect(")"); 7742ec34544SRui Ueyama } 7752ec34544SRui Ueyama 776d30a78b3SGeorge Rimar Expr ScriptParser::readAssert() { 7772ec34544SRui Ueyama expect("("); 7783837f427SRui Ueyama Expr e = readExpr(); 7792ec34544SRui Ueyama expect(","); 7803837f427SRui Ueyama StringRef msg = unquote(next()); 7812ec34544SRui Ueyama expect(")"); 782b579c439SRui Ueyama 7832ec34544SRui Ueyama return [=] { 7843837f427SRui Ueyama if (!e().getValue()) 7852682bc3cSFangrui Song errorOrWarn(msg); 7863837f427SRui Ueyama return script->getDot(); 7872ec34544SRui Ueyama }; 7882ec34544SRui Ueyama } 7892ec34544SRui Ueyama 790a46d08ebSGeorge Rimar // Tries to read the special directive for an output section definition which 791a46d08ebSGeorge Rimar // can be one of following: "(NOLOAD)", "(COPY)", "(INFO)" or "(OVERLAY)". 792a46d08ebSGeorge Rimar // Tok1 and Tok2 are next 2 tokens peeked. See comment for readSectionAddressType below. 7933837f427SRui Ueyama bool ScriptParser::readSectionDirective(OutputSection *cmd, StringRef tok1, StringRef tok2) { 7943837f427SRui Ueyama if (tok1 != "(") 795a46d08ebSGeorge Rimar return false; 7963837f427SRui Ueyama if (tok2 != "NOLOAD" && tok2 != "COPY" && tok2 != "INFO" && tok2 != "OVERLAY") 797a46d08ebSGeorge Rimar return false; 798a46d08ebSGeorge Rimar 799a46d08ebSGeorge Rimar expect("("); 800a46d08ebSGeorge Rimar if (consume("NOLOAD")) { 8013837f427SRui Ueyama cmd->noload = true; 802fdc41aa2SMatt Schulte cmd->type = SHT_NOBITS; 803a46d08ebSGeorge Rimar } else { 804a46d08ebSGeorge Rimar skip(); // This is "COPY", "INFO" or "OVERLAY". 8053837f427SRui Ueyama cmd->nonAlloc = true; 806a46d08ebSGeorge Rimar } 807a46d08ebSGeorge Rimar expect(")"); 808a46d08ebSGeorge Rimar return true; 809a46d08ebSGeorge Rimar } 810a46d08ebSGeorge Rimar 8111c08e9f5SGeorge Rimar // Reads an expression and/or the special directive for an output 8121c08e9f5SGeorge Rimar // section definition. Directive is one of following: "(NOLOAD)", 8131c08e9f5SGeorge Rimar // "(COPY)", "(INFO)" or "(OVERLAY)". 8143271d370SRui Ueyama // 8153271d370SRui Ueyama // An output section name can be followed by an address expression 8161c08e9f5SGeorge Rimar // and/or directive. This grammar is not LL(1) because "(" can be 81797f4d158SGeorge Rimar // interpreted as either the beginning of some expression or beginning 8181c08e9f5SGeorge Rimar // of directive. 8193271d370SRui Ueyama // 820b579c439SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Address.html 821fbb0463fSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Type.html 8223837f427SRui Ueyama void ScriptParser::readSectionAddressType(OutputSection *cmd) { 8233837f427SRui Ueyama if (readSectionDirective(cmd, peek(), peek2())) 8243271d370SRui Ueyama return; 8253271d370SRui Ueyama 8263837f427SRui Ueyama cmd->addrExpr = readExpr(); 8273837f427SRui Ueyama if (peek() == "(" && !readSectionDirective(cmd, "(", peek2())) 828a46d08ebSGeorge Rimar setError("unknown section directive: " + peek2()); 829fbb0463fSGeorge Rimar } 830fbb0463fSGeorge Rimar 8313837f427SRui Ueyama static Expr checkAlignment(Expr e, std::string &loc) { 832f22ec9ddSGeorge Rimar return [=] { 8333837f427SRui Ueyama uint64_t alignment = std::max((uint64_t)1, e().getValue()); 8343837f427SRui Ueyama if (!isPowerOf2_64(alignment)) { 8353837f427SRui Ueyama error(loc + ": alignment must be power of 2"); 836f22ec9ddSGeorge Rimar return (uint64_t)1; // Return a dummy value. 837f22ec9ddSGeorge Rimar } 8383837f427SRui Ueyama return alignment; 839f22ec9ddSGeorge Rimar }; 840f22ec9ddSGeorge Rimar } 841f22ec9ddSGeorge Rimar 842a582419aSGeorge Rimar OutputSection *ScriptParser::readOverlaySectionDescription() { 8433837f427SRui Ueyama OutputSection *cmd = 8443837f427SRui Ueyama script->createOutputSection(next(), getCurrentLocation()); 8453837f427SRui Ueyama cmd->inOverlay = true; 846a582419aSGeorge Rimar expect("{"); 847dbd0ad33SPeter Smith while (!errorCount() && !consume("}")) { 848dbd0ad33SPeter Smith uint64_t withFlags = 0; 849dbd0ad33SPeter Smith uint64_t withoutFlags = 0; 850dbd0ad33SPeter Smith if (consume("INPUT_SECTION_FLAGS")) 851dbd0ad33SPeter Smith std::tie(withFlags, withoutFlags) = readInputSectionFlags(); 8526188fd49SFangrui Song cmd->commands.push_back( 853dbd0ad33SPeter Smith readInputSectionRules(next(), withFlags, withoutFlags)); 854dbd0ad33SPeter Smith } 8553837f427SRui Ueyama return cmd; 856a582419aSGeorge Rimar } 857a582419aSGeorge Rimar 8583837f427SRui Ueyama OutputSection *ScriptParser::readOutputSectionDescription(StringRef outSec) { 8593837f427SRui Ueyama OutputSection *cmd = 8603837f427SRui Ueyama script->createOutputSection(outSec, getCurrentLocation()); 8613271d370SRui Ueyama 8623837f427SRui Ueyama size_t symbolsReferenced = script->referencedSymbols.size(); 863c4df670dSGeorge Rimar 8643271d370SRui Ueyama if (peek() != ":") 8653837f427SRui Ueyama readSectionAddressType(cmd); 8662ec34544SRui Ueyama expect(":"); 8672ec34544SRui Ueyama 8683837f427SRui Ueyama std::string location = getCurrentLocation(); 8692ec34544SRui Ueyama if (consume("AT")) 8703837f427SRui Ueyama cmd->lmaExpr = readParenExpr(); 8712ec34544SRui Ueyama if (consume("ALIGN")) 8723837f427SRui Ueyama cmd->alignExpr = checkAlignment(readParenExpr(), location); 8732ec34544SRui Ueyama if (consume("SUBALIGN")) 8743837f427SRui Ueyama cmd->subalignExpr = checkAlignment(readParenExpr(), location); 8752ec34544SRui Ueyama 8762ec34544SRui Ueyama // Parse constraints. 8772ec34544SRui Ueyama if (consume("ONLY_IF_RO")) 8783837f427SRui Ueyama cmd->constraint = ConstraintKind::ReadOnly; 8792ec34544SRui Ueyama if (consume("ONLY_IF_RW")) 8803837f427SRui Ueyama cmd->constraint = ConstraintKind::ReadWrite; 8812ec34544SRui Ueyama expect("{"); 8822ec34544SRui Ueyama 883b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 8843837f427SRui Ueyama StringRef tok = next(); 8853837f427SRui Ueyama if (tok == ";") { 8862ec34544SRui Ueyama // Empty commands are allowed. Do nothing here. 8873837f427SRui Ueyama } else if (SymbolAssignment *assign = readAssignment(tok)) { 8886188fd49SFangrui Song cmd->commands.push_back(assign); 8893837f427SRui Ueyama } else if (ByteCommand *data = readByteCommand(tok)) { 8906188fd49SFangrui Song cmd->commands.push_back(data); 8913837f427SRui Ueyama } else if (tok == "CONSTRUCTORS") { 8922ec34544SRui Ueyama // CONSTRUCTORS is a keyword to make the linker recognize C++ ctors/dtors 8932ec34544SRui Ueyama // by name. This is for very old file formats such as ECOFF/XCOFF. 8942ec34544SRui Ueyama // For ELF, we should ignore. 8953837f427SRui Ueyama } else if (tok == "FILL") { 8960810f16fSGeorge Rimar // We handle the FILL command as an alias for =fillexp section attribute, 8970810f16fSGeorge Rimar // which is different from what GNU linkers do. 8980810f16fSGeorge Rimar // https://sourceware.org/binutils/docs/ld/Output-Section-Data.html 899bb7d2b17SGeorgii Rymar if (peek() != "(") 900bb7d2b17SGeorgii Rymar setError("( expected, but got " + peek()); 9013837f427SRui Ueyama cmd->filler = readFill(); 9023837f427SRui Ueyama } else if (tok == "SORT") { 9032ec34544SRui Ueyama readSort(); 9043837f427SRui Ueyama } else if (tok == "INCLUDE") { 9052e9d40d5SRui Ueyama readInclude(); 9062ec34544SRui Ueyama } else if (peek() == "(") { 9076188fd49SFangrui Song cmd->commands.push_back(readInputSectionDescription(tok)); 9082ec34544SRui Ueyama } else { 909f49fe218SGeorge Rimar // We have a file name and no input sections description. It is not a 910f49fe218SGeorge Rimar // commonly used syntax, but still acceptable. In that case, all sections 911f49fe218SGeorge Rimar // from the file will be included. 912dbd0ad33SPeter Smith // FIXME: GNU ld permits INPUT_SECTION_FLAGS to be used here. We do not 913dbd0ad33SPeter Smith // handle this case here as it will already have been matched by the 914dbd0ad33SPeter Smith // case above. 9153837f427SRui Ueyama auto *isd = make<InputSectionDescription>(tok); 916c42fe247SThomas Preud'homme isd->sectionPatterns.push_back({{}, StringMatcher("*")}); 9176188fd49SFangrui Song cmd->commands.push_back(isd); 9182ec34544SRui Ueyama } 9192ec34544SRui Ueyama } 9202ec34544SRui Ueyama 9212ec34544SRui Ueyama if (consume(">")) 922adcd0268SBenjamin Kramer cmd->memoryRegionName = std::string(next()); 9232ec34544SRui Ueyama 9245d01a8beSGeorge Rimar if (consume("AT")) { 9255d01a8beSGeorge Rimar expect(">"); 926adcd0268SBenjamin Kramer cmd->lmaRegionName = std::string(next()); 9275d01a8beSGeorge Rimar } 9285d01a8beSGeorge Rimar 9293837f427SRui Ueyama if (cmd->lmaExpr && !cmd->lmaRegionName.empty()) 9305d01a8beSGeorge Rimar error("section can't have both LMA and a load region"); 9315d01a8beSGeorge Rimar 9323837f427SRui Ueyama cmd->phdrs = readOutputSectionPhdrs(); 9332ec34544SRui Ueyama 9340810f16fSGeorge Rimar if (peek() == "=" || peek().startswith("=")) { 9353837f427SRui Ueyama inExpr = true; 9360810f16fSGeorge Rimar consume("="); 9373837f427SRui Ueyama cmd->filler = readFill(); 9383837f427SRui Ueyama inExpr = false; 9390810f16fSGeorge Rimar } 9402ec34544SRui Ueyama 9412ec34544SRui Ueyama // Consume optional comma following output section command. 9422ec34544SRui Ueyama consume(","); 9432ec34544SRui Ueyama 9443837f427SRui Ueyama if (script->referencedSymbols.size() > symbolsReferenced) 9453837f427SRui Ueyama cmd->expressionsUseSymbols = true; 9463837f427SRui Ueyama return cmd; 9472ec34544SRui Ueyama } 9482ec34544SRui Ueyama 9490810f16fSGeorge Rimar // Reads a `=<fillexp>` expression and returns its value as a big-endian number. 9502ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html 9510810f16fSGeorge Rimar // We do not support using symbols in such expressions. 9522ec34544SRui Ueyama // 9538acbf1ccSRui Ueyama // When reading a hexstring, ld.bfd handles it as a blob of arbitrary 9548acbf1ccSRui Ueyama // size, while ld.gold always handles it as a 32-bit big-endian number. 9558acbf1ccSRui Ueyama // We are compatible with ld.gold because it's easier to implement. 956bb7d2b17SGeorgii Rymar // Also, we require that expressions with operators must be wrapped into 957bb7d2b17SGeorgii Rymar // round brackets. We did it to resolve the ambiguity when parsing scripts like: 958bb7d2b17SGeorgii Rymar // SECTIONS { .foo : { ... } =120+3 /DISCARD/ : { ... } } 9590810f16fSGeorge Rimar std::array<uint8_t, 4> ScriptParser::readFill() { 960bb7d2b17SGeorgii Rymar uint64_t value = readPrimary()().val; 9613837f427SRui Ueyama if (value > UINT32_MAX) 9620810f16fSGeorge Rimar setError("filler expression result does not fit 32-bit: 0x" + 9633837f427SRui Ueyama Twine::utohexstr(value)); 964b58079d4SRui Ueyama 9653837f427SRui Ueyama std::array<uint8_t, 4> buf; 9663837f427SRui Ueyama write32be(buf.data(), (uint32_t)value); 9673837f427SRui Ueyama return buf; 9682ec34544SRui Ueyama } 9692ec34544SRui Ueyama 9703837f427SRui Ueyama SymbolAssignment *ScriptParser::readProvideHidden(bool provide, bool hidden) { 9712ec34544SRui Ueyama expect("("); 9723837f427SRui Ueyama SymbolAssignment *cmd = readSymbolAssignment(next()); 9733837f427SRui Ueyama cmd->provide = provide; 9743837f427SRui Ueyama cmd->hidden = hidden; 9752ec34544SRui Ueyama expect(")"); 9763837f427SRui Ueyama return cmd; 9772ec34544SRui Ueyama } 9782ec34544SRui Ueyama 9793837f427SRui Ueyama SymbolAssignment *ScriptParser::readAssignment(StringRef tok) { 980d30a78b3SGeorge Rimar // Assert expression returns Dot, so this is equal to ".=." 9813837f427SRui Ueyama if (tok == "ASSERT") 982d30a78b3SGeorge Rimar return make<SymbolAssignment>(".", readAssert(), getCurrentLocation()); 983d30a78b3SGeorge Rimar 9843837f427SRui Ueyama size_t oldPos = pos; 9853837f427SRui Ueyama SymbolAssignment *cmd = nullptr; 986e88b76a9SGeorge Rimar if (peek() == "=" || peek() == "+=") 9873837f427SRui Ueyama cmd = readSymbolAssignment(tok); 9883837f427SRui Ueyama else if (tok == "PROVIDE") 9893837f427SRui Ueyama cmd = readProvideHidden(true, false); 9903837f427SRui Ueyama else if (tok == "HIDDEN") 9913837f427SRui Ueyama cmd = readProvideHidden(false, true); 9923837f427SRui Ueyama else if (tok == "PROVIDE_HIDDEN") 9933837f427SRui Ueyama cmd = readProvideHidden(true, true); 994e88b76a9SGeorge Rimar 9953837f427SRui Ueyama if (cmd) { 9963837f427SRui Ueyama cmd->commandString = 9973837f427SRui Ueyama tok.str() + " " + 9983837f427SRui Ueyama llvm::join(tokens.begin() + oldPos, tokens.begin() + pos, " "); 999e88b76a9SGeorge Rimar expect(";"); 10002ec34544SRui Ueyama } 10013837f427SRui Ueyama return cmd; 10022ec34544SRui Ueyama } 10032ec34544SRui Ueyama 10043837f427SRui Ueyama SymbolAssignment *ScriptParser::readSymbolAssignment(StringRef name) { 1005e7a7ad13SFangrui Song name = unquote(name); 10063837f427SRui Ueyama StringRef op = next(); 10073837f427SRui Ueyama assert(op == "=" || op == "+="); 10083837f427SRui Ueyama Expr e = readExpr(); 10093837f427SRui Ueyama if (op == "+=") { 10103837f427SRui Ueyama std::string loc = getCurrentLocation(); 10113837f427SRui Ueyama e = [=] { return add(script->getSymbolValue(name, loc), e()); }; 10122ec34544SRui Ueyama } 10133837f427SRui Ueyama return make<SymbolAssignment>(name, e, getCurrentLocation()); 10142ec34544SRui Ueyama } 10152ec34544SRui Ueyama 10162ec34544SRui Ueyama // This is an operator-precedence parser to parse a linker 10172ec34544SRui Ueyama // script expression. 10182ec34544SRui Ueyama Expr ScriptParser::readExpr() { 10192ec34544SRui Ueyama // Our lexer is context-aware. Set the in-expression bit so that 10202ec34544SRui Ueyama // they apply different tokenization rules. 10213837f427SRui Ueyama bool orig = inExpr; 10223837f427SRui Ueyama inExpr = true; 10233837f427SRui Ueyama Expr e = readExpr1(readPrimary(), 0); 10243837f427SRui Ueyama inExpr = orig; 10253837f427SRui Ueyama return e; 10262ec34544SRui Ueyama } 10272ec34544SRui Ueyama 10283837f427SRui Ueyama Expr ScriptParser::combine(StringRef op, Expr l, Expr r) { 10293837f427SRui Ueyama if (op == "+") 10303837f427SRui Ueyama return [=] { return add(l(), r()); }; 10313837f427SRui Ueyama if (op == "-") 10323837f427SRui Ueyama return [=] { return sub(l(), r()); }; 10333837f427SRui Ueyama if (op == "*") 10343837f427SRui Ueyama return [=] { return l().getValue() * r().getValue(); }; 10353837f427SRui Ueyama if (op == "/") { 10363837f427SRui Ueyama std::string loc = getCurrentLocation(); 10377b91e213SGeorge Rimar return [=]() -> uint64_t { 10383837f427SRui Ueyama if (uint64_t rv = r().getValue()) 10393837f427SRui Ueyama return l().getValue() / rv; 10403837f427SRui Ueyama error(loc + ": division by zero"); 1041067617f9SRui Ueyama return 0; 10427b91e213SGeorge Rimar }; 10437b91e213SGeorge Rimar } 10443837f427SRui Ueyama if (op == "%") { 10453837f427SRui Ueyama std::string loc = getCurrentLocation(); 10467b91e213SGeorge Rimar return [=]() -> uint64_t { 10473837f427SRui Ueyama if (uint64_t rv = r().getValue()) 10483837f427SRui Ueyama return l().getValue() % rv; 10493837f427SRui Ueyama error(loc + ": modulo by zero"); 1050067617f9SRui Ueyama return 0; 10517b91e213SGeorge Rimar }; 10527b91e213SGeorge Rimar } 10533837f427SRui Ueyama if (op == "<<") 10543837f427SRui Ueyama return [=] { return l().getValue() << r().getValue(); }; 10553837f427SRui Ueyama if (op == ">>") 10563837f427SRui Ueyama return [=] { return l().getValue() >> r().getValue(); }; 10573837f427SRui Ueyama if (op == "<") 10583837f427SRui Ueyama return [=] { return l().getValue() < r().getValue(); }; 10593837f427SRui Ueyama if (op == ">") 10603837f427SRui Ueyama return [=] { return l().getValue() > r().getValue(); }; 10613837f427SRui Ueyama if (op == ">=") 10623837f427SRui Ueyama return [=] { return l().getValue() >= r().getValue(); }; 10633837f427SRui Ueyama if (op == "<=") 10643837f427SRui Ueyama return [=] { return l().getValue() <= r().getValue(); }; 10653837f427SRui Ueyama if (op == "==") 10663837f427SRui Ueyama return [=] { return l().getValue() == r().getValue(); }; 10673837f427SRui Ueyama if (op == "!=") 10683837f427SRui Ueyama return [=] { return l().getValue() != r().getValue(); }; 10693837f427SRui Ueyama if (op == "||") 10703837f427SRui Ueyama return [=] { return l().getValue() || r().getValue(); }; 10713837f427SRui Ueyama if (op == "&&") 10723837f427SRui Ueyama return [=] { return l().getValue() && r().getValue(); }; 10733837f427SRui Ueyama if (op == "&") 10743837f427SRui Ueyama return [=] { return bitAnd(l(), r()); }; 10753837f427SRui Ueyama if (op == "|") 10763837f427SRui Ueyama return [=] { return bitOr(l(), r()); }; 10772ec34544SRui Ueyama llvm_unreachable("invalid operator"); 10782ec34544SRui Ueyama } 10792ec34544SRui Ueyama 10802ec34544SRui Ueyama // This is a part of the operator-precedence parser. This function 10812ec34544SRui Ueyama // assumes that the remaining token stream starts with an operator. 10823837f427SRui Ueyama Expr ScriptParser::readExpr1(Expr lhs, int minPrec) { 1083b8a59c8aSBob Haarman while (!atEOF() && !errorCount()) { 10842ec34544SRui Ueyama // Read an operator and an expression. 10852ec34544SRui Ueyama if (consume("?")) 10863837f427SRui Ueyama return readTernary(lhs); 10873837f427SRui Ueyama StringRef op1 = peek(); 10883837f427SRui Ueyama if (precedence(op1) < minPrec) 10892ec34544SRui Ueyama break; 10902ec34544SRui Ueyama skip(); 10913837f427SRui Ueyama Expr rhs = readPrimary(); 10922ec34544SRui Ueyama 10932ec34544SRui Ueyama // Evaluate the remaining part of the expression first if the 10942ec34544SRui Ueyama // next operator has greater precedence than the previous one. 10952ec34544SRui Ueyama // For example, if we have read "+" and "3", and if the next 10962ec34544SRui Ueyama // operator is "*", then we'll evaluate 3 * ... part first. 10972ec34544SRui Ueyama while (!atEOF()) { 10983837f427SRui Ueyama StringRef op2 = peek(); 10993837f427SRui Ueyama if (precedence(op2) <= precedence(op1)) 11002ec34544SRui Ueyama break; 11013837f427SRui Ueyama rhs = readExpr1(rhs, precedence(op2)); 11022ec34544SRui Ueyama } 11032ec34544SRui Ueyama 11043837f427SRui Ueyama lhs = combine(op1, lhs, rhs); 11052ec34544SRui Ueyama } 11063837f427SRui Ueyama return lhs; 11072ec34544SRui Ueyama } 11082ec34544SRui Ueyama 11095fb17128SGeorge Rimar Expr ScriptParser::getPageSize() { 11103837f427SRui Ueyama std::string location = getCurrentLocation(); 11115fb17128SGeorge Rimar return [=]() -> uint64_t { 11123837f427SRui Ueyama if (target) 11133837f427SRui Ueyama return config->commonPageSize; 11143837f427SRui Ueyama error(location + ": unable to calculate page size"); 11155fb17128SGeorge Rimar return 4096; // Return a dummy value. 11165fb17128SGeorge Rimar }; 11175fb17128SGeorge Rimar } 11185fb17128SGeorge Rimar 11195fb17128SGeorge Rimar Expr ScriptParser::readConstant() { 11203837f427SRui Ueyama StringRef s = readParenLiteral(); 11213837f427SRui Ueyama if (s == "COMMONPAGESIZE") 11225fb17128SGeorge Rimar return getPageSize(); 11233837f427SRui Ueyama if (s == "MAXPAGESIZE") 11243837f427SRui Ueyama return [] { return config->maxPageSize; }; 11253837f427SRui Ueyama setError("unknown constant: " + s); 1126b068b037SGeorge Rimar return [] { return 0; }; 11272ec34544SRui Ueyama } 11282ec34544SRui Ueyama 11295c65088fSRui Ueyama // Parses Tok as an integer. It recognizes hexadecimal (prefixed with 11305c65088fSRui Ueyama // "0x" or suffixed with "H") and decimal numbers. Decimal numbers may 11315c65088fSRui Ueyama // have "K" (Ki) or "M" (Mi) suffixes. 11323837f427SRui Ueyama static Optional<uint64_t> parseInt(StringRef tok) { 11332ec34544SRui Ueyama // Hexadecimal 11343837f427SRui Ueyama uint64_t val; 11353c6f8ca7SMartin Storsjö if (tok.startswith_insensitive("0x")) { 11363837f427SRui Ueyama if (!to_integer(tok.substr(2), val, 16)) 11374092016bSRui Ueyama return None; 11383837f427SRui Ueyama return val; 11394092016bSRui Ueyama } 11403c6f8ca7SMartin Storsjö if (tok.endswith_insensitive("H")) { 11413837f427SRui Ueyama if (!to_integer(tok.drop_back(), val, 16)) 11424092016bSRui Ueyama return None; 11433837f427SRui Ueyama return val; 11444092016bSRui Ueyama } 11452ec34544SRui Ueyama 11462ec34544SRui Ueyama // Decimal 11473c6f8ca7SMartin Storsjö if (tok.endswith_insensitive("K")) { 11483837f427SRui Ueyama if (!to_integer(tok.drop_back(), val, 10)) 11495c65088fSRui Ueyama return None; 11503837f427SRui Ueyama return val * 1024; 11512ec34544SRui Ueyama } 11523c6f8ca7SMartin Storsjö if (tok.endswith_insensitive("M")) { 11533837f427SRui Ueyama if (!to_integer(tok.drop_back(), val, 10)) 11545c65088fSRui Ueyama return None; 11553837f427SRui Ueyama return val * 1024 * 1024; 11565c65088fSRui Ueyama } 11573837f427SRui Ueyama if (!to_integer(tok, val, 10)) 11585c65088fSRui Ueyama return None; 11593837f427SRui Ueyama return val; 11602ec34544SRui Ueyama } 11612ec34544SRui Ueyama 11623837f427SRui Ueyama ByteCommand *ScriptParser::readByteCommand(StringRef tok) { 11633837f427SRui Ueyama int size = StringSwitch<int>(tok) 11642ec34544SRui Ueyama .Case("BYTE", 1) 11652ec34544SRui Ueyama .Case("SHORT", 2) 11662ec34544SRui Ueyama .Case("LONG", 4) 11672ec34544SRui Ueyama .Case("QUAD", 8) 11682ec34544SRui Ueyama .Default(-1); 11693837f427SRui Ueyama if (size == -1) 11702ec34544SRui Ueyama return nullptr; 117184bcabcbSGeorge Rimar 11723837f427SRui Ueyama size_t oldPos = pos; 11733837f427SRui Ueyama Expr e = readParenExpr(); 11743837f427SRui Ueyama std::string commandString = 11753837f427SRui Ueyama tok.str() + " " + 11763837f427SRui Ueyama llvm::join(tokens.begin() + oldPos, tokens.begin() + pos, " "); 11773837f427SRui Ueyama return make<ByteCommand>(e, size, commandString); 11782ec34544SRui Ueyama } 11792ec34544SRui Ueyama 1180dbd0ad33SPeter Smith static llvm::Optional<uint64_t> parseFlag(StringRef tok) { 1181dbd0ad33SPeter Smith if (llvm::Optional<uint64_t> asInt = parseInt(tok)) 1182dbd0ad33SPeter Smith return asInt; 1183dbd0ad33SPeter Smith #define CASE_ENT(enum) #enum, ELF::enum 1184dbd0ad33SPeter Smith return StringSwitch<llvm::Optional<uint64_t>>(tok) 1185dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_WRITE)) 1186dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_ALLOC)) 1187dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_EXECINSTR)) 1188dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_MERGE)) 1189dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_STRINGS)) 1190dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_INFO_LINK)) 1191dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_LINK_ORDER)) 1192dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_OS_NONCONFORMING)) 1193dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_GROUP)) 1194dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_TLS)) 1195dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_COMPRESSED)) 1196dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_EXCLUDE)) 1197dbd0ad33SPeter Smith .Case(CASE_ENT(SHF_ARM_PURECODE)) 1198dbd0ad33SPeter Smith .Default(None); 1199dbd0ad33SPeter Smith #undef CASE_ENT 1200dbd0ad33SPeter Smith } 1201dbd0ad33SPeter Smith 1202dbd0ad33SPeter Smith // Reads the '(' <flags> ')' list of section flags in 1203dbd0ad33SPeter Smith // INPUT_SECTION_FLAGS '(' <flags> ')' in the 1204dbd0ad33SPeter Smith // following form: 1205dbd0ad33SPeter Smith // <flags> ::= <flag> 1206dbd0ad33SPeter Smith // | <flags> & flag 1207dbd0ad33SPeter Smith // <flag> ::= Recognized Flag Name, or Integer value of flag. 1208dbd0ad33SPeter Smith // If the first character of <flag> is a ! then this means without flag, 1209dbd0ad33SPeter Smith // otherwise with flag. 1210dbd0ad33SPeter Smith // Example: SHF_EXECINSTR & !SHF_WRITE means with flag SHF_EXECINSTR and 1211dbd0ad33SPeter Smith // without flag SHF_WRITE. 1212dbd0ad33SPeter Smith std::pair<uint64_t, uint64_t> ScriptParser::readInputSectionFlags() { 1213dbd0ad33SPeter Smith uint64_t withFlags = 0; 1214dbd0ad33SPeter Smith uint64_t withoutFlags = 0; 1215dbd0ad33SPeter Smith expect("("); 1216dbd0ad33SPeter Smith while (!errorCount()) { 1217dbd0ad33SPeter Smith StringRef tok = unquote(next()); 1218dbd0ad33SPeter Smith bool without = tok.consume_front("!"); 1219dbd0ad33SPeter Smith if (llvm::Optional<uint64_t> flag = parseFlag(tok)) { 1220dbd0ad33SPeter Smith if (without) 1221dbd0ad33SPeter Smith withoutFlags |= *flag; 1222dbd0ad33SPeter Smith else 1223dbd0ad33SPeter Smith withFlags |= *flag; 1224dbd0ad33SPeter Smith } else { 1225dbd0ad33SPeter Smith setError("unrecognised flag: " + tok); 1226dbd0ad33SPeter Smith } 1227dbd0ad33SPeter Smith if (consume(")")) 1228dbd0ad33SPeter Smith break; 1229dbd0ad33SPeter Smith if (!consume("&")) { 1230dbd0ad33SPeter Smith next(); 1231dbd0ad33SPeter Smith setError("expected & or )"); 1232dbd0ad33SPeter Smith } 1233dbd0ad33SPeter Smith } 1234dbd0ad33SPeter Smith return std::make_pair(withFlags, withoutFlags); 1235dbd0ad33SPeter Smith } 1236dbd0ad33SPeter Smith 12372ec34544SRui Ueyama StringRef ScriptParser::readParenLiteral() { 12382ec34544SRui Ueyama expect("("); 12393837f427SRui Ueyama bool orig = inExpr; 12403837f427SRui Ueyama inExpr = false; 12413837f427SRui Ueyama StringRef tok = next(); 12423837f427SRui Ueyama inExpr = orig; 12432ec34544SRui Ueyama expect(")"); 12443837f427SRui Ueyama return tok; 12452ec34544SRui Ueyama } 12462ec34544SRui Ueyama 12473837f427SRui Ueyama static void checkIfExists(OutputSection *cmd, StringRef location) { 12483837f427SRui Ueyama if (cmd->location.empty() && script->errorOnMissingSection) 12493837f427SRui Ueyama error(location + ": undefined section " + cmd->name); 125005c4f67cSRafael Espindola } 125105c4f67cSRafael Espindola 1252e4f385d8SFangrui Song static bool isValidSymbolName(StringRef s) { 1253e4f385d8SFangrui Song auto valid = [](char c) { 1254e4f385d8SFangrui Song return isAlnum(c) || c == '$' || c == '.' || c == '_'; 1255e4f385d8SFangrui Song }; 1256e4f385d8SFangrui Song return !s.empty() && !isDigit(s[0]) && llvm::all_of(s, valid); 1257e4f385d8SFangrui Song } 1258e4f385d8SFangrui Song 12592ec34544SRui Ueyama Expr ScriptParser::readPrimary() { 12602ec34544SRui Ueyama if (peek() == "(") 12612ec34544SRui Ueyama return readParenExpr(); 12622ec34544SRui Ueyama 12635c65088fSRui Ueyama if (consume("~")) { 12643837f427SRui Ueyama Expr e = readPrimary(); 12653837f427SRui Ueyama return [=] { return ~e().getValue(); }; 12662ec34544SRui Ueyama } 12676f1d954eSHafiz Abid Qadeer if (consume("!")) { 12683837f427SRui Ueyama Expr e = readPrimary(); 12693837f427SRui Ueyama return [=] { return !e().getValue(); }; 12706f1d954eSHafiz Abid Qadeer } 12715c65088fSRui Ueyama if (consume("-")) { 12723837f427SRui Ueyama Expr e = readPrimary(); 12733837f427SRui Ueyama return [=] { return -e().getValue(); }; 12742ec34544SRui Ueyama } 12752ec34544SRui Ueyama 12763837f427SRui Ueyama StringRef tok = next(); 12773837f427SRui Ueyama std::string location = getCurrentLocation(); 12785c65088fSRui Ueyama 12792ec34544SRui Ueyama // Built-in functions are parsed here. 12802ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/Builtin-Functions.html. 12813837f427SRui Ueyama if (tok == "ABSOLUTE") { 12823837f427SRui Ueyama Expr inner = readParenExpr(); 12832ec34544SRui Ueyama return [=] { 12843837f427SRui Ueyama ExprValue i = inner(); 12853837f427SRui Ueyama i.forceAbsolute = true; 12863837f427SRui Ueyama return i; 12872ec34544SRui Ueyama }; 12882ec34544SRui Ueyama } 12893837f427SRui Ueyama if (tok == "ADDR") { 12903837f427SRui Ueyama StringRef name = readParenLiteral(); 12913837f427SRui Ueyama OutputSection *sec = script->getOrCreateOutputSection(name); 12923837f427SRui Ueyama sec->usedInExpression = true; 129341c7ab4aSGeorge Rimar return [=]() -> ExprValue { 12943837f427SRui Ueyama checkIfExists(sec, location); 12953837f427SRui Ueyama return {sec, false, 0, location}; 129641c7ab4aSGeorge Rimar }; 12972ec34544SRui Ueyama } 12983837f427SRui Ueyama if (tok == "ALIGN") { 12992ec34544SRui Ueyama expect("("); 13003837f427SRui Ueyama Expr e = readExpr(); 1301f22ec9ddSGeorge Rimar if (consume(")")) { 13023837f427SRui Ueyama e = checkAlignment(e, location); 13033837f427SRui Ueyama return [=] { return alignTo(script->getDot(), e().getValue()); }; 1304f22ec9ddSGeorge Rimar } 1305b579c439SRui Ueyama expect(","); 13063837f427SRui Ueyama Expr e2 = checkAlignment(readExpr(), location); 13072ec34544SRui Ueyama expect(")"); 13083c6de1a6SPetr Hosek return [=] { 13093837f427SRui Ueyama ExprValue v = e(); 13103837f427SRui Ueyama v.alignment = e2().getValue(); 13113837f427SRui Ueyama return v; 13123c6de1a6SPetr Hosek }; 13132ec34544SRui Ueyama } 13143837f427SRui Ueyama if (tok == "ALIGNOF") { 13153837f427SRui Ueyama StringRef name = readParenLiteral(); 13163837f427SRui Ueyama OutputSection *cmd = script->getOrCreateOutputSection(name); 1317617e2f98SRui Ueyama return [=] { 13183837f427SRui Ueyama checkIfExists(cmd, location); 13193837f427SRui Ueyama return cmd->alignment; 1320617e2f98SRui Ueyama }; 13212ec34544SRui Ueyama } 13223837f427SRui Ueyama if (tok == "ASSERT") 1323d30a78b3SGeorge Rimar return readAssert(); 13243837f427SRui Ueyama if (tok == "CONSTANT") 13255fb17128SGeorge Rimar return readConstant(); 13263837f427SRui Ueyama if (tok == "DATA_SEGMENT_ALIGN") { 13272ec34544SRui Ueyama expect("("); 13283837f427SRui Ueyama Expr e = readExpr(); 13292ec34544SRui Ueyama expect(","); 13302ec34544SRui Ueyama readExpr(); 13312ec34544SRui Ueyama expect(")"); 133260833f6eSGeorge Rimar return [=] { 13333837f427SRui Ueyama return alignTo(script->getDot(), std::max((uint64_t)1, e().getValue())); 133460833f6eSGeorge Rimar }; 13352ec34544SRui Ueyama } 13363837f427SRui Ueyama if (tok == "DATA_SEGMENT_END") { 13372ec34544SRui Ueyama expect("("); 13382ec34544SRui Ueyama expect("."); 13392ec34544SRui Ueyama expect(")"); 13403837f427SRui Ueyama return [] { return script->getDot(); }; 13412ec34544SRui Ueyama } 13423837f427SRui Ueyama if (tok == "DATA_SEGMENT_RELRO_END") { 13432ec34544SRui Ueyama // GNU linkers implements more complicated logic to handle 13442ec34544SRui Ueyama // DATA_SEGMENT_RELRO_END. We instead ignore the arguments and 13452ec34544SRui Ueyama // just align to the next page boundary for simplicity. 13462ec34544SRui Ueyama expect("("); 13472ec34544SRui Ueyama readExpr(); 13482ec34544SRui Ueyama expect(","); 13492ec34544SRui Ueyama readExpr(); 13502ec34544SRui Ueyama expect(")"); 13513837f427SRui Ueyama Expr e = getPageSize(); 13523837f427SRui Ueyama return [=] { return alignTo(script->getDot(), e().getValue()); }; 13532ec34544SRui Ueyama } 13543837f427SRui Ueyama if (tok == "DEFINED") { 1355e7a7ad13SFangrui Song StringRef name = unquote(readParenLiteral()); 13561f166edeSHafiz Abid Qadeer return [=] { 13571f166edeSHafiz Abid Qadeer Symbol *b = symtab->find(name); 13581f166edeSHafiz Abid Qadeer return (b && b->isDefined()) ? 1 : 0; 13591f166edeSHafiz Abid Qadeer }; 13602ec34544SRui Ueyama } 13613837f427SRui Ueyama if (tok == "LENGTH") { 13623837f427SRui Ueyama StringRef name = readParenLiteral(); 13633837f427SRui Ueyama if (script->memoryRegions.count(name) == 0) { 13643837f427SRui Ueyama setError("memory region not defined: " + name); 1365b068b037SGeorge Rimar return [] { return 0; }; 1366b068b037SGeorge Rimar } 136792b5b980SFangrui Song return script->memoryRegions[name]->length; 136891b95b61SRui Ueyama } 13693837f427SRui Ueyama if (tok == "LOADADDR") { 13703837f427SRui Ueyama StringRef name = readParenLiteral(); 13713837f427SRui Ueyama OutputSection *cmd = script->getOrCreateOutputSection(name); 13723837f427SRui Ueyama cmd->usedInExpression = true; 1373617e2f98SRui Ueyama return [=] { 13743837f427SRui Ueyama checkIfExists(cmd, location); 13753837f427SRui Ueyama return cmd->getLMA(); 1376617e2f98SRui Ueyama }; 13772ec34544SRui Ueyama } 1378fa1145a8SIsaac Richter if (tok == "LOG2CEIL") { 1379fa1145a8SIsaac Richter expect("("); 1380fa1145a8SIsaac Richter Expr a = readExpr(); 1381fa1145a8SIsaac Richter expect(")"); 1382fa1145a8SIsaac Richter return [=] { 1383fa1145a8SIsaac Richter // LOG2CEIL(0) is defined to be 0. 1384fa1145a8SIsaac Richter return llvm::Log2_64_Ceil(std::max(a().getValue(), UINT64_C(1))); 1385fa1145a8SIsaac Richter }; 1386fa1145a8SIsaac Richter } 13873837f427SRui Ueyama if (tok == "MAX" || tok == "MIN") { 1388fd11560fSGeorge Rimar expect("("); 13893837f427SRui Ueyama Expr a = readExpr(); 1390fd11560fSGeorge Rimar expect(","); 13913837f427SRui Ueyama Expr b = readExpr(); 1392fd11560fSGeorge Rimar expect(")"); 13933837f427SRui Ueyama if (tok == "MIN") 13943837f427SRui Ueyama return [=] { return std::min(a().getValue(), b().getValue()); }; 13953837f427SRui Ueyama return [=] { return std::max(a().getValue(), b().getValue()); }; 1396fd11560fSGeorge Rimar } 13973837f427SRui Ueyama if (tok == "ORIGIN") { 13983837f427SRui Ueyama StringRef name = readParenLiteral(); 13993837f427SRui Ueyama if (script->memoryRegions.count(name) == 0) { 14003837f427SRui Ueyama setError("memory region not defined: " + name); 1401b068b037SGeorge Rimar return [] { return 0; }; 1402b068b037SGeorge Rimar } 140392b5b980SFangrui Song return script->memoryRegions[name]->origin; 140491b95b61SRui Ueyama } 14053837f427SRui Ueyama if (tok == "SEGMENT_START") { 14062ec34544SRui Ueyama expect("("); 14072ec34544SRui Ueyama skip(); 14082ec34544SRui Ueyama expect(","); 14093837f427SRui Ueyama Expr e = readExpr(); 14102ec34544SRui Ueyama expect(")"); 14113837f427SRui Ueyama return [=] { return e(); }; 14122ec34544SRui Ueyama } 14133837f427SRui Ueyama if (tok == "SIZEOF") { 14143837f427SRui Ueyama StringRef name = readParenLiteral(); 14153837f427SRui Ueyama OutputSection *cmd = script->getOrCreateOutputSection(name); 141605c4f67cSRafael Espindola // Linker script does not create an output section if its content is empty. 141705c4f67cSRafael Espindola // We want to allow SIZEOF(.foo) where .foo is a section which happened to 141805c4f67cSRafael Espindola // be empty. 14193837f427SRui Ueyama return [=] { return cmd->size; }; 14202ec34544SRui Ueyama } 14213837f427SRui Ueyama if (tok == "SIZEOF_HEADERS") 142207837b8fSFangrui Song return [=] { return elf::getHeaderSize(); }; 14232ec34544SRui Ueyama 14244eb2eccbSRui Ueyama // Tok is the dot. 14253837f427SRui Ueyama if (tok == ".") 14263837f427SRui Ueyama return [=] { return script->getSymbolValue(tok, location); }; 14274eb2eccbSRui Ueyama 14282ec34544SRui Ueyama // Tok is a literal number. 14293837f427SRui Ueyama if (Optional<uint64_t> val = parseInt(tok)) 14303837f427SRui Ueyama return [=] { return *val; }; 14312ec34544SRui Ueyama 14322ec34544SRui Ueyama // Tok is a symbol name. 14332bf06d93SFangrui Song if (tok.startswith("\"")) 1434e7a7ad13SFangrui Song tok = unquote(tok); 14352bf06d93SFangrui Song else if (!isValidSymbolName(tok)) 14363837f427SRui Ueyama setError("malformed number: " + tok); 14373837f427SRui Ueyama script->referencedSymbols.push_back(tok); 14383837f427SRui Ueyama return [=] { return script->getSymbolValue(tok, location); }; 14392ec34544SRui Ueyama } 14402ec34544SRui Ueyama 14413837f427SRui Ueyama Expr ScriptParser::readTernary(Expr cond) { 14423837f427SRui Ueyama Expr l = readExpr(); 14432ec34544SRui Ueyama expect(":"); 14443837f427SRui Ueyama Expr r = readExpr(); 14453837f427SRui Ueyama return [=] { return cond().getValue() ? l() : r(); }; 14462ec34544SRui Ueyama } 14472ec34544SRui Ueyama 14482ec34544SRui Ueyama Expr ScriptParser::readParenExpr() { 14492ec34544SRui Ueyama expect("("); 14503837f427SRui Ueyama Expr e = readExpr(); 14512ec34544SRui Ueyama expect(")"); 14523837f427SRui Ueyama return e; 14532ec34544SRui Ueyama } 14542ec34544SRui Ueyama 1455a1c2ee01SFangrui Song SmallVector<StringRef, 0> ScriptParser::readOutputSectionPhdrs() { 1456a1c2ee01SFangrui Song SmallVector<StringRef, 0> phdrs; 1457b8a59c8aSBob Haarman while (!errorCount() && peek().startswith(":")) { 14583837f427SRui Ueyama StringRef tok = next(); 14593837f427SRui Ueyama phdrs.push_back((tok.size() == 1) ? next() : tok.substr(1)); 14602ec34544SRui Ueyama } 14613837f427SRui Ueyama return phdrs; 14622ec34544SRui Ueyama } 14632ec34544SRui Ueyama 14642ec34544SRui Ueyama // Read a program header type name. The next token must be a 14652ec34544SRui Ueyama // name of a program header type or a constant (e.g. "0x3"). 14662ec34544SRui Ueyama unsigned ScriptParser::readPhdrType() { 14673837f427SRui Ueyama StringRef tok = next(); 14683837f427SRui Ueyama if (Optional<uint64_t> val = parseInt(tok)) 14693837f427SRui Ueyama return *val; 14702ec34544SRui Ueyama 14713837f427SRui Ueyama unsigned ret = StringSwitch<unsigned>(tok) 14722ec34544SRui Ueyama .Case("PT_NULL", PT_NULL) 14732ec34544SRui Ueyama .Case("PT_LOAD", PT_LOAD) 14742ec34544SRui Ueyama .Case("PT_DYNAMIC", PT_DYNAMIC) 14752ec34544SRui Ueyama .Case("PT_INTERP", PT_INTERP) 14762ec34544SRui Ueyama .Case("PT_NOTE", PT_NOTE) 14772ec34544SRui Ueyama .Case("PT_SHLIB", PT_SHLIB) 14782ec34544SRui Ueyama .Case("PT_PHDR", PT_PHDR) 14792ec34544SRui Ueyama .Case("PT_TLS", PT_TLS) 14802ec34544SRui Ueyama .Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME) 14812ec34544SRui Ueyama .Case("PT_GNU_STACK", PT_GNU_STACK) 14822ec34544SRui Ueyama .Case("PT_GNU_RELRO", PT_GNU_RELRO) 14832ec34544SRui Ueyama .Case("PT_OPENBSD_RANDOMIZE", PT_OPENBSD_RANDOMIZE) 14842ec34544SRui Ueyama .Case("PT_OPENBSD_WXNEEDED", PT_OPENBSD_WXNEEDED) 14852ec34544SRui Ueyama .Case("PT_OPENBSD_BOOTDATA", PT_OPENBSD_BOOTDATA) 14862ec34544SRui Ueyama .Default(-1); 14872ec34544SRui Ueyama 14883837f427SRui Ueyama if (ret == (unsigned)-1) { 14893837f427SRui Ueyama setError("invalid program header type: " + tok); 14902ec34544SRui Ueyama return PT_NULL; 14912ec34544SRui Ueyama } 14923837f427SRui Ueyama return ret; 14932ec34544SRui Ueyama } 14942ec34544SRui Ueyama 14952ec34544SRui Ueyama // Reads an anonymous version declaration. 14962ec34544SRui Ueyama void ScriptParser::readAnonymousDeclaration() { 1497*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> locals; 1498*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> globals; 14993837f427SRui Ueyama std::tie(locals, globals) = readSymbols(); 1500e28a70daSFangrui Song for (const SymbolVersion &pat : locals) 150100809c88SFangrui Song config->versionDefinitions[VER_NDX_LOCAL].localPatterns.push_back(pat); 1502e28a70daSFangrui Song for (const SymbolVersion &pat : globals) 150300809c88SFangrui Song config->versionDefinitions[VER_NDX_GLOBAL].nonLocalPatterns.push_back(pat); 15042ec34544SRui Ueyama 15052ec34544SRui Ueyama expect(";"); 15062ec34544SRui Ueyama } 15072ec34544SRui Ueyama 15082ec34544SRui Ueyama // Reads a non-anonymous version definition, 15092ec34544SRui Ueyama // e.g. "VerStr { global: foo; bar; local: *; };". 15103837f427SRui Ueyama void ScriptParser::readVersionDeclaration(StringRef verStr) { 15112ec34544SRui Ueyama // Read a symbol list. 1512*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> locals; 1513*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> globals; 15143837f427SRui Ueyama std::tie(locals, globals) = readSymbols(); 15152ec34544SRui Ueyama 15162ec34544SRui Ueyama // Create a new version definition and add that to the global symbols. 15173837f427SRui Ueyama VersionDefinition ver; 15183837f427SRui Ueyama ver.name = verStr; 151900809c88SFangrui Song ver.nonLocalPatterns = std::move(globals); 152000809c88SFangrui Song ver.localPatterns = std::move(locals); 1521e28a70daSFangrui Song ver.id = config->versionDefinitions.size(); 15223837f427SRui Ueyama config->versionDefinitions.push_back(ver); 15232ec34544SRui Ueyama 15242ec34544SRui Ueyama // Each version may have a parent version. For example, "Ver2" 15252ec34544SRui Ueyama // defined as "Ver2 { global: foo; local: *; } Ver1;" has "Ver1" 15262ec34544SRui Ueyama // as a parent. This version hierarchy is, probably against your 15272ec34544SRui Ueyama // instinct, purely for hint; the runtime doesn't care about it 15282ec34544SRui Ueyama // at all. In LLD, we simply ignore it. 15295f380403SFangrui Song if (next() != ";") 15302ec34544SRui Ueyama expect(";"); 15312ec34544SRui Ueyama } 15322ec34544SRui Ueyama 153349279ca1SFangrui Song bool elf::hasWildcard(StringRef s) { 15343837f427SRui Ueyama return s.find_first_of("?*[") != StringRef::npos; 15351e77ad14SRui Ueyama } 15361e77ad14SRui Ueyama 15372ec34544SRui Ueyama // Reads a list of symbols, e.g. "{ global: foo; bar; local: *; };". 1538*64038ef8SFangrui Song std::pair<SmallVector<SymbolVersion, 0>, SmallVector<SymbolVersion, 0>> 15392ec34544SRui Ueyama ScriptParser::readSymbols() { 1540*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> locals; 1541*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> globals; 1542*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> *v = &globals; 15432ec34544SRui Ueyama 1544b8a59c8aSBob Haarman while (!errorCount()) { 15452ec34544SRui Ueyama if (consume("}")) 15462ec34544SRui Ueyama break; 15472ec34544SRui Ueyama if (consumeLabel("local")) { 15483837f427SRui Ueyama v = &locals; 15492ec34544SRui Ueyama continue; 15502ec34544SRui Ueyama } 15512ec34544SRui Ueyama if (consumeLabel("global")) { 15523837f427SRui Ueyama v = &globals; 15532ec34544SRui Ueyama continue; 15542ec34544SRui Ueyama } 15552ec34544SRui Ueyama 15562ec34544SRui Ueyama if (consume("extern")) { 1557*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> ext = readVersionExtern(); 15583837f427SRui Ueyama v->insert(v->end(), ext.begin(), ext.end()); 15592ec34544SRui Ueyama } else { 15603837f427SRui Ueyama StringRef tok = next(); 15613837f427SRui Ueyama v->push_back({unquote(tok), false, hasWildcard(tok)}); 15622ec34544SRui Ueyama } 15632ec34544SRui Ueyama expect(";"); 15642ec34544SRui Ueyama } 15653837f427SRui Ueyama return {locals, globals}; 15662ec34544SRui Ueyama } 15672ec34544SRui Ueyama 15682ec34544SRui Ueyama // Reads an "extern C++" directive, e.g., 15692ec34544SRui Ueyama // "extern "C++" { ns::*; "f(int, double)"; };" 157017324d8bSRui Ueyama // 157117324d8bSRui Ueyama // The last semicolon is optional. E.g. this is OK: 157217324d8bSRui Ueyama // "extern "C++" { ns::*; "f(int, double)" };" 1573*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> ScriptParser::readVersionExtern() { 15743837f427SRui Ueyama StringRef tok = next(); 15753837f427SRui Ueyama bool isCXX = tok == "\"C++\""; 15763837f427SRui Ueyama if (!isCXX && tok != "\"C\"") 15772ec34544SRui Ueyama setError("Unknown language"); 15782ec34544SRui Ueyama expect("{"); 15792ec34544SRui Ueyama 1580*64038ef8SFangrui Song SmallVector<SymbolVersion, 0> ret; 1581b8a59c8aSBob Haarman while (!errorCount() && peek() != "}") { 15823837f427SRui Ueyama StringRef tok = next(); 15833837f427SRui Ueyama ret.push_back( 15843837f427SRui Ueyama {unquote(tok), isCXX, !tok.startswith("\"") && hasWildcard(tok)}); 158517324d8bSRui Ueyama if (consume("}")) 15863837f427SRui Ueyama return ret; 15872ec34544SRui Ueyama expect(";"); 15882ec34544SRui Ueyama } 15892ec34544SRui Ueyama 15902ec34544SRui Ueyama expect("}"); 15913837f427SRui Ueyama return ret; 15922ec34544SRui Ueyama } 15932ec34544SRui Ueyama 159492b5b980SFangrui Song Expr ScriptParser::readMemoryAssignment(StringRef s1, StringRef s2, 15953837f427SRui Ueyama StringRef s3) { 15963837f427SRui Ueyama if (!consume(s1) && !consume(s2) && !consume(s3)) { 15973837f427SRui Ueyama setError("expected one of: " + s1 + ", " + s2 + ", or " + s3); 159892b5b980SFangrui Song return [] { return 0; }; 15992ec34544SRui Ueyama } 16002ec34544SRui Ueyama expect("="); 160192b5b980SFangrui Song return readExpr(); 16022ec34544SRui Ueyama } 16032ec34544SRui Ueyama 16042ec34544SRui Ueyama // Parse the MEMORY command as specified in: 16052ec34544SRui Ueyama // https://sourceware.org/binutils/docs/ld/MEMORY.html 16062ec34544SRui Ueyama // 16072ec34544SRui Ueyama // MEMORY { name [(attr)] : ORIGIN = origin, LENGTH = len ... } 16082ec34544SRui Ueyama void ScriptParser::readMemory() { 16092ec34544SRui Ueyama expect("{"); 1610b8a59c8aSBob Haarman while (!errorCount() && !consume("}")) { 16113837f427SRui Ueyama StringRef tok = next(); 16123837f427SRui Ueyama if (tok == "INCLUDE") { 16132e9d40d5SRui Ueyama readInclude(); 16142e9d40d5SRui Ueyama continue; 16152e9d40d5SRui Ueyama } 16162ec34544SRui Ueyama 16173837f427SRui Ueyama uint32_t flags = 0; 16188cdf1c1eSIgor Kudrin uint32_t invFlags = 0; 16193837f427SRui Ueyama uint32_t negFlags = 0; 16208cdf1c1eSIgor Kudrin uint32_t negInvFlags = 0; 16212ec34544SRui Ueyama if (consume("(")) { 16228cdf1c1eSIgor Kudrin readMemoryAttributes(flags, invFlags, negFlags, negInvFlags); 16232ec34544SRui Ueyama expect(")"); 16242ec34544SRui Ueyama } 16252ec34544SRui Ueyama expect(":"); 16262ec34544SRui Ueyama 162792b5b980SFangrui Song Expr origin = readMemoryAssignment("ORIGIN", "org", "o"); 16282ec34544SRui Ueyama expect(","); 162992b5b980SFangrui Song Expr length = readMemoryAssignment("LENGTH", "len", "l"); 16302ec34544SRui Ueyama 16315f37541cSGeorge Rimar // Add the memory region to the region map. 16328cdf1c1eSIgor Kudrin MemoryRegion *mr = make<MemoryRegion>(tok, origin, length, flags, invFlags, 16338cdf1c1eSIgor Kudrin negFlags, negInvFlags); 16343837f427SRui Ueyama if (!script->memoryRegions.insert({tok, mr}).second) 16353837f427SRui Ueyama setError("region '" + tok + "' already defined"); 16362ec34544SRui Ueyama } 16372ec34544SRui Ueyama } 16382ec34544SRui Ueyama 16392ec34544SRui Ueyama // This function parses the attributes used to match against section 16402ec34544SRui Ueyama // flags when placing output sections in a memory region. These flags 16412ec34544SRui Ueyama // are only used when an explicit memory region name is not used. 16428cdf1c1eSIgor Kudrin void ScriptParser::readMemoryAttributes(uint32_t &flags, uint32_t &invFlags, 16438cdf1c1eSIgor Kudrin uint32_t &negFlags, 16448cdf1c1eSIgor Kudrin uint32_t &negInvFlags) { 16453837f427SRui Ueyama bool invert = false; 16462ec34544SRui Ueyama 16473837f427SRui Ueyama for (char c : next().lower()) { 16488cdf1c1eSIgor Kudrin if (c == '!') { 16493837f427SRui Ueyama invert = !invert; 16508cdf1c1eSIgor Kudrin std::swap(flags, negFlags); 16518cdf1c1eSIgor Kudrin std::swap(invFlags, negInvFlags); 16528cdf1c1eSIgor Kudrin continue; 16532ec34544SRui Ueyama } 16548cdf1c1eSIgor Kudrin if (c == 'w') 16558cdf1c1eSIgor Kudrin flags |= SHF_WRITE; 16568cdf1c1eSIgor Kudrin else if (c == 'x') 16578cdf1c1eSIgor Kudrin flags |= SHF_EXECINSTR; 16588cdf1c1eSIgor Kudrin else if (c == 'a') 16598cdf1c1eSIgor Kudrin flags |= SHF_ALLOC; 16608cdf1c1eSIgor Kudrin else if (c == 'r') 16618cdf1c1eSIgor Kudrin invFlags |= SHF_WRITE; 16628cdf1c1eSIgor Kudrin else 16638cdf1c1eSIgor Kudrin setError("invalid memory region attribute"); 16648cdf1c1eSIgor Kudrin } 16658cdf1c1eSIgor Kudrin 16668cdf1c1eSIgor Kudrin if (invert) { 16678cdf1c1eSIgor Kudrin std::swap(flags, negFlags); 16688cdf1c1eSIgor Kudrin std::swap(invFlags, negInvFlags); 16698cdf1c1eSIgor Kudrin } 16702ec34544SRui Ueyama } 16712ec34544SRui Ueyama 167207837b8fSFangrui Song void elf::readLinkerScript(MemoryBufferRef mb) { 1673439341b9SJames Henderson llvm::TimeTraceScope timeScope("Read linker script", 1674439341b9SJames Henderson mb.getBufferIdentifier()); 16753837f427SRui Ueyama ScriptParser(mb).readLinkerScript(); 16762ec34544SRui Ueyama } 16772ec34544SRui Ueyama 167807837b8fSFangrui Song void elf::readVersionScript(MemoryBufferRef mb) { 1679439341b9SJames Henderson llvm::TimeTraceScope timeScope("Read version script", 1680439341b9SJames Henderson mb.getBufferIdentifier()); 16813837f427SRui Ueyama ScriptParser(mb).readVersionScript(); 16822ec34544SRui Ueyama } 16832ec34544SRui Ueyama 168407837b8fSFangrui Song void elf::readDynamicList(MemoryBufferRef mb) { 1685439341b9SJames Henderson llvm::TimeTraceScope timeScope("Read dynamic list", mb.getBufferIdentifier()); 168607837b8fSFangrui Song ScriptParser(mb).readDynamicList(); 16878c7e8cceSPetr Hosek } 1688bd8cfe65SFangrui Song 168907837b8fSFangrui Song void elf::readDefsym(StringRef name, MemoryBufferRef mb) { 1690439341b9SJames Henderson llvm::TimeTraceScope timeScope("Read defsym input", name); 169107837b8fSFangrui Song ScriptParser(mb).readDefsym(name); 169207837b8fSFangrui Song } 1693