1 //===- Driver.cpp ---------------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "Driver.h" 10 #include "Config.h" 11 #include "ICF.h" 12 #include "InputFiles.h" 13 #include "LTO.h" 14 #include "MarkLive.h" 15 #include "ObjC.h" 16 #include "OutputSection.h" 17 #include "OutputSegment.h" 18 #include "SectionPriorities.h" 19 #include "SymbolTable.h" 20 #include "Symbols.h" 21 #include "SyntheticSections.h" 22 #include "Target.h" 23 #include "UnwindInfoSection.h" 24 #include "Writer.h" 25 26 #include "lld/Common/Args.h" 27 #include "lld/Common/Driver.h" 28 #include "lld/Common/ErrorHandler.h" 29 #include "lld/Common/LLVM.h" 30 #include "lld/Common/Memory.h" 31 #include "lld/Common/Reproduce.h" 32 #include "lld/Common/Version.h" 33 #include "llvm/ADT/DenseSet.h" 34 #include "llvm/ADT/StringExtras.h" 35 #include "llvm/ADT/StringRef.h" 36 #include "llvm/BinaryFormat/MachO.h" 37 #include "llvm/BinaryFormat/Magic.h" 38 #include "llvm/Config/llvm-config.h" 39 #include "llvm/LTO/LTO.h" 40 #include "llvm/Object/Archive.h" 41 #include "llvm/Option/ArgList.h" 42 #include "llvm/Support/CommandLine.h" 43 #include "llvm/Support/FileSystem.h" 44 #include "llvm/Support/Host.h" 45 #include "llvm/Support/MemoryBuffer.h" 46 #include "llvm/Support/Parallel.h" 47 #include "llvm/Support/Path.h" 48 #include "llvm/Support/TarWriter.h" 49 #include "llvm/Support/TargetSelect.h" 50 #include "llvm/Support/TimeProfiler.h" 51 #include "llvm/TextAPI/PackedVersion.h" 52 53 #include <algorithm> 54 55 using namespace llvm; 56 using namespace llvm::MachO; 57 using namespace llvm::object; 58 using namespace llvm::opt; 59 using namespace llvm::sys; 60 using namespace lld; 61 using namespace lld::macho; 62 63 std::unique_ptr<Configuration> macho::config; 64 std::unique_ptr<DependencyTracker> macho::depTracker; 65 66 static HeaderFileType getOutputType(const InputArgList &args) { 67 // TODO: -r, -dylinker, -preload... 68 Arg *outputArg = args.getLastArg(OPT_bundle, OPT_dylib, OPT_execute); 69 if (outputArg == nullptr) 70 return MH_EXECUTE; 71 72 switch (outputArg->getOption().getID()) { 73 case OPT_bundle: 74 return MH_BUNDLE; 75 case OPT_dylib: 76 return MH_DYLIB; 77 case OPT_execute: 78 return MH_EXECUTE; 79 default: 80 llvm_unreachable("internal error"); 81 } 82 } 83 84 static DenseMap<CachedHashStringRef, StringRef> resolvedLibraries; 85 static Optional<StringRef> findLibrary(StringRef name) { 86 CachedHashStringRef key(name); 87 auto entry = resolvedLibraries.find(key); 88 if (entry != resolvedLibraries.end()) 89 return entry->second; 90 91 auto doFind = [&] { 92 if (config->searchDylibsFirst) { 93 if (Optional<StringRef> path = findPathCombination( 94 "lib" + name, config->librarySearchPaths, {".tbd", ".dylib"})) 95 return path; 96 return findPathCombination("lib" + name, config->librarySearchPaths, 97 {".a"}); 98 } 99 return findPathCombination("lib" + name, config->librarySearchPaths, 100 {".tbd", ".dylib", ".a"}); 101 }; 102 103 Optional<StringRef> path = doFind(); 104 if (path) 105 resolvedLibraries[key] = *path; 106 107 return path; 108 } 109 110 static DenseMap<CachedHashStringRef, StringRef> resolvedFrameworks; 111 static Optional<StringRef> findFramework(StringRef name) { 112 CachedHashStringRef key(name); 113 auto entry = resolvedFrameworks.find(key); 114 if (entry != resolvedFrameworks.end()) 115 return entry->second; 116 117 SmallString<260> symlink; 118 StringRef suffix; 119 std::tie(name, suffix) = name.split(","); 120 for (StringRef dir : config->frameworkSearchPaths) { 121 symlink = dir; 122 path::append(symlink, name + ".framework", name); 123 124 if (!suffix.empty()) { 125 // NOTE: we must resolve the symlink before trying the suffixes, because 126 // there are no symlinks for the suffixed paths. 127 SmallString<260> location; 128 if (!fs::real_path(symlink, location)) { 129 // only append suffix if realpath() succeeds 130 Twine suffixed = location + suffix; 131 if (fs::exists(suffixed)) 132 return resolvedFrameworks[key] = saver().save(suffixed.str()); 133 } 134 // Suffix lookup failed, fall through to the no-suffix case. 135 } 136 137 if (Optional<StringRef> path = resolveDylibPath(symlink.str())) 138 return resolvedFrameworks[key] = *path; 139 } 140 return {}; 141 } 142 143 static bool warnIfNotDirectory(StringRef option, StringRef path) { 144 if (!fs::exists(path)) { 145 warn("directory not found for option -" + option + path); 146 return false; 147 } else if (!fs::is_directory(path)) { 148 warn("option -" + option + path + " references a non-directory path"); 149 return false; 150 } 151 return true; 152 } 153 154 static std::vector<StringRef> 155 getSearchPaths(unsigned optionCode, InputArgList &args, 156 const std::vector<StringRef> &roots, 157 const SmallVector<StringRef, 2> &systemPaths) { 158 std::vector<StringRef> paths; 159 StringRef optionLetter{optionCode == OPT_F ? "F" : "L"}; 160 for (StringRef path : args::getStrings(args, optionCode)) { 161 // NOTE: only absolute paths are re-rooted to syslibroot(s) 162 bool found = false; 163 if (path::is_absolute(path, path::Style::posix)) { 164 for (StringRef root : roots) { 165 SmallString<261> buffer(root); 166 path::append(buffer, path); 167 // Do not warn about paths that are computed via the syslib roots 168 if (fs::is_directory(buffer)) { 169 paths.push_back(saver().save(buffer.str())); 170 found = true; 171 } 172 } 173 } 174 if (!found && warnIfNotDirectory(optionLetter, path)) 175 paths.push_back(path); 176 } 177 178 // `-Z` suppresses the standard "system" search paths. 179 if (args.hasArg(OPT_Z)) 180 return paths; 181 182 for (const StringRef &path : systemPaths) { 183 for (const StringRef &root : roots) { 184 SmallString<261> buffer(root); 185 path::append(buffer, path); 186 if (fs::is_directory(buffer)) 187 paths.push_back(saver().save(buffer.str())); 188 } 189 } 190 return paths; 191 } 192 193 static std::vector<StringRef> getSystemLibraryRoots(InputArgList &args) { 194 std::vector<StringRef> roots; 195 for (const Arg *arg : args.filtered(OPT_syslibroot)) 196 roots.push_back(arg->getValue()); 197 // NOTE: the final `-syslibroot` being `/` will ignore all roots 198 if (!roots.empty() && roots.back() == "/") 199 roots.clear(); 200 // NOTE: roots can never be empty - add an empty root to simplify the library 201 // and framework search path computation. 202 if (roots.empty()) 203 roots.emplace_back(""); 204 return roots; 205 } 206 207 static std::vector<StringRef> 208 getLibrarySearchPaths(InputArgList &args, const std::vector<StringRef> &roots) { 209 return getSearchPaths(OPT_L, args, roots, {"/usr/lib", "/usr/local/lib"}); 210 } 211 212 static std::vector<StringRef> 213 getFrameworkSearchPaths(InputArgList &args, 214 const std::vector<StringRef> &roots) { 215 return getSearchPaths(OPT_F, args, roots, 216 {"/Library/Frameworks", "/System/Library/Frameworks"}); 217 } 218 219 static llvm::CachePruningPolicy getLTOCachePolicy(InputArgList &args) { 220 SmallString<128> ltoPolicy; 221 auto add = [<oPolicy](Twine val) { 222 if (!ltoPolicy.empty()) 223 ltoPolicy += ":"; 224 val.toVector(ltoPolicy); 225 }; 226 for (const Arg *arg : 227 args.filtered(OPT_thinlto_cache_policy, OPT_prune_interval_lto, 228 OPT_prune_after_lto, OPT_max_relative_cache_size_lto)) { 229 switch (arg->getOption().getID()) { 230 case OPT_thinlto_cache_policy: 231 add(arg->getValue()); 232 break; 233 case OPT_prune_interval_lto: 234 if (!strcmp("-1", arg->getValue())) 235 add("prune_interval=87600h"); // 10 years 236 else 237 add(Twine("prune_interval=") + arg->getValue() + "s"); 238 break; 239 case OPT_prune_after_lto: 240 add(Twine("prune_after=") + arg->getValue() + "s"); 241 break; 242 case OPT_max_relative_cache_size_lto: 243 add(Twine("cache_size=") + arg->getValue() + "%"); 244 break; 245 } 246 } 247 return CHECK(parseCachePruningPolicy(ltoPolicy), "invalid LTO cache policy"); 248 } 249 250 static DenseMap<StringRef, ArchiveFile *> loadedArchives; 251 252 static InputFile *addFile(StringRef path, ForceLoad forceLoadArchive, 253 bool isLazy = false, bool isExplicit = true, 254 bool isBundleLoader = false) { 255 Optional<MemoryBufferRef> buffer = readFile(path); 256 if (!buffer) 257 return nullptr; 258 MemoryBufferRef mbref = *buffer; 259 InputFile *newFile = nullptr; 260 261 file_magic magic = identify_magic(mbref.getBuffer()); 262 switch (magic) { 263 case file_magic::archive: { 264 // Avoid loading archives twice. If the archives are being force-loaded, 265 // loading them twice would create duplicate symbol errors. In the 266 // non-force-loading case, this is just a minor performance optimization. 267 // We don't take a reference to cachedFile here because the 268 // loadArchiveMember() call below may recursively call addFile() and 269 // invalidate this reference. 270 auto entry = loadedArchives.find(path); 271 if (entry != loadedArchives.end()) 272 return entry->second; 273 274 std::unique_ptr<object::Archive> archive = CHECK( 275 object::Archive::create(mbref), path + ": failed to parse archive"); 276 277 if (!archive->isEmpty() && !archive->hasSymbolTable()) 278 error(path + ": archive has no index; run ranlib to add one"); 279 280 auto *file = make<ArchiveFile>(std::move(archive)); 281 if ((forceLoadArchive == ForceLoad::Default && config->allLoad) || 282 forceLoadArchive == ForceLoad::Yes) { 283 if (Optional<MemoryBufferRef> buffer = readFile(path)) { 284 Error e = Error::success(); 285 for (const object::Archive::Child &c : file->getArchive().children(e)) { 286 StringRef reason = 287 forceLoadArchive == ForceLoad::Yes ? "-force_load" : "-all_load"; 288 if (Error e = file->fetch(c, reason)) 289 error(toString(file) + ": " + reason + 290 " failed to load archive member: " + toString(std::move(e))); 291 } 292 if (e) 293 error(toString(file) + 294 ": Archive::children failed: " + toString(std::move(e))); 295 } 296 } else if (forceLoadArchive == ForceLoad::Default && 297 config->forceLoadObjC) { 298 for (const object::Archive::Symbol &sym : file->getArchive().symbols()) 299 if (sym.getName().startswith(objc::klass)) 300 file->fetch(sym); 301 302 // TODO: no need to look for ObjC sections for a given archive member if 303 // we already found that it contains an ObjC symbol. 304 if (Optional<MemoryBufferRef> buffer = readFile(path)) { 305 Error e = Error::success(); 306 for (const object::Archive::Child &c : file->getArchive().children(e)) { 307 Expected<MemoryBufferRef> mb = c.getMemoryBufferRef(); 308 if (!mb || !hasObjCSection(*mb)) 309 continue; 310 if (Error e = file->fetch(c, "-ObjC")) 311 error(toString(file) + ": -ObjC failed to load archive member: " + 312 toString(std::move(e))); 313 } 314 if (e) 315 error(toString(file) + 316 ": Archive::children failed: " + toString(std::move(e))); 317 } 318 } 319 320 file->addLazySymbols(); 321 newFile = loadedArchives[path] = file; 322 break; 323 } 324 case file_magic::macho_object: 325 newFile = make<ObjFile>(mbref, getModTime(path), "", isLazy); 326 break; 327 case file_magic::macho_dynamically_linked_shared_lib: 328 case file_magic::macho_dynamically_linked_shared_lib_stub: 329 case file_magic::tapi_file: 330 if (DylibFile *dylibFile = 331 loadDylib(mbref, nullptr, /*isBundleLoader=*/false, isExplicit)) 332 newFile = dylibFile; 333 break; 334 case file_magic::bitcode: 335 newFile = make<BitcodeFile>(mbref, "", 0, isLazy); 336 break; 337 case file_magic::macho_executable: 338 case file_magic::macho_bundle: 339 // We only allow executable and bundle type here if it is used 340 // as a bundle loader. 341 if (!isBundleLoader) 342 error(path + ": unhandled file type"); 343 if (DylibFile *dylibFile = loadDylib(mbref, nullptr, isBundleLoader)) 344 newFile = dylibFile; 345 break; 346 default: 347 error(path + ": unhandled file type"); 348 } 349 if (newFile && !isa<DylibFile>(newFile)) { 350 if ((isa<ObjFile>(newFile) || isa<BitcodeFile>(newFile)) && newFile->lazy && 351 config->forceLoadObjC) { 352 for (Symbol *sym : newFile->symbols) 353 if (sym && sym->getName().startswith(objc::klass)) { 354 extract(*newFile, "-ObjC"); 355 break; 356 } 357 if (newFile->lazy && hasObjCSection(mbref)) 358 extract(*newFile, "-ObjC"); 359 } 360 361 // printArchiveMemberLoad() prints both .a and .o names, so no need to 362 // print the .a name here. Similarly skip lazy files. 363 if (config->printEachFile && magic != file_magic::archive && !isLazy) 364 message(toString(newFile)); 365 inputFiles.insert(newFile); 366 } 367 return newFile; 368 } 369 370 static void addLibrary(StringRef name, bool isNeeded, bool isWeak, 371 bool isReexport, bool isExplicit, 372 ForceLoad forceLoadArchive) { 373 if (Optional<StringRef> path = findLibrary(name)) { 374 if (auto *dylibFile = dyn_cast_or_null<DylibFile>( 375 addFile(*path, forceLoadArchive, /*isLazy=*/false, isExplicit))) { 376 if (isNeeded) 377 dylibFile->forceNeeded = true; 378 if (isWeak) 379 dylibFile->forceWeakImport = true; 380 if (isReexport) { 381 config->hasReexports = true; 382 dylibFile->reexport = true; 383 } 384 } 385 return; 386 } 387 error("library not found for -l" + name); 388 } 389 390 static DenseSet<StringRef> loadedObjectFrameworks; 391 static void addFramework(StringRef name, bool isNeeded, bool isWeak, 392 bool isReexport, bool isExplicit, 393 ForceLoad forceLoadArchive) { 394 if (Optional<StringRef> path = findFramework(name)) { 395 if (loadedObjectFrameworks.contains(*path)) 396 return; 397 398 InputFile *file = 399 addFile(*path, forceLoadArchive, /*isLazy=*/false, isExplicit); 400 if (auto *dylibFile = dyn_cast_or_null<DylibFile>(file)) { 401 if (isNeeded) 402 dylibFile->forceNeeded = true; 403 if (isWeak) 404 dylibFile->forceWeakImport = true; 405 if (isReexport) { 406 config->hasReexports = true; 407 dylibFile->reexport = true; 408 } 409 } else if (isa_and_nonnull<ObjFile>(file) || 410 isa_and_nonnull<BitcodeFile>(file)) { 411 // Cache frameworks containing object or bitcode files to avoid duplicate 412 // symbols. Frameworks containing static archives are cached separately 413 // in addFile() to share caching with libraries, and frameworks 414 // containing dylibs should allow overwriting of attributes such as 415 // forceNeeded by subsequent loads 416 loadedObjectFrameworks.insert(*path); 417 } 418 return; 419 } 420 error("framework not found for -framework " + name); 421 } 422 423 // Parses LC_LINKER_OPTION contents, which can add additional command line 424 // flags. This directly parses the flags instead of using the standard argument 425 // parser to improve performance. 426 void macho::parseLCLinkerOption(InputFile *f, unsigned argc, StringRef data) { 427 SmallVector<StringRef, 4> argv; 428 size_t offset = 0; 429 for (unsigned i = 0; i < argc && offset < data.size(); ++i) { 430 argv.push_back(data.data() + offset); 431 offset += strlen(data.data() + offset) + 1; 432 } 433 if (argv.size() != argc || offset > data.size()) 434 fatal(toString(f) + ": invalid LC_LINKER_OPTION"); 435 436 unsigned i = 0; 437 StringRef arg = argv[i]; 438 if (arg.consume_front("-l")) { 439 ForceLoad forceLoadArchive = 440 config->forceLoadSwift && arg.startswith("swift") ? ForceLoad::Yes 441 : ForceLoad::No; 442 addLibrary(arg, /*isNeeded=*/false, /*isWeak=*/false, 443 /*isReexport=*/false, /*isExplicit=*/false, forceLoadArchive); 444 } else if (arg == "-framework") { 445 StringRef name = argv[++i]; 446 addFramework(name, /*isNeeded=*/false, /*isWeak=*/false, 447 /*isReexport=*/false, /*isExplicit=*/false, ForceLoad::No); 448 } else { 449 error(arg + " is not allowed in LC_LINKER_OPTION"); 450 } 451 } 452 453 static void addFileList(StringRef path, bool isLazy) { 454 Optional<MemoryBufferRef> buffer = readFile(path); 455 if (!buffer) 456 return; 457 MemoryBufferRef mbref = *buffer; 458 for (StringRef path : args::getLines(mbref)) 459 addFile(rerootPath(path), ForceLoad::Default, isLazy); 460 } 461 462 // We expect sub-library names of the form "libfoo", which will match a dylib 463 // with a path of .*/libfoo.{dylib, tbd}. 464 // XXX ld64 seems to ignore the extension entirely when matching sub-libraries; 465 // I'm not sure what the use case for that is. 466 static bool markReexport(StringRef searchName, ArrayRef<StringRef> extensions) { 467 for (InputFile *file : inputFiles) { 468 if (auto *dylibFile = dyn_cast<DylibFile>(file)) { 469 StringRef filename = path::filename(dylibFile->getName()); 470 if (filename.consume_front(searchName) && 471 (filename.empty() || 472 find(extensions, filename) != extensions.end())) { 473 dylibFile->reexport = true; 474 return true; 475 } 476 } 477 } 478 return false; 479 } 480 481 // This function is called on startup. We need this for LTO since 482 // LTO calls LLVM functions to compile bitcode files to native code. 483 // Technically this can be delayed until we read bitcode files, but 484 // we don't bother to do lazily because the initialization is fast. 485 static void initLLVM() { 486 InitializeAllTargets(); 487 InitializeAllTargetMCs(); 488 InitializeAllAsmPrinters(); 489 InitializeAllAsmParsers(); 490 } 491 492 static void compileBitcodeFiles() { 493 TimeTraceScope timeScope("LTO"); 494 auto *lto = make<BitcodeCompiler>(); 495 for (InputFile *file : inputFiles) 496 if (auto *bitcodeFile = dyn_cast<BitcodeFile>(file)) 497 if (!file->lazy) 498 lto->add(*bitcodeFile); 499 500 for (ObjFile *file : lto->compile()) 501 inputFiles.insert(file); 502 } 503 504 // Replaces common symbols with defined symbols residing in __common sections. 505 // This function must be called after all symbol names are resolved (i.e. after 506 // all InputFiles have been loaded.) As a result, later operations won't see 507 // any CommonSymbols. 508 static void replaceCommonSymbols() { 509 TimeTraceScope timeScope("Replace common symbols"); 510 ConcatOutputSection *osec = nullptr; 511 for (Symbol *sym : symtab->getSymbols()) { 512 auto *common = dyn_cast<CommonSymbol>(sym); 513 if (common == nullptr) 514 continue; 515 516 // Casting to size_t will truncate large values on 32-bit architectures, 517 // but it's not really worth supporting the linking of 64-bit programs on 518 // 32-bit archs. 519 ArrayRef<uint8_t> data = {nullptr, static_cast<size_t>(common->size)}; 520 // FIXME avoid creating one Section per symbol? 521 auto *section = 522 make<Section>(common->getFile(), segment_names::data, 523 section_names::common, S_ZEROFILL, /*addr=*/0); 524 auto *isec = make<ConcatInputSection>(*section, data, common->align); 525 if (!osec) 526 osec = ConcatOutputSection::getOrCreateForInput(isec); 527 isec->parent = osec; 528 inputSections.push_back(isec); 529 530 // FIXME: CommonSymbol should store isReferencedDynamically, noDeadStrip 531 // and pass them on here. 532 replaceSymbol<Defined>( 533 sym, sym->getName(), common->getFile(), isec, /*value=*/0, /*size=*/0, 534 /*isWeakDef=*/false, /*isExternal=*/true, common->privateExtern, 535 /*includeInSymtab=*/true, /*isThumb=*/false, 536 /*isReferencedDynamically=*/false, /*noDeadStrip=*/false); 537 } 538 } 539 540 static void initializeSectionRenameMap() { 541 if (config->dataConst) { 542 SmallVector<StringRef> v{section_names::got, 543 section_names::authGot, 544 section_names::authPtr, 545 section_names::nonLazySymbolPtr, 546 section_names::const_, 547 section_names::cfString, 548 section_names::moduleInitFunc, 549 section_names::moduleTermFunc, 550 section_names::objcClassList, 551 section_names::objcNonLazyClassList, 552 section_names::objcCatList, 553 section_names::objcNonLazyCatList, 554 section_names::objcProtoList, 555 section_names::objcImageInfo}; 556 for (StringRef s : v) 557 config->sectionRenameMap[{segment_names::data, s}] = { 558 segment_names::dataConst, s}; 559 } 560 config->sectionRenameMap[{segment_names::text, section_names::staticInit}] = { 561 segment_names::text, section_names::text}; 562 config->sectionRenameMap[{segment_names::import, section_names::pointers}] = { 563 config->dataConst ? segment_names::dataConst : segment_names::data, 564 section_names::nonLazySymbolPtr}; 565 } 566 567 static inline char toLowerDash(char x) { 568 if (x >= 'A' && x <= 'Z') 569 return x - 'A' + 'a'; 570 else if (x == ' ') 571 return '-'; 572 return x; 573 } 574 575 static std::string lowerDash(StringRef s) { 576 return std::string(map_iterator(s.begin(), toLowerDash), 577 map_iterator(s.end(), toLowerDash)); 578 } 579 580 struct PlatformVersion { 581 PlatformType platform = PLATFORM_UNKNOWN; 582 llvm::VersionTuple minimum; 583 llvm::VersionTuple sdk; 584 }; 585 586 static PlatformVersion parsePlatformVersion(const Arg *arg) { 587 assert(arg->getOption().getID() == OPT_platform_version); 588 StringRef platformStr = arg->getValue(0); 589 StringRef minVersionStr = arg->getValue(1); 590 StringRef sdkVersionStr = arg->getValue(2); 591 592 PlatformVersion platformVersion; 593 594 // TODO(compnerd) see if we can generate this case list via XMACROS 595 platformVersion.platform = 596 StringSwitch<PlatformType>(lowerDash(platformStr)) 597 .Cases("macos", "1", PLATFORM_MACOS) 598 .Cases("ios", "2", PLATFORM_IOS) 599 .Cases("tvos", "3", PLATFORM_TVOS) 600 .Cases("watchos", "4", PLATFORM_WATCHOS) 601 .Cases("bridgeos", "5", PLATFORM_BRIDGEOS) 602 .Cases("mac-catalyst", "6", PLATFORM_MACCATALYST) 603 .Cases("ios-simulator", "7", PLATFORM_IOSSIMULATOR) 604 .Cases("tvos-simulator", "8", PLATFORM_TVOSSIMULATOR) 605 .Cases("watchos-simulator", "9", PLATFORM_WATCHOSSIMULATOR) 606 .Cases("driverkit", "10", PLATFORM_DRIVERKIT) 607 .Default(PLATFORM_UNKNOWN); 608 if (platformVersion.platform == PLATFORM_UNKNOWN) 609 error(Twine("malformed platform: ") + platformStr); 610 // TODO: check validity of version strings, which varies by platform 611 // NOTE: ld64 accepts version strings with 5 components 612 // llvm::VersionTuple accepts no more than 4 components 613 // Has Apple ever published version strings with 5 components? 614 if (platformVersion.minimum.tryParse(minVersionStr)) 615 error(Twine("malformed minimum version: ") + minVersionStr); 616 if (platformVersion.sdk.tryParse(sdkVersionStr)) 617 error(Twine("malformed sdk version: ") + sdkVersionStr); 618 return platformVersion; 619 } 620 621 // Has the side-effect of setting Config::platformInfo. 622 static PlatformType parsePlatformVersions(const ArgList &args) { 623 std::map<PlatformType, PlatformVersion> platformVersions; 624 const PlatformVersion *lastVersionInfo = nullptr; 625 for (const Arg *arg : args.filtered(OPT_platform_version)) { 626 PlatformVersion version = parsePlatformVersion(arg); 627 628 // For each platform, the last flag wins: 629 // `-platform_version macos 2 3 -platform_version macos 4 5` has the same 630 // effect as just passing `-platform_version macos 4 5`. 631 // FIXME: ld64 warns on multiple flags for one platform. Should we? 632 platformVersions[version.platform] = version; 633 lastVersionInfo = &platformVersions[version.platform]; 634 } 635 636 if (platformVersions.empty()) { 637 error("must specify -platform_version"); 638 return PLATFORM_UNKNOWN; 639 } 640 if (platformVersions.size() > 2) { 641 error("must specify -platform_version at most twice"); 642 return PLATFORM_UNKNOWN; 643 } 644 if (platformVersions.size() == 2) { 645 bool isZipperedCatalyst = platformVersions.count(PLATFORM_MACOS) && 646 platformVersions.count(PLATFORM_MACCATALYST); 647 648 if (!isZipperedCatalyst) { 649 error("lld supports writing zippered outputs only for " 650 "macos and mac-catalyst"); 651 } else if (config->outputType != MH_DYLIB && 652 config->outputType != MH_BUNDLE) { 653 error("writing zippered outputs only valid for -dylib and -bundle"); 654 } else { 655 config->platformInfo.minimum = platformVersions[PLATFORM_MACOS].minimum; 656 config->platformInfo.sdk = platformVersions[PLATFORM_MACOS].sdk; 657 config->secondaryPlatformInfo = PlatformInfo{}; 658 config->secondaryPlatformInfo->minimum = 659 platformVersions[PLATFORM_MACCATALYST].minimum; 660 config->secondaryPlatformInfo->sdk = 661 platformVersions[PLATFORM_MACCATALYST].sdk; 662 } 663 return PLATFORM_MACOS; 664 } 665 666 config->platformInfo.minimum = lastVersionInfo->minimum; 667 config->platformInfo.sdk = lastVersionInfo->sdk; 668 return lastVersionInfo->platform; 669 } 670 671 // Has the side-effect of setting Config::target. 672 static TargetInfo *createTargetInfo(InputArgList &args) { 673 StringRef archName = args.getLastArgValue(OPT_arch); 674 if (archName.empty()) { 675 error("must specify -arch"); 676 return nullptr; 677 } 678 679 PlatformType platform = parsePlatformVersions(args); 680 config->platformInfo.target = 681 MachO::Target(getArchitectureFromName(archName), platform); 682 if (config->secondaryPlatformInfo) { 683 config->secondaryPlatformInfo->target = 684 MachO::Target(getArchitectureFromName(archName), PLATFORM_MACCATALYST); 685 } 686 687 uint32_t cpuType; 688 uint32_t cpuSubtype; 689 std::tie(cpuType, cpuSubtype) = getCPUTypeFromArchitecture(config->arch()); 690 691 switch (cpuType) { 692 case CPU_TYPE_X86_64: 693 return createX86_64TargetInfo(); 694 case CPU_TYPE_ARM64: 695 return createARM64TargetInfo(); 696 case CPU_TYPE_ARM64_32: 697 return createARM64_32TargetInfo(); 698 case CPU_TYPE_ARM: 699 return createARMTargetInfo(cpuSubtype); 700 default: 701 error("missing or unsupported -arch " + archName); 702 return nullptr; 703 } 704 } 705 706 static UndefinedSymbolTreatment 707 getUndefinedSymbolTreatment(const ArgList &args) { 708 StringRef treatmentStr = args.getLastArgValue(OPT_undefined); 709 auto treatment = 710 StringSwitch<UndefinedSymbolTreatment>(treatmentStr) 711 .Cases("error", "", UndefinedSymbolTreatment::error) 712 .Case("warning", UndefinedSymbolTreatment::warning) 713 .Case("suppress", UndefinedSymbolTreatment::suppress) 714 .Case("dynamic_lookup", UndefinedSymbolTreatment::dynamic_lookup) 715 .Default(UndefinedSymbolTreatment::unknown); 716 if (treatment == UndefinedSymbolTreatment::unknown) { 717 warn(Twine("unknown -undefined TREATMENT '") + treatmentStr + 718 "', defaulting to 'error'"); 719 treatment = UndefinedSymbolTreatment::error; 720 } else if (config->namespaceKind == NamespaceKind::twolevel && 721 (treatment == UndefinedSymbolTreatment::warning || 722 treatment == UndefinedSymbolTreatment::suppress)) { 723 if (treatment == UndefinedSymbolTreatment::warning) 724 error("'-undefined warning' only valid with '-flat_namespace'"); 725 else 726 error("'-undefined suppress' only valid with '-flat_namespace'"); 727 treatment = UndefinedSymbolTreatment::error; 728 } 729 return treatment; 730 } 731 732 static ICFLevel getICFLevel(const ArgList &args) { 733 StringRef icfLevelStr = args.getLastArgValue(OPT_icf_eq); 734 auto icfLevel = StringSwitch<ICFLevel>(icfLevelStr) 735 .Cases("none", "", ICFLevel::none) 736 .Case("safe", ICFLevel::safe) 737 .Case("all", ICFLevel::all) 738 .Default(ICFLevel::unknown); 739 if (icfLevel == ICFLevel::unknown) { 740 warn(Twine("unknown --icf=OPTION `") + icfLevelStr + 741 "', defaulting to `none'"); 742 icfLevel = ICFLevel::none; 743 } 744 return icfLevel; 745 } 746 747 static void warnIfDeprecatedOption(const Option &opt) { 748 if (!opt.getGroup().isValid()) 749 return; 750 if (opt.getGroup().getID() == OPT_grp_deprecated) { 751 warn("Option `" + opt.getPrefixedName() + "' is deprecated in ld64:"); 752 warn(opt.getHelpText()); 753 } 754 } 755 756 static void warnIfUnimplementedOption(const Option &opt) { 757 if (!opt.getGroup().isValid() || !opt.hasFlag(DriverFlag::HelpHidden)) 758 return; 759 switch (opt.getGroup().getID()) { 760 case OPT_grp_deprecated: 761 // warn about deprecated options elsewhere 762 break; 763 case OPT_grp_undocumented: 764 warn("Option `" + opt.getPrefixedName() + 765 "' is undocumented. Should lld implement it?"); 766 break; 767 case OPT_grp_obsolete: 768 warn("Option `" + opt.getPrefixedName() + 769 "' is obsolete. Please modernize your usage."); 770 break; 771 case OPT_grp_ignored: 772 warn("Option `" + opt.getPrefixedName() + "' is ignored."); 773 break; 774 case OPT_grp_ignored_silently: 775 break; 776 default: 777 warn("Option `" + opt.getPrefixedName() + 778 "' is not yet implemented. Stay tuned..."); 779 break; 780 } 781 } 782 783 static const char *getReproduceOption(InputArgList &args) { 784 if (const Arg *arg = args.getLastArg(OPT_reproduce)) 785 return arg->getValue(); 786 return getenv("LLD_REPRODUCE"); 787 } 788 789 static void parseClangOption(StringRef opt, const Twine &msg) { 790 std::string err; 791 raw_string_ostream os(err); 792 793 const char *argv[] = {"lld", opt.data()}; 794 if (cl::ParseCommandLineOptions(2, argv, "", &os)) 795 return; 796 os.flush(); 797 error(msg + ": " + StringRef(err).trim()); 798 } 799 800 static uint32_t parseDylibVersion(const ArgList &args, unsigned id) { 801 const Arg *arg = args.getLastArg(id); 802 if (!arg) 803 return 0; 804 805 if (config->outputType != MH_DYLIB) { 806 error(arg->getAsString(args) + ": only valid with -dylib"); 807 return 0; 808 } 809 810 PackedVersion version; 811 if (!version.parse32(arg->getValue())) { 812 error(arg->getAsString(args) + ": malformed version"); 813 return 0; 814 } 815 816 return version.rawValue(); 817 } 818 819 static uint32_t parseProtection(StringRef protStr) { 820 uint32_t prot = 0; 821 for (char c : protStr) { 822 switch (c) { 823 case 'r': 824 prot |= VM_PROT_READ; 825 break; 826 case 'w': 827 prot |= VM_PROT_WRITE; 828 break; 829 case 'x': 830 prot |= VM_PROT_EXECUTE; 831 break; 832 case '-': 833 break; 834 default: 835 error("unknown -segprot letter '" + Twine(c) + "' in " + protStr); 836 return 0; 837 } 838 } 839 return prot; 840 } 841 842 static std::vector<SectionAlign> parseSectAlign(const opt::InputArgList &args) { 843 std::vector<SectionAlign> sectAligns; 844 for (const Arg *arg : args.filtered(OPT_sectalign)) { 845 StringRef segName = arg->getValue(0); 846 StringRef sectName = arg->getValue(1); 847 StringRef alignStr = arg->getValue(2); 848 if (alignStr.startswith("0x") || alignStr.startswith("0X")) 849 alignStr = alignStr.drop_front(2); 850 uint32_t align; 851 if (alignStr.getAsInteger(16, align)) { 852 error("-sectalign: failed to parse '" + StringRef(arg->getValue(2)) + 853 "' as number"); 854 continue; 855 } 856 if (!isPowerOf2_32(align)) { 857 error("-sectalign: '" + StringRef(arg->getValue(2)) + 858 "' (in base 16) not a power of two"); 859 continue; 860 } 861 sectAligns.push_back({segName, sectName, align}); 862 } 863 return sectAligns; 864 } 865 866 PlatformType macho::removeSimulator(PlatformType platform) { 867 switch (platform) { 868 case PLATFORM_IOSSIMULATOR: 869 return PLATFORM_IOS; 870 case PLATFORM_TVOSSIMULATOR: 871 return PLATFORM_TVOS; 872 case PLATFORM_WATCHOSSIMULATOR: 873 return PLATFORM_WATCHOS; 874 default: 875 return platform; 876 } 877 } 878 879 static bool dataConstDefault(const InputArgList &args) { 880 static const std::vector<std::pair<PlatformType, VersionTuple>> minVersion = { 881 {PLATFORM_MACOS, VersionTuple(10, 15)}, 882 {PLATFORM_IOS, VersionTuple(13, 0)}, 883 {PLATFORM_TVOS, VersionTuple(13, 0)}, 884 {PLATFORM_WATCHOS, VersionTuple(6, 0)}, 885 {PLATFORM_BRIDGEOS, VersionTuple(4, 0)}}; 886 PlatformType platform = removeSimulator(config->platformInfo.target.Platform); 887 auto it = llvm::find_if(minVersion, 888 [&](const auto &p) { return p.first == platform; }); 889 if (it != minVersion.end()) 890 if (config->platformInfo.minimum < it->second) 891 return false; 892 893 switch (config->outputType) { 894 case MH_EXECUTE: 895 return !args.hasArg(OPT_no_pie); 896 case MH_BUNDLE: 897 // FIXME: return false when -final_name ... 898 // has prefix "/System/Library/UserEventPlugins/" 899 // or matches "/usr/libexec/locationd" "/usr/libexec/terminusd" 900 return true; 901 case MH_DYLIB: 902 return true; 903 case MH_OBJECT: 904 return false; 905 default: 906 llvm_unreachable( 907 "unsupported output type for determining data-const default"); 908 } 909 return false; 910 } 911 912 void SymbolPatterns::clear() { 913 literals.clear(); 914 globs.clear(); 915 } 916 917 void SymbolPatterns::insert(StringRef symbolName) { 918 if (symbolName.find_first_of("*?[]") == StringRef::npos) 919 literals.insert(CachedHashStringRef(symbolName)); 920 else if (Expected<GlobPattern> pattern = GlobPattern::create(symbolName)) 921 globs.emplace_back(*pattern); 922 else 923 error("invalid symbol-name pattern: " + symbolName); 924 } 925 926 bool SymbolPatterns::matchLiteral(StringRef symbolName) const { 927 return literals.contains(CachedHashStringRef(symbolName)); 928 } 929 930 bool SymbolPatterns::matchGlob(StringRef symbolName) const { 931 for (const GlobPattern &glob : globs) 932 if (glob.match(symbolName)) 933 return true; 934 return false; 935 } 936 937 bool SymbolPatterns::match(StringRef symbolName) const { 938 return matchLiteral(symbolName) || matchGlob(symbolName); 939 } 940 941 static void parseSymbolPatternsFile(const Arg *arg, 942 SymbolPatterns &symbolPatterns) { 943 StringRef path = arg->getValue(); 944 Optional<MemoryBufferRef> buffer = readFile(path); 945 if (!buffer) { 946 error("Could not read symbol file: " + path); 947 return; 948 } 949 MemoryBufferRef mbref = *buffer; 950 for (StringRef line : args::getLines(mbref)) { 951 line = line.take_until([](char c) { return c == '#'; }).trim(); 952 if (!line.empty()) 953 symbolPatterns.insert(line); 954 } 955 } 956 957 static void handleSymbolPatterns(InputArgList &args, 958 SymbolPatterns &symbolPatterns, 959 unsigned singleOptionCode, 960 unsigned listFileOptionCode) { 961 for (const Arg *arg : args.filtered(singleOptionCode)) 962 symbolPatterns.insert(arg->getValue()); 963 for (const Arg *arg : args.filtered(listFileOptionCode)) 964 parseSymbolPatternsFile(arg, symbolPatterns); 965 } 966 967 static void createFiles(const InputArgList &args) { 968 TimeTraceScope timeScope("Load input files"); 969 // This loop should be reserved for options whose exact ordering matters. 970 // Other options should be handled via filtered() and/or getLastArg(). 971 bool isLazy = false; 972 for (const Arg *arg : args) { 973 const Option &opt = arg->getOption(); 974 warnIfDeprecatedOption(opt); 975 warnIfUnimplementedOption(opt); 976 977 switch (opt.getID()) { 978 case OPT_INPUT: 979 addFile(rerootPath(arg->getValue()), ForceLoad::Default, isLazy); 980 break; 981 case OPT_needed_library: 982 if (auto *dylibFile = dyn_cast_or_null<DylibFile>( 983 addFile(rerootPath(arg->getValue()), ForceLoad::Default))) 984 dylibFile->forceNeeded = true; 985 break; 986 case OPT_reexport_library: 987 if (auto *dylibFile = dyn_cast_or_null<DylibFile>( 988 addFile(rerootPath(arg->getValue()), ForceLoad::Default))) { 989 config->hasReexports = true; 990 dylibFile->reexport = true; 991 } 992 break; 993 case OPT_weak_library: 994 if (auto *dylibFile = dyn_cast_or_null<DylibFile>( 995 addFile(rerootPath(arg->getValue()), ForceLoad::Default))) 996 dylibFile->forceWeakImport = true; 997 break; 998 case OPT_filelist: 999 addFileList(arg->getValue(), isLazy); 1000 break; 1001 case OPT_force_load: 1002 addFile(rerootPath(arg->getValue()), ForceLoad::Yes); 1003 break; 1004 case OPT_l: 1005 case OPT_needed_l: 1006 case OPT_reexport_l: 1007 case OPT_weak_l: 1008 addLibrary(arg->getValue(), opt.getID() == OPT_needed_l, 1009 opt.getID() == OPT_weak_l, opt.getID() == OPT_reexport_l, 1010 /*isExplicit=*/true, ForceLoad::Default); 1011 break; 1012 case OPT_framework: 1013 case OPT_needed_framework: 1014 case OPT_reexport_framework: 1015 case OPT_weak_framework: 1016 addFramework(arg->getValue(), opt.getID() == OPT_needed_framework, 1017 opt.getID() == OPT_weak_framework, 1018 opt.getID() == OPT_reexport_framework, /*isExplicit=*/true, 1019 ForceLoad::Default); 1020 break; 1021 case OPT_start_lib: 1022 if (isLazy) 1023 error("nested --start-lib"); 1024 isLazy = true; 1025 break; 1026 case OPT_end_lib: 1027 if (!isLazy) 1028 error("stray --end-lib"); 1029 isLazy = false; 1030 break; 1031 default: 1032 break; 1033 } 1034 } 1035 } 1036 1037 static void gatherInputSections() { 1038 TimeTraceScope timeScope("Gathering input sections"); 1039 int inputOrder = 0; 1040 for (const InputFile *file : inputFiles) { 1041 for (const Section *section : file->sections) { 1042 // Compact unwind entries require special handling elsewhere. (In 1043 // contrast, EH frames are handled like regular ConcatInputSections.) 1044 if (section->name == section_names::compactUnwind) 1045 continue; 1046 ConcatOutputSection *osec = nullptr; 1047 for (const Subsection &subsection : section->subsections) { 1048 if (auto *isec = dyn_cast<ConcatInputSection>(subsection.isec)) { 1049 if (isec->isCoalescedWeak()) 1050 continue; 1051 isec->outSecOff = inputOrder++; 1052 if (!osec) 1053 osec = ConcatOutputSection::getOrCreateForInput(isec); 1054 isec->parent = osec; 1055 inputSections.push_back(isec); 1056 } else if (auto *isec = 1057 dyn_cast<CStringInputSection>(subsection.isec)) { 1058 if (in.cStringSection->inputOrder == UnspecifiedInputOrder) 1059 in.cStringSection->inputOrder = inputOrder++; 1060 in.cStringSection->addInput(isec); 1061 } else if (auto *isec = 1062 dyn_cast<WordLiteralInputSection>(subsection.isec)) { 1063 if (in.wordLiteralSection->inputOrder == UnspecifiedInputOrder) 1064 in.wordLiteralSection->inputOrder = inputOrder++; 1065 in.wordLiteralSection->addInput(isec); 1066 } else { 1067 llvm_unreachable("unexpected input section kind"); 1068 } 1069 } 1070 } 1071 } 1072 assert(inputOrder <= UnspecifiedInputOrder); 1073 } 1074 1075 static void foldIdenticalLiterals() { 1076 // We always create a cStringSection, regardless of whether dedupLiterals is 1077 // true. If it isn't, we simply create a non-deduplicating CStringSection. 1078 // Either way, we must unconditionally finalize it here. 1079 in.cStringSection->finalizeContents(); 1080 if (in.wordLiteralSection) 1081 in.wordLiteralSection->finalizeContents(); 1082 } 1083 1084 static void referenceStubBinder() { 1085 bool needsStubHelper = config->outputType == MH_DYLIB || 1086 config->outputType == MH_EXECUTE || 1087 config->outputType == MH_BUNDLE; 1088 if (!needsStubHelper || !symtab->find("dyld_stub_binder")) 1089 return; 1090 1091 // dyld_stub_binder is used by dyld to resolve lazy bindings. This code here 1092 // adds a opportunistic reference to dyld_stub_binder if it happens to exist. 1093 // dyld_stub_binder is in libSystem.dylib, which is usually linked in. This 1094 // isn't needed for correctness, but the presence of that symbol suppresses 1095 // "no symbols" diagnostics from `nm`. 1096 // StubHelperSection::setup() adds a reference and errors out if 1097 // dyld_stub_binder doesn't exist in case it is actually needed. 1098 symtab->addUndefined("dyld_stub_binder", /*file=*/nullptr, /*isWeak=*/false); 1099 } 1100 1101 bool macho::link(ArrayRef<const char *> argsArr, llvm::raw_ostream &stdoutOS, 1102 llvm::raw_ostream &stderrOS, bool exitEarly, 1103 bool disableOutput) { 1104 // This driver-specific context will be freed later by lldMain(). 1105 auto *ctx = new CommonLinkerContext; 1106 1107 ctx->e.initialize(stdoutOS, stderrOS, exitEarly, disableOutput); 1108 ctx->e.cleanupCallback = []() { 1109 resolvedFrameworks.clear(); 1110 resolvedLibraries.clear(); 1111 cachedReads.clear(); 1112 concatOutputSections.clear(); 1113 inputFiles.clear(); 1114 inputSections.clear(); 1115 loadedArchives.clear(); 1116 loadedObjectFrameworks.clear(); 1117 syntheticSections.clear(); 1118 thunkMap.clear(); 1119 1120 firstTLVDataSection = nullptr; 1121 tar = nullptr; 1122 memset(&in, 0, sizeof(in)); 1123 1124 resetLoadedDylibs(); 1125 resetOutputSegments(); 1126 resetWriter(); 1127 InputFile::resetIdCount(); 1128 }; 1129 1130 ctx->e.logName = args::getFilenameWithoutExe(argsArr[0]); 1131 1132 MachOOptTable parser; 1133 InputArgList args = parser.parse(argsArr.slice(1)); 1134 1135 ctx->e.errorLimitExceededMsg = "too many errors emitted, stopping now " 1136 "(use --error-limit=0 to see all errors)"; 1137 ctx->e.errorLimit = args::getInteger(args, OPT_error_limit_eq, 20); 1138 ctx->e.verbose = args.hasArg(OPT_verbose); 1139 1140 if (args.hasArg(OPT_help_hidden)) { 1141 parser.printHelp(argsArr[0], /*showHidden=*/true); 1142 return true; 1143 } 1144 if (args.hasArg(OPT_help)) { 1145 parser.printHelp(argsArr[0], /*showHidden=*/false); 1146 return true; 1147 } 1148 if (args.hasArg(OPT_version)) { 1149 message(getLLDVersion()); 1150 return true; 1151 } 1152 1153 config = std::make_unique<Configuration>(); 1154 symtab = std::make_unique<SymbolTable>(); 1155 config->outputType = getOutputType(args); 1156 target = createTargetInfo(args); 1157 depTracker = std::make_unique<DependencyTracker>( 1158 args.getLastArgValue(OPT_dependency_info)); 1159 if (errorCount()) 1160 return false; 1161 1162 if (args.hasArg(OPT_pagezero_size)) { 1163 uint64_t pagezeroSize = args::getHex(args, OPT_pagezero_size, 0); 1164 1165 // ld64 does something really weird. It attempts to realign the value to the 1166 // page size, but assumes the the page size is 4K. This doesn't work with 1167 // most of Apple's ARM64 devices, which use a page size of 16K. This means 1168 // that it will first 4K align it by rounding down, then round up to 16K. 1169 // This probably only happened because no one using this arg with anything 1170 // other then 0, so no one checked if it did what is what it says it does. 1171 1172 // So we are not copying this weird behavior and doing the it in a logical 1173 // way, by always rounding down to page size. 1174 if (!isAligned(Align(target->getPageSize()), pagezeroSize)) { 1175 pagezeroSize -= pagezeroSize % target->getPageSize(); 1176 warn("__PAGEZERO size is not page aligned, rounding down to 0x" + 1177 Twine::utohexstr(pagezeroSize)); 1178 } 1179 1180 target->pageZeroSize = pagezeroSize; 1181 } 1182 1183 config->osoPrefix = args.getLastArgValue(OPT_oso_prefix); 1184 if (!config->osoPrefix.empty()) { 1185 // Expand special characters, such as ".", "..", or "~", if present. 1186 // Note: LD64 only expands "." and not other special characters. 1187 // That seems silly to imitate so we will not try to follow it, but rather 1188 // just use real_path() to do it. 1189 1190 // The max path length is 4096, in theory. However that seems quite long 1191 // and seems unlikely that any one would want to strip everything from the 1192 // path. Hence we've picked a reasonably large number here. 1193 SmallString<1024> expanded; 1194 if (!fs::real_path(config->osoPrefix, expanded, 1195 /*expand_tilde=*/true)) { 1196 // Note: LD64 expands "." to be `<current_dir>/` 1197 // (ie., it has a slash suffix) whereas real_path() doesn't. 1198 // So we have to append '/' to be consistent. 1199 StringRef sep = sys::path::get_separator(); 1200 // real_path removes trailing slashes as part of the normalization, but 1201 // these are meaningful for our text based stripping 1202 if (config->osoPrefix.equals(".") || config->osoPrefix.endswith(sep)) 1203 expanded += sep; 1204 config->osoPrefix = saver().save(expanded.str()); 1205 } 1206 } 1207 1208 // Must be set before any InputSections and Symbols are created. 1209 config->deadStrip = args.hasArg(OPT_dead_strip); 1210 1211 config->systemLibraryRoots = getSystemLibraryRoots(args); 1212 if (const char *path = getReproduceOption(args)) { 1213 // Note that --reproduce is a debug option so you can ignore it 1214 // if you are trying to understand the whole picture of the code. 1215 Expected<std::unique_ptr<TarWriter>> errOrWriter = 1216 TarWriter::create(path, path::stem(path)); 1217 if (errOrWriter) { 1218 tar = std::move(*errOrWriter); 1219 tar->append("response.txt", createResponseFile(args)); 1220 tar->append("version.txt", getLLDVersion() + "\n"); 1221 } else { 1222 error("--reproduce: " + toString(errOrWriter.takeError())); 1223 } 1224 } 1225 1226 if (auto *arg = args.getLastArg(OPT_threads_eq)) { 1227 StringRef v(arg->getValue()); 1228 unsigned threads = 0; 1229 if (!llvm::to_integer(v, threads, 0) || threads == 0) 1230 error(arg->getSpelling() + ": expected a positive integer, but got '" + 1231 arg->getValue() + "'"); 1232 parallel::strategy = hardware_concurrency(threads); 1233 config->thinLTOJobs = v; 1234 } 1235 if (auto *arg = args.getLastArg(OPT_thinlto_jobs_eq)) 1236 config->thinLTOJobs = arg->getValue(); 1237 if (!get_threadpool_strategy(config->thinLTOJobs)) 1238 error("--thinlto-jobs: invalid job count: " + config->thinLTOJobs); 1239 1240 for (const Arg *arg : args.filtered(OPT_u)) { 1241 config->explicitUndefineds.push_back(symtab->addUndefined( 1242 arg->getValue(), /*file=*/nullptr, /*isWeakRef=*/false)); 1243 } 1244 1245 for (const Arg *arg : args.filtered(OPT_U)) 1246 config->explicitDynamicLookups.insert(arg->getValue()); 1247 1248 config->mapFile = args.getLastArgValue(OPT_map); 1249 config->optimize = args::getInteger(args, OPT_O, 1); 1250 config->outputFile = args.getLastArgValue(OPT_o, "a.out"); 1251 config->finalOutput = 1252 args.getLastArgValue(OPT_final_output, config->outputFile); 1253 config->astPaths = args.getAllArgValues(OPT_add_ast_path); 1254 config->headerPad = args::getHex(args, OPT_headerpad, /*Default=*/32); 1255 config->headerPadMaxInstallNames = 1256 args.hasArg(OPT_headerpad_max_install_names); 1257 config->printDylibSearch = 1258 args.hasArg(OPT_print_dylib_search) || getenv("RC_TRACE_DYLIB_SEARCHING"); 1259 config->printEachFile = args.hasArg(OPT_t); 1260 config->printWhyLoad = args.hasArg(OPT_why_load); 1261 config->omitDebugInfo = args.hasArg(OPT_S); 1262 config->errorForArchMismatch = args.hasArg(OPT_arch_errors_fatal); 1263 if (const Arg *arg = args.getLastArg(OPT_bundle_loader)) { 1264 if (config->outputType != MH_BUNDLE) 1265 error("-bundle_loader can only be used with MachO bundle output"); 1266 addFile(arg->getValue(), ForceLoad::Default, /*isLazy=*/false, 1267 /*isExplicit=*/false, 1268 /*isBundleLoader=*/true); 1269 } 1270 if (const Arg *arg = args.getLastArg(OPT_umbrella)) { 1271 if (config->outputType != MH_DYLIB) 1272 warn("-umbrella used, but not creating dylib"); 1273 config->umbrella = arg->getValue(); 1274 } 1275 config->ltoObjPath = args.getLastArgValue(OPT_object_path_lto); 1276 config->ltoo = args::getInteger(args, OPT_lto_O, 2); 1277 if (config->ltoo > 3) 1278 error("--lto-O: invalid optimization level: " + Twine(config->ltoo)); 1279 config->thinLTOCacheDir = args.getLastArgValue(OPT_cache_path_lto); 1280 config->thinLTOCachePolicy = getLTOCachePolicy(args); 1281 config->runtimePaths = args::getStrings(args, OPT_rpath); 1282 config->allLoad = args.hasFlag(OPT_all_load, OPT_noall_load, false); 1283 config->archMultiple = args.hasArg(OPT_arch_multiple); 1284 config->applicationExtension = args.hasFlag( 1285 OPT_application_extension, OPT_no_application_extension, false); 1286 config->exportDynamic = args.hasArg(OPT_export_dynamic); 1287 config->forceLoadObjC = args.hasArg(OPT_ObjC); 1288 config->forceLoadSwift = args.hasArg(OPT_force_load_swift_libs); 1289 config->deadStripDylibs = args.hasArg(OPT_dead_strip_dylibs); 1290 config->demangle = args.hasArg(OPT_demangle); 1291 config->implicitDylibs = !args.hasArg(OPT_no_implicit_dylibs); 1292 config->emitFunctionStarts = 1293 args.hasFlag(OPT_function_starts, OPT_no_function_starts, true); 1294 config->emitBitcodeBundle = args.hasArg(OPT_bitcode_bundle); 1295 config->emitDataInCodeInfo = 1296 args.hasFlag(OPT_data_in_code_info, OPT_no_data_in_code_info, true); 1297 config->icfLevel = getICFLevel(args); 1298 config->dedupLiterals = 1299 args.hasFlag(OPT_deduplicate_literals, OPT_icf_eq, false) || 1300 config->icfLevel != ICFLevel::none; 1301 config->warnDylibInstallName = args.hasFlag( 1302 OPT_warn_dylib_install_name, OPT_no_warn_dylib_install_name, false); 1303 config->callGraphProfileSort = args.hasFlag( 1304 OPT_call_graph_profile_sort, OPT_no_call_graph_profile_sort, true); 1305 config->printSymbolOrder = args.getLastArgValue(OPT_print_symbol_order); 1306 config->parseEhFrames = static_cast<bool>(getenv("LLD_IN_TEST")); 1307 1308 // FIXME: Add a commandline flag for this too. 1309 config->zeroModTime = getenv("ZERO_AR_DATE"); 1310 1311 std::array<PlatformType, 3> encryptablePlatforms{ 1312 PLATFORM_IOS, PLATFORM_WATCHOS, PLATFORM_TVOS}; 1313 config->emitEncryptionInfo = 1314 args.hasFlag(OPT_encryptable, OPT_no_encryption, 1315 is_contained(encryptablePlatforms, config->platform())); 1316 1317 #ifndef LLVM_HAVE_LIBXAR 1318 if (config->emitBitcodeBundle) 1319 error("-bitcode_bundle unsupported because LLD wasn't built with libxar"); 1320 #endif 1321 1322 if (const Arg *arg = args.getLastArg(OPT_install_name)) { 1323 if (config->warnDylibInstallName && config->outputType != MH_DYLIB) 1324 warn( 1325 arg->getAsString(args) + 1326 ": ignored, only has effect with -dylib [--warn-dylib-install-name]"); 1327 else 1328 config->installName = arg->getValue(); 1329 } else if (config->outputType == MH_DYLIB) { 1330 config->installName = config->finalOutput; 1331 } 1332 1333 if (args.hasArg(OPT_mark_dead_strippable_dylib)) { 1334 if (config->outputType != MH_DYLIB) 1335 warn("-mark_dead_strippable_dylib: ignored, only has effect with -dylib"); 1336 else 1337 config->markDeadStrippableDylib = true; 1338 } 1339 1340 if (const Arg *arg = args.getLastArg(OPT_static, OPT_dynamic)) 1341 config->staticLink = (arg->getOption().getID() == OPT_static); 1342 1343 if (const Arg *arg = 1344 args.getLastArg(OPT_flat_namespace, OPT_twolevel_namespace)) 1345 config->namespaceKind = arg->getOption().getID() == OPT_twolevel_namespace 1346 ? NamespaceKind::twolevel 1347 : NamespaceKind::flat; 1348 1349 config->undefinedSymbolTreatment = getUndefinedSymbolTreatment(args); 1350 1351 if (config->outputType == MH_EXECUTE) 1352 config->entry = symtab->addUndefined(args.getLastArgValue(OPT_e, "_main"), 1353 /*file=*/nullptr, 1354 /*isWeakRef=*/false); 1355 1356 config->librarySearchPaths = 1357 getLibrarySearchPaths(args, config->systemLibraryRoots); 1358 config->frameworkSearchPaths = 1359 getFrameworkSearchPaths(args, config->systemLibraryRoots); 1360 if (const Arg *arg = 1361 args.getLastArg(OPT_search_paths_first, OPT_search_dylibs_first)) 1362 config->searchDylibsFirst = 1363 arg->getOption().getID() == OPT_search_dylibs_first; 1364 1365 config->dylibCompatibilityVersion = 1366 parseDylibVersion(args, OPT_compatibility_version); 1367 config->dylibCurrentVersion = parseDylibVersion(args, OPT_current_version); 1368 1369 config->dataConst = 1370 args.hasFlag(OPT_data_const, OPT_no_data_const, dataConstDefault(args)); 1371 // Populate config->sectionRenameMap with builtin default renames. 1372 // Options -rename_section and -rename_segment are able to override. 1373 initializeSectionRenameMap(); 1374 // Reject every special character except '.' and '$' 1375 // TODO(gkm): verify that this is the proper set of invalid chars 1376 StringRef invalidNameChars("!\"#%&'()*+,-/:;<=>?@[\\]^`{|}~"); 1377 auto validName = [invalidNameChars](StringRef s) { 1378 if (s.find_first_of(invalidNameChars) != StringRef::npos) 1379 error("invalid name for segment or section: " + s); 1380 return s; 1381 }; 1382 for (const Arg *arg : args.filtered(OPT_rename_section)) { 1383 config->sectionRenameMap[{validName(arg->getValue(0)), 1384 validName(arg->getValue(1))}] = { 1385 validName(arg->getValue(2)), validName(arg->getValue(3))}; 1386 } 1387 for (const Arg *arg : args.filtered(OPT_rename_segment)) { 1388 config->segmentRenameMap[validName(arg->getValue(0))] = 1389 validName(arg->getValue(1)); 1390 } 1391 1392 config->sectionAlignments = parseSectAlign(args); 1393 1394 for (const Arg *arg : args.filtered(OPT_segprot)) { 1395 StringRef segName = arg->getValue(0); 1396 uint32_t maxProt = parseProtection(arg->getValue(1)); 1397 uint32_t initProt = parseProtection(arg->getValue(2)); 1398 if (maxProt != initProt && config->arch() != AK_i386) 1399 error("invalid argument '" + arg->getAsString(args) + 1400 "': max and init must be the same for non-i386 archs"); 1401 if (segName == segment_names::linkEdit) 1402 error("-segprot cannot be used to change __LINKEDIT's protections"); 1403 config->segmentProtections.push_back({segName, maxProt, initProt}); 1404 } 1405 1406 handleSymbolPatterns(args, config->exportedSymbols, OPT_exported_symbol, 1407 OPT_exported_symbols_list); 1408 handleSymbolPatterns(args, config->unexportedSymbols, OPT_unexported_symbol, 1409 OPT_unexported_symbols_list); 1410 if (!config->exportedSymbols.empty() && !config->unexportedSymbols.empty()) { 1411 error("cannot use both -exported_symbol* and -unexported_symbol* options\n" 1412 ">>> ignoring unexports"); 1413 config->unexportedSymbols.clear(); 1414 } 1415 1416 // Imitating LD64's: 1417 // -non_global_symbols_no_strip_list and -non_global_symbols_strip_list can't 1418 // both be present. 1419 // But -x can be used with either of these two, in which case, the last arg 1420 // takes effect. 1421 // (TODO: This is kind of confusing - considering disallowing using them 1422 // together for a more straightforward behaviour) 1423 { 1424 bool includeLocal = false; 1425 bool excludeLocal = false; 1426 for (const Arg *arg : 1427 args.filtered(OPT_x, OPT_non_global_symbols_no_strip_list, 1428 OPT_non_global_symbols_strip_list)) { 1429 switch (arg->getOption().getID()) { 1430 case OPT_x: 1431 config->localSymbolsPresence = SymtabPresence::None; 1432 break; 1433 case OPT_non_global_symbols_no_strip_list: 1434 if (excludeLocal) { 1435 error("cannot use both -non_global_symbols_no_strip_list and " 1436 "-non_global_symbols_strip_list"); 1437 } else { 1438 includeLocal = true; 1439 config->localSymbolsPresence = SymtabPresence::SelectivelyIncluded; 1440 parseSymbolPatternsFile(arg, config->localSymbolPatterns); 1441 } 1442 break; 1443 case OPT_non_global_symbols_strip_list: 1444 if (includeLocal) { 1445 error("cannot use both -non_global_symbols_no_strip_list and " 1446 "-non_global_symbols_strip_list"); 1447 } else { 1448 excludeLocal = true; 1449 config->localSymbolsPresence = SymtabPresence::SelectivelyExcluded; 1450 parseSymbolPatternsFile(arg, config->localSymbolPatterns); 1451 } 1452 break; 1453 default: 1454 llvm_unreachable("unexpected option"); 1455 } 1456 } 1457 } 1458 // Explicitly-exported literal symbols must be defined, but might 1459 // languish in an archive if unreferenced elsewhere or if they are in the 1460 // non-global strip list. Light a fire under those lazy symbols! 1461 for (const CachedHashStringRef &cachedName : config->exportedSymbols.literals) 1462 symtab->addUndefined(cachedName.val(), /*file=*/nullptr, 1463 /*isWeakRef=*/false); 1464 1465 for (const Arg *arg : args.filtered(OPT_why_live)) 1466 config->whyLive.insert(arg->getValue()); 1467 if (!config->whyLive.empty() && !config->deadStrip) 1468 warn("-why_live has no effect without -dead_strip, ignoring"); 1469 1470 config->saveTemps = args.hasArg(OPT_save_temps); 1471 1472 config->adhocCodesign = args.hasFlag( 1473 OPT_adhoc_codesign, OPT_no_adhoc_codesign, 1474 (config->arch() == AK_arm64 || config->arch() == AK_arm64e) && 1475 config->platform() == PLATFORM_MACOS); 1476 1477 if (args.hasArg(OPT_v)) { 1478 message(getLLDVersion(), lld::errs()); 1479 message(StringRef("Library search paths:") + 1480 (config->librarySearchPaths.empty() 1481 ? "" 1482 : "\n\t" + join(config->librarySearchPaths, "\n\t")), 1483 lld::errs()); 1484 message(StringRef("Framework search paths:") + 1485 (config->frameworkSearchPaths.empty() 1486 ? "" 1487 : "\n\t" + join(config->frameworkSearchPaths, "\n\t")), 1488 lld::errs()); 1489 } 1490 1491 config->progName = argsArr[0]; 1492 1493 config->timeTraceEnabled = args.hasArg( 1494 OPT_time_trace, OPT_time_trace_granularity_eq, OPT_time_trace_file_eq); 1495 config->timeTraceGranularity = 1496 args::getInteger(args, OPT_time_trace_granularity_eq, 500); 1497 1498 // Initialize time trace profiler. 1499 if (config->timeTraceEnabled) 1500 timeTraceProfilerInitialize(config->timeTraceGranularity, config->progName); 1501 1502 { 1503 TimeTraceScope timeScope("ExecuteLinker"); 1504 1505 initLLVM(); // must be run before any call to addFile() 1506 createFiles(args); 1507 1508 config->isPic = config->outputType == MH_DYLIB || 1509 config->outputType == MH_BUNDLE || 1510 (config->outputType == MH_EXECUTE && 1511 args.hasFlag(OPT_pie, OPT_no_pie, true)); 1512 1513 // Now that all dylibs have been loaded, search for those that should be 1514 // re-exported. 1515 { 1516 auto reexportHandler = [](const Arg *arg, 1517 const std::vector<StringRef> &extensions) { 1518 config->hasReexports = true; 1519 StringRef searchName = arg->getValue(); 1520 if (!markReexport(searchName, extensions)) 1521 error(arg->getSpelling() + " " + searchName + 1522 " does not match a supplied dylib"); 1523 }; 1524 std::vector<StringRef> extensions = {".tbd"}; 1525 for (const Arg *arg : args.filtered(OPT_sub_umbrella)) 1526 reexportHandler(arg, extensions); 1527 1528 extensions.push_back(".dylib"); 1529 for (const Arg *arg : args.filtered(OPT_sub_library)) 1530 reexportHandler(arg, extensions); 1531 } 1532 1533 cl::ResetAllOptionOccurrences(); 1534 1535 // Parse LTO options. 1536 if (const Arg *arg = args.getLastArg(OPT_mcpu)) 1537 parseClangOption(saver().save("-mcpu=" + StringRef(arg->getValue())), 1538 arg->getSpelling()); 1539 1540 for (const Arg *arg : args.filtered(OPT_mllvm)) 1541 parseClangOption(arg->getValue(), arg->getSpelling()); 1542 1543 compileBitcodeFiles(); 1544 replaceCommonSymbols(); 1545 1546 StringRef orderFile = args.getLastArgValue(OPT_order_file); 1547 if (!orderFile.empty()) 1548 priorityBuilder.parseOrderFile(orderFile); 1549 1550 referenceStubBinder(); 1551 1552 // FIXME: should terminate the link early based on errors encountered so 1553 // far? 1554 1555 createSyntheticSections(); 1556 createSyntheticSymbols(); 1557 1558 if (!config->exportedSymbols.empty()) { 1559 parallelForEach(symtab->getSymbols(), [](Symbol *sym) { 1560 if (auto *defined = dyn_cast<Defined>(sym)) { 1561 StringRef symbolName = defined->getName(); 1562 if (config->exportedSymbols.match(symbolName)) { 1563 if (defined->privateExtern) { 1564 if (defined->weakDefCanBeHidden) { 1565 // weak_def_can_be_hidden symbols behave similarly to 1566 // private_extern symbols in most cases, except for when 1567 // it is explicitly exported. 1568 // The former can be exported but the latter cannot. 1569 defined->privateExtern = false; 1570 } else { 1571 warn("cannot export hidden symbol " + toString(*defined) + 1572 "\n>>> defined in " + toString(defined->getFile())); 1573 } 1574 } 1575 } else { 1576 defined->privateExtern = true; 1577 } 1578 } 1579 }); 1580 } else if (!config->unexportedSymbols.empty()) { 1581 parallelForEach(symtab->getSymbols(), [](Symbol *sym) { 1582 if (auto *defined = dyn_cast<Defined>(sym)) 1583 if (config->unexportedSymbols.match(defined->getName())) 1584 defined->privateExtern = true; 1585 }); 1586 } 1587 1588 for (const Arg *arg : args.filtered(OPT_sectcreate)) { 1589 StringRef segName = arg->getValue(0); 1590 StringRef sectName = arg->getValue(1); 1591 StringRef fileName = arg->getValue(2); 1592 Optional<MemoryBufferRef> buffer = readFile(fileName); 1593 if (buffer) 1594 inputFiles.insert(make<OpaqueFile>(*buffer, segName, sectName)); 1595 } 1596 1597 for (const Arg *arg : args.filtered(OPT_add_empty_section)) { 1598 StringRef segName = arg->getValue(0); 1599 StringRef sectName = arg->getValue(1); 1600 inputFiles.insert(make<OpaqueFile>(MemoryBufferRef(), segName, sectName)); 1601 } 1602 1603 gatherInputSections(); 1604 if (config->callGraphProfileSort) 1605 priorityBuilder.extractCallGraphProfile(); 1606 1607 if (config->deadStrip) 1608 markLive(); 1609 1610 // ICF assumes that all literals have been folded already, so we must run 1611 // foldIdenticalLiterals before foldIdenticalSections. 1612 foldIdenticalLiterals(); 1613 if (config->icfLevel != ICFLevel::none) { 1614 if (config->icfLevel == ICFLevel::safe) 1615 markAddrSigSymbols(); 1616 foldIdenticalSections(); 1617 } 1618 1619 // Write to an output file. 1620 if (target->wordSize == 8) 1621 writeResult<LP64>(); 1622 else 1623 writeResult<ILP32>(); 1624 1625 depTracker->write(getLLDVersion(), inputFiles, config->outputFile); 1626 } 1627 1628 if (config->timeTraceEnabled) { 1629 checkError(timeTraceProfilerWrite( 1630 args.getLastArgValue(OPT_time_trace_file_eq).str(), 1631 config->outputFile)); 1632 1633 timeTraceProfilerCleanup(); 1634 } 1635 return errorCount() == 0; 1636 } 1637