1 //===- Driver.cpp ---------------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8
9 #include "lld/Common/Driver.h"
10 #include "Config.h"
11 #include "InputChunks.h"
12 #include "InputElement.h"
13 #include "MarkLive.h"
14 #include "SymbolTable.h"
15 #include "Writer.h"
16 #include "lld/Common/Args.h"
17 #include "lld/Common/ErrorHandler.h"
18 #include "lld/Common/Filesystem.h"
19 #include "lld/Common/Memory.h"
20 #include "lld/Common/Reproduce.h"
21 #include "lld/Common/Strings.h"
22 #include "lld/Common/Version.h"
23 #include "llvm/ADT/Twine.h"
24 #include "llvm/Config/llvm-config.h"
25 #include "llvm/Object/Wasm.h"
26 #include "llvm/Option/Arg.h"
27 #include "llvm/Option/ArgList.h"
28 #include "llvm/Support/CommandLine.h"
29 #include "llvm/Support/Host.h"
30 #include "llvm/Support/Parallel.h"
31 #include "llvm/Support/Path.h"
32 #include "llvm/Support/Process.h"
33 #include "llvm/Support/TarWriter.h"
34 #include "llvm/Support/TargetSelect.h"
35
36 #define DEBUG_TYPE "lld"
37
38 using namespace llvm;
39 using namespace llvm::object;
40 using namespace llvm::sys;
41 using namespace llvm::wasm;
42
43 namespace lld {
44 namespace wasm {
45 Configuration *config;
46
47 namespace {
48
49 // Create enum with OPT_xxx values for each option in Options.td
50 enum {
51 OPT_INVALID = 0,
52 #define OPTION(_1, _2, ID, _4, _5, _6, _7, _8, _9, _10, _11, _12) OPT_##ID,
53 #include "Options.inc"
54 #undef OPTION
55 };
56
57 // This function is called on startup. We need this for LTO since
58 // LTO calls LLVM functions to compile bitcode files to native code.
59 // Technically this can be delayed until we read bitcode files, but
60 // we don't bother to do lazily because the initialization is fast.
initLLVM()61 static void initLLVM() {
62 InitializeAllTargets();
63 InitializeAllTargetMCs();
64 InitializeAllAsmPrinters();
65 InitializeAllAsmParsers();
66 }
67
68 class LinkerDriver {
69 public:
70 void linkerMain(ArrayRef<const char *> argsArr);
71
72 private:
73 void createFiles(opt::InputArgList &args);
74 void addFile(StringRef path);
75 void addLibrary(StringRef name);
76
77 // True if we are in --whole-archive and --no-whole-archive.
78 bool inWholeArchive = false;
79
80 std::vector<InputFile *> files;
81 };
82 } // anonymous namespace
83
link(ArrayRef<const char * > args,llvm::raw_ostream & stdoutOS,llvm::raw_ostream & stderrOS,bool exitEarly,bool disableOutput)84 bool link(ArrayRef<const char *> args, llvm::raw_ostream &stdoutOS,
85 llvm::raw_ostream &stderrOS, bool exitEarly, bool disableOutput) {
86 // This driver-specific context will be freed later by lldMain().
87 auto *ctx = new CommonLinkerContext;
88
89 ctx->e.initialize(stdoutOS, stderrOS, exitEarly, disableOutput);
90 ctx->e.logName = args::getFilenameWithoutExe(args[0]);
91 ctx->e.errorLimitExceededMsg = "too many errors emitted, stopping now (use "
92 "-error-limit=0 to see all errors)";
93
94 config = make<Configuration>();
95 symtab = make<SymbolTable>();
96
97 initLLVM();
98 LinkerDriver().linkerMain(args);
99
100 return errorCount() == 0;
101 }
102
103 // Create prefix string literals used in Options.td
104 #define PREFIX(NAME, VALUE) const char *const NAME[] = VALUE;
105 #include "Options.inc"
106 #undef PREFIX
107
108 // Create table mapping all options defined in Options.td
109 static const opt::OptTable::Info optInfo[] = {
110 #define OPTION(X1, X2, ID, KIND, GROUP, ALIAS, X7, X8, X9, X10, X11, X12) \
111 {X1, X2, X10, X11, OPT_##ID, opt::Option::KIND##Class, \
112 X9, X8, OPT_##GROUP, OPT_##ALIAS, X7, X12},
113 #include "Options.inc"
114 #undef OPTION
115 };
116
117 namespace {
118 class WasmOptTable : public llvm::opt::OptTable {
119 public:
WasmOptTable()120 WasmOptTable() : OptTable(optInfo) {}
121 opt::InputArgList parse(ArrayRef<const char *> argv);
122 };
123 } // namespace
124
125 // Set color diagnostics according to -color-diagnostics={auto,always,never}
126 // or -no-color-diagnostics flags.
handleColorDiagnostics(opt::InputArgList & args)127 static void handleColorDiagnostics(opt::InputArgList &args) {
128 auto *arg = args.getLastArg(OPT_color_diagnostics, OPT_color_diagnostics_eq,
129 OPT_no_color_diagnostics);
130 if (!arg)
131 return;
132 if (arg->getOption().getID() == OPT_color_diagnostics) {
133 lld::errs().enable_colors(true);
134 } else if (arg->getOption().getID() == OPT_no_color_diagnostics) {
135 lld::errs().enable_colors(false);
136 } else {
137 StringRef s = arg->getValue();
138 if (s == "always")
139 lld::errs().enable_colors(true);
140 else if (s == "never")
141 lld::errs().enable_colors(false);
142 else if (s != "auto")
143 error("unknown option: --color-diagnostics=" + s);
144 }
145 }
146
getQuotingStyle(opt::InputArgList & args)147 static cl::TokenizerCallback getQuotingStyle(opt::InputArgList &args) {
148 if (auto *arg = args.getLastArg(OPT_rsp_quoting)) {
149 StringRef s = arg->getValue();
150 if (s != "windows" && s != "posix")
151 error("invalid response file quoting: " + s);
152 if (s == "windows")
153 return cl::TokenizeWindowsCommandLine;
154 return cl::TokenizeGNUCommandLine;
155 }
156 if (Triple(sys::getProcessTriple()).isOSWindows())
157 return cl::TokenizeWindowsCommandLine;
158 return cl::TokenizeGNUCommandLine;
159 }
160
161 // Find a file by concatenating given paths.
findFile(StringRef path1,const Twine & path2)162 static Optional<std::string> findFile(StringRef path1, const Twine &path2) {
163 SmallString<128> s;
164 path::append(s, path1, path2);
165 if (fs::exists(s))
166 return std::string(s);
167 return None;
168 }
169
parse(ArrayRef<const char * > argv)170 opt::InputArgList WasmOptTable::parse(ArrayRef<const char *> argv) {
171 SmallVector<const char *, 256> vec(argv.data(), argv.data() + argv.size());
172
173 unsigned missingIndex;
174 unsigned missingCount;
175
176 // We need to get the quoting style for response files before parsing all
177 // options so we parse here before and ignore all the options but
178 // --rsp-quoting.
179 opt::InputArgList args = this->ParseArgs(vec, missingIndex, missingCount);
180
181 // Expand response files (arguments in the form of @<filename>)
182 // and then parse the argument again.
183 cl::ExpandResponseFiles(saver(), getQuotingStyle(args), vec);
184 args = this->ParseArgs(vec, missingIndex, missingCount);
185
186 handleColorDiagnostics(args);
187 if (missingCount)
188 error(Twine(args.getArgString(missingIndex)) + ": missing argument");
189
190 for (auto *arg : args.filtered(OPT_UNKNOWN))
191 error("unknown argument: " + arg->getAsString(args));
192 return args;
193 }
194
195 // Currently we allow a ".imports" to live alongside a library. This can
196 // be used to specify a list of symbols which can be undefined at link
197 // time (imported from the environment. For example libc.a include an
198 // import file that lists the syscall functions it relies on at runtime.
199 // In the long run this information would be better stored as a symbol
200 // attribute/flag in the object file itself.
201 // See: https://github.com/WebAssembly/tool-conventions/issues/35
readImportFile(StringRef filename)202 static void readImportFile(StringRef filename) {
203 if (Optional<MemoryBufferRef> buf = readFile(filename))
204 for (StringRef sym : args::getLines(*buf))
205 config->allowUndefinedSymbols.insert(sym);
206 }
207
208 // Returns slices of MB by parsing MB as an archive file.
209 // Each slice consists of a member file in the archive.
getArchiveMembers(MemoryBufferRef mb)210 std::vector<MemoryBufferRef> static getArchiveMembers(MemoryBufferRef mb) {
211 std::unique_ptr<Archive> file =
212 CHECK(Archive::create(mb),
213 mb.getBufferIdentifier() + ": failed to parse archive");
214
215 std::vector<MemoryBufferRef> v;
216 Error err = Error::success();
217 for (const Archive::Child &c : file->children(err)) {
218 MemoryBufferRef mbref =
219 CHECK(c.getMemoryBufferRef(),
220 mb.getBufferIdentifier() +
221 ": could not get the buffer for a child of the archive");
222 v.push_back(mbref);
223 }
224 if (err)
225 fatal(mb.getBufferIdentifier() +
226 ": Archive::children failed: " + toString(std::move(err)));
227
228 // Take ownership of memory buffers created for members of thin archives.
229 for (std::unique_ptr<MemoryBuffer> &mb : file->takeThinBuffers())
230 make<std::unique_ptr<MemoryBuffer>>(std::move(mb));
231
232 return v;
233 }
234
addFile(StringRef path)235 void LinkerDriver::addFile(StringRef path) {
236 Optional<MemoryBufferRef> buffer = readFile(path);
237 if (!buffer)
238 return;
239 MemoryBufferRef mbref = *buffer;
240
241 switch (identify_magic(mbref.getBuffer())) {
242 case file_magic::archive: {
243 SmallString<128> importFile = path;
244 path::replace_extension(importFile, ".imports");
245 if (fs::exists(importFile))
246 readImportFile(importFile.str());
247
248 // Handle -whole-archive.
249 if (inWholeArchive) {
250 for (MemoryBufferRef &m : getArchiveMembers(mbref)) {
251 auto *object = createObjectFile(m, path);
252 // Mark object as live; object members are normally not
253 // live by default but -whole-archive is designed to treat
254 // them as such.
255 object->markLive();
256 files.push_back(object);
257 }
258
259 return;
260 }
261
262 std::unique_ptr<Archive> file =
263 CHECK(Archive::create(mbref), path + ": failed to parse archive");
264
265 if (!file->isEmpty() && !file->hasSymbolTable()) {
266 error(mbref.getBufferIdentifier() +
267 ": archive has no index; run ranlib to add one");
268 }
269
270 files.push_back(make<ArchiveFile>(mbref));
271 return;
272 }
273 case file_magic::bitcode:
274 case file_magic::wasm_object:
275 files.push_back(createObjectFile(mbref));
276 break;
277 default:
278 error("unknown file type: " + mbref.getBufferIdentifier());
279 }
280 }
281
282 // Add a given library by searching it from input search paths.
addLibrary(StringRef name)283 void LinkerDriver::addLibrary(StringRef name) {
284 for (StringRef dir : config->searchPaths) {
285 if (Optional<std::string> s = findFile(dir, "lib" + name + ".a")) {
286 addFile(*s);
287 return;
288 }
289 }
290
291 error("unable to find library -l" + name);
292 }
293
createFiles(opt::InputArgList & args)294 void LinkerDriver::createFiles(opt::InputArgList &args) {
295 for (auto *arg : args) {
296 switch (arg->getOption().getID()) {
297 case OPT_l:
298 addLibrary(arg->getValue());
299 break;
300 case OPT_INPUT:
301 addFile(arg->getValue());
302 break;
303 case OPT_whole_archive:
304 inWholeArchive = true;
305 break;
306 case OPT_no_whole_archive:
307 inWholeArchive = false;
308 break;
309 }
310 }
311 if (files.empty() && errorCount() == 0)
312 error("no input files");
313 }
314
getEntry(opt::InputArgList & args)315 static StringRef getEntry(opt::InputArgList &args) {
316 auto *arg = args.getLastArg(OPT_entry, OPT_no_entry);
317 if (!arg) {
318 if (args.hasArg(OPT_relocatable))
319 return "";
320 if (args.hasArg(OPT_shared))
321 return "__wasm_call_ctors";
322 return "_start";
323 }
324 if (arg->getOption().getID() == OPT_no_entry)
325 return "";
326 return arg->getValue();
327 }
328
329 // Determines what we should do if there are remaining unresolved
330 // symbols after the name resolution.
getUnresolvedSymbolPolicy(opt::InputArgList & args)331 static UnresolvedPolicy getUnresolvedSymbolPolicy(opt::InputArgList &args) {
332 UnresolvedPolicy errorOrWarn = args.hasFlag(OPT_error_unresolved_symbols,
333 OPT_warn_unresolved_symbols, true)
334 ? UnresolvedPolicy::ReportError
335 : UnresolvedPolicy::Warn;
336
337 if (auto *arg = args.getLastArg(OPT_unresolved_symbols)) {
338 StringRef s = arg->getValue();
339 if (s == "ignore-all")
340 return UnresolvedPolicy::Ignore;
341 if (s == "import-dynamic")
342 return UnresolvedPolicy::ImportDynamic;
343 if (s == "report-all")
344 return errorOrWarn;
345 error("unknown --unresolved-symbols value: " + s);
346 }
347
348 return errorOrWarn;
349 }
350
351 // Initializes Config members by the command line options.
readConfigs(opt::InputArgList & args)352 static void readConfigs(opt::InputArgList &args) {
353 config->bsymbolic = args.hasArg(OPT_Bsymbolic);
354 config->checkFeatures =
355 args.hasFlag(OPT_check_features, OPT_no_check_features, true);
356 config->compressRelocations = args.hasArg(OPT_compress_relocations);
357 config->demangle = args.hasFlag(OPT_demangle, OPT_no_demangle, true);
358 config->disableVerify = args.hasArg(OPT_disable_verify);
359 config->emitRelocs = args.hasArg(OPT_emit_relocs);
360 config->experimentalPic = args.hasArg(OPT_experimental_pic);
361 config->entry = getEntry(args);
362 config->exportAll = args.hasArg(OPT_export_all);
363 config->exportTable = args.hasArg(OPT_export_table);
364 config->growableTable = args.hasArg(OPT_growable_table);
365 config->importMemory = args.hasArg(OPT_import_memory);
366 config->sharedMemory = args.hasArg(OPT_shared_memory);
367 config->importTable = args.hasArg(OPT_import_table);
368 config->importUndefined = args.hasArg(OPT_import_undefined);
369 config->ltoo = args::getInteger(args, OPT_lto_O, 2);
370 config->ltoPartitions = args::getInteger(args, OPT_lto_partitions, 1);
371 config->ltoDebugPassManager = args.hasArg(OPT_lto_debug_pass_manager);
372 config->mapFile = args.getLastArgValue(OPT_Map);
373 config->optimize = args::getInteger(args, OPT_O, 1);
374 config->outputFile = args.getLastArgValue(OPT_o);
375 config->relocatable = args.hasArg(OPT_relocatable);
376 config->gcSections =
377 args.hasFlag(OPT_gc_sections, OPT_no_gc_sections, !config->relocatable);
378 config->mergeDataSegments =
379 args.hasFlag(OPT_merge_data_segments, OPT_no_merge_data_segments,
380 !config->relocatable);
381 config->pie = args.hasFlag(OPT_pie, OPT_no_pie, false);
382 config->printGcSections =
383 args.hasFlag(OPT_print_gc_sections, OPT_no_print_gc_sections, false);
384 config->saveTemps = args.hasArg(OPT_save_temps);
385 config->searchPaths = args::getStrings(args, OPT_L);
386 config->shared = args.hasArg(OPT_shared);
387 config->stripAll = args.hasArg(OPT_strip_all);
388 config->stripDebug = args.hasArg(OPT_strip_debug);
389 config->stackFirst = args.hasArg(OPT_stack_first);
390 config->trace = args.hasArg(OPT_trace);
391 config->thinLTOCacheDir = args.getLastArgValue(OPT_thinlto_cache_dir);
392 config->thinLTOCachePolicy = CHECK(
393 parseCachePruningPolicy(args.getLastArgValue(OPT_thinlto_cache_policy)),
394 "--thinlto-cache-policy: invalid cache policy");
395 config->unresolvedSymbols = getUnresolvedSymbolPolicy(args);
396 errorHandler().verbose = args.hasArg(OPT_verbose);
397 LLVM_DEBUG(errorHandler().verbose = true);
398
399 config->initialMemory = args::getInteger(args, OPT_initial_memory, 0);
400 config->globalBase = args::getInteger(args, OPT_global_base, 1024);
401 config->maxMemory = args::getInteger(args, OPT_max_memory, 0);
402 config->zStackSize =
403 args::getZOptionValue(args, OPT_z, "stack-size", WasmPageSize);
404
405 // Default value of exportDynamic depends on `-shared`
406 config->exportDynamic =
407 args.hasFlag(OPT_export_dynamic, OPT_no_export_dynamic, config->shared);
408
409 // Parse wasm32/64.
410 if (auto *arg = args.getLastArg(OPT_m)) {
411 StringRef s = arg->getValue();
412 if (s == "wasm32")
413 config->is64 = false;
414 else if (s == "wasm64")
415 config->is64 = true;
416 else
417 error("invalid target architecture: " + s);
418 }
419
420 // --threads= takes a positive integer and provides the default value for
421 // --thinlto-jobs=.
422 if (auto *arg = args.getLastArg(OPT_threads)) {
423 StringRef v(arg->getValue());
424 unsigned threads = 0;
425 if (!llvm::to_integer(v, threads, 0) || threads == 0)
426 error(arg->getSpelling() + ": expected a positive integer, but got '" +
427 arg->getValue() + "'");
428 parallel::strategy = hardware_concurrency(threads);
429 config->thinLTOJobs = v;
430 }
431 if (auto *arg = args.getLastArg(OPT_thinlto_jobs))
432 config->thinLTOJobs = arg->getValue();
433
434 if (auto *arg = args.getLastArg(OPT_features)) {
435 config->features =
436 llvm::Optional<std::vector<std::string>>(std::vector<std::string>());
437 for (StringRef s : arg->getValues())
438 config->features->push_back(std::string(s));
439 }
440
441 // Legacy --allow-undefined flag which is equivalent to
442 // --unresolve-symbols=ignore + --import-undefined
443 if (args.hasArg(OPT_allow_undefined)) {
444 config->importUndefined = true;
445 config->unresolvedSymbols = UnresolvedPolicy::Ignore;
446 }
447
448 if (args.hasArg(OPT_print_map))
449 config->mapFile = "-";
450 }
451
452 // Some Config members do not directly correspond to any particular
453 // command line options, but computed based on other Config values.
454 // This function initialize such members. See Config.h for the details
455 // of these values.
setConfigs()456 static void setConfigs() {
457 config->isPic = config->pie || config->shared;
458
459 if (config->isPic) {
460 if (config->exportTable)
461 error("-shared/-pie is incompatible with --export-table");
462 config->importTable = true;
463 }
464
465 if (config->relocatable) {
466 if (config->exportTable)
467 error("--relocatable is incompatible with --export-table");
468 if (config->growableTable)
469 error("--relocatable is incompatible with --growable-table");
470 // Ignore any --import-table, as it's redundant.
471 config->importTable = true;
472 }
473
474 if (config->shared) {
475 config->importMemory = true;
476 config->importUndefined = true;
477 }
478 }
479
480 // Some command line options or some combinations of them are not allowed.
481 // This function checks for such errors.
checkOptions(opt::InputArgList & args)482 static void checkOptions(opt::InputArgList &args) {
483 if (!config->stripDebug && !config->stripAll && config->compressRelocations)
484 error("--compress-relocations is incompatible with output debug"
485 " information. Please pass --strip-debug or --strip-all");
486
487 if (config->ltoo > 3)
488 error("invalid optimization level for LTO: " + Twine(config->ltoo));
489 if (config->ltoPartitions == 0)
490 error("--lto-partitions: number of threads must be > 0");
491 if (!get_threadpool_strategy(config->thinLTOJobs))
492 error("--thinlto-jobs: invalid job count: " + config->thinLTOJobs);
493
494 if (config->pie && config->shared)
495 error("-shared and -pie may not be used together");
496
497 if (config->outputFile.empty())
498 error("no output file specified");
499
500 if (config->importTable && config->exportTable)
501 error("--import-table and --export-table may not be used together");
502
503 if (config->relocatable) {
504 if (!config->entry.empty())
505 error("entry point specified for relocatable output file");
506 if (config->gcSections)
507 error("-r and --gc-sections may not be used together");
508 if (config->compressRelocations)
509 error("-r -and --compress-relocations may not be used together");
510 if (args.hasArg(OPT_undefined))
511 error("-r -and --undefined may not be used together");
512 if (config->pie)
513 error("-r and -pie may not be used together");
514 if (config->sharedMemory)
515 error("-r and --shared-memory may not be used together");
516 }
517
518 // To begin to prepare for Module Linking-style shared libraries, start
519 // warning about uses of `-shared` and related flags outside of Experimental
520 // mode, to give anyone using them a heads-up that they will be changing.
521 //
522 // Also, warn about flags which request explicit exports.
523 if (!config->experimentalPic) {
524 // -shared will change meaning when Module Linking is implemented.
525 if (config->shared) {
526 warn("creating shared libraries, with -shared, is not yet stable");
527 }
528
529 // -pie will change meaning when Module Linking is implemented.
530 if (config->pie) {
531 warn("creating PIEs, with -pie, is not yet stable");
532 }
533
534 if (config->unresolvedSymbols == UnresolvedPolicy::ImportDynamic) {
535 warn("dynamic imports are not yet stable "
536 "(--unresolved-symbols=import-dynamic)");
537 }
538 }
539
540 if (config->bsymbolic && !config->shared) {
541 warn("-Bsymbolic is only meaningful when combined with -shared");
542 }
543 }
544
545 // Force Sym to be entered in the output. Used for -u or equivalent.
handleUndefined(StringRef name)546 static Symbol *handleUndefined(StringRef name) {
547 Symbol *sym = symtab->find(name);
548 if (!sym)
549 return nullptr;
550
551 // Since symbol S may not be used inside the program, LTO may
552 // eliminate it. Mark the symbol as "used" to prevent it.
553 sym->isUsedInRegularObj = true;
554
555 if (auto *lazySym = dyn_cast<LazySymbol>(sym))
556 lazySym->fetch();
557
558 return sym;
559 }
560
handleLibcall(StringRef name)561 static void handleLibcall(StringRef name) {
562 Symbol *sym = symtab->find(name);
563 if (!sym)
564 return;
565
566 if (auto *lazySym = dyn_cast<LazySymbol>(sym)) {
567 MemoryBufferRef mb = lazySym->getMemberBuffer();
568 if (isBitcode(mb))
569 lazySym->fetch();
570 }
571 }
572
573 static UndefinedGlobal *
createUndefinedGlobal(StringRef name,llvm::wasm::WasmGlobalType * type)574 createUndefinedGlobal(StringRef name, llvm::wasm::WasmGlobalType *type) {
575 auto *sym = cast<UndefinedGlobal>(symtab->addUndefinedGlobal(
576 name, None, None, WASM_SYMBOL_UNDEFINED, nullptr, type));
577 config->allowUndefinedSymbols.insert(sym->getName());
578 sym->isUsedInRegularObj = true;
579 return sym;
580 }
581
createGlobal(StringRef name,bool isMutable)582 static InputGlobal *createGlobal(StringRef name, bool isMutable) {
583 llvm::wasm::WasmGlobal wasmGlobal;
584 bool is64 = config->is64.value_or(false);
585 wasmGlobal.Type = {uint8_t(is64 ? WASM_TYPE_I64 : WASM_TYPE_I32), isMutable};
586 wasmGlobal.InitExpr = intConst(0, is64);
587 wasmGlobal.SymbolName = name;
588 return make<InputGlobal>(wasmGlobal, nullptr);
589 }
590
createGlobalVariable(StringRef name,bool isMutable)591 static GlobalSymbol *createGlobalVariable(StringRef name, bool isMutable) {
592 InputGlobal *g = createGlobal(name, isMutable);
593 return symtab->addSyntheticGlobal(name, WASM_SYMBOL_VISIBILITY_HIDDEN, g);
594 }
595
createOptionalGlobal(StringRef name,bool isMutable)596 static GlobalSymbol *createOptionalGlobal(StringRef name, bool isMutable) {
597 InputGlobal *g = createGlobal(name, isMutable);
598 return symtab->addOptionalGlobalSymbol(name, g);
599 }
600
601 // Create ABI-defined synthetic symbols
createSyntheticSymbols()602 static void createSyntheticSymbols() {
603 if (config->relocatable)
604 return;
605
606 static WasmSignature nullSignature = {{}, {}};
607 static WasmSignature i32ArgSignature = {{}, {ValType::I32}};
608 static WasmSignature i64ArgSignature = {{}, {ValType::I64}};
609 static llvm::wasm::WasmGlobalType globalTypeI32 = {WASM_TYPE_I32, false};
610 static llvm::wasm::WasmGlobalType globalTypeI64 = {WASM_TYPE_I64, false};
611 static llvm::wasm::WasmGlobalType mutableGlobalTypeI32 = {WASM_TYPE_I32,
612 true};
613 static llvm::wasm::WasmGlobalType mutableGlobalTypeI64 = {WASM_TYPE_I64,
614 true};
615 WasmSym::callCtors = symtab->addSyntheticFunction(
616 "__wasm_call_ctors", WASM_SYMBOL_VISIBILITY_HIDDEN,
617 make<SyntheticFunction>(nullSignature, "__wasm_call_ctors"));
618
619 bool is64 = config->is64.value_or(false);
620
621 if (config->isPic) {
622 WasmSym::stackPointer =
623 createUndefinedGlobal("__stack_pointer", config->is64.value_or(false)
624 ? &mutableGlobalTypeI64
625 : &mutableGlobalTypeI32);
626 // For PIC code, we import two global variables (__memory_base and
627 // __table_base) from the environment and use these as the offset at
628 // which to load our static data and function table.
629 // See:
630 // https://github.com/WebAssembly/tool-conventions/blob/main/DynamicLinking.md
631 auto *globalType = is64 ? &globalTypeI64 : &globalTypeI32;
632 WasmSym::memoryBase = createUndefinedGlobal("__memory_base", globalType);
633 WasmSym::tableBase = createUndefinedGlobal("__table_base", globalType);
634 WasmSym::memoryBase->markLive();
635 WasmSym::tableBase->markLive();
636 if (is64) {
637 WasmSym::tableBase32 =
638 createUndefinedGlobal("__table_base32", &globalTypeI32);
639 WasmSym::tableBase32->markLive();
640 } else {
641 WasmSym::tableBase32 = nullptr;
642 }
643 } else {
644 // For non-PIC code
645 WasmSym::stackPointer = createGlobalVariable("__stack_pointer", true);
646 WasmSym::stackPointer->markLive();
647 }
648
649 if (config->sharedMemory) {
650 WasmSym::tlsBase = createGlobalVariable("__tls_base", true);
651 WasmSym::tlsSize = createGlobalVariable("__tls_size", false);
652 WasmSym::tlsAlign = createGlobalVariable("__tls_align", false);
653 WasmSym::initTLS = symtab->addSyntheticFunction(
654 "__wasm_init_tls", WASM_SYMBOL_VISIBILITY_HIDDEN,
655 make<SyntheticFunction>(
656 is64 ? i64ArgSignature : i32ArgSignature,
657 "__wasm_init_tls"));
658 }
659
660 if (config->isPic ||
661 config->unresolvedSymbols == UnresolvedPolicy::ImportDynamic) {
662 // For PIC code, or when dynamically importing addresses, we create
663 // synthetic functions that apply relocations. These get called from
664 // __wasm_call_ctors before the user-level constructors.
665 WasmSym::applyDataRelocs = symtab->addSyntheticFunction(
666 "__wasm_apply_data_relocs",
667 WASM_SYMBOL_VISIBILITY_DEFAULT | WASM_SYMBOL_EXPORTED,
668 make<SyntheticFunction>(nullSignature, "__wasm_apply_data_relocs"));
669 }
670 }
671
createOptionalSymbols()672 static void createOptionalSymbols() {
673 if (config->relocatable)
674 return;
675
676 WasmSym::dsoHandle = symtab->addOptionalDataSymbol("__dso_handle");
677
678 if (!config->shared)
679 WasmSym::dataEnd = symtab->addOptionalDataSymbol("__data_end");
680
681 if (!config->isPic) {
682 WasmSym::globalBase = symtab->addOptionalDataSymbol("__global_base");
683 WasmSym::heapBase = symtab->addOptionalDataSymbol("__heap_base");
684 WasmSym::heapEnd = symtab->addOptionalDataSymbol("__heap_end");
685 WasmSym::definedMemoryBase = symtab->addOptionalDataSymbol("__memory_base");
686 WasmSym::definedTableBase = symtab->addOptionalDataSymbol("__table_base");
687 if (config->is64.value_or(false))
688 WasmSym::definedTableBase32 =
689 symtab->addOptionalDataSymbol("__table_base32");
690 }
691
692 // For non-shared memory programs we still need to define __tls_base since we
693 // allow object files built with TLS to be linked into single threaded
694 // programs, and such object files can contain references to this symbol.
695 //
696 // However, in this case __tls_base is immutable and points directly to the
697 // start of the `.tdata` static segment.
698 //
699 // __tls_size and __tls_align are not needed in this case since they are only
700 // needed for __wasm_init_tls (which we do not create in this case).
701 if (!config->sharedMemory)
702 WasmSym::tlsBase = createOptionalGlobal("__tls_base", false);
703 }
704
705 // Reconstructs command line arguments so that so that you can re-run
706 // the same command with the same inputs. This is for --reproduce.
createResponseFile(const opt::InputArgList & args)707 static std::string createResponseFile(const opt::InputArgList &args) {
708 SmallString<0> data;
709 raw_svector_ostream os(data);
710
711 // Copy the command line to the output while rewriting paths.
712 for (auto *arg : args) {
713 switch (arg->getOption().getID()) {
714 case OPT_reproduce:
715 break;
716 case OPT_INPUT:
717 os << quote(relativeToRoot(arg->getValue())) << "\n";
718 break;
719 case OPT_o:
720 // If -o path contains directories, "lld @response.txt" will likely
721 // fail because the archive we are creating doesn't contain empty
722 // directories for the output path (-o doesn't create directories).
723 // Strip directories to prevent the issue.
724 os << "-o " << quote(sys::path::filename(arg->getValue())) << "\n";
725 break;
726 default:
727 os << toString(*arg) << "\n";
728 }
729 }
730 return std::string(data.str());
731 }
732
733 // The --wrap option is a feature to rename symbols so that you can write
734 // wrappers for existing functions. If you pass `-wrap=foo`, all
735 // occurrences of symbol `foo` are resolved to `wrap_foo` (so, you are
736 // expected to write `wrap_foo` function as a wrapper). The original
737 // symbol becomes accessible as `real_foo`, so you can call that from your
738 // wrapper.
739 //
740 // This data structure is instantiated for each -wrap option.
741 struct WrappedSymbol {
742 Symbol *sym;
743 Symbol *real;
744 Symbol *wrap;
745 };
746
addUndefined(StringRef name)747 static Symbol *addUndefined(StringRef name) {
748 return symtab->addUndefinedFunction(name, None, None, WASM_SYMBOL_UNDEFINED,
749 nullptr, nullptr, false);
750 }
751
752 // Handles -wrap option.
753 //
754 // This function instantiates wrapper symbols. At this point, they seem
755 // like they are not being used at all, so we explicitly set some flags so
756 // that LTO won't eliminate them.
addWrappedSymbols(opt::InputArgList & args)757 static std::vector<WrappedSymbol> addWrappedSymbols(opt::InputArgList &args) {
758 std::vector<WrappedSymbol> v;
759 DenseSet<StringRef> seen;
760
761 for (auto *arg : args.filtered(OPT_wrap)) {
762 StringRef name = arg->getValue();
763 if (!seen.insert(name).second)
764 continue;
765
766 Symbol *sym = symtab->find(name);
767 if (!sym)
768 continue;
769
770 Symbol *real = addUndefined(saver().save("__real_" + name));
771 Symbol *wrap = addUndefined(saver().save("__wrap_" + name));
772 v.push_back({sym, real, wrap});
773
774 // We want to tell LTO not to inline symbols to be overwritten
775 // because LTO doesn't know the final symbol contents after renaming.
776 real->canInline = false;
777 sym->canInline = false;
778
779 // Tell LTO not to eliminate these symbols.
780 sym->isUsedInRegularObj = true;
781 wrap->isUsedInRegularObj = true;
782 real->isUsedInRegularObj = false;
783 }
784 return v;
785 }
786
787 // Do renaming for -wrap by updating pointers to symbols.
788 //
789 // When this function is executed, only InputFiles and symbol table
790 // contain pointers to symbol objects. We visit them to replace pointers,
791 // so that wrapped symbols are swapped as instructed by the command line.
wrapSymbols(ArrayRef<WrappedSymbol> wrapped)792 static void wrapSymbols(ArrayRef<WrappedSymbol> wrapped) {
793 DenseMap<Symbol *, Symbol *> map;
794 for (const WrappedSymbol &w : wrapped) {
795 map[w.sym] = w.wrap;
796 map[w.real] = w.sym;
797 }
798
799 // Update pointers in input files.
800 parallelForEach(symtab->objectFiles, [&](InputFile *file) {
801 MutableArrayRef<Symbol *> syms = file->getMutableSymbols();
802 for (size_t i = 0, e = syms.size(); i != e; ++i)
803 if (Symbol *s = map.lookup(syms[i]))
804 syms[i] = s;
805 });
806
807 // Update pointers in the symbol table.
808 for (const WrappedSymbol &w : wrapped)
809 symtab->wrap(w.sym, w.real, w.wrap);
810 }
811
splitSections()812 static void splitSections() {
813 // splitIntoPieces needs to be called on each MergeInputChunk
814 // before calling finalizeContents().
815 LLVM_DEBUG(llvm::dbgs() << "splitSections\n");
816 parallelForEach(symtab->objectFiles, [](ObjFile *file) {
817 for (InputChunk *seg : file->segments) {
818 if (auto *s = dyn_cast<MergeInputChunk>(seg))
819 s->splitIntoPieces();
820 }
821 for (InputChunk *sec : file->customSections) {
822 if (auto *s = dyn_cast<MergeInputChunk>(sec))
823 s->splitIntoPieces();
824 }
825 });
826 }
827
isKnownZFlag(StringRef s)828 static bool isKnownZFlag(StringRef s) {
829 // For now, we only support a very limited set of -z flags
830 return s.startswith("stack-size=");
831 }
832
833 // Report a warning for an unknown -z option.
checkZOptions(opt::InputArgList & args)834 static void checkZOptions(opt::InputArgList &args) {
835 for (auto *arg : args.filtered(OPT_z))
836 if (!isKnownZFlag(arg->getValue()))
837 warn("unknown -z value: " + StringRef(arg->getValue()));
838 }
839
linkerMain(ArrayRef<const char * > argsArr)840 void LinkerDriver::linkerMain(ArrayRef<const char *> argsArr) {
841 WasmOptTable parser;
842 opt::InputArgList args = parser.parse(argsArr.slice(1));
843
844 // Interpret these flags early because error()/warn() depend on them.
845 errorHandler().errorLimit = args::getInteger(args, OPT_error_limit, 20);
846 errorHandler().fatalWarnings =
847 args.hasFlag(OPT_fatal_warnings, OPT_no_fatal_warnings, false);
848 checkZOptions(args);
849
850 // Handle --help
851 if (args.hasArg(OPT_help)) {
852 parser.printHelp(lld::outs(),
853 (std::string(argsArr[0]) + " [options] file...").c_str(),
854 "LLVM Linker", false);
855 return;
856 }
857
858 // Handle --version
859 if (args.hasArg(OPT_version) || args.hasArg(OPT_v)) {
860 lld::outs() << getLLDVersion() << "\n";
861 return;
862 }
863
864 // Handle --reproduce
865 if (auto *arg = args.getLastArg(OPT_reproduce)) {
866 StringRef path = arg->getValue();
867 Expected<std::unique_ptr<TarWriter>> errOrWriter =
868 TarWriter::create(path, path::stem(path));
869 if (errOrWriter) {
870 tar = std::move(*errOrWriter);
871 tar->append("response.txt", createResponseFile(args));
872 tar->append("version.txt", getLLDVersion() + "\n");
873 } else {
874 error("--reproduce: " + toString(errOrWriter.takeError()));
875 }
876 }
877
878 // Parse and evaluate -mllvm options.
879 std::vector<const char *> v;
880 v.push_back("wasm-ld (LLVM option parsing)");
881 for (auto *arg : args.filtered(OPT_mllvm))
882 v.push_back(arg->getValue());
883 cl::ResetAllOptionOccurrences();
884 cl::ParseCommandLineOptions(v.size(), v.data());
885
886 readConfigs(args);
887
888 createFiles(args);
889 if (errorCount())
890 return;
891
892 setConfigs();
893 checkOptions(args);
894 if (errorCount())
895 return;
896
897 if (auto *arg = args.getLastArg(OPT_allow_undefined_file))
898 readImportFile(arg->getValue());
899
900 // Fail early if the output file or map file is not writable. If a user has a
901 // long link, e.g. due to a large LTO link, they do not wish to run it and
902 // find that it failed because there was a mistake in their command-line.
903 if (auto e = tryCreateFile(config->outputFile))
904 error("cannot open output file " + config->outputFile + ": " + e.message());
905 if (auto e = tryCreateFile(config->mapFile))
906 error("cannot open map file " + config->mapFile + ": " + e.message());
907 if (errorCount())
908 return;
909
910 // Handle --trace-symbol.
911 for (auto *arg : args.filtered(OPT_trace_symbol))
912 symtab->trace(arg->getValue());
913
914 for (auto *arg : args.filtered(OPT_export_if_defined))
915 config->exportedSymbols.insert(arg->getValue());
916
917 for (auto *arg : args.filtered(OPT_export)) {
918 config->exportedSymbols.insert(arg->getValue());
919 config->requiredExports.push_back(arg->getValue());
920 }
921
922 createSyntheticSymbols();
923
924 // Add all files to the symbol table. This will add almost all
925 // symbols that we need to the symbol table.
926 for (InputFile *f : files)
927 symtab->addFile(f);
928 if (errorCount())
929 return;
930
931 // Handle the `--undefined <sym>` options.
932 for (auto *arg : args.filtered(OPT_undefined))
933 handleUndefined(arg->getValue());
934
935 // Handle the `--export <sym>` options
936 // This works like --undefined but also exports the symbol if its found
937 for (auto &iter : config->exportedSymbols)
938 handleUndefined(iter.first());
939
940 Symbol *entrySym = nullptr;
941 if (!config->relocatable && !config->entry.empty()) {
942 entrySym = handleUndefined(config->entry);
943 if (entrySym && entrySym->isDefined())
944 entrySym->forceExport = true;
945 else
946 error("entry symbol not defined (pass --no-entry to suppress): " +
947 config->entry);
948 }
949
950 // If the user code defines a `__wasm_call_dtors` function, remember it so
951 // that we can call it from the command export wrappers. Unlike
952 // `__wasm_call_ctors` which we synthesize, `__wasm_call_dtors` is defined
953 // by libc/etc., because destructors are registered dynamically with
954 // `__cxa_atexit` and friends.
955 if (!config->relocatable && !config->shared &&
956 !WasmSym::callCtors->isUsedInRegularObj &&
957 WasmSym::callCtors->getName() != config->entry &&
958 !config->exportedSymbols.count(WasmSym::callCtors->getName())) {
959 if (Symbol *callDtors = handleUndefined("__wasm_call_dtors")) {
960 if (auto *callDtorsFunc = dyn_cast<DefinedFunction>(callDtors)) {
961 if (callDtorsFunc->signature &&
962 (!callDtorsFunc->signature->Params.empty() ||
963 !callDtorsFunc->signature->Returns.empty())) {
964 error("__wasm_call_dtors must have no argument or return values");
965 }
966 WasmSym::callDtors = callDtorsFunc;
967 } else {
968 error("__wasm_call_dtors must be a function");
969 }
970 }
971 }
972
973 if (errorCount())
974 return;
975
976 // Create wrapped symbols for -wrap option.
977 std::vector<WrappedSymbol> wrapped = addWrappedSymbols(args);
978
979 // If any of our inputs are bitcode files, the LTO code generator may create
980 // references to certain library functions that might not be explicit in the
981 // bitcode file's symbol table. If any of those library functions are defined
982 // in a bitcode file in an archive member, we need to arrange to use LTO to
983 // compile those archive members by adding them to the link beforehand.
984 //
985 // We only need to add libcall symbols to the link before LTO if the symbol's
986 // definition is in bitcode. Any other required libcall symbols will be added
987 // to the link after LTO when we add the LTO object file to the link.
988 if (!symtab->bitcodeFiles.empty())
989 for (auto *s : lto::LTO::getRuntimeLibcallSymbols())
990 handleLibcall(s);
991 if (errorCount())
992 return;
993
994 // Do link-time optimization if given files are LLVM bitcode files.
995 // This compiles bitcode files into real object files.
996 symtab->compileBitcodeFiles();
997 if (errorCount())
998 return;
999
1000 createOptionalSymbols();
1001
1002 // Resolve any variant symbols that were created due to signature
1003 // mismatchs.
1004 symtab->handleSymbolVariants();
1005 if (errorCount())
1006 return;
1007
1008 // Apply symbol renames for -wrap.
1009 if (!wrapped.empty())
1010 wrapSymbols(wrapped);
1011
1012 for (auto &iter : config->exportedSymbols) {
1013 Symbol *sym = symtab->find(iter.first());
1014 if (sym && sym->isDefined())
1015 sym->forceExport = true;
1016 }
1017
1018 if (!config->relocatable && !config->isPic) {
1019 // Add synthetic dummies for weak undefined functions. Must happen
1020 // after LTO otherwise functions may not yet have signatures.
1021 symtab->handleWeakUndefines();
1022 }
1023
1024 if (entrySym)
1025 entrySym->setHidden(false);
1026
1027 if (errorCount())
1028 return;
1029
1030 // Split WASM_SEG_FLAG_STRINGS sections into pieces in preparation for garbage
1031 // collection.
1032 splitSections();
1033
1034 // Do size optimizations: garbage collection
1035 markLive();
1036
1037 // Provide the indirect function table if needed.
1038 WasmSym::indirectFunctionTable =
1039 symtab->resolveIndirectFunctionTable(/*required =*/false);
1040
1041 if (errorCount())
1042 return;
1043
1044 // Write the result to the file.
1045 writeResult();
1046 }
1047
1048 } // namespace wasm
1049 } // namespace lld
1050