111c8dfa5SLang Hames //===--------- JITLinkGeneric.cpp - Generic JIT linker utilities ----------===//
211c8dfa5SLang Hames //
311c8dfa5SLang Hames // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
411c8dfa5SLang Hames // See https://llvm.org/LICENSE.txt for license information.
511c8dfa5SLang Hames // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
611c8dfa5SLang Hames //
711c8dfa5SLang Hames //===----------------------------------------------------------------------===//
811c8dfa5SLang Hames //
911c8dfa5SLang Hames // Generic JITLinker utility class.
1011c8dfa5SLang Hames //
1111c8dfa5SLang Hames //===----------------------------------------------------------------------===//
1211c8dfa5SLang Hames 
1311c8dfa5SLang Hames #include "JITLinkGeneric.h"
1411c8dfa5SLang Hames 
1511c8dfa5SLang Hames #include "llvm/Support/BinaryStreamReader.h"
1611c8dfa5SLang Hames #include "llvm/Support/MemoryBuffer.h"
1711c8dfa5SLang Hames 
1811c8dfa5SLang Hames #define DEBUG_TYPE "jitlink"
1911c8dfa5SLang Hames 
2011c8dfa5SLang Hames namespace llvm {
2111c8dfa5SLang Hames namespace jitlink {
2211c8dfa5SLang Hames 
23*3a3cb929SKazu Hirata JITLinkerBase::~JITLinkerBase() = default;
2411c8dfa5SLang Hames 
linkPhase1(std::unique_ptr<JITLinkerBase> Self)2511c8dfa5SLang Hames void JITLinkerBase::linkPhase1(std::unique_ptr<JITLinkerBase> Self) {
2611c8dfa5SLang Hames 
278ce8cee1SLang Hames   LLVM_DEBUG({
2827a79b72SLang Hames     dbgs() << "Starting link phase 1 for graph " << G->getName() << "\n";
2927a79b72SLang Hames   });
3027a79b72SLang Hames 
3111c8dfa5SLang Hames   // Prune and optimize the graph.
324e920e58SLang Hames   if (auto Err = runPasses(Passes.PrePrunePasses))
3311c8dfa5SLang Hames     return Ctx->notifyFailed(std::move(Err));
3411c8dfa5SLang Hames 
3511c8dfa5SLang Hames   LLVM_DEBUG({
364e920e58SLang Hames     dbgs() << "Link graph \"" << G->getName() << "\" pre-pruning:\n";
37ecf6466fSLang Hames     G->dump(dbgs());
3811c8dfa5SLang Hames   });
3911c8dfa5SLang Hames 
4011c8dfa5SLang Hames   prune(*G);
4111c8dfa5SLang Hames 
4211c8dfa5SLang Hames   LLVM_DEBUG({
434e920e58SLang Hames     dbgs() << "Link graph \"" << G->getName() << "\" post-pruning:\n";
44ecf6466fSLang Hames     G->dump(dbgs());
4511c8dfa5SLang Hames   });
4611c8dfa5SLang Hames 
4711c8dfa5SLang Hames   // Run post-pruning passes.
484e920e58SLang Hames   if (auto Err = runPasses(Passes.PostPrunePasses))
4911c8dfa5SLang Hames     return Ctx->notifyFailed(std::move(Err));
5011c8dfa5SLang Hames 
51962a2479SLang Hames   Ctx->getMemoryManager().allocate(
52962a2479SLang Hames       Ctx->getJITLinkDylib(), *G,
53962a2479SLang Hames       [S = std::move(Self)](AllocResult AR) mutable {
54962a2479SLang Hames         auto *TmpSelf = S.get();
55962a2479SLang Hames         TmpSelf->linkPhase2(std::move(S), std::move(AR));
56962a2479SLang Hames       });
57962a2479SLang Hames }
5811c8dfa5SLang Hames 
linkPhase2(std::unique_ptr<JITLinkerBase> Self,AllocResult AR)59962a2479SLang Hames void JITLinkerBase::linkPhase2(std::unique_ptr<JITLinkerBase> Self,
60962a2479SLang Hames                                AllocResult AR) {
61962a2479SLang Hames 
62962a2479SLang Hames   if (AR)
63962a2479SLang Hames     Alloc = std::move(*AR);
64962a2479SLang Hames   else
65962a2479SLang Hames     return Ctx->notifyFailed(AR.takeError());
6611c8dfa5SLang Hames 
67ef50c07bSLang Hames   LLVM_DEBUG({
68ef50c07bSLang Hames     dbgs() << "Link graph \"" << G->getName()
69ef50c07bSLang Hames            << "\" before post-allocation passes:\n";
70ecf6466fSLang Hames     G->dump(dbgs());
71ef50c07bSLang Hames   });
72ef50c07bSLang Hames 
73ef50c07bSLang Hames   // Run post-allocation passes.
74ef50c07bSLang Hames   if (auto Err = runPasses(Passes.PostAllocationPasses))
75ef50c07bSLang Hames     return Ctx->notifyFailed(std::move(Err));
76ef50c07bSLang Hames 
774e920e58SLang Hames   // Notify client that the defined symbols have been assigned addresses.
78602e19edSLang Hames   LLVM_DEBUG(dbgs() << "Resolving symbols defined in " << G->getName() << "\n");
799f1dcdcaSLang Hames 
809f1dcdcaSLang Hames   if (auto Err = Ctx->notifyResolved(*G))
819f1dcdcaSLang Hames     return Ctx->notifyFailed(std::move(Err));
8211c8dfa5SLang Hames 
8311c8dfa5SLang Hames   auto ExternalSymbols = getExternalSymbolNames();
8411c8dfa5SLang Hames 
85962a2479SLang Hames   // If there are no external symbols then proceed immediately with phase 3.
86602e19edSLang Hames   if (ExternalSymbols.empty()) {
87602e19edSLang Hames     LLVM_DEBUG({
88602e19edSLang Hames       dbgs() << "No external symbols for " << G->getName()
89962a2479SLang Hames              << ". Proceeding immediately with link phase 3.\n";
90602e19edSLang Hames     });
91602e19edSLang Hames     // FIXME: Once callee expressions are defined to be sequenced before
92602e19edSLang Hames     //        argument expressions (c++17) we can simplify this. See below.
93602e19edSLang Hames     auto &TmpSelf = *Self;
94962a2479SLang Hames     TmpSelf.linkPhase3(std::move(Self), AsyncLookupResult());
95602e19edSLang Hames     return;
96602e19edSLang Hames   }
97602e19edSLang Hames 
98602e19edSLang Hames   // Otherwise look up the externals.
9927a79b72SLang Hames   LLVM_DEBUG({
10027a79b72SLang Hames     dbgs() << "Issuing lookup for external symbols for " << G->getName()
10127a79b72SLang Hames            << " (may trigger materialization/linking of other graphs)...\n";
10227a79b72SLang Hames   });
10327a79b72SLang Hames 
10411c8dfa5SLang Hames   // We're about to hand off ownership of ourself to the continuation. Grab a
10511c8dfa5SLang Hames   // pointer to the context so that we can call it to initiate the lookup.
10611c8dfa5SLang Hames   //
10711c8dfa5SLang Hames   // FIXME: Once callee expressions are defined to be sequenced before argument
10811c8dfa5SLang Hames   // expressions (c++17) we can simplify all this to:
10911c8dfa5SLang Hames   //
11011c8dfa5SLang Hames   // Ctx->lookup(std::move(UnresolvedExternals),
11111c8dfa5SLang Hames   //             [Self=std::move(Self)](Expected<AsyncLookupResult> Result) {
112962a2479SLang Hames   //               Self->linkPhase3(std::move(Self), std::move(Result));
11311c8dfa5SLang Hames   //             });
114962a2479SLang Hames   Ctx->lookup(std::move(ExternalSymbols),
1154e920e58SLang Hames               createLookupContinuation(
116962a2479SLang Hames                   [S = std::move(Self)](
1174e920e58SLang Hames                       Expected<AsyncLookupResult> LookupResult) mutable {
1184e920e58SLang Hames                     auto &TmpSelf = *S;
119962a2479SLang Hames                     TmpSelf.linkPhase3(std::move(S), std::move(LookupResult));
1204e920e58SLang Hames                   }));
12111c8dfa5SLang Hames }
12211c8dfa5SLang Hames 
linkPhase3(std::unique_ptr<JITLinkerBase> Self,Expected<AsyncLookupResult> LR)123962a2479SLang Hames void JITLinkerBase::linkPhase3(std::unique_ptr<JITLinkerBase> Self,
124962a2479SLang Hames                                Expected<AsyncLookupResult> LR) {
12527a79b72SLang Hames 
12627a79b72SLang Hames   LLVM_DEBUG({
127962a2479SLang Hames     dbgs() << "Starting link phase 3 for graph " << G->getName() << "\n";
12827a79b72SLang Hames   });
12927a79b72SLang Hames 
13011c8dfa5SLang Hames   // If the lookup failed, bail out.
13111c8dfa5SLang Hames   if (!LR)
132962a2479SLang Hames     return abandonAllocAndBailOut(std::move(Self), LR.takeError());
13311c8dfa5SLang Hames 
1344e920e58SLang Hames   // Assign addresses to external addressables.
13511c8dfa5SLang Hames   applyLookupResult(*LR);
13611c8dfa5SLang Hames 
13727a79b72SLang Hames   LLVM_DEBUG({
13827a79b72SLang Hames     dbgs() << "Link graph \"" << G->getName()
139ef50c07bSLang Hames            << "\" before pre-fixup passes:\n";
140ecf6466fSLang Hames     G->dump(dbgs());
14127a79b72SLang Hames   });
14227a79b72SLang Hames 
1437b11f564SLang Hames   if (auto Err = runPasses(Passes.PreFixupPasses))
144962a2479SLang Hames     return abandonAllocAndBailOut(std::move(Self), std::move(Err));
14527a79b72SLang Hames 
14611c8dfa5SLang Hames   LLVM_DEBUG({
1474e920e58SLang Hames     dbgs() << "Link graph \"" << G->getName() << "\" before copy-and-fixup:\n";
148ecf6466fSLang Hames     G->dump(dbgs());
14911c8dfa5SLang Hames   });
15011c8dfa5SLang Hames 
15127a79b72SLang Hames   // Fix up block content.
15227a79b72SLang Hames   if (auto Err = fixUpBlocks(*G))
153962a2479SLang Hames     return abandonAllocAndBailOut(std::move(Self), std::move(Err));
15411c8dfa5SLang Hames 
15511c8dfa5SLang Hames   LLVM_DEBUG({
1564e920e58SLang Hames     dbgs() << "Link graph \"" << G->getName() << "\" after copy-and-fixup:\n";
157ecf6466fSLang Hames     G->dump(dbgs());
15811c8dfa5SLang Hames   });
15911c8dfa5SLang Hames 
1604e920e58SLang Hames   if (auto Err = runPasses(Passes.PostFixupPasses))
161962a2479SLang Hames     return abandonAllocAndBailOut(std::move(Self), std::move(Err));
16211c8dfa5SLang Hames 
163962a2479SLang Hames   Alloc->finalize([S = std::move(Self)](FinalizeResult FR) mutable {
164962a2479SLang Hames     auto *TmpSelf = S.get();
165962a2479SLang Hames     TmpSelf->linkPhase4(std::move(S), std::move(FR));
166962a2479SLang Hames   });
16711c8dfa5SLang Hames }
16811c8dfa5SLang Hames 
linkPhase4(std::unique_ptr<JITLinkerBase> Self,FinalizeResult FR)169962a2479SLang Hames void JITLinkerBase::linkPhase4(std::unique_ptr<JITLinkerBase> Self,
170962a2479SLang Hames                                FinalizeResult FR) {
17127a79b72SLang Hames 
17227a79b72SLang Hames   LLVM_DEBUG({
173962a2479SLang Hames     dbgs() << "Starting link phase 4 for graph " << G->getName() << "\n";
17427a79b72SLang Hames   });
17527a79b72SLang Hames 
176962a2479SLang Hames   if (!FR)
177962a2479SLang Hames     return Ctx->notifyFailed(FR.takeError());
178962a2479SLang Hames 
179962a2479SLang Hames   Ctx->notifyFinalized(std::move(*FR));
18027a79b72SLang Hames 
18127a79b72SLang Hames   LLVM_DEBUG({ dbgs() << "Link of graph " << G->getName() << " complete\n"; });
18211c8dfa5SLang Hames }
18311c8dfa5SLang Hames 
runPasses(LinkGraphPassList & Passes)1844e920e58SLang Hames Error JITLinkerBase::runPasses(LinkGraphPassList &Passes) {
18511c8dfa5SLang Hames   for (auto &P : Passes)
1864e920e58SLang Hames     if (auto Err = P(*G))
18711c8dfa5SLang Hames       return Err;
18811c8dfa5SLang Hames   return Error::success();
18911c8dfa5SLang Hames }
19011c8dfa5SLang Hames 
getExternalSymbolNames() const191674df13bSLang Hames JITLinkContext::LookupMap JITLinkerBase::getExternalSymbolNames() const {
1924e920e58SLang Hames   // Identify unresolved external symbols.
193674df13bSLang Hames   JITLinkContext::LookupMap UnresolvedExternals;
1944e920e58SLang Hames   for (auto *Sym : G->external_symbols()) {
195118e953bSLang Hames     assert(!Sym->getAddress() &&
19611c8dfa5SLang Hames            "External has already been assigned an address");
1974e920e58SLang Hames     assert(Sym->getName() != StringRef() && Sym->getName() != "" &&
19811c8dfa5SLang Hames            "Externals must be named");
199674df13bSLang Hames     SymbolLookupFlags LookupFlags =
200674df13bSLang Hames         Sym->getLinkage() == Linkage::Weak
201674df13bSLang Hames             ? SymbolLookupFlags::WeaklyReferencedSymbol
202674df13bSLang Hames             : SymbolLookupFlags::RequiredSymbol;
203674df13bSLang Hames     UnresolvedExternals[Sym->getName()] = LookupFlags;
20411c8dfa5SLang Hames   }
20511c8dfa5SLang Hames   return UnresolvedExternals;
20611c8dfa5SLang Hames }
20711c8dfa5SLang Hames 
applyLookupResult(AsyncLookupResult Result)20811c8dfa5SLang Hames void JITLinkerBase::applyLookupResult(AsyncLookupResult Result) {
2094e920e58SLang Hames   for (auto *Sym : G->external_symbols()) {
210674df13bSLang Hames     assert(Sym->getOffset() == 0 &&
211674df13bSLang Hames            "External symbol is not at the start of its addressable block");
212118e953bSLang Hames     assert(!Sym->getAddress() && "Symbol already resolved");
2134e920e58SLang Hames     assert(!Sym->isDefined() && "Symbol being resolved is already defined");
214674df13bSLang Hames     auto ResultI = Result.find(Sym->getName());
215674df13bSLang Hames     if (ResultI != Result.end())
216118e953bSLang Hames       Sym->getAddressable().setAddress(
217118e953bSLang Hames           orc::ExecutorAddr(ResultI->second.getAddress()));
218674df13bSLang Hames     else
219674df13bSLang Hames       assert(Sym->getLinkage() == Linkage::Weak &&
220674df13bSLang Hames              "Failed to resolve non-weak reference");
22111c8dfa5SLang Hames   }
22211c8dfa5SLang Hames 
223d407b4b9SLang Hames   LLVM_DEBUG({
224d407b4b9SLang Hames     dbgs() << "Externals after applying lookup result:\n";
2254e920e58SLang Hames     for (auto *Sym : G->external_symbols())
2264e920e58SLang Hames       dbgs() << "  " << Sym->getName() << ": "
227118e953bSLang Hames              << formatv("{0:x16}", Sym->getAddress().getValue()) << "\n";
228d407b4b9SLang Hames   });
22911c8dfa5SLang Hames }
23011c8dfa5SLang Hames 
abandonAllocAndBailOut(std::unique_ptr<JITLinkerBase> Self,Error Err)231962a2479SLang Hames void JITLinkerBase::abandonAllocAndBailOut(std::unique_ptr<JITLinkerBase> Self,
232962a2479SLang Hames                                            Error Err) {
2336641d29bSLang Hames   assert(Err && "Should not be bailing out on success value");
234962a2479SLang Hames   assert(Alloc && "can not call abandonAllocAndBailOut before allocation");
235962a2479SLang Hames   Alloc->abandon([S = std::move(Self), E1 = std::move(Err)](Error E2) mutable {
236962a2479SLang Hames     S->Ctx->notifyFailed(joinErrors(std::move(E1), std::move(E2)));
237962a2479SLang Hames   });
2383181b87cSLang Hames }
2393181b87cSLang Hames 
prune(LinkGraph & G)2404e920e58SLang Hames void prune(LinkGraph &G) {
2414e920e58SLang Hames   std::vector<Symbol *> Worklist;
2424e920e58SLang Hames   DenseSet<Block *> VisitedBlocks;
24311c8dfa5SLang Hames 
2444e920e58SLang Hames   // Build the initial worklist from all symbols initially live.
2454e920e58SLang Hames   for (auto *Sym : G.defined_symbols())
2464e920e58SLang Hames     if (Sym->isLive())
2474e920e58SLang Hames       Worklist.push_back(Sym);
24811c8dfa5SLang Hames 
2494e920e58SLang Hames   // Propagate live flags to all symbols reachable from the initial live set.
25011c8dfa5SLang Hames   while (!Worklist.empty()) {
2514e920e58SLang Hames     auto *Sym = Worklist.back();
25211c8dfa5SLang Hames     Worklist.pop_back();
25311c8dfa5SLang Hames 
2544e920e58SLang Hames     auto &B = Sym->getBlock();
25511c8dfa5SLang Hames 
2564e920e58SLang Hames     // Skip addressables that we've visited before.
2574e920e58SLang Hames     if (VisitedBlocks.count(&B))
25811c8dfa5SLang Hames       continue;
25911c8dfa5SLang Hames 
2604e920e58SLang Hames     VisitedBlocks.insert(&B);
26111c8dfa5SLang Hames 
2624e920e58SLang Hames     for (auto &E : Sym->getBlock().edges()) {
2638ce8cee1SLang Hames       // If the edge target is a defined symbol that is being newly marked live
2648ce8cee1SLang Hames       // then add it to the worklist.
2658ce8cee1SLang Hames       if (E.getTarget().isDefined() && !E.getTarget().isLive())
2664e920e58SLang Hames         Worklist.push_back(&E.getTarget());
2678ce8cee1SLang Hames 
2688ce8cee1SLang Hames       // Mark the target live.
2698ce8cee1SLang Hames       E.getTarget().setLive(true);
27011c8dfa5SLang Hames     }
27111c8dfa5SLang Hames   }
27211c8dfa5SLang Hames 
2738ce8cee1SLang Hames   // Collect all defined symbols to remove, then remove them.
27411c8dfa5SLang Hames   {
2758ce8cee1SLang Hames     LLVM_DEBUG(dbgs() << "Dead-stripping defined symbols:\n");
2764e920e58SLang Hames     std::vector<Symbol *> SymbolsToRemove;
2774e920e58SLang Hames     for (auto *Sym : G.defined_symbols())
2784e920e58SLang Hames       if (!Sym->isLive())
2794e920e58SLang Hames         SymbolsToRemove.push_back(Sym);
2804e920e58SLang Hames     for (auto *Sym : SymbolsToRemove) {
2814e920e58SLang Hames       LLVM_DEBUG(dbgs() << "  " << *Sym << "...\n");
2824e920e58SLang Hames       G.removeDefinedSymbol(*Sym);
2834e920e58SLang Hames     }
2844e920e58SLang Hames   }
2854e920e58SLang Hames 
2864e920e58SLang Hames   // Delete any unused blocks.
2874e920e58SLang Hames   {
2884e920e58SLang Hames     LLVM_DEBUG(dbgs() << "Dead-stripping blocks:\n");
2894e920e58SLang Hames     std::vector<Block *> BlocksToRemove;
2904e920e58SLang Hames     for (auto *B : G.blocks())
2914e920e58SLang Hames       if (!VisitedBlocks.count(B))
2924e920e58SLang Hames         BlocksToRemove.push_back(B);
2934e920e58SLang Hames     for (auto *B : BlocksToRemove) {
2944e920e58SLang Hames       LLVM_DEBUG(dbgs() << "  " << *B << "...\n");
2954e920e58SLang Hames       G.removeBlock(*B);
2964e920e58SLang Hames     }
29711c8dfa5SLang Hames   }
2988ce8cee1SLang Hames 
2998ce8cee1SLang Hames   // Collect all external symbols to remove, then remove them.
3008ce8cee1SLang Hames   {
3018ce8cee1SLang Hames     LLVM_DEBUG(dbgs() << "Removing unused external symbols:\n");
3028ce8cee1SLang Hames     std::vector<Symbol *> SymbolsToRemove;
3038ce8cee1SLang Hames     for (auto *Sym : G.external_symbols())
3048ce8cee1SLang Hames       if (!Sym->isLive())
3058ce8cee1SLang Hames         SymbolsToRemove.push_back(Sym);
3068ce8cee1SLang Hames     for (auto *Sym : SymbolsToRemove) {
3078ce8cee1SLang Hames       LLVM_DEBUG(dbgs() << "  " << *Sym << "...\n");
3088ce8cee1SLang Hames       G.removeExternalSymbol(*Sym);
3098ce8cee1SLang Hames     }
3108ce8cee1SLang Hames   }
31111c8dfa5SLang Hames }
31211c8dfa5SLang Hames 
31311c8dfa5SLang Hames } // end namespace jitlink
31411c8dfa5SLang Hames } // end namespace llvm
315