142418abaSMehdi Amini //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===//
242418abaSMehdi Amini //
342418abaSMehdi Amini //                     The LLVM Compiler Infrastructure
442418abaSMehdi Amini //
542418abaSMehdi Amini // This file is distributed under the University of Illinois Open Source
642418abaSMehdi Amini // License. See LICENSE.TXT for details.
742418abaSMehdi Amini //
842418abaSMehdi Amini //===----------------------------------------------------------------------===//
942418abaSMehdi Amini //
1042418abaSMehdi Amini // This file implements Function import based on summaries.
1142418abaSMehdi Amini //
1242418abaSMehdi Amini //===----------------------------------------------------------------------===//
1342418abaSMehdi Amini 
1442418abaSMehdi Amini #include "llvm/Transforms/IPO/FunctionImport.h"
1542418abaSMehdi Amini 
1601e32130SMehdi Amini #include "llvm/ADT/SmallVector.h"
17d29478f7STeresa Johnson #include "llvm/ADT/Statistic.h"
1842418abaSMehdi Amini #include "llvm/ADT/StringSet.h"
1904c9a2d6STeresa Johnson #include "llvm/ADT/Triple.h"
2042418abaSMehdi Amini #include "llvm/IR/AutoUpgrade.h"
2142418abaSMehdi Amini #include "llvm/IR/DiagnosticPrinter.h"
2242418abaSMehdi Amini #include "llvm/IR/IntrinsicInst.h"
2342418abaSMehdi Amini #include "llvm/IR/Module.h"
24fc06b83eSMehdi Amini #include "llvm/IR/Verifier.h"
2542418abaSMehdi Amini #include "llvm/IRReader/IRReader.h"
2642418abaSMehdi Amini #include "llvm/Linker/Linker.h"
2704c9a2d6STeresa Johnson #include "llvm/Object/IRObjectFile.h"
2826ab5772STeresa Johnson #include "llvm/Object/ModuleSummaryIndexObjectFile.h"
2942418abaSMehdi Amini #include "llvm/Support/CommandLine.h"
3042418abaSMehdi Amini #include "llvm/Support/Debug.h"
3142418abaSMehdi Amini #include "llvm/Support/SourceMgr.h"
3204c9a2d6STeresa Johnson #include "llvm/Transforms/IPO/Internalize.h"
33488a800aSTeresa Johnson #include "llvm/Transforms/Utils/FunctionImportUtils.h"
347e88d0daSMehdi Amini 
3501e32130SMehdi Amini #define DEBUG_TYPE "function-import"
367e88d0daSMehdi Amini 
3742418abaSMehdi Amini using namespace llvm;
3842418abaSMehdi Amini 
396c475a75STeresa Johnson STATISTIC(NumImportedFunctions, "Number of functions imported");
406c475a75STeresa Johnson STATISTIC(NumImportedModules, "Number of modules imported from");
416c475a75STeresa Johnson STATISTIC(NumDeadSymbols, "Number of dead stripped symbols in index");
426c475a75STeresa Johnson STATISTIC(NumLiveSymbols, "Number of live symbols in index");
43d29478f7STeresa Johnson 
4439303619STeresa Johnson /// Limit on instruction count of imported functions.
4539303619STeresa Johnson static cl::opt<unsigned> ImportInstrLimit(
4639303619STeresa Johnson     "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"),
4739303619STeresa Johnson     cl::desc("Only import functions with less than N instructions"));
4839303619STeresa Johnson 
4940641748SMehdi Amini static cl::opt<float>
5040641748SMehdi Amini     ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7),
5140641748SMehdi Amini                       cl::Hidden, cl::value_desc("x"),
5240641748SMehdi Amini                       cl::desc("As we import functions, multiply the "
5340641748SMehdi Amini                                "`import-instr-limit` threshold by this factor "
5440641748SMehdi Amini                                "before processing newly imported functions"));
55ba72b95fSPiotr Padlewski 
56d2869473SPiotr Padlewski static cl::opt<float> ImportHotInstrFactor(
57d2869473SPiotr Padlewski     "import-hot-evolution-factor", cl::init(1.0), cl::Hidden,
58d2869473SPiotr Padlewski     cl::value_desc("x"),
59d2869473SPiotr Padlewski     cl::desc("As we import functions called from hot callsite, multiply the "
60d2869473SPiotr Padlewski              "`import-instr-limit` threshold by this factor "
61d2869473SPiotr Padlewski              "before processing newly imported functions"));
62d2869473SPiotr Padlewski 
63d9830eb7SPiotr Padlewski static cl::opt<float> ImportHotMultiplier(
64d9830eb7SPiotr Padlewski     "import-hot-multiplier", cl::init(3.0), cl::Hidden, cl::value_desc("x"),
65ba72b95fSPiotr Padlewski     cl::desc("Multiply the `import-instr-limit` threshold for hot callsites"));
66ba72b95fSPiotr Padlewski 
67ba72b95fSPiotr Padlewski // FIXME: This multiplier was not really tuned up.
68ba72b95fSPiotr Padlewski static cl::opt<float> ImportColdMultiplier(
69ba72b95fSPiotr Padlewski     "import-cold-multiplier", cl::init(0), cl::Hidden, cl::value_desc("N"),
70ba72b95fSPiotr Padlewski     cl::desc("Multiply the `import-instr-limit` threshold for cold callsites"));
7140641748SMehdi Amini 
72d29478f7STeresa Johnson static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden,
73d29478f7STeresa Johnson                                   cl::desc("Print imported functions"));
74d29478f7STeresa Johnson 
756c475a75STeresa Johnson static cl::opt<bool> ComputeDead("compute-dead", cl::init(true), cl::Hidden,
766c475a75STeresa Johnson                                  cl::desc("Compute dead symbols"));
776c475a75STeresa Johnson 
783b776128SPiotr Padlewski static cl::opt<bool> EnableImportMetadata(
793b776128SPiotr Padlewski     "enable-import-metadata", cl::init(
803b776128SPiotr Padlewski #if !defined(NDEBUG)
813b776128SPiotr Padlewski                                   true /*Enabled with asserts.*/
823b776128SPiotr Padlewski #else
833b776128SPiotr Padlewski                                   false
843b776128SPiotr Padlewski #endif
853b776128SPiotr Padlewski                                   ),
863b776128SPiotr Padlewski     cl::Hidden, cl::desc("Enable import metadata like 'thinlto_src_module'"));
873b776128SPiotr Padlewski 
8842418abaSMehdi Amini // Load lazily a module from \p FileName in \p Context.
8942418abaSMehdi Amini static std::unique_ptr<Module> loadFile(const std::string &FileName,
9042418abaSMehdi Amini                                         LLVMContext &Context) {
9142418abaSMehdi Amini   SMDiagnostic Err;
9242418abaSMehdi Amini   DEBUG(dbgs() << "Loading '" << FileName << "'\n");
936cba37ceSTeresa Johnson   // Metadata isn't loaded until functions are imported, to minimize
946cba37ceSTeresa Johnson   // the memory overhead.
95a1080ee6STeresa Johnson   std::unique_ptr<Module> Result =
96a1080ee6STeresa Johnson       getLazyIRFileModule(FileName, Err, Context,
97a1080ee6STeresa Johnson                           /* ShouldLazyLoadMetadata = */ true);
9842418abaSMehdi Amini   if (!Result) {
9942418abaSMehdi Amini     Err.print("function-import", errs());
100d7ad221cSMehdi Amini     report_fatal_error("Abort");
10142418abaSMehdi Amini   }
10242418abaSMehdi Amini 
10342418abaSMehdi Amini   return Result;
10442418abaSMehdi Amini }
10542418abaSMehdi Amini 
1067e88d0daSMehdi Amini namespace {
10740641748SMehdi Amini 
10801e32130SMehdi Amini /// Given a list of possible callee implementation for a call site, select one
10901e32130SMehdi Amini /// that fits the \p Threshold.
11001e32130SMehdi Amini ///
11101e32130SMehdi Amini /// FIXME: select "best" instead of first that fits. But what is "best"?
11201e32130SMehdi Amini /// - The smallest: more likely to be inlined.
11301e32130SMehdi Amini /// - The one with the least outgoing edges (already well optimized).
11401e32130SMehdi Amini /// - One from a module already being imported from in order to reduce the
11501e32130SMehdi Amini ///   number of source modules parsed/linked.
11601e32130SMehdi Amini /// - One that has PGO data attached.
11701e32130SMehdi Amini /// - [insert you fancy metric here]
1182d28f7aaSMehdi Amini static const GlobalValueSummary *
119b4e1e829SMehdi Amini selectCallee(const ModuleSummaryIndex &Index,
120b4e1e829SMehdi Amini              const GlobalValueSummaryList &CalleeSummaryList,
12183aaf358STeresa Johnson              unsigned Threshold, StringRef CallerModulePath) {
12201e32130SMehdi Amini   auto It = llvm::find_if(
12328e457bcSTeresa Johnson       CalleeSummaryList,
12428e457bcSTeresa Johnson       [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) {
12528e457bcSTeresa Johnson         auto *GVSummary = SummaryPtr.get();
126f329be83SRafael Espindola         if (GlobalValue::isInterposableLinkage(GVSummary->linkage()))
1275b85d8d6SMehdi Amini           // There is no point in importing these, we can't inline them
12801e32130SMehdi Amini           return false;
1292c719cc1SMehdi Amini         if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) {
1302c719cc1SMehdi Amini           GVSummary = &AS->getAliasee();
1312c719cc1SMehdi Amini           // Alias can't point to "available_externally". However when we import
1322c719cc1SMehdi Amini           // linkOnceODR the linkage does not change. So we import the alias
1332c719cc1SMehdi Amini           // and aliasee only in this case.
1342c719cc1SMehdi Amini           // FIXME: we should import alias as available_externally *function*,
1352c719cc1SMehdi Amini           // the destination module does need to know it is an alias.
1362c719cc1SMehdi Amini           if (!GlobalValue::isLinkOnceODRLinkage(GVSummary->linkage()))
1372c719cc1SMehdi Amini             return false;
1382c719cc1SMehdi Amini         }
1392c719cc1SMehdi Amini 
1402c719cc1SMehdi Amini         auto *Summary = cast<FunctionSummary>(GVSummary);
1417e88d0daSMehdi Amini 
14283aaf358STeresa Johnson         // If this is a local function, make sure we import the copy
14383aaf358STeresa Johnson         // in the caller's module. The only time a local function can
14483aaf358STeresa Johnson         // share an entry in the index is if there is a local with the same name
14583aaf358STeresa Johnson         // in another module that had the same source file name (in a different
14683aaf358STeresa Johnson         // directory), where each was compiled in their own directory so there
14783aaf358STeresa Johnson         // was not distinguishing path.
14883aaf358STeresa Johnson         // However, do the import from another module if there is only one
14983aaf358STeresa Johnson         // entry in the list - in that case this must be a reference due
15083aaf358STeresa Johnson         // to indirect call profile data, since a function pointer can point to
15183aaf358STeresa Johnson         // a local in another module.
15283aaf358STeresa Johnson         if (GlobalValue::isLocalLinkage(Summary->linkage()) &&
15383aaf358STeresa Johnson             CalleeSummaryList.size() > 1 &&
15483aaf358STeresa Johnson             Summary->modulePath() != CallerModulePath)
15583aaf358STeresa Johnson           return false;
15683aaf358STeresa Johnson 
15701e32130SMehdi Amini         if (Summary->instCount() > Threshold)
15801e32130SMehdi Amini           return false;
1597e88d0daSMehdi Amini 
160519465b9STeresa Johnson         if (Summary->notEligibleToImport())
161b4e1e829SMehdi Amini           return false;
162b4e1e829SMehdi Amini 
16301e32130SMehdi Amini         return true;
16401e32130SMehdi Amini       });
16528e457bcSTeresa Johnson   if (It == CalleeSummaryList.end())
16601e32130SMehdi Amini     return nullptr;
1677e88d0daSMehdi Amini 
16828e457bcSTeresa Johnson   return cast<GlobalValueSummary>(It->get());
169434e9561SRafael Espindola }
1707e88d0daSMehdi Amini 
17101e32130SMehdi Amini /// Return the summary for the function \p GUID that fits the \p Threshold, or
17201e32130SMehdi Amini /// null if there's no match.
1732d28f7aaSMehdi Amini static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID,
174ad5741b0SMehdi Amini                                               unsigned Threshold,
17583aaf358STeresa Johnson                                               const ModuleSummaryIndex &Index,
17683aaf358STeresa Johnson                                               StringRef CallerModulePath) {
17728e457bcSTeresa Johnson   auto CalleeSummaryList = Index.findGlobalValueSummaryList(GUID);
178b4e1e829SMehdi Amini   if (CalleeSummaryList == Index.end())
17901e32130SMehdi Amini     return nullptr; // This function does not have a summary
18083aaf358STeresa Johnson   return selectCallee(Index, CalleeSummaryList->second, Threshold,
18183aaf358STeresa Johnson                       CallerModulePath);
18201e32130SMehdi Amini }
1837e88d0daSMehdi Amini 
184475b51a7STeresa Johnson using EdgeInfo = std::tuple<const FunctionSummary *, unsigned /* Threshold */,
185475b51a7STeresa Johnson                             GlobalValue::GUID>;
18601e32130SMehdi Amini 
18701e32130SMehdi Amini /// Compute the list of functions to import for a given caller. Mark these
18801e32130SMehdi Amini /// imported functions and the symbols they reference in their source module as
18901e32130SMehdi Amini /// exported from their source module.
19001e32130SMehdi Amini static void computeImportForFunction(
1913255eec1STeresa Johnson     const FunctionSummary &Summary, const ModuleSummaryIndex &Index,
192d9830eb7SPiotr Padlewski     const unsigned Threshold, const GVSummaryMapTy &DefinedGVSummaries,
19301e32130SMehdi Amini     SmallVectorImpl<EdgeInfo> &Worklist,
1949b490f10SMehdi Amini     FunctionImporter::ImportMapTy &ImportList,
195c86af334STeresa Johnson     StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) {
19601e32130SMehdi Amini   for (auto &Edge : Summary.calls()) {
1972d5487cfSTeresa Johnson     auto GUID = Edge.first.getGUID();
19801e32130SMehdi Amini     DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n");
19901e32130SMehdi Amini 
2001aafabf7SMehdi Amini     if (DefinedGVSummaries.count(GUID)) {
20101e32130SMehdi Amini       DEBUG(dbgs() << "ignored! Target already in destination module.\n");
2027e88d0daSMehdi Amini       continue;
203d450da32STeresa Johnson     }
20440641748SMehdi Amini 
205ba72b95fSPiotr Padlewski     auto GetBonusMultiplier = [](CalleeInfo::HotnessType Hotness) -> float {
206ba72b95fSPiotr Padlewski       if (Hotness == CalleeInfo::HotnessType::Hot)
207ba72b95fSPiotr Padlewski         return ImportHotMultiplier;
208ba72b95fSPiotr Padlewski       if (Hotness == CalleeInfo::HotnessType::Cold)
209ba72b95fSPiotr Padlewski         return ImportColdMultiplier;
210ba72b95fSPiotr Padlewski       return 1.0;
211ba72b95fSPiotr Padlewski     };
212ba72b95fSPiotr Padlewski 
213d9830eb7SPiotr Padlewski     const auto NewThreshold =
214ba72b95fSPiotr Padlewski         Threshold * GetBonusMultiplier(Edge.second.Hotness);
215d2869473SPiotr Padlewski 
21683aaf358STeresa Johnson     auto *CalleeSummary =
21783aaf358STeresa Johnson         selectCallee(GUID, NewThreshold, Index, Summary.modulePath());
21801e32130SMehdi Amini     if (!CalleeSummary) {
21901e32130SMehdi Amini       DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n");
2207e88d0daSMehdi Amini       continue;
2217e88d0daSMehdi Amini     }
2222d28f7aaSMehdi Amini     // "Resolve" the summary, traversing alias,
2232d28f7aaSMehdi Amini     const FunctionSummary *ResolvedCalleeSummary;
2246968ef77SMehdi Amini     if (isa<AliasSummary>(CalleeSummary)) {
2252d28f7aaSMehdi Amini       ResolvedCalleeSummary = cast<FunctionSummary>(
2262d28f7aaSMehdi Amini           &cast<AliasSummary>(CalleeSummary)->getAliasee());
2272c719cc1SMehdi Amini       assert(
2282c719cc1SMehdi Amini           GlobalValue::isLinkOnceODRLinkage(ResolvedCalleeSummary->linkage()) &&
2292c719cc1SMehdi Amini           "Unexpected alias to a non-linkonceODR in import list");
2306968ef77SMehdi Amini     } else
2312d28f7aaSMehdi Amini       ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary);
2322d28f7aaSMehdi Amini 
233d9830eb7SPiotr Padlewski     assert(ResolvedCalleeSummary->instCount() <= NewThreshold &&
23401e32130SMehdi Amini            "selectCallee() didn't honor the threshold");
23501e32130SMehdi Amini 
236d2869473SPiotr Padlewski     auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) {
237d2869473SPiotr Padlewski       // Adjust the threshold for next level of imported functions.
238d2869473SPiotr Padlewski       // The threshold is different for hot callsites because we can then
239d2869473SPiotr Padlewski       // inline chains of hot calls.
240d2869473SPiotr Padlewski       if (IsHotCallsite)
241d2869473SPiotr Padlewski         return Threshold * ImportHotInstrFactor;
242d2869473SPiotr Padlewski       return Threshold * ImportInstrFactor;
243d2869473SPiotr Padlewski     };
244d2869473SPiotr Padlewski 
245d2869473SPiotr Padlewski     bool IsHotCallsite = Edge.second.Hotness == CalleeInfo::HotnessType::Hot;
2461b859a23STeresa Johnson     const auto AdjThreshold = GetAdjustedThreshold(Threshold, IsHotCallsite);
2471b859a23STeresa Johnson 
2481b859a23STeresa Johnson     auto ExportModulePath = ResolvedCalleeSummary->modulePath();
2491b859a23STeresa Johnson     auto &ProcessedThreshold = ImportList[ExportModulePath][GUID];
2501b859a23STeresa Johnson     /// Since the traversal of the call graph is DFS, we can revisit a function
2511b859a23STeresa Johnson     /// a second time with a higher threshold. In this case, it is added back to
2521b859a23STeresa Johnson     /// the worklist with the new threshold.
2531b859a23STeresa Johnson     if (ProcessedThreshold && ProcessedThreshold >= AdjThreshold) {
2541b859a23STeresa Johnson       DEBUG(dbgs() << "ignored! Target was already seen with Threshold "
2551b859a23STeresa Johnson                    << ProcessedThreshold << "\n");
2561b859a23STeresa Johnson       continue;
2571b859a23STeresa Johnson     }
25819f2aa78STeresa Johnson     bool PreviouslyImported = ProcessedThreshold != 0;
2591b859a23STeresa Johnson     // Mark this function as imported in this module, with the current Threshold
2601b859a23STeresa Johnson     ProcessedThreshold = AdjThreshold;
2611b859a23STeresa Johnson 
2621b859a23STeresa Johnson     // Make exports in the source module.
2631b859a23STeresa Johnson     if (ExportLists) {
2641b859a23STeresa Johnson       auto &ExportList = (*ExportLists)[ExportModulePath];
2651b859a23STeresa Johnson       ExportList.insert(GUID);
26619f2aa78STeresa Johnson       if (!PreviouslyImported) {
26719f2aa78STeresa Johnson         // This is the first time this function was exported from its source
26819f2aa78STeresa Johnson         // module, so mark all functions and globals it references as exported
2691b859a23STeresa Johnson         // to the outside if they are defined in the same source module.
270edddca22STeresa Johnson         // For efficiency, we unconditionally add all the referenced GUIDs
271edddca22STeresa Johnson         // to the ExportList for this module, and will prune out any not
272edddca22STeresa Johnson         // defined in the module later in a single pass.
2731b859a23STeresa Johnson         for (auto &Edge : ResolvedCalleeSummary->calls()) {
2741b859a23STeresa Johnson           auto CalleeGUID = Edge.first.getGUID();
275edddca22STeresa Johnson           ExportList.insert(CalleeGUID);
2761b859a23STeresa Johnson         }
2771b859a23STeresa Johnson         for (auto &Ref : ResolvedCalleeSummary->refs()) {
2781b859a23STeresa Johnson           auto GUID = Ref.getGUID();
279edddca22STeresa Johnson           ExportList.insert(GUID);
2801b859a23STeresa Johnson         }
2811b859a23STeresa Johnson       }
28219f2aa78STeresa Johnson     }
283d2869473SPiotr Padlewski 
28401e32130SMehdi Amini     // Insert the newly imported function to the worklist.
285475b51a7STeresa Johnson     Worklist.emplace_back(ResolvedCalleeSummary, AdjThreshold, GUID);
286d450da32STeresa Johnson   }
287d450da32STeresa Johnson }
288d450da32STeresa Johnson 
28901e32130SMehdi Amini /// Given the list of globals defined in a module, compute the list of imports
29001e32130SMehdi Amini /// as well as the list of "exports", i.e. the list of symbols referenced from
29101e32130SMehdi Amini /// another module (that may require promotion).
29201e32130SMehdi Amini static void ComputeImportForModule(
293c851d216STeresa Johnson     const GVSummaryMapTy &DefinedGVSummaries, const ModuleSummaryIndex &Index,
2949b490f10SMehdi Amini     FunctionImporter::ImportMapTy &ImportList,
2956c475a75STeresa Johnson     StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr,
2966c475a75STeresa Johnson     const DenseSet<GlobalValue::GUID> *DeadSymbols = nullptr) {
29701e32130SMehdi Amini   // Worklist contains the list of function imported in this module, for which
29801e32130SMehdi Amini   // we will analyse the callees and may import further down the callgraph.
29901e32130SMehdi Amini   SmallVector<EdgeInfo, 128> Worklist;
30001e32130SMehdi Amini 
30101e32130SMehdi Amini   // Populate the worklist with the import for the functions in the current
30201e32130SMehdi Amini   // module
30328e457bcSTeresa Johnson   for (auto &GVSummary : DefinedGVSummaries) {
3046c475a75STeresa Johnson     if (DeadSymbols && DeadSymbols->count(GVSummary.first)) {
3056c475a75STeresa Johnson       DEBUG(dbgs() << "Ignores Dead GUID: " << GVSummary.first << "\n");
3066c475a75STeresa Johnson       continue;
3076c475a75STeresa Johnson     }
30828e457bcSTeresa Johnson     auto *Summary = GVSummary.second;
3092d28f7aaSMehdi Amini     if (auto *AS = dyn_cast<AliasSummary>(Summary))
3102d28f7aaSMehdi Amini       Summary = &AS->getAliasee();
3111aafabf7SMehdi Amini     auto *FuncSummary = dyn_cast<FunctionSummary>(Summary);
3121aafabf7SMehdi Amini     if (!FuncSummary)
3131aafabf7SMehdi Amini       // Skip import for global variables
3141aafabf7SMehdi Amini       continue;
31528e457bcSTeresa Johnson     DEBUG(dbgs() << "Initalize import for " << GVSummary.first << "\n");
3162d28f7aaSMehdi Amini     computeImportForFunction(*FuncSummary, Index, ImportInstrLimit,
3179b490f10SMehdi Amini                              DefinedGVSummaries, Worklist, ImportList,
31801e32130SMehdi Amini                              ExportLists);
31901e32130SMehdi Amini   }
32001e32130SMehdi Amini 
321d2869473SPiotr Padlewski   // Process the newly imported functions and add callees to the worklist.
32242418abaSMehdi Amini   while (!Worklist.empty()) {
32301e32130SMehdi Amini     auto FuncInfo = Worklist.pop_back_val();
324475b51a7STeresa Johnson     auto *Summary = std::get<0>(FuncInfo);
325475b51a7STeresa Johnson     auto Threshold = std::get<1>(FuncInfo);
326475b51a7STeresa Johnson     auto GUID = std::get<2>(FuncInfo);
327475b51a7STeresa Johnson 
328475b51a7STeresa Johnson     // Check if we later added this summary with a higher threshold.
329475b51a7STeresa Johnson     // If so, skip this entry.
330475b51a7STeresa Johnson     auto ExportModulePath = Summary->modulePath();
331475b51a7STeresa Johnson     auto &LatestProcessedThreshold = ImportList[ExportModulePath][GUID];
332475b51a7STeresa Johnson     if (LatestProcessedThreshold > Threshold)
333475b51a7STeresa Johnson       continue;
33442418abaSMehdi Amini 
3351aafabf7SMehdi Amini     computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries,
3369b490f10SMehdi Amini                              Worklist, ImportList, ExportLists);
337c8c55170SMehdi Amini   }
33842418abaSMehdi Amini }
339ffe2e4aaSMehdi Amini 
34001e32130SMehdi Amini } // anonymous namespace
34101e32130SMehdi Amini 
342c86af334STeresa Johnson /// Compute all the import and export for every module using the Index.
34301e32130SMehdi Amini void llvm::ComputeCrossModuleImport(
34401e32130SMehdi Amini     const ModuleSummaryIndex &Index,
345c851d216STeresa Johnson     const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
34601e32130SMehdi Amini     StringMap<FunctionImporter::ImportMapTy> &ImportLists,
3476c475a75STeresa Johnson     StringMap<FunctionImporter::ExportSetTy> &ExportLists,
3486c475a75STeresa Johnson     const DenseSet<GlobalValue::GUID> *DeadSymbols) {
34901e32130SMehdi Amini   // For each module that has function defined, compute the import/export lists.
3501aafabf7SMehdi Amini   for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) {
3519b490f10SMehdi Amini     auto &ImportList = ImportLists[DefinedGVSummaries.first()];
3521aafabf7SMehdi Amini     DEBUG(dbgs() << "Computing import for Module '"
3531aafabf7SMehdi Amini                  << DefinedGVSummaries.first() << "'\n");
3549b490f10SMehdi Amini     ComputeImportForModule(DefinedGVSummaries.second, Index, ImportList,
3556c475a75STeresa Johnson                            &ExportLists, DeadSymbols);
35601e32130SMehdi Amini   }
35701e32130SMehdi Amini 
358edddca22STeresa Johnson   // When computing imports we added all GUIDs referenced by anything
359edddca22STeresa Johnson   // imported from the module to its ExportList. Now we prune each ExportList
360edddca22STeresa Johnson   // of any not defined in that module. This is more efficient than checking
361edddca22STeresa Johnson   // while computing imports because some of the summary lists may be long
362edddca22STeresa Johnson   // due to linkonce (comdat) copies.
363edddca22STeresa Johnson   for (auto &ELI : ExportLists) {
364edddca22STeresa Johnson     const auto &DefinedGVSummaries =
365edddca22STeresa Johnson         ModuleToDefinedGVSummaries.lookup(ELI.first());
366edddca22STeresa Johnson     for (auto EI = ELI.second.begin(); EI != ELI.second.end();) {
367edddca22STeresa Johnson       if (!DefinedGVSummaries.count(*EI))
368edddca22STeresa Johnson         EI = ELI.second.erase(EI);
369edddca22STeresa Johnson       else
370edddca22STeresa Johnson         ++EI;
371edddca22STeresa Johnson     }
372edddca22STeresa Johnson   }
373edddca22STeresa Johnson 
37401e32130SMehdi Amini #ifndef NDEBUG
37501e32130SMehdi Amini   DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size()
37601e32130SMehdi Amini                << " modules:\n");
37701e32130SMehdi Amini   for (auto &ModuleImports : ImportLists) {
37801e32130SMehdi Amini     auto ModName = ModuleImports.first();
37901e32130SMehdi Amini     auto &Exports = ExportLists[ModName];
38001e32130SMehdi Amini     DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size()
38101e32130SMehdi Amini                  << " functions. Imports from " << ModuleImports.second.size()
38201e32130SMehdi Amini                  << " modules.\n");
38301e32130SMehdi Amini     for (auto &Src : ModuleImports.second) {
38401e32130SMehdi Amini       auto SrcModName = Src.first();
38501e32130SMehdi Amini       DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from "
38601e32130SMehdi Amini                    << SrcModName << "\n");
38701e32130SMehdi Amini     }
38801e32130SMehdi Amini   }
38901e32130SMehdi Amini #endif
39001e32130SMehdi Amini }
39101e32130SMehdi Amini 
392c86af334STeresa Johnson /// Compute all the imports for the given module in the Index.
393c86af334STeresa Johnson void llvm::ComputeCrossModuleImportForModule(
394c86af334STeresa Johnson     StringRef ModulePath, const ModuleSummaryIndex &Index,
395c86af334STeresa Johnson     FunctionImporter::ImportMapTy &ImportList) {
396c86af334STeresa Johnson 
397c86af334STeresa Johnson   // Collect the list of functions this module defines.
398c86af334STeresa Johnson   // GUID -> Summary
399c851d216STeresa Johnson   GVSummaryMapTy FunctionSummaryMap;
40028e457bcSTeresa Johnson   Index.collectDefinedFunctionsForModule(ModulePath, FunctionSummaryMap);
401c86af334STeresa Johnson 
402c86af334STeresa Johnson   // Compute the import list for this module.
403c86af334STeresa Johnson   DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n");
40428e457bcSTeresa Johnson   ComputeImportForModule(FunctionSummaryMap, Index, ImportList);
405c86af334STeresa Johnson 
406c86af334STeresa Johnson #ifndef NDEBUG
407c86af334STeresa Johnson   DEBUG(dbgs() << "* Module " << ModulePath << " imports from "
408c86af334STeresa Johnson                << ImportList.size() << " modules.\n");
409c86af334STeresa Johnson   for (auto &Src : ImportList) {
410c86af334STeresa Johnson     auto SrcModName = Src.first();
411c86af334STeresa Johnson     DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from "
412c86af334STeresa Johnson                  << SrcModName << "\n");
413c86af334STeresa Johnson   }
414c86af334STeresa Johnson #endif
415c86af334STeresa Johnson }
416c86af334STeresa Johnson 
4176c475a75STeresa Johnson DenseSet<GlobalValue::GUID> llvm::computeDeadSymbols(
4186c475a75STeresa Johnson     const ModuleSummaryIndex &Index,
4196c475a75STeresa Johnson     const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) {
4206c475a75STeresa Johnson   if (!ComputeDead)
4216c475a75STeresa Johnson     return DenseSet<GlobalValue::GUID>();
4226c475a75STeresa Johnson   if (GUIDPreservedSymbols.empty())
4236c475a75STeresa Johnson     // Don't do anything when nothing is live, this is friendly with tests.
4246c475a75STeresa Johnson     return DenseSet<GlobalValue::GUID>();
4256c475a75STeresa Johnson   DenseSet<GlobalValue::GUID> LiveSymbols = GUIDPreservedSymbols;
4266c475a75STeresa Johnson   SmallVector<GlobalValue::GUID, 128> Worklist;
4276c475a75STeresa Johnson   Worklist.reserve(LiveSymbols.size() * 2);
4286c475a75STeresa Johnson   for (auto GUID : LiveSymbols) {
4296c475a75STeresa Johnson     DEBUG(dbgs() << "Live root: " << GUID << "\n");
4306c475a75STeresa Johnson     Worklist.push_back(GUID);
4316c475a75STeresa Johnson   }
4326c475a75STeresa Johnson   // Add values flagged in the index as live roots to the worklist.
4336c475a75STeresa Johnson   for (const auto &Entry : Index) {
4346c475a75STeresa Johnson     bool IsLiveRoot = llvm::any_of(
4356c475a75STeresa Johnson         Entry.second,
4366c475a75STeresa Johnson         [&](const std::unique_ptr<llvm::GlobalValueSummary> &Summary) {
4376c475a75STeresa Johnson           return Summary->liveRoot();
4386c475a75STeresa Johnson         });
4396c475a75STeresa Johnson     if (!IsLiveRoot)
4406c475a75STeresa Johnson       continue;
4416c475a75STeresa Johnson     DEBUG(dbgs() << "Live root (summary): " << Entry.first << "\n");
4426c475a75STeresa Johnson     Worklist.push_back(Entry.first);
4436c475a75STeresa Johnson   }
4446c475a75STeresa Johnson 
4456c475a75STeresa Johnson   while (!Worklist.empty()) {
4466c475a75STeresa Johnson     auto GUID = Worklist.pop_back_val();
4476c475a75STeresa Johnson     auto It = Index.findGlobalValueSummaryList(GUID);
4486c475a75STeresa Johnson     if (It == Index.end()) {
4496c475a75STeresa Johnson       DEBUG(dbgs() << "Not in index: " << GUID << "\n");
4506c475a75STeresa Johnson       continue;
4516c475a75STeresa Johnson     }
4526c475a75STeresa Johnson 
4536c475a75STeresa Johnson     // FIXME: we should only make the prevailing copy live here
4546c475a75STeresa Johnson     for (auto &Summary : It->second) {
4556c475a75STeresa Johnson       for (auto Ref : Summary->refs()) {
4566c475a75STeresa Johnson         auto RefGUID = Ref.getGUID();
4576c475a75STeresa Johnson         if (LiveSymbols.insert(RefGUID).second) {
4586c475a75STeresa Johnson           DEBUG(dbgs() << "Marking live (ref): " << RefGUID << "\n");
4596c475a75STeresa Johnson           Worklist.push_back(RefGUID);
4606c475a75STeresa Johnson         }
4616c475a75STeresa Johnson       }
4626c475a75STeresa Johnson       if (auto *FS = dyn_cast<FunctionSummary>(Summary.get())) {
4636c475a75STeresa Johnson         for (auto Call : FS->calls()) {
4646c475a75STeresa Johnson           auto CallGUID = Call.first.getGUID();
4656c475a75STeresa Johnson           if (LiveSymbols.insert(CallGUID).second) {
4666c475a75STeresa Johnson             DEBUG(dbgs() << "Marking live (call): " << CallGUID << "\n");
4676c475a75STeresa Johnson             Worklist.push_back(CallGUID);
4686c475a75STeresa Johnson           }
4696c475a75STeresa Johnson         }
4706c475a75STeresa Johnson       }
4716c475a75STeresa Johnson       if (auto *AS = dyn_cast<AliasSummary>(Summary.get())) {
4726c475a75STeresa Johnson         auto AliaseeGUID = AS->getAliasee().getOriginalName();
4736c475a75STeresa Johnson         if (LiveSymbols.insert(AliaseeGUID).second) {
4746c475a75STeresa Johnson           DEBUG(dbgs() << "Marking live (alias): " << AliaseeGUID << "\n");
4756c475a75STeresa Johnson           Worklist.push_back(AliaseeGUID);
4766c475a75STeresa Johnson         }
4776c475a75STeresa Johnson       }
4786c475a75STeresa Johnson     }
4796c475a75STeresa Johnson   }
4806c475a75STeresa Johnson   DenseSet<GlobalValue::GUID> DeadSymbols;
4816c475a75STeresa Johnson   DeadSymbols.reserve(
4826c475a75STeresa Johnson       std::min(Index.size(), Index.size() - LiveSymbols.size()));
4836c475a75STeresa Johnson   for (auto &Entry : Index) {
4846c475a75STeresa Johnson     auto GUID = Entry.first;
4856c475a75STeresa Johnson     if (!LiveSymbols.count(GUID)) {
4866c475a75STeresa Johnson       DEBUG(dbgs() << "Marking dead: " << GUID << "\n");
4876c475a75STeresa Johnson       DeadSymbols.insert(GUID);
4886c475a75STeresa Johnson     }
4896c475a75STeresa Johnson   }
4906c475a75STeresa Johnson   DEBUG(dbgs() << LiveSymbols.size() << " symbols Live, and "
4916c475a75STeresa Johnson                << DeadSymbols.size() << " symbols Dead \n");
4926c475a75STeresa Johnson   NumDeadSymbols += DeadSymbols.size();
4936c475a75STeresa Johnson   NumLiveSymbols += LiveSymbols.size();
4946c475a75STeresa Johnson   return DeadSymbols;
4956c475a75STeresa Johnson }
4966c475a75STeresa Johnson 
49784174c37STeresa Johnson /// Compute the set of summaries needed for a ThinLTO backend compilation of
49884174c37STeresa Johnson /// \p ModulePath.
49984174c37STeresa Johnson void llvm::gatherImportedSummariesForModule(
50084174c37STeresa Johnson     StringRef ModulePath,
50184174c37STeresa Johnson     const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
502cdbcbf74SMehdi Amini     const FunctionImporter::ImportMapTy &ImportList,
50384174c37STeresa Johnson     std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) {
50484174c37STeresa Johnson   // Include all summaries from the importing module.
50584174c37STeresa Johnson   ModuleToSummariesForIndex[ModulePath] =
50684174c37STeresa Johnson       ModuleToDefinedGVSummaries.lookup(ModulePath);
50784174c37STeresa Johnson   // Include summaries for imports.
50888c491ddSMehdi Amini   for (auto &ILI : ImportList) {
50984174c37STeresa Johnson     auto &SummariesForIndex = ModuleToSummariesForIndex[ILI.first()];
51084174c37STeresa Johnson     const auto &DefinedGVSummaries =
51184174c37STeresa Johnson         ModuleToDefinedGVSummaries.lookup(ILI.first());
51284174c37STeresa Johnson     for (auto &GI : ILI.second) {
51384174c37STeresa Johnson       const auto &DS = DefinedGVSummaries.find(GI.first);
51484174c37STeresa Johnson       assert(DS != DefinedGVSummaries.end() &&
51584174c37STeresa Johnson              "Expected a defined summary for imported global value");
51684174c37STeresa Johnson       SummariesForIndex[GI.first] = DS->second;
51784174c37STeresa Johnson     }
51884174c37STeresa Johnson   }
51984174c37STeresa Johnson }
52084174c37STeresa Johnson 
5218570fe47STeresa Johnson /// Emit the files \p ModulePath will import from into \p OutputFilename.
522cdbcbf74SMehdi Amini std::error_code
523cdbcbf74SMehdi Amini llvm::EmitImportsFiles(StringRef ModulePath, StringRef OutputFilename,
524cdbcbf74SMehdi Amini                        const FunctionImporter::ImportMapTy &ModuleImports) {
5258570fe47STeresa Johnson   std::error_code EC;
5268570fe47STeresa Johnson   raw_fd_ostream ImportsOS(OutputFilename, EC, sys::fs::OpenFlags::F_None);
5278570fe47STeresa Johnson   if (EC)
5288570fe47STeresa Johnson     return EC;
529cdbcbf74SMehdi Amini   for (auto &ILI : ModuleImports)
5308570fe47STeresa Johnson     ImportsOS << ILI.first() << "\n";
5318570fe47STeresa Johnson   return std::error_code();
5328570fe47STeresa Johnson }
5338570fe47STeresa Johnson 
53404c9a2d6STeresa Johnson /// Fixup WeakForLinker linkages in \p TheModule based on summary analysis.
53504c9a2d6STeresa Johnson void llvm::thinLTOResolveWeakForLinkerModule(
53604c9a2d6STeresa Johnson     Module &TheModule, const GVSummaryMapTy &DefinedGlobals) {
5374566c6dbSTeresa Johnson   auto ConvertToDeclaration = [](GlobalValue &GV) {
5384566c6dbSTeresa Johnson     DEBUG(dbgs() << "Converting to a declaration: `" << GV.getName() << "\n");
5394566c6dbSTeresa Johnson     if (Function *F = dyn_cast<Function>(&GV)) {
5404566c6dbSTeresa Johnson       F->deleteBody();
5414566c6dbSTeresa Johnson       F->clearMetadata();
5424566c6dbSTeresa Johnson     } else if (GlobalVariable *V = dyn_cast<GlobalVariable>(&GV)) {
5434566c6dbSTeresa Johnson       V->setInitializer(nullptr);
5444566c6dbSTeresa Johnson       V->setLinkage(GlobalValue::ExternalLinkage);
5454566c6dbSTeresa Johnson       V->clearMetadata();
5464566c6dbSTeresa Johnson     } else
5474566c6dbSTeresa Johnson       // For now we don't resolve or drop aliases. Once we do we'll
5484566c6dbSTeresa Johnson       // need to add support here for creating either a function or
5494566c6dbSTeresa Johnson       // variable declaration, and return the new GlobalValue* for
5504566c6dbSTeresa Johnson       // the caller to use.
5514566c6dbSTeresa Johnson       assert(false && "Expected function or variable");
5524566c6dbSTeresa Johnson   };
5534566c6dbSTeresa Johnson 
55404c9a2d6STeresa Johnson   auto updateLinkage = [&](GlobalValue &GV) {
55504c9a2d6STeresa Johnson     if (!GlobalValue::isWeakForLinker(GV.getLinkage()))
55604c9a2d6STeresa Johnson       return;
55704c9a2d6STeresa Johnson     // See if the global summary analysis computed a new resolved linkage.
55804c9a2d6STeresa Johnson     const auto &GS = DefinedGlobals.find(GV.getGUID());
55904c9a2d6STeresa Johnson     if (GS == DefinedGlobals.end())
56004c9a2d6STeresa Johnson       return;
56104c9a2d6STeresa Johnson     auto NewLinkage = GS->second->linkage();
56204c9a2d6STeresa Johnson     if (NewLinkage == GV.getLinkage())
56304c9a2d6STeresa Johnson       return;
5644566c6dbSTeresa Johnson     // Check for a non-prevailing def that has interposable linkage
5654566c6dbSTeresa Johnson     // (e.g. non-odr weak or linkonce). In that case we can't simply
5664566c6dbSTeresa Johnson     // convert to available_externally, since it would lose the
5674566c6dbSTeresa Johnson     // interposable property and possibly get inlined. Simply drop
5684566c6dbSTeresa Johnson     // the definition in that case.
5694566c6dbSTeresa Johnson     if (GlobalValue::isAvailableExternallyLinkage(NewLinkage) &&
5704566c6dbSTeresa Johnson         GlobalValue::isInterposableLinkage(GV.getLinkage()))
5714566c6dbSTeresa Johnson       ConvertToDeclaration(GV);
5724566c6dbSTeresa Johnson     else {
57304c9a2d6STeresa Johnson       DEBUG(dbgs() << "ODR fixing up linkage for `" << GV.getName() << "` from "
57404c9a2d6STeresa Johnson                    << GV.getLinkage() << " to " << NewLinkage << "\n");
57504c9a2d6STeresa Johnson       GV.setLinkage(NewLinkage);
5764566c6dbSTeresa Johnson     }
5774566c6dbSTeresa Johnson     // Remove declarations from comdats, including available_externally
5786107a419STeresa Johnson     // as this is a declaration for the linker, and will be dropped eventually.
5796107a419STeresa Johnson     // It is illegal for comdats to contain declarations.
5806107a419STeresa Johnson     auto *GO = dyn_cast_or_null<GlobalObject>(&GV);
5814566c6dbSTeresa Johnson     if (GO && GO->isDeclarationForLinker() && GO->hasComdat())
5826107a419STeresa Johnson       GO->setComdat(nullptr);
58304c9a2d6STeresa Johnson   };
58404c9a2d6STeresa Johnson 
58504c9a2d6STeresa Johnson   // Process functions and global now
58604c9a2d6STeresa Johnson   for (auto &GV : TheModule)
58704c9a2d6STeresa Johnson     updateLinkage(GV);
58804c9a2d6STeresa Johnson   for (auto &GV : TheModule.globals())
58904c9a2d6STeresa Johnson     updateLinkage(GV);
59004c9a2d6STeresa Johnson   for (auto &GV : TheModule.aliases())
59104c9a2d6STeresa Johnson     updateLinkage(GV);
59204c9a2d6STeresa Johnson }
59304c9a2d6STeresa Johnson 
59404c9a2d6STeresa Johnson /// Run internalization on \p TheModule based on symmary analysis.
59504c9a2d6STeresa Johnson void llvm::thinLTOInternalizeModule(Module &TheModule,
59604c9a2d6STeresa Johnson                                     const GVSummaryMapTy &DefinedGlobals) {
59704c9a2d6STeresa Johnson   // Parse inline ASM and collect the list of symbols that are not defined in
59804c9a2d6STeresa Johnson   // the current module.
59904c9a2d6STeresa Johnson   StringSet<> AsmUndefinedRefs;
600863cbfbeSPeter Collingbourne   ModuleSymbolTable::CollectAsmSymbols(
601*d8204472STeresa Johnson       TheModule,
60204c9a2d6STeresa Johnson       [&AsmUndefinedRefs](StringRef Name, object::BasicSymbolRef::Flags Flags) {
60304c9a2d6STeresa Johnson         if (Flags & object::BasicSymbolRef::SF_Undefined)
60404c9a2d6STeresa Johnson           AsmUndefinedRefs.insert(Name);
60504c9a2d6STeresa Johnson       });
60604c9a2d6STeresa Johnson 
60704c9a2d6STeresa Johnson   // Declare a callback for the internalize pass that will ask for every
60804c9a2d6STeresa Johnson   // candidate GlobalValue if it can be internalized or not.
60904c9a2d6STeresa Johnson   auto MustPreserveGV = [&](const GlobalValue &GV) -> bool {
61004c9a2d6STeresa Johnson     // Can't be internalized if referenced in inline asm.
61104c9a2d6STeresa Johnson     if (AsmUndefinedRefs.count(GV.getName()))
61204c9a2d6STeresa Johnson       return true;
61304c9a2d6STeresa Johnson 
61404c9a2d6STeresa Johnson     // Lookup the linkage recorded in the summaries during global analysis.
61504c9a2d6STeresa Johnson     const auto &GS = DefinedGlobals.find(GV.getGUID());
61604c9a2d6STeresa Johnson     GlobalValue::LinkageTypes Linkage;
61704c9a2d6STeresa Johnson     if (GS == DefinedGlobals.end()) {
61804c9a2d6STeresa Johnson       // Must have been promoted (possibly conservatively). Find original
61904c9a2d6STeresa Johnson       // name so that we can access the correct summary and see if it can
62004c9a2d6STeresa Johnson       // be internalized again.
62104c9a2d6STeresa Johnson       // FIXME: Eventually we should control promotion instead of promoting
62204c9a2d6STeresa Johnson       // and internalizing again.
62304c9a2d6STeresa Johnson       StringRef OrigName =
62404c9a2d6STeresa Johnson           ModuleSummaryIndex::getOriginalNameBeforePromote(GV.getName());
62504c9a2d6STeresa Johnson       std::string OrigId = GlobalValue::getGlobalIdentifier(
62604c9a2d6STeresa Johnson           OrigName, GlobalValue::InternalLinkage,
62704c9a2d6STeresa Johnson           TheModule.getSourceFileName());
62804c9a2d6STeresa Johnson       const auto &GS = DefinedGlobals.find(GlobalValue::getGUID(OrigId));
6297ab1f692STeresa Johnson       if (GS == DefinedGlobals.end()) {
6307ab1f692STeresa Johnson         // Also check the original non-promoted non-globalized name. In some
6317ab1f692STeresa Johnson         // cases a preempted weak value is linked in as a local copy because
6327ab1f692STeresa Johnson         // it is referenced by an alias (IRLinker::linkGlobalValueProto).
6337ab1f692STeresa Johnson         // In that case, since it was originally not a local value, it was
6347ab1f692STeresa Johnson         // recorded in the index using the original name.
6357ab1f692STeresa Johnson         // FIXME: This may not be needed once PR27866 is fixed.
6367ab1f692STeresa Johnson         const auto &GS = DefinedGlobals.find(GlobalValue::getGUID(OrigName));
63704c9a2d6STeresa Johnson         assert(GS != DefinedGlobals.end());
63804c9a2d6STeresa Johnson         Linkage = GS->second->linkage();
6397ab1f692STeresa Johnson       } else {
6407ab1f692STeresa Johnson         Linkage = GS->second->linkage();
6417ab1f692STeresa Johnson       }
64204c9a2d6STeresa Johnson     } else
64304c9a2d6STeresa Johnson       Linkage = GS->second->linkage();
64404c9a2d6STeresa Johnson     return !GlobalValue::isLocalLinkage(Linkage);
64504c9a2d6STeresa Johnson   };
64604c9a2d6STeresa Johnson 
64704c9a2d6STeresa Johnson   // FIXME: See if we can just internalize directly here via linkage changes
64804c9a2d6STeresa Johnson   // based on the index, rather than invoking internalizeModule.
64904c9a2d6STeresa Johnson   llvm::internalizeModule(TheModule, MustPreserveGV);
65004c9a2d6STeresa Johnson }
65104c9a2d6STeresa Johnson 
652c8c55170SMehdi Amini // Automatically import functions in Module \p DestModule based on the summaries
653c8c55170SMehdi Amini // index.
654c8c55170SMehdi Amini //
6557f00d0a1SPeter Collingbourne Expected<bool> FunctionImporter::importFunctions(
65637e24591SPeter Collingbourne     Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) {
6575411d051SMehdi Amini   DEBUG(dbgs() << "Starting import for Module "
658311fef6eSMehdi Amini                << DestModule.getModuleIdentifier() << "\n");
659c8c55170SMehdi Amini   unsigned ImportedCount = 0;
660c8c55170SMehdi Amini 
6616d8f817fSPeter Collingbourne   IRMover Mover(DestModule);
6627e88d0daSMehdi Amini   // Do the actual import of functions now, one Module at a time
66301e32130SMehdi Amini   std::set<StringRef> ModuleNameOrderedList;
66401e32130SMehdi Amini   for (auto &FunctionsToImportPerModule : ImportList) {
66501e32130SMehdi Amini     ModuleNameOrderedList.insert(FunctionsToImportPerModule.first());
66601e32130SMehdi Amini   }
66701e32130SMehdi Amini   for (auto &Name : ModuleNameOrderedList) {
6687e88d0daSMehdi Amini     // Get the module for the import
66901e32130SMehdi Amini     const auto &FunctionsToImportPerModule = ImportList.find(Name);
67001e32130SMehdi Amini     assert(FunctionsToImportPerModule != ImportList.end());
671d9445c49SPeter Collingbourne     Expected<std::unique_ptr<Module>> SrcModuleOrErr = ModuleLoader(Name);
672d9445c49SPeter Collingbourne     if (!SrcModuleOrErr)
673d9445c49SPeter Collingbourne       return SrcModuleOrErr.takeError();
674d9445c49SPeter Collingbourne     std::unique_ptr<Module> SrcModule = std::move(*SrcModuleOrErr);
6757e88d0daSMehdi Amini     assert(&DestModule.getContext() == &SrcModule->getContext() &&
6767e88d0daSMehdi Amini            "Context mismatch");
6777e88d0daSMehdi Amini 
6786cba37ceSTeresa Johnson     // If modules were created with lazy metadata loading, materialize it
6796cba37ceSTeresa Johnson     // now, before linking it (otherwise this will be a noop).
6807f00d0a1SPeter Collingbourne     if (Error Err = SrcModule->materializeMetadata())
6817f00d0a1SPeter Collingbourne       return std::move(Err);
682e5a61917STeresa Johnson 
68301e32130SMehdi Amini     auto &ImportGUIDs = FunctionsToImportPerModule->second;
68401e32130SMehdi Amini     // Find the globals to import
6856d8f817fSPeter Collingbourne     SetVector<GlobalValue *> GlobalsToImport;
6861f685e01SPiotr Padlewski     for (Function &F : *SrcModule) {
6871f685e01SPiotr Padlewski       if (!F.hasName())
6880beb858eSTeresa Johnson         continue;
6891f685e01SPiotr Padlewski       auto GUID = F.getGUID();
6900beb858eSTeresa Johnson       auto Import = ImportGUIDs.count(GUID);
691aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID
6921f685e01SPiotr Padlewski                    << " " << F.getName() << " from "
693aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
6940beb858eSTeresa Johnson       if (Import) {
6957f00d0a1SPeter Collingbourne         if (Error Err = F.materialize())
6967f00d0a1SPeter Collingbourne           return std::move(Err);
6973b776128SPiotr Padlewski         if (EnableImportMetadata) {
6986deaa6afSPiotr Padlewski           // Add 'thinlto_src_module' metadata for statistics and debugging.
6993b776128SPiotr Padlewski           F.setMetadata(
7003b776128SPiotr Padlewski               "thinlto_src_module",
7013b776128SPiotr Padlewski               llvm::MDNode::get(
7026deaa6afSPiotr Padlewski                   DestModule.getContext(),
7033b776128SPiotr Padlewski                   {llvm::MDString::get(DestModule.getContext(),
7046deaa6afSPiotr Padlewski                                        SrcModule->getSourceFileName())}));
7053b776128SPiotr Padlewski         }
7061f685e01SPiotr Padlewski         GlobalsToImport.insert(&F);
70701e32130SMehdi Amini       }
70801e32130SMehdi Amini     }
7091f685e01SPiotr Padlewski     for (GlobalVariable &GV : SrcModule->globals()) {
7102d28f7aaSMehdi Amini       if (!GV.hasName())
7112d28f7aaSMehdi Amini         continue;
7122d28f7aaSMehdi Amini       auto GUID = GV.getGUID();
7132d28f7aaSMehdi Amini       auto Import = ImportGUIDs.count(GUID);
714aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID
715aeb1e59bSMehdi Amini                    << " " << GV.getName() << " from "
716aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
7172d28f7aaSMehdi Amini       if (Import) {
7187f00d0a1SPeter Collingbourne         if (Error Err = GV.materialize())
7197f00d0a1SPeter Collingbourne           return std::move(Err);
7202d28f7aaSMehdi Amini         GlobalsToImport.insert(&GV);
7212d28f7aaSMehdi Amini       }
7222d28f7aaSMehdi Amini     }
7231f685e01SPiotr Padlewski     for (GlobalAlias &GA : SrcModule->aliases()) {
7246d8f817fSPeter Collingbourne       // FIXME: This should eventually be controlled entirely by the summary.
7256d8f817fSPeter Collingbourne       if (FunctionImportGlobalProcessing::doImportAsDefinition(
7266d8f817fSPeter Collingbourne               &GA, &GlobalsToImport)) {
7276d8f817fSPeter Collingbourne         GlobalsToImport.insert(&GA);
7286d8f817fSPeter Collingbourne         continue;
7296d8f817fSPeter Collingbourne       }
7306d8f817fSPeter Collingbourne 
7311f685e01SPiotr Padlewski       if (!GA.hasName())
73201e32130SMehdi Amini         continue;
7331f685e01SPiotr Padlewski       auto GUID = GA.getGUID();
7340beb858eSTeresa Johnson       auto Import = ImportGUIDs.count(GUID);
735aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID
7361f685e01SPiotr Padlewski                    << " " << GA.getName() << " from "
737aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
7380beb858eSTeresa Johnson       if (Import) {
73901e32130SMehdi Amini         // Alias can't point to "available_externally". However when we import
7409aae395fSTeresa Johnson         // linkOnceODR the linkage does not change. So we import the alias
7416968ef77SMehdi Amini         // and aliasee only in this case. This has been handled by
7426968ef77SMehdi Amini         // computeImportForFunction()
7431f685e01SPiotr Padlewski         GlobalObject *GO = GA.getBaseObject();
7446968ef77SMehdi Amini         assert(GO->hasLinkOnceODRLinkage() &&
7456968ef77SMehdi Amini                "Unexpected alias to a non-linkonceODR in import list");
7462d28f7aaSMehdi Amini #ifndef NDEBUG
7472d28f7aaSMehdi Amini         if (!GlobalsToImport.count(GO))
7482d28f7aaSMehdi Amini           DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID()
7492d28f7aaSMehdi Amini                        << " " << GO->getName() << " from "
7502d28f7aaSMehdi Amini                        << SrcModule->getSourceFileName() << "\n");
7512d28f7aaSMehdi Amini #endif
7527f00d0a1SPeter Collingbourne         if (Error Err = GO->materialize())
7537f00d0a1SPeter Collingbourne           return std::move(Err);
75401e32130SMehdi Amini         GlobalsToImport.insert(GO);
7557f00d0a1SPeter Collingbourne         if (Error Err = GA.materialize())
7567f00d0a1SPeter Collingbourne           return std::move(Err);
7571f685e01SPiotr Padlewski         GlobalsToImport.insert(&GA);
75801e32130SMehdi Amini       }
75901e32130SMehdi Amini     }
76001e32130SMehdi Amini 
76119ef4fadSMehdi Amini     // Upgrade debug info after we're done materializing all the globals and we
76219ef4fadSMehdi Amini     // have loaded all the required metadata!
76319ef4fadSMehdi Amini     UpgradeDebugInfo(*SrcModule);
76419ef4fadSMehdi Amini 
7657e88d0daSMehdi Amini     // Link in the specified functions.
76601e32130SMehdi Amini     if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport))
7678d05185aSMehdi Amini       return true;
7688d05185aSMehdi Amini 
769d29478f7STeresa Johnson     if (PrintImports) {
770d29478f7STeresa Johnson       for (const auto *GV : GlobalsToImport)
771d29478f7STeresa Johnson         dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName()
772d29478f7STeresa Johnson                << " from " << SrcModule->getSourceFileName() << "\n";
773d29478f7STeresa Johnson     }
774d29478f7STeresa Johnson 
7756d8f817fSPeter Collingbourne     if (Mover.move(std::move(SrcModule), GlobalsToImport.getArrayRef(),
7766d8f817fSPeter Collingbourne                    [](GlobalValue &, IRMover::ValueAdder) {},
777e6fd9ff9SPeter Collingbourne                    /*IsPerformingImport=*/true))
7787e88d0daSMehdi Amini       report_fatal_error("Function Import: link error");
7797e88d0daSMehdi Amini 
78001e32130SMehdi Amini     ImportedCount += GlobalsToImport.size();
7816c475a75STeresa Johnson     NumImportedModules++;
7827e88d0daSMehdi Amini   }
783e5a61917STeresa Johnson 
7846c475a75STeresa Johnson   NumImportedFunctions += ImportedCount;
785d29478f7STeresa Johnson 
7867e88d0daSMehdi Amini   DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module "
787c8c55170SMehdi Amini                << DestModule.getModuleIdentifier() << "\n");
788c8c55170SMehdi Amini   return ImportedCount;
78942418abaSMehdi Amini }
79042418abaSMehdi Amini 
79142418abaSMehdi Amini /// Summary file to use for function importing when using -function-import from
79242418abaSMehdi Amini /// the command line.
79342418abaSMehdi Amini static cl::opt<std::string>
79442418abaSMehdi Amini     SummaryFile("summary-file",
79542418abaSMehdi Amini                 cl::desc("The summary file to use for function importing."));
79642418abaSMehdi Amini 
797598bd2a2SPeter Collingbourne static bool doImportingForModule(Module &M) {
798598bd2a2SPeter Collingbourne   if (SummaryFile.empty())
799598bd2a2SPeter Collingbourne     report_fatal_error("error: -function-import requires -summary-file\n");
8006de481a3SPeter Collingbourne   Expected<std::unique_ptr<ModuleSummaryIndex>> IndexPtrOrErr =
8016de481a3SPeter Collingbourne       getModuleSummaryIndexForFile(SummaryFile);
8026de481a3SPeter Collingbourne   if (!IndexPtrOrErr) {
8036de481a3SPeter Collingbourne     logAllUnhandledErrors(IndexPtrOrErr.takeError(), errs(),
8046de481a3SPeter Collingbourne                           "Error loading file '" + SummaryFile + "': ");
80542418abaSMehdi Amini     return false;
80642418abaSMehdi Amini   }
807598bd2a2SPeter Collingbourne   std::unique_ptr<ModuleSummaryIndex> Index = std::move(*IndexPtrOrErr);
80842418abaSMehdi Amini 
809c86af334STeresa Johnson   // First step is collecting the import list.
810c86af334STeresa Johnson   FunctionImporter::ImportMapTy ImportList;
811c86af334STeresa Johnson   ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index,
812c86af334STeresa Johnson                                     ImportList);
81301e32130SMehdi Amini 
8144fef68cbSTeresa Johnson   // Conservatively mark all internal values as promoted. This interface is
8154fef68cbSTeresa Johnson   // only used when doing importing via the function importing pass. The pass
8164fef68cbSTeresa Johnson   // is only enabled when testing importing via the 'opt' tool, which does
8174fef68cbSTeresa Johnson   // not do the ThinLink that would normally determine what values to promote.
8184fef68cbSTeresa Johnson   for (auto &I : *Index) {
8194fef68cbSTeresa Johnson     for (auto &S : I.second) {
8204fef68cbSTeresa Johnson       if (GlobalValue::isLocalLinkage(S->linkage()))
8214fef68cbSTeresa Johnson         S->setLinkage(GlobalValue::ExternalLinkage);
8224fef68cbSTeresa Johnson     }
8234fef68cbSTeresa Johnson   }
8244fef68cbSTeresa Johnson 
82501e32130SMehdi Amini   // Next we need to promote to global scope and rename any local values that
8261b00f2d9STeresa Johnson   // are potentially exported to other modules.
82701e32130SMehdi Amini   if (renameModuleForThinLTO(M, *Index, nullptr)) {
8281b00f2d9STeresa Johnson     errs() << "Error renaming module\n";
8291b00f2d9STeresa Johnson     return false;
8301b00f2d9STeresa Johnson   }
8311b00f2d9STeresa Johnson 
83242418abaSMehdi Amini   // Perform the import now.
833d16c8065SMehdi Amini   auto ModuleLoader = [&M](StringRef Identifier) {
834d16c8065SMehdi Amini     return loadFile(Identifier, M.getContext());
835d16c8065SMehdi Amini   };
8369d2bfc48SRafael Espindola   FunctionImporter Importer(*Index, ModuleLoader);
83737e24591SPeter Collingbourne   Expected<bool> Result = Importer.importFunctions(M, ImportList);
8387f00d0a1SPeter Collingbourne 
8397f00d0a1SPeter Collingbourne   // FIXME: Probably need to propagate Errors through the pass manager.
8407f00d0a1SPeter Collingbourne   if (!Result) {
8417f00d0a1SPeter Collingbourne     logAllUnhandledErrors(Result.takeError(), errs(),
8427f00d0a1SPeter Collingbourne                           "Error importing module: ");
8437f00d0a1SPeter Collingbourne     return false;
8447f00d0a1SPeter Collingbourne   }
8457f00d0a1SPeter Collingbourne 
8467f00d0a1SPeter Collingbourne   return *Result;
84721241571STeresa Johnson }
84821241571STeresa Johnson 
84921241571STeresa Johnson namespace {
85021241571STeresa Johnson /// Pass that performs cross-module function import provided a summary file.
85121241571STeresa Johnson class FunctionImportLegacyPass : public ModulePass {
85221241571STeresa Johnson public:
85321241571STeresa Johnson   /// Pass identification, replacement for typeid
85421241571STeresa Johnson   static char ID;
85521241571STeresa Johnson 
85621241571STeresa Johnson   /// Specify pass name for debug output
857117296c0SMehdi Amini   StringRef getPassName() const override { return "Function Importing"; }
85821241571STeresa Johnson 
859598bd2a2SPeter Collingbourne   explicit FunctionImportLegacyPass() : ModulePass(ID) {}
86021241571STeresa Johnson 
86121241571STeresa Johnson   bool runOnModule(Module &M) override {
86221241571STeresa Johnson     if (skipModule(M))
86321241571STeresa Johnson       return false;
86421241571STeresa Johnson 
865598bd2a2SPeter Collingbourne     return doImportingForModule(M);
86642418abaSMehdi Amini   }
86742418abaSMehdi Amini };
868fe2b5415SBenjamin Kramer } // anonymous namespace
86942418abaSMehdi Amini 
87021241571STeresa Johnson PreservedAnalyses FunctionImportPass::run(Module &M,
871fd03ac6aSSean Silva                                           ModuleAnalysisManager &AM) {
872598bd2a2SPeter Collingbourne   if (!doImportingForModule(M))
87321241571STeresa Johnson     return PreservedAnalyses::all();
87421241571STeresa Johnson 
87521241571STeresa Johnson   return PreservedAnalyses::none();
87621241571STeresa Johnson }
87721241571STeresa Johnson 
87821241571STeresa Johnson char FunctionImportLegacyPass::ID = 0;
87921241571STeresa Johnson INITIALIZE_PASS(FunctionImportLegacyPass, "function-import",
88042418abaSMehdi Amini                 "Summary Based Function Import", false, false)
88142418abaSMehdi Amini 
88242418abaSMehdi Amini namespace llvm {
883598bd2a2SPeter Collingbourne Pass *createFunctionImportPass() {
884598bd2a2SPeter Collingbourne   return new FunctionImportLegacyPass();
8855fcbdb71STeresa Johnson }
88642418abaSMehdi Amini }
887