142418abaSMehdi Amini //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===//
242418abaSMehdi Amini //
342418abaSMehdi Amini //                     The LLVM Compiler Infrastructure
442418abaSMehdi Amini //
542418abaSMehdi Amini // This file is distributed under the University of Illinois Open Source
642418abaSMehdi Amini // License. See LICENSE.TXT for details.
742418abaSMehdi Amini //
842418abaSMehdi Amini //===----------------------------------------------------------------------===//
942418abaSMehdi Amini //
1042418abaSMehdi Amini // This file implements Function import based on summaries.
1142418abaSMehdi Amini //
1242418abaSMehdi Amini //===----------------------------------------------------------------------===//
1342418abaSMehdi Amini 
1442418abaSMehdi Amini #include "llvm/Transforms/IPO/FunctionImport.h"
1542418abaSMehdi Amini 
1601e32130SMehdi Amini #include "llvm/ADT/SmallVector.h"
17d29478f7STeresa Johnson #include "llvm/ADT/Statistic.h"
1842418abaSMehdi Amini #include "llvm/ADT/StringSet.h"
1942418abaSMehdi Amini #include "llvm/IR/AutoUpgrade.h"
2042418abaSMehdi Amini #include "llvm/IR/DiagnosticPrinter.h"
2142418abaSMehdi Amini #include "llvm/IR/IntrinsicInst.h"
2242418abaSMehdi Amini #include "llvm/IR/Module.h"
2342418abaSMehdi Amini #include "llvm/IRReader/IRReader.h"
2442418abaSMehdi Amini #include "llvm/Linker/Linker.h"
2526ab5772STeresa Johnson #include "llvm/Object/ModuleSummaryIndexObjectFile.h"
2642418abaSMehdi Amini #include "llvm/Support/CommandLine.h"
2742418abaSMehdi Amini #include "llvm/Support/Debug.h"
2842418abaSMehdi Amini #include "llvm/Support/SourceMgr.h"
29488a800aSTeresa Johnson #include "llvm/Transforms/Utils/FunctionImportUtils.h"
307e88d0daSMehdi Amini 
3101e32130SMehdi Amini #define DEBUG_TYPE "function-import"
327e88d0daSMehdi Amini 
3342418abaSMehdi Amini using namespace llvm;
3442418abaSMehdi Amini 
35d29478f7STeresa Johnson STATISTIC(NumImported, "Number of functions imported");
36d29478f7STeresa Johnson 
3739303619STeresa Johnson /// Limit on instruction count of imported functions.
3839303619STeresa Johnson static cl::opt<unsigned> ImportInstrLimit(
3939303619STeresa Johnson     "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"),
4039303619STeresa Johnson     cl::desc("Only import functions with less than N instructions"));
4139303619STeresa Johnson 
4240641748SMehdi Amini static cl::opt<float>
4340641748SMehdi Amini     ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7),
4440641748SMehdi Amini                       cl::Hidden, cl::value_desc("x"),
4540641748SMehdi Amini                       cl::desc("As we import functions, multiply the "
4640641748SMehdi Amini                                "`import-instr-limit` threshold by this factor "
4740641748SMehdi Amini                                "before processing newly imported functions"));
4840641748SMehdi Amini 
49d29478f7STeresa Johnson static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden,
50d29478f7STeresa Johnson                                   cl::desc("Print imported functions"));
51d29478f7STeresa Johnson 
52bda3c97cSMehdi Amini // Temporary allows the function import pass to disable always linking
53bda3c97cSMehdi Amini // referenced discardable symbols.
54bda3c97cSMehdi Amini static cl::opt<bool>
55bda3c97cSMehdi Amini     DontForceImportReferencedDiscardableSymbols("disable-force-link-odr",
56bda3c97cSMehdi Amini                                                 cl::init(false), cl::Hidden);
57bda3c97cSMehdi Amini 
5842418abaSMehdi Amini // Load lazily a module from \p FileName in \p Context.
5942418abaSMehdi Amini static std::unique_ptr<Module> loadFile(const std::string &FileName,
6042418abaSMehdi Amini                                         LLVMContext &Context) {
6142418abaSMehdi Amini   SMDiagnostic Err;
6242418abaSMehdi Amini   DEBUG(dbgs() << "Loading '" << FileName << "'\n");
636cba37ceSTeresa Johnson   // Metadata isn't loaded until functions are imported, to minimize
646cba37ceSTeresa Johnson   // the memory overhead.
65a1080ee6STeresa Johnson   std::unique_ptr<Module> Result =
66a1080ee6STeresa Johnson       getLazyIRFileModule(FileName, Err, Context,
67a1080ee6STeresa Johnson                           /* ShouldLazyLoadMetadata = */ true);
6842418abaSMehdi Amini   if (!Result) {
6942418abaSMehdi Amini     Err.print("function-import", errs());
70d7ad221cSMehdi Amini     report_fatal_error("Abort");
7142418abaSMehdi Amini   }
7242418abaSMehdi Amini 
7342418abaSMehdi Amini   return Result;
7442418abaSMehdi Amini }
7542418abaSMehdi Amini 
767e88d0daSMehdi Amini namespace {
7740641748SMehdi Amini 
7801e32130SMehdi Amini /// Given a list of possible callee implementation for a call site, select one
7901e32130SMehdi Amini /// that fits the \p Threshold.
8001e32130SMehdi Amini ///
8101e32130SMehdi Amini /// FIXME: select "best" instead of first that fits. But what is "best"?
8201e32130SMehdi Amini /// - The smallest: more likely to be inlined.
8301e32130SMehdi Amini /// - The one with the least outgoing edges (already well optimized).
8401e32130SMehdi Amini /// - One from a module already being imported from in order to reduce the
8501e32130SMehdi Amini ///   number of source modules parsed/linked.
8601e32130SMehdi Amini /// - One that has PGO data attached.
8701e32130SMehdi Amini /// - [insert you fancy metric here]
882d28f7aaSMehdi Amini static const GlobalValueSummary *
8901e32130SMehdi Amini selectCallee(const GlobalValueInfoList &CalleeInfoList, unsigned Threshold) {
9001e32130SMehdi Amini   auto It = llvm::find_if(
9101e32130SMehdi Amini       CalleeInfoList, [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) {
9201e32130SMehdi Amini         assert(GlobInfo->summary() &&
9301e32130SMehdi Amini                "We should not have a Global Info without summary");
942d28f7aaSMehdi Amini         auto *GVSummary = GlobInfo->summary();
952c719cc1SMehdi Amini         if (GlobalValue::isWeakAnyLinkage(GVSummary->linkage()))
962c719cc1SMehdi Amini           // There is no point in importing weak symbols, we can't inline them
9701e32130SMehdi Amini           return false;
982c719cc1SMehdi Amini         if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) {
992c719cc1SMehdi Amini           GVSummary = &AS->getAliasee();
1002c719cc1SMehdi Amini           // Alias can't point to "available_externally". However when we import
1012c719cc1SMehdi Amini           // linkOnceODR the linkage does not change. So we import the alias
1022c719cc1SMehdi Amini           // and aliasee only in this case.
1032c719cc1SMehdi Amini           // FIXME: we should import alias as available_externally *function*,
1042c719cc1SMehdi Amini           // the destination module does need to know it is an alias.
1052c719cc1SMehdi Amini           if (!GlobalValue::isLinkOnceODRLinkage(GVSummary->linkage()))
1062c719cc1SMehdi Amini             return false;
1072c719cc1SMehdi Amini         }
1082c719cc1SMehdi Amini 
1092c719cc1SMehdi Amini         auto *Summary = cast<FunctionSummary>(GVSummary);
1107e88d0daSMehdi Amini 
11101e32130SMehdi Amini         if (Summary->instCount() > Threshold)
11201e32130SMehdi Amini           return false;
1137e88d0daSMehdi Amini 
11401e32130SMehdi Amini         return true;
11501e32130SMehdi Amini       });
11601e32130SMehdi Amini   if (It == CalleeInfoList.end())
11701e32130SMehdi Amini     return nullptr;
1187e88d0daSMehdi Amini 
1192d28f7aaSMehdi Amini   return cast<GlobalValueSummary>((*It)->summary());
120434e9561SRafael Espindola }
1217e88d0daSMehdi Amini 
12201e32130SMehdi Amini /// Return the summary for the function \p GUID that fits the \p Threshold, or
12301e32130SMehdi Amini /// null if there's no match.
1242d28f7aaSMehdi Amini static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID,
125ad5741b0SMehdi Amini                                               unsigned Threshold,
12601e32130SMehdi Amini                                               const ModuleSummaryIndex &Index) {
12701e32130SMehdi Amini   auto CalleeInfoList = Index.findGlobalValueInfoList(GUID);
12801e32130SMehdi Amini   if (CalleeInfoList == Index.end()) {
12901e32130SMehdi Amini     return nullptr; // This function does not have a summary
1307e88d0daSMehdi Amini   }
13101e32130SMehdi Amini   return selectCallee(CalleeInfoList->second, Threshold);
13201e32130SMehdi Amini }
1337e88d0daSMehdi Amini 
134*cb87494fSMehdi Amini /// Mark the global \p GUID as export by module \p ExportModulePath if found in
135*cb87494fSMehdi Amini /// this module. If it is a GlobalVariable, we also mark any referenced global
136*cb87494fSMehdi Amini /// in the current module as exported.
137*cb87494fSMehdi Amini static void exportGlobalInModule(const ModuleSummaryIndex &Index,
138ad5741b0SMehdi Amini                                  StringRef ExportModulePath,
139*cb87494fSMehdi Amini                                  GlobalValue::GUID GUID,
140*cb87494fSMehdi Amini                                  FunctionImporter::ExportSetTy &ExportList) {
141*cb87494fSMehdi Amini   auto FindGlobalInfoInModule =
142*cb87494fSMehdi Amini       [&](GlobalValue::GUID GUID) -> GlobalValueInfo *{
143*cb87494fSMehdi Amini         auto InfoList = Index.findGlobalValueInfoList(GUID);
144*cb87494fSMehdi Amini         if (InfoList == Index.end())
14501e32130SMehdi Amini           // This global does not have a summary, it is not part of the ThinLTO
14601e32130SMehdi Amini           // process
147*cb87494fSMehdi Amini           return nullptr;
148*cb87494fSMehdi Amini         auto Info = llvm::find_if(
149*cb87494fSMehdi Amini             InfoList->second,
15001e32130SMehdi Amini             [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) {
15101e32130SMehdi Amini               auto *Summary = GlobInfo->summary();
15201e32130SMehdi Amini               assert(Summary && "Unexpected GlobalValueInfo without summary");
15301e32130SMehdi Amini               return Summary->modulePath() == ExportModulePath;
15401e32130SMehdi Amini             });
155*cb87494fSMehdi Amini         if (Info == InfoList->second.end())
156*cb87494fSMehdi Amini           return nullptr;
157*cb87494fSMehdi Amini         return Info->get();
158*cb87494fSMehdi Amini       };
159*cb87494fSMehdi Amini 
160*cb87494fSMehdi Amini   auto *GVInfo = FindGlobalInfoInModule(GUID);
161*cb87494fSMehdi Amini   if (!GVInfo)
162*cb87494fSMehdi Amini     return;
163*cb87494fSMehdi Amini   // We found it in the current module, mark as exported
164*cb87494fSMehdi Amini   ExportList.insert(GUID);
165*cb87494fSMehdi Amini 
166*cb87494fSMehdi Amini   auto *Summary = GVInfo->summary();
167*cb87494fSMehdi Amini   auto GVS = dyn_cast<GlobalVarSummary>(Summary);
168*cb87494fSMehdi Amini   if (!GVS)
169*cb87494fSMehdi Amini     return;
170*cb87494fSMehdi Amini   // FunctionImportGlobalProcessing::doPromoteLocalToGlobal() will always
171*cb87494fSMehdi Amini   // trigger importing  the initializer for `constant unnamed addr` globals that
172*cb87494fSMehdi Amini   // are referenced. We conservatively export all the referenced symbols for
173*cb87494fSMehdi Amini   // every global to workaround this, so that the ExportList is accurate.
174*cb87494fSMehdi Amini   // FIXME: with a "isConstant" flag in the summary we could be more targetted.
175*cb87494fSMehdi Amini   for (auto &Ref : GVS->refs()) {
176*cb87494fSMehdi Amini     auto GUID = Ref.getGUID();
177*cb87494fSMehdi Amini     auto *RefInfo = FindGlobalInfoInModule(GUID);
178*cb87494fSMehdi Amini     if (RefInfo)
179*cb87494fSMehdi Amini       // Found a ref in the current module, mark it as exported
180*cb87494fSMehdi Amini       ExportList.insert(GUID);
181*cb87494fSMehdi Amini   }
18201e32130SMehdi Amini }
1837e88d0daSMehdi Amini 
18401e32130SMehdi Amini using EdgeInfo = std::pair<const FunctionSummary *, unsigned /* Threshold */>;
18501e32130SMehdi Amini 
18601e32130SMehdi Amini /// Compute the list of functions to import for a given caller. Mark these
18701e32130SMehdi Amini /// imported functions and the symbols they reference in their source module as
18801e32130SMehdi Amini /// exported from their source module.
18901e32130SMehdi Amini static void computeImportForFunction(
1903255eec1STeresa Johnson     const FunctionSummary &Summary, const ModuleSummaryIndex &Index,
1913255eec1STeresa Johnson     unsigned Threshold,
1921aafabf7SMehdi Amini     const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries,
19301e32130SMehdi Amini     SmallVectorImpl<EdgeInfo> &Worklist,
19401e32130SMehdi Amini     FunctionImporter::ImportMapTy &ImportsForModule,
195c86af334STeresa Johnson     StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) {
19601e32130SMehdi Amini   for (auto &Edge : Summary.calls()) {
1972d5487cfSTeresa Johnson     auto GUID = Edge.first.getGUID();
19801e32130SMehdi Amini     DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n");
19901e32130SMehdi Amini 
2001aafabf7SMehdi Amini     if (DefinedGVSummaries.count(GUID)) {
20101e32130SMehdi Amini       DEBUG(dbgs() << "ignored! Target already in destination module.\n");
2027e88d0daSMehdi Amini       continue;
203d450da32STeresa Johnson     }
20440641748SMehdi Amini 
20501e32130SMehdi Amini     auto *CalleeSummary = selectCallee(GUID, Threshold, Index);
20601e32130SMehdi Amini     if (!CalleeSummary) {
20701e32130SMehdi Amini       DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n");
2087e88d0daSMehdi Amini       continue;
2097e88d0daSMehdi Amini     }
2102d28f7aaSMehdi Amini     // "Resolve" the summary, traversing alias,
2112d28f7aaSMehdi Amini     const FunctionSummary *ResolvedCalleeSummary;
2126968ef77SMehdi Amini     if (isa<AliasSummary>(CalleeSummary)) {
2132d28f7aaSMehdi Amini       ResolvedCalleeSummary = cast<FunctionSummary>(
2142d28f7aaSMehdi Amini           &cast<AliasSummary>(CalleeSummary)->getAliasee());
2152c719cc1SMehdi Amini       assert(
2162c719cc1SMehdi Amini           GlobalValue::isLinkOnceODRLinkage(ResolvedCalleeSummary->linkage()) &&
2172c719cc1SMehdi Amini           "Unexpected alias to a non-linkonceODR in import list");
2186968ef77SMehdi Amini     } else
2192d28f7aaSMehdi Amini       ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary);
2202d28f7aaSMehdi Amini 
2212d28f7aaSMehdi Amini     assert(ResolvedCalleeSummary->instCount() <= Threshold &&
22201e32130SMehdi Amini            "selectCallee() didn't honor the threshold");
22301e32130SMehdi Amini 
2242d28f7aaSMehdi Amini     auto ExportModulePath = ResolvedCalleeSummary->modulePath();
2252d28f7aaSMehdi Amini     auto &ProcessedThreshold = ImportsForModule[ExportModulePath][GUID];
22601e32130SMehdi Amini     /// Since the traversal of the call graph is DFS, we can revisit a function
22701e32130SMehdi Amini     /// a second time with a higher threshold. In this case, it is added back to
22801e32130SMehdi Amini     /// the worklist with the new threshold.
22901e32130SMehdi Amini     if (ProcessedThreshold && ProcessedThreshold > Threshold) {
23001e32130SMehdi Amini       DEBUG(dbgs() << "ignored! Target was already seen with Threshold "
23101e32130SMehdi Amini                    << ProcessedThreshold << "\n");
23201e32130SMehdi Amini       continue;
23301e32130SMehdi Amini     }
23401e32130SMehdi Amini     // Mark this function as imported in this module, with the current Threshold
23501e32130SMehdi Amini     ProcessedThreshold = Threshold;
23601e32130SMehdi Amini 
23701e32130SMehdi Amini     // Make exports in the source module.
238c86af334STeresa Johnson     if (ExportLists) {
239ef7555fbSMehdi Amini       auto &ExportList = (*ExportLists)[ExportModulePath];
24001e32130SMehdi Amini       ExportList.insert(GUID);
241c86af334STeresa Johnson       // Mark all functions and globals referenced by this function as exported
242c86af334STeresa Johnson       // to the outside if they are defined in the same source module.
2432d28f7aaSMehdi Amini       for (auto &Edge : ResolvedCalleeSummary->calls()) {
2442d5487cfSTeresa Johnson         auto CalleeGUID = Edge.first.getGUID();
245*cb87494fSMehdi Amini         exportGlobalInModule(Index, ExportModulePath, CalleeGUID, ExportList);
24601e32130SMehdi Amini       }
2472d28f7aaSMehdi Amini       for (auto &Ref : ResolvedCalleeSummary->refs()) {
2482d5487cfSTeresa Johnson         auto GUID = Ref.getGUID();
249*cb87494fSMehdi Amini         exportGlobalInModule(Index, ExportModulePath, GUID, ExportList);
2507e88d0daSMehdi Amini       }
251c86af334STeresa Johnson     }
2527e88d0daSMehdi Amini 
25301e32130SMehdi Amini     // Insert the newly imported function to the worklist.
2542d28f7aaSMehdi Amini     Worklist.push_back(std::make_pair(ResolvedCalleeSummary, Threshold));
255d450da32STeresa Johnson   }
256d450da32STeresa Johnson }
257d450da32STeresa Johnson 
25801e32130SMehdi Amini /// Given the list of globals defined in a module, compute the list of imports
25901e32130SMehdi Amini /// as well as the list of "exports", i.e. the list of symbols referenced from
26001e32130SMehdi Amini /// another module (that may require promotion).
26101e32130SMehdi Amini static void ComputeImportForModule(
2621aafabf7SMehdi Amini     const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries,
26326ab5772STeresa Johnson     const ModuleSummaryIndex &Index,
26401e32130SMehdi Amini     FunctionImporter::ImportMapTy &ImportsForModule,
265c86af334STeresa Johnson     StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) {
26601e32130SMehdi Amini   // Worklist contains the list of function imported in this module, for which
26701e32130SMehdi Amini   // we will analyse the callees and may import further down the callgraph.
26801e32130SMehdi Amini   SmallVector<EdgeInfo, 128> Worklist;
26901e32130SMehdi Amini 
27001e32130SMehdi Amini   // Populate the worklist with the import for the functions in the current
27101e32130SMehdi Amini   // module
2721aafabf7SMehdi Amini   for (auto &GVInfo : DefinedGVSummaries) {
2731aafabf7SMehdi Amini     auto *Summary = GVInfo.second;
2742d28f7aaSMehdi Amini     if (auto *AS = dyn_cast<AliasSummary>(Summary))
2752d28f7aaSMehdi Amini       Summary = &AS->getAliasee();
2761aafabf7SMehdi Amini     auto *FuncSummary = dyn_cast<FunctionSummary>(Summary);
2771aafabf7SMehdi Amini     if (!FuncSummary)
2781aafabf7SMehdi Amini       // Skip import for global variables
2791aafabf7SMehdi Amini       continue;
2801aafabf7SMehdi Amini     DEBUG(dbgs() << "Initalize import for " << GVInfo.first << "\n");
2812d28f7aaSMehdi Amini     computeImportForFunction(*FuncSummary, Index, ImportInstrLimit,
2821aafabf7SMehdi Amini                              DefinedGVSummaries, Worklist, ImportsForModule,
28301e32130SMehdi Amini                              ExportLists);
28401e32130SMehdi Amini   }
28501e32130SMehdi Amini 
28642418abaSMehdi Amini   while (!Worklist.empty()) {
28701e32130SMehdi Amini     auto FuncInfo = Worklist.pop_back_val();
28801e32130SMehdi Amini     auto *Summary = FuncInfo.first;
28901e32130SMehdi Amini     auto Threshold = FuncInfo.second;
29042418abaSMehdi Amini 
2917e88d0daSMehdi Amini     // Process the newly imported functions and add callees to the worklist.
29240641748SMehdi Amini     // Adjust the threshold
29340641748SMehdi Amini     Threshold = Threshold * ImportInstrFactor;
29401e32130SMehdi Amini 
2951aafabf7SMehdi Amini     computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries,
2963255eec1STeresa Johnson                              Worklist, ImportsForModule, ExportLists);
297c8c55170SMehdi Amini   }
29842418abaSMehdi Amini }
299ffe2e4aaSMehdi Amini 
30001e32130SMehdi Amini } // anonymous namespace
30101e32130SMehdi Amini 
302c86af334STeresa Johnson /// Compute all the import and export for every module using the Index.
30301e32130SMehdi Amini void llvm::ComputeCrossModuleImport(
30401e32130SMehdi Amini     const ModuleSummaryIndex &Index,
3051aafabf7SMehdi Amini     const StringMap<std::map<GlobalValue::GUID, GlobalValueSummary *>> &
3061aafabf7SMehdi Amini         ModuleToDefinedGVSummaries,
30701e32130SMehdi Amini     StringMap<FunctionImporter::ImportMapTy> &ImportLists,
30801e32130SMehdi Amini     StringMap<FunctionImporter::ExportSetTy> &ExportLists) {
30901e32130SMehdi Amini   // For each module that has function defined, compute the import/export lists.
3101aafabf7SMehdi Amini   for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) {
3111aafabf7SMehdi Amini     auto &ImportsForModule = ImportLists[DefinedGVSummaries.first()];
3121aafabf7SMehdi Amini     DEBUG(dbgs() << "Computing import for Module '"
3131aafabf7SMehdi Amini                  << DefinedGVSummaries.first() << "'\n");
3141aafabf7SMehdi Amini     ComputeImportForModule(DefinedGVSummaries.second, Index, ImportsForModule,
315c86af334STeresa Johnson                            &ExportLists);
31601e32130SMehdi Amini   }
31701e32130SMehdi Amini 
31801e32130SMehdi Amini #ifndef NDEBUG
31901e32130SMehdi Amini   DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size()
32001e32130SMehdi Amini                << " modules:\n");
32101e32130SMehdi Amini   for (auto &ModuleImports : ImportLists) {
32201e32130SMehdi Amini     auto ModName = ModuleImports.first();
32301e32130SMehdi Amini     auto &Exports = ExportLists[ModName];
32401e32130SMehdi Amini     DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size()
32501e32130SMehdi Amini                  << " functions. Imports from " << ModuleImports.second.size()
32601e32130SMehdi Amini                  << " modules.\n");
32701e32130SMehdi Amini     for (auto &Src : ModuleImports.second) {
32801e32130SMehdi Amini       auto SrcModName = Src.first();
32901e32130SMehdi Amini       DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from "
33001e32130SMehdi Amini                    << SrcModName << "\n");
33101e32130SMehdi Amini     }
33201e32130SMehdi Amini   }
33301e32130SMehdi Amini #endif
33401e32130SMehdi Amini }
33501e32130SMehdi Amini 
336c86af334STeresa Johnson /// Compute all the imports for the given module in the Index.
337c86af334STeresa Johnson void llvm::ComputeCrossModuleImportForModule(
338c86af334STeresa Johnson     StringRef ModulePath, const ModuleSummaryIndex &Index,
339c86af334STeresa Johnson     FunctionImporter::ImportMapTy &ImportList) {
340c86af334STeresa Johnson 
341c86af334STeresa Johnson   // Collect the list of functions this module defines.
342c86af334STeresa Johnson   // GUID -> Summary
3432d28f7aaSMehdi Amini   std::map<GlobalValue::GUID, GlobalValueSummary *> FunctionInfoMap;
344c86af334STeresa Johnson   Index.collectDefinedFunctionsForModule(ModulePath, FunctionInfoMap);
345c86af334STeresa Johnson 
346c86af334STeresa Johnson   // Compute the import list for this module.
347c86af334STeresa Johnson   DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n");
348c86af334STeresa Johnson   ComputeImportForModule(FunctionInfoMap, Index, ImportList);
349c86af334STeresa Johnson 
350c86af334STeresa Johnson #ifndef NDEBUG
351c86af334STeresa Johnson   DEBUG(dbgs() << "* Module " << ModulePath << " imports from "
352c86af334STeresa Johnson                << ImportList.size() << " modules.\n");
353c86af334STeresa Johnson   for (auto &Src : ImportList) {
354c86af334STeresa Johnson     auto SrcModName = Src.first();
355c86af334STeresa Johnson     DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from "
356c86af334STeresa Johnson                  << SrcModName << "\n");
357c86af334STeresa Johnson   }
358c86af334STeresa Johnson #endif
359c86af334STeresa Johnson }
360c86af334STeresa Johnson 
361c8c55170SMehdi Amini // Automatically import functions in Module \p DestModule based on the summaries
362c8c55170SMehdi Amini // index.
363c8c55170SMehdi Amini //
36401e32130SMehdi Amini bool FunctionImporter::importFunctions(
365bda3c97cSMehdi Amini     Module &DestModule, const FunctionImporter::ImportMapTy &ImportList,
366bda3c97cSMehdi Amini     bool ForceImportReferencedDiscardableSymbols) {
3675411d051SMehdi Amini   DEBUG(dbgs() << "Starting import for Module "
368311fef6eSMehdi Amini                << DestModule.getModuleIdentifier() << "\n");
369c8c55170SMehdi Amini   unsigned ImportedCount = 0;
370c8c55170SMehdi Amini 
371c8c55170SMehdi Amini   // Linker that will be used for importing function
3729d2bfc48SRafael Espindola   Linker TheLinker(DestModule);
3737e88d0daSMehdi Amini   // Do the actual import of functions now, one Module at a time
37401e32130SMehdi Amini   std::set<StringRef> ModuleNameOrderedList;
37501e32130SMehdi Amini   for (auto &FunctionsToImportPerModule : ImportList) {
37601e32130SMehdi Amini     ModuleNameOrderedList.insert(FunctionsToImportPerModule.first());
37701e32130SMehdi Amini   }
37801e32130SMehdi Amini   for (auto &Name : ModuleNameOrderedList) {
3797e88d0daSMehdi Amini     // Get the module for the import
38001e32130SMehdi Amini     const auto &FunctionsToImportPerModule = ImportList.find(Name);
38101e32130SMehdi Amini     assert(FunctionsToImportPerModule != ImportList.end());
38201e32130SMehdi Amini     std::unique_ptr<Module> SrcModule = ModuleLoader(Name);
3837e88d0daSMehdi Amini     assert(&DestModule.getContext() == &SrcModule->getContext() &&
3847e88d0daSMehdi Amini            "Context mismatch");
3857e88d0daSMehdi Amini 
3866cba37ceSTeresa Johnson     // If modules were created with lazy metadata loading, materialize it
3876cba37ceSTeresa Johnson     // now, before linking it (otherwise this will be a noop).
3886cba37ceSTeresa Johnson     SrcModule->materializeMetadata();
3896cba37ceSTeresa Johnson     UpgradeDebugInfo(*SrcModule);
390e5a61917STeresa Johnson 
39101e32130SMehdi Amini     auto &ImportGUIDs = FunctionsToImportPerModule->second;
39201e32130SMehdi Amini     // Find the globals to import
39301e32130SMehdi Amini     DenseSet<const GlobalValue *> GlobalsToImport;
39401e32130SMehdi Amini     for (auto &GV : *SrcModule) {
3950beb858eSTeresa Johnson       if (!GV.hasName())
3960beb858eSTeresa Johnson         continue;
3970beb858eSTeresa Johnson       auto GUID = GV.getGUID();
3980beb858eSTeresa Johnson       auto Import = ImportGUIDs.count(GUID);
399aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID
400aeb1e59bSMehdi Amini                    << " " << GV.getName() << " from "
401aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
4020beb858eSTeresa Johnson       if (Import) {
40301e32130SMehdi Amini         GV.materialize();
40401e32130SMehdi Amini         GlobalsToImport.insert(&GV);
40501e32130SMehdi Amini       }
40601e32130SMehdi Amini     }
4072d28f7aaSMehdi Amini     for (auto &GV : SrcModule->globals()) {
4082d28f7aaSMehdi Amini       if (!GV.hasName())
4092d28f7aaSMehdi Amini         continue;
4102d28f7aaSMehdi Amini       auto GUID = GV.getGUID();
4112d28f7aaSMehdi Amini       auto Import = ImportGUIDs.count(GUID);
412aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID
413aeb1e59bSMehdi Amini                    << " " << GV.getName() << " from "
414aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
4152d28f7aaSMehdi Amini       if (Import) {
4162d28f7aaSMehdi Amini         GV.materialize();
4172d28f7aaSMehdi Amini         GlobalsToImport.insert(&GV);
4182d28f7aaSMehdi Amini       }
4192d28f7aaSMehdi Amini     }
42001e32130SMehdi Amini     for (auto &GV : SrcModule->aliases()) {
42101e32130SMehdi Amini       if (!GV.hasName())
42201e32130SMehdi Amini         continue;
42301e32130SMehdi Amini       auto GUID = GV.getGUID();
4240beb858eSTeresa Johnson       auto Import = ImportGUIDs.count(GUID);
425aeb1e59bSMehdi Amini       DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID
426aeb1e59bSMehdi Amini                    << " " << GV.getName() << " from "
427aeb1e59bSMehdi Amini                    << SrcModule->getSourceFileName() << "\n");
4280beb858eSTeresa Johnson       if (Import) {
42901e32130SMehdi Amini         // Alias can't point to "available_externally". However when we import
4309aae395fSTeresa Johnson         // linkOnceODR the linkage does not change. So we import the alias
4316968ef77SMehdi Amini         // and aliasee only in this case. This has been handled by
4326968ef77SMehdi Amini         // computeImportForFunction()
4332d28f7aaSMehdi Amini         GlobalObject *GO = GV.getBaseObject();
4346968ef77SMehdi Amini         assert(GO->hasLinkOnceODRLinkage() &&
4356968ef77SMehdi Amini                "Unexpected alias to a non-linkonceODR in import list");
4362d28f7aaSMehdi Amini #ifndef NDEBUG
4372d28f7aaSMehdi Amini         if (!GlobalsToImport.count(GO))
4382d28f7aaSMehdi Amini           DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID()
4392d28f7aaSMehdi Amini                        << " " << GO->getName() << " from "
4402d28f7aaSMehdi Amini                        << SrcModule->getSourceFileName() << "\n");
4412d28f7aaSMehdi Amini #endif
4422d28f7aaSMehdi Amini         GO->materialize();
44301e32130SMehdi Amini         GlobalsToImport.insert(GO);
44401e32130SMehdi Amini         GV.materialize();
44501e32130SMehdi Amini         GlobalsToImport.insert(&GV);
44601e32130SMehdi Amini       }
44701e32130SMehdi Amini     }
44801e32130SMehdi Amini 
4497e88d0daSMehdi Amini     // Link in the specified functions.
45001e32130SMehdi Amini     if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport))
4518d05185aSMehdi Amini       return true;
4528d05185aSMehdi Amini 
453d29478f7STeresa Johnson     if (PrintImports) {
454d29478f7STeresa Johnson       for (const auto *GV : GlobalsToImport)
455d29478f7STeresa Johnson         dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName()
456d29478f7STeresa Johnson                << " from " << SrcModule->getSourceFileName() << "\n";
457d29478f7STeresa Johnson     }
458d29478f7STeresa Johnson 
459bda3c97cSMehdi Amini     // Instruct the linker that the client will take care of linkonce resolution
460bda3c97cSMehdi Amini     unsigned Flags = Linker::Flags::None;
461bda3c97cSMehdi Amini     if (!ForceImportReferencedDiscardableSymbols)
462bda3c97cSMehdi Amini       Flags |= Linker::Flags::DontForceLinkLinkonceODR;
463bda3c97cSMehdi Amini 
464bda3c97cSMehdi Amini     if (TheLinker.linkInModule(std::move(SrcModule), Flags, &GlobalsToImport))
4657e88d0daSMehdi Amini       report_fatal_error("Function Import: link error");
4667e88d0daSMehdi Amini 
46701e32130SMehdi Amini     ImportedCount += GlobalsToImport.size();
4687e88d0daSMehdi Amini   }
469e5a61917STeresa Johnson 
470d29478f7STeresa Johnson   NumImported += ImportedCount;
471d29478f7STeresa Johnson 
4727e88d0daSMehdi Amini   DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module "
473c8c55170SMehdi Amini                << DestModule.getModuleIdentifier() << "\n");
474c8c55170SMehdi Amini   return ImportedCount;
47542418abaSMehdi Amini }
47642418abaSMehdi Amini 
47742418abaSMehdi Amini /// Summary file to use for function importing when using -function-import from
47842418abaSMehdi Amini /// the command line.
47942418abaSMehdi Amini static cl::opt<std::string>
48042418abaSMehdi Amini     SummaryFile("summary-file",
48142418abaSMehdi Amini                 cl::desc("The summary file to use for function importing."));
48242418abaSMehdi Amini 
48342418abaSMehdi Amini static void diagnosticHandler(const DiagnosticInfo &DI) {
48442418abaSMehdi Amini   raw_ostream &OS = errs();
48542418abaSMehdi Amini   DiagnosticPrinterRawOStream DP(OS);
48642418abaSMehdi Amini   DI.print(DP);
48742418abaSMehdi Amini   OS << '\n';
48842418abaSMehdi Amini }
48942418abaSMehdi Amini 
49026ab5772STeresa Johnson /// Parse the summary index out of an IR file and return the summary
49142418abaSMehdi Amini /// index object if found, or nullptr if not.
49226ab5772STeresa Johnson static std::unique_ptr<ModuleSummaryIndex>
49326ab5772STeresa Johnson getModuleSummaryIndexForFile(StringRef Path, std::string &Error,
49442418abaSMehdi Amini                              DiagnosticHandlerFunction DiagnosticHandler) {
49542418abaSMehdi Amini   std::unique_ptr<MemoryBuffer> Buffer;
49642418abaSMehdi Amini   ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr =
49742418abaSMehdi Amini       MemoryBuffer::getFile(Path);
49842418abaSMehdi Amini   if (std::error_code EC = BufferOrErr.getError()) {
49942418abaSMehdi Amini     Error = EC.message();
50042418abaSMehdi Amini     return nullptr;
50142418abaSMehdi Amini   }
50242418abaSMehdi Amini   Buffer = std::move(BufferOrErr.get());
50326ab5772STeresa Johnson   ErrorOr<std::unique_ptr<object::ModuleSummaryIndexObjectFile>> ObjOrErr =
50426ab5772STeresa Johnson       object::ModuleSummaryIndexObjectFile::create(Buffer->getMemBufferRef(),
50542418abaSMehdi Amini                                                    DiagnosticHandler);
50642418abaSMehdi Amini   if (std::error_code EC = ObjOrErr.getError()) {
50742418abaSMehdi Amini     Error = EC.message();
50842418abaSMehdi Amini     return nullptr;
50942418abaSMehdi Amini   }
51042418abaSMehdi Amini   return (*ObjOrErr)->takeIndex();
51142418abaSMehdi Amini }
51242418abaSMehdi Amini 
513fe2b5415SBenjamin Kramer namespace {
51442418abaSMehdi Amini /// Pass that performs cross-module function import provided a summary file.
51542418abaSMehdi Amini class FunctionImportPass : public ModulePass {
51626ab5772STeresa Johnson   /// Optional module summary index to use for importing, otherwise
5175fcbdb71STeresa Johnson   /// the summary-file option must be specified.
51826ab5772STeresa Johnson   const ModuleSummaryIndex *Index;
51942418abaSMehdi Amini 
52042418abaSMehdi Amini public:
52142418abaSMehdi Amini   /// Pass identification, replacement for typeid
52242418abaSMehdi Amini   static char ID;
52342418abaSMehdi Amini 
5245fcbdb71STeresa Johnson   /// Specify pass name for debug output
5252d28f7aaSMehdi Amini   const char *getPassName() const override { return "Function Importing"; }
5265fcbdb71STeresa Johnson 
52726ab5772STeresa Johnson   explicit FunctionImportPass(const ModuleSummaryIndex *Index = nullptr)
5285fcbdb71STeresa Johnson       : ModulePass(ID), Index(Index) {}
52942418abaSMehdi Amini 
53042418abaSMehdi Amini   bool runOnModule(Module &M) override {
531aa641a51SAndrew Kaylor     if (skipModule(M))
532aa641a51SAndrew Kaylor       return false;
533aa641a51SAndrew Kaylor 
5345fcbdb71STeresa Johnson     if (SummaryFile.empty() && !Index)
5355fcbdb71STeresa Johnson       report_fatal_error("error: -function-import requires -summary-file or "
5365fcbdb71STeresa Johnson                          "file from frontend\n");
53726ab5772STeresa Johnson     std::unique_ptr<ModuleSummaryIndex> IndexPtr;
5385fcbdb71STeresa Johnson     if (!SummaryFile.empty()) {
5395fcbdb71STeresa Johnson       if (Index)
5405fcbdb71STeresa Johnson         report_fatal_error("error: -summary-file and index from frontend\n");
54142418abaSMehdi Amini       std::string Error;
54226ab5772STeresa Johnson       IndexPtr =
54326ab5772STeresa Johnson           getModuleSummaryIndexForFile(SummaryFile, Error, diagnosticHandler);
5445fcbdb71STeresa Johnson       if (!IndexPtr) {
5455fcbdb71STeresa Johnson         errs() << "Error loading file '" << SummaryFile << "': " << Error
5465fcbdb71STeresa Johnson                << "\n";
54742418abaSMehdi Amini         return false;
54842418abaSMehdi Amini       }
5495fcbdb71STeresa Johnson       Index = IndexPtr.get();
5505fcbdb71STeresa Johnson     }
55142418abaSMehdi Amini 
552c86af334STeresa Johnson     // First step is collecting the import list.
553c86af334STeresa Johnson     FunctionImporter::ImportMapTy ImportList;
554c86af334STeresa Johnson     ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index,
555c86af334STeresa Johnson                                       ImportList);
55601e32130SMehdi Amini 
55701e32130SMehdi Amini     // Next we need to promote to global scope and rename any local values that
5581b00f2d9STeresa Johnson     // are potentially exported to other modules.
55901e32130SMehdi Amini     if (renameModuleForThinLTO(M, *Index, nullptr)) {
5601b00f2d9STeresa Johnson       errs() << "Error renaming module\n";
5611b00f2d9STeresa Johnson       return false;
5621b00f2d9STeresa Johnson     }
5631b00f2d9STeresa Johnson 
56442418abaSMehdi Amini     // Perform the import now.
565d16c8065SMehdi Amini     auto ModuleLoader = [&M](StringRef Identifier) {
566d16c8065SMehdi Amini       return loadFile(Identifier, M.getContext());
567d16c8065SMehdi Amini     };
5689d2bfc48SRafael Espindola     FunctionImporter Importer(*Index, ModuleLoader);
569bda3c97cSMehdi Amini     return Importer.importFunctions(
570bda3c97cSMehdi Amini         M, ImportList, !DontForceImportReferencedDiscardableSymbols);
57142418abaSMehdi Amini   }
57242418abaSMehdi Amini };
573fe2b5415SBenjamin Kramer } // anonymous namespace
57442418abaSMehdi Amini 
57542418abaSMehdi Amini char FunctionImportPass::ID = 0;
57642418abaSMehdi Amini INITIALIZE_PASS_BEGIN(FunctionImportPass, "function-import",
57742418abaSMehdi Amini                       "Summary Based Function Import", false, false)
57842418abaSMehdi Amini INITIALIZE_PASS_END(FunctionImportPass, "function-import",
57942418abaSMehdi Amini                     "Summary Based Function Import", false, false)
58042418abaSMehdi Amini 
58142418abaSMehdi Amini namespace llvm {
58226ab5772STeresa Johnson Pass *createFunctionImportPass(const ModuleSummaryIndex *Index = nullptr) {
5835fcbdb71STeresa Johnson   return new FunctionImportPass(Index);
5845fcbdb71STeresa Johnson }
58542418abaSMehdi Amini }
586