142418abaSMehdi Amini //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// 242418abaSMehdi Amini // 342418abaSMehdi Amini // The LLVM Compiler Infrastructure 442418abaSMehdi Amini // 542418abaSMehdi Amini // This file is distributed under the University of Illinois Open Source 642418abaSMehdi Amini // License. See LICENSE.TXT for details. 742418abaSMehdi Amini // 842418abaSMehdi Amini //===----------------------------------------------------------------------===// 942418abaSMehdi Amini // 1042418abaSMehdi Amini // This file implements Function import based on summaries. 1142418abaSMehdi Amini // 1242418abaSMehdi Amini //===----------------------------------------------------------------------===// 1342418abaSMehdi Amini 1442418abaSMehdi Amini #include "llvm/Transforms/IPO/FunctionImport.h" 1542418abaSMehdi Amini 1601e32130SMehdi Amini #include "llvm/ADT/SmallVector.h" 17d29478f7STeresa Johnson #include "llvm/ADT/Statistic.h" 1842418abaSMehdi Amini #include "llvm/ADT/StringSet.h" 1942418abaSMehdi Amini #include "llvm/IR/AutoUpgrade.h" 2042418abaSMehdi Amini #include "llvm/IR/DiagnosticPrinter.h" 2142418abaSMehdi Amini #include "llvm/IR/IntrinsicInst.h" 2242418abaSMehdi Amini #include "llvm/IR/Module.h" 2342418abaSMehdi Amini #include "llvm/IRReader/IRReader.h" 2442418abaSMehdi Amini #include "llvm/Linker/Linker.h" 2526ab5772STeresa Johnson #include "llvm/Object/ModuleSummaryIndexObjectFile.h" 2642418abaSMehdi Amini #include "llvm/Support/CommandLine.h" 2742418abaSMehdi Amini #include "llvm/Support/Debug.h" 2842418abaSMehdi Amini #include "llvm/Support/SourceMgr.h" 29488a800aSTeresa Johnson #include "llvm/Transforms/Utils/FunctionImportUtils.h" 307e88d0daSMehdi Amini 3101e32130SMehdi Amini #define DEBUG_TYPE "function-import" 327e88d0daSMehdi Amini 3342418abaSMehdi Amini using namespace llvm; 3442418abaSMehdi Amini 35d29478f7STeresa Johnson STATISTIC(NumImported, "Number of functions imported"); 36d29478f7STeresa Johnson 3739303619STeresa Johnson /// Limit on instruction count of imported functions. 3839303619STeresa Johnson static cl::opt<unsigned> ImportInstrLimit( 3939303619STeresa Johnson "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), 4039303619STeresa Johnson cl::desc("Only import functions with less than N instructions")); 4139303619STeresa Johnson 4240641748SMehdi Amini static cl::opt<float> 4340641748SMehdi Amini ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), 4440641748SMehdi Amini cl::Hidden, cl::value_desc("x"), 4540641748SMehdi Amini cl::desc("As we import functions, multiply the " 4640641748SMehdi Amini "`import-instr-limit` threshold by this factor " 4740641748SMehdi Amini "before processing newly imported functions")); 4840641748SMehdi Amini 49d29478f7STeresa Johnson static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, 50d29478f7STeresa Johnson cl::desc("Print imported functions")); 51d29478f7STeresa Johnson 52bda3c97cSMehdi Amini // Temporary allows the function import pass to disable always linking 53bda3c97cSMehdi Amini // referenced discardable symbols. 54bda3c97cSMehdi Amini static cl::opt<bool> 55bda3c97cSMehdi Amini DontForceImportReferencedDiscardableSymbols("disable-force-link-odr", 56bda3c97cSMehdi Amini cl::init(false), cl::Hidden); 57bda3c97cSMehdi Amini 5842418abaSMehdi Amini // Load lazily a module from \p FileName in \p Context. 5942418abaSMehdi Amini static std::unique_ptr<Module> loadFile(const std::string &FileName, 6042418abaSMehdi Amini LLVMContext &Context) { 6142418abaSMehdi Amini SMDiagnostic Err; 6242418abaSMehdi Amini DEBUG(dbgs() << "Loading '" << FileName << "'\n"); 636cba37ceSTeresa Johnson // Metadata isn't loaded until functions are imported, to minimize 646cba37ceSTeresa Johnson // the memory overhead. 65a1080ee6STeresa Johnson std::unique_ptr<Module> Result = 66a1080ee6STeresa Johnson getLazyIRFileModule(FileName, Err, Context, 67a1080ee6STeresa Johnson /* ShouldLazyLoadMetadata = */ true); 6842418abaSMehdi Amini if (!Result) { 6942418abaSMehdi Amini Err.print("function-import", errs()); 70d7ad221cSMehdi Amini report_fatal_error("Abort"); 7142418abaSMehdi Amini } 7242418abaSMehdi Amini 7342418abaSMehdi Amini return Result; 7442418abaSMehdi Amini } 7542418abaSMehdi Amini 767e88d0daSMehdi Amini namespace { 7740641748SMehdi Amini 7801e32130SMehdi Amini /// Given a list of possible callee implementation for a call site, select one 7901e32130SMehdi Amini /// that fits the \p Threshold. 8001e32130SMehdi Amini /// 8101e32130SMehdi Amini /// FIXME: select "best" instead of first that fits. But what is "best"? 8201e32130SMehdi Amini /// - The smallest: more likely to be inlined. 8301e32130SMehdi Amini /// - The one with the least outgoing edges (already well optimized). 8401e32130SMehdi Amini /// - One from a module already being imported from in order to reduce the 8501e32130SMehdi Amini /// number of source modules parsed/linked. 8601e32130SMehdi Amini /// - One that has PGO data attached. 8701e32130SMehdi Amini /// - [insert you fancy metric here] 882d28f7aaSMehdi Amini static const GlobalValueSummary * 8901e32130SMehdi Amini selectCallee(const GlobalValueInfoList &CalleeInfoList, unsigned Threshold) { 9001e32130SMehdi Amini auto It = llvm::find_if( 9101e32130SMehdi Amini CalleeInfoList, [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { 9201e32130SMehdi Amini assert(GlobInfo->summary() && 9301e32130SMehdi Amini "We should not have a Global Info without summary"); 942d28f7aaSMehdi Amini auto *GVSummary = GlobInfo->summary(); 952c719cc1SMehdi Amini if (GlobalValue::isWeakAnyLinkage(GVSummary->linkage())) 962c719cc1SMehdi Amini // There is no point in importing weak symbols, we can't inline them 9701e32130SMehdi Amini return false; 982c719cc1SMehdi Amini if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) { 992c719cc1SMehdi Amini GVSummary = &AS->getAliasee(); 1002c719cc1SMehdi Amini // Alias can't point to "available_externally". However when we import 1012c719cc1SMehdi Amini // linkOnceODR the linkage does not change. So we import the alias 1022c719cc1SMehdi Amini // and aliasee only in this case. 1032c719cc1SMehdi Amini // FIXME: we should import alias as available_externally *function*, 1042c719cc1SMehdi Amini // the destination module does need to know it is an alias. 1052c719cc1SMehdi Amini if (!GlobalValue::isLinkOnceODRLinkage(GVSummary->linkage())) 1062c719cc1SMehdi Amini return false; 1072c719cc1SMehdi Amini } 1082c719cc1SMehdi Amini 1092c719cc1SMehdi Amini auto *Summary = cast<FunctionSummary>(GVSummary); 1107e88d0daSMehdi Amini 11101e32130SMehdi Amini if (Summary->instCount() > Threshold) 11201e32130SMehdi Amini return false; 1137e88d0daSMehdi Amini 11401e32130SMehdi Amini return true; 11501e32130SMehdi Amini }); 11601e32130SMehdi Amini if (It == CalleeInfoList.end()) 11701e32130SMehdi Amini return nullptr; 1187e88d0daSMehdi Amini 1192d28f7aaSMehdi Amini return cast<GlobalValueSummary>((*It)->summary()); 120434e9561SRafael Espindola } 1217e88d0daSMehdi Amini 12201e32130SMehdi Amini /// Return the summary for the function \p GUID that fits the \p Threshold, or 12301e32130SMehdi Amini /// null if there's no match. 1242d28f7aaSMehdi Amini static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID, 125ad5741b0SMehdi Amini unsigned Threshold, 12601e32130SMehdi Amini const ModuleSummaryIndex &Index) { 12701e32130SMehdi Amini auto CalleeInfoList = Index.findGlobalValueInfoList(GUID); 12801e32130SMehdi Amini if (CalleeInfoList == Index.end()) { 12901e32130SMehdi Amini return nullptr; // This function does not have a summary 1307e88d0daSMehdi Amini } 13101e32130SMehdi Amini return selectCallee(CalleeInfoList->second, Threshold); 13201e32130SMehdi Amini } 1337e88d0daSMehdi Amini 134*cb87494fSMehdi Amini /// Mark the global \p GUID as export by module \p ExportModulePath if found in 135*cb87494fSMehdi Amini /// this module. If it is a GlobalVariable, we also mark any referenced global 136*cb87494fSMehdi Amini /// in the current module as exported. 137*cb87494fSMehdi Amini static void exportGlobalInModule(const ModuleSummaryIndex &Index, 138ad5741b0SMehdi Amini StringRef ExportModulePath, 139*cb87494fSMehdi Amini GlobalValue::GUID GUID, 140*cb87494fSMehdi Amini FunctionImporter::ExportSetTy &ExportList) { 141*cb87494fSMehdi Amini auto FindGlobalInfoInModule = 142*cb87494fSMehdi Amini [&](GlobalValue::GUID GUID) -> GlobalValueInfo *{ 143*cb87494fSMehdi Amini auto InfoList = Index.findGlobalValueInfoList(GUID); 144*cb87494fSMehdi Amini if (InfoList == Index.end()) 14501e32130SMehdi Amini // This global does not have a summary, it is not part of the ThinLTO 14601e32130SMehdi Amini // process 147*cb87494fSMehdi Amini return nullptr; 148*cb87494fSMehdi Amini auto Info = llvm::find_if( 149*cb87494fSMehdi Amini InfoList->second, 15001e32130SMehdi Amini [&](const std::unique_ptr<GlobalValueInfo> &GlobInfo) { 15101e32130SMehdi Amini auto *Summary = GlobInfo->summary(); 15201e32130SMehdi Amini assert(Summary && "Unexpected GlobalValueInfo without summary"); 15301e32130SMehdi Amini return Summary->modulePath() == ExportModulePath; 15401e32130SMehdi Amini }); 155*cb87494fSMehdi Amini if (Info == InfoList->second.end()) 156*cb87494fSMehdi Amini return nullptr; 157*cb87494fSMehdi Amini return Info->get(); 158*cb87494fSMehdi Amini }; 159*cb87494fSMehdi Amini 160*cb87494fSMehdi Amini auto *GVInfo = FindGlobalInfoInModule(GUID); 161*cb87494fSMehdi Amini if (!GVInfo) 162*cb87494fSMehdi Amini return; 163*cb87494fSMehdi Amini // We found it in the current module, mark as exported 164*cb87494fSMehdi Amini ExportList.insert(GUID); 165*cb87494fSMehdi Amini 166*cb87494fSMehdi Amini auto *Summary = GVInfo->summary(); 167*cb87494fSMehdi Amini auto GVS = dyn_cast<GlobalVarSummary>(Summary); 168*cb87494fSMehdi Amini if (!GVS) 169*cb87494fSMehdi Amini return; 170*cb87494fSMehdi Amini // FunctionImportGlobalProcessing::doPromoteLocalToGlobal() will always 171*cb87494fSMehdi Amini // trigger importing the initializer for `constant unnamed addr` globals that 172*cb87494fSMehdi Amini // are referenced. We conservatively export all the referenced symbols for 173*cb87494fSMehdi Amini // every global to workaround this, so that the ExportList is accurate. 174*cb87494fSMehdi Amini // FIXME: with a "isConstant" flag in the summary we could be more targetted. 175*cb87494fSMehdi Amini for (auto &Ref : GVS->refs()) { 176*cb87494fSMehdi Amini auto GUID = Ref.getGUID(); 177*cb87494fSMehdi Amini auto *RefInfo = FindGlobalInfoInModule(GUID); 178*cb87494fSMehdi Amini if (RefInfo) 179*cb87494fSMehdi Amini // Found a ref in the current module, mark it as exported 180*cb87494fSMehdi Amini ExportList.insert(GUID); 181*cb87494fSMehdi Amini } 18201e32130SMehdi Amini } 1837e88d0daSMehdi Amini 18401e32130SMehdi Amini using EdgeInfo = std::pair<const FunctionSummary *, unsigned /* Threshold */>; 18501e32130SMehdi Amini 18601e32130SMehdi Amini /// Compute the list of functions to import for a given caller. Mark these 18701e32130SMehdi Amini /// imported functions and the symbols they reference in their source module as 18801e32130SMehdi Amini /// exported from their source module. 18901e32130SMehdi Amini static void computeImportForFunction( 1903255eec1STeresa Johnson const FunctionSummary &Summary, const ModuleSummaryIndex &Index, 1913255eec1STeresa Johnson unsigned Threshold, 1921aafabf7SMehdi Amini const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, 19301e32130SMehdi Amini SmallVectorImpl<EdgeInfo> &Worklist, 19401e32130SMehdi Amini FunctionImporter::ImportMapTy &ImportsForModule, 195c86af334STeresa Johnson StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { 19601e32130SMehdi Amini for (auto &Edge : Summary.calls()) { 1972d5487cfSTeresa Johnson auto GUID = Edge.first.getGUID(); 19801e32130SMehdi Amini DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n"); 19901e32130SMehdi Amini 2001aafabf7SMehdi Amini if (DefinedGVSummaries.count(GUID)) { 20101e32130SMehdi Amini DEBUG(dbgs() << "ignored! Target already in destination module.\n"); 2027e88d0daSMehdi Amini continue; 203d450da32STeresa Johnson } 20440641748SMehdi Amini 20501e32130SMehdi Amini auto *CalleeSummary = selectCallee(GUID, Threshold, Index); 20601e32130SMehdi Amini if (!CalleeSummary) { 20701e32130SMehdi Amini DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n"); 2087e88d0daSMehdi Amini continue; 2097e88d0daSMehdi Amini } 2102d28f7aaSMehdi Amini // "Resolve" the summary, traversing alias, 2112d28f7aaSMehdi Amini const FunctionSummary *ResolvedCalleeSummary; 2126968ef77SMehdi Amini if (isa<AliasSummary>(CalleeSummary)) { 2132d28f7aaSMehdi Amini ResolvedCalleeSummary = cast<FunctionSummary>( 2142d28f7aaSMehdi Amini &cast<AliasSummary>(CalleeSummary)->getAliasee()); 2152c719cc1SMehdi Amini assert( 2162c719cc1SMehdi Amini GlobalValue::isLinkOnceODRLinkage(ResolvedCalleeSummary->linkage()) && 2172c719cc1SMehdi Amini "Unexpected alias to a non-linkonceODR in import list"); 2186968ef77SMehdi Amini } else 2192d28f7aaSMehdi Amini ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 2202d28f7aaSMehdi Amini 2212d28f7aaSMehdi Amini assert(ResolvedCalleeSummary->instCount() <= Threshold && 22201e32130SMehdi Amini "selectCallee() didn't honor the threshold"); 22301e32130SMehdi Amini 2242d28f7aaSMehdi Amini auto ExportModulePath = ResolvedCalleeSummary->modulePath(); 2252d28f7aaSMehdi Amini auto &ProcessedThreshold = ImportsForModule[ExportModulePath][GUID]; 22601e32130SMehdi Amini /// Since the traversal of the call graph is DFS, we can revisit a function 22701e32130SMehdi Amini /// a second time with a higher threshold. In this case, it is added back to 22801e32130SMehdi Amini /// the worklist with the new threshold. 22901e32130SMehdi Amini if (ProcessedThreshold && ProcessedThreshold > Threshold) { 23001e32130SMehdi Amini DEBUG(dbgs() << "ignored! Target was already seen with Threshold " 23101e32130SMehdi Amini << ProcessedThreshold << "\n"); 23201e32130SMehdi Amini continue; 23301e32130SMehdi Amini } 23401e32130SMehdi Amini // Mark this function as imported in this module, with the current Threshold 23501e32130SMehdi Amini ProcessedThreshold = Threshold; 23601e32130SMehdi Amini 23701e32130SMehdi Amini // Make exports in the source module. 238c86af334STeresa Johnson if (ExportLists) { 239ef7555fbSMehdi Amini auto &ExportList = (*ExportLists)[ExportModulePath]; 24001e32130SMehdi Amini ExportList.insert(GUID); 241c86af334STeresa Johnson // Mark all functions and globals referenced by this function as exported 242c86af334STeresa Johnson // to the outside if they are defined in the same source module. 2432d28f7aaSMehdi Amini for (auto &Edge : ResolvedCalleeSummary->calls()) { 2442d5487cfSTeresa Johnson auto CalleeGUID = Edge.first.getGUID(); 245*cb87494fSMehdi Amini exportGlobalInModule(Index, ExportModulePath, CalleeGUID, ExportList); 24601e32130SMehdi Amini } 2472d28f7aaSMehdi Amini for (auto &Ref : ResolvedCalleeSummary->refs()) { 2482d5487cfSTeresa Johnson auto GUID = Ref.getGUID(); 249*cb87494fSMehdi Amini exportGlobalInModule(Index, ExportModulePath, GUID, ExportList); 2507e88d0daSMehdi Amini } 251c86af334STeresa Johnson } 2527e88d0daSMehdi Amini 25301e32130SMehdi Amini // Insert the newly imported function to the worklist. 2542d28f7aaSMehdi Amini Worklist.push_back(std::make_pair(ResolvedCalleeSummary, Threshold)); 255d450da32STeresa Johnson } 256d450da32STeresa Johnson } 257d450da32STeresa Johnson 25801e32130SMehdi Amini /// Given the list of globals defined in a module, compute the list of imports 25901e32130SMehdi Amini /// as well as the list of "exports", i.e. the list of symbols referenced from 26001e32130SMehdi Amini /// another module (that may require promotion). 26101e32130SMehdi Amini static void ComputeImportForModule( 2621aafabf7SMehdi Amini const std::map<GlobalValue::GUID, GlobalValueSummary *> &DefinedGVSummaries, 26326ab5772STeresa Johnson const ModuleSummaryIndex &Index, 26401e32130SMehdi Amini FunctionImporter::ImportMapTy &ImportsForModule, 265c86af334STeresa Johnson StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { 26601e32130SMehdi Amini // Worklist contains the list of function imported in this module, for which 26701e32130SMehdi Amini // we will analyse the callees and may import further down the callgraph. 26801e32130SMehdi Amini SmallVector<EdgeInfo, 128> Worklist; 26901e32130SMehdi Amini 27001e32130SMehdi Amini // Populate the worklist with the import for the functions in the current 27101e32130SMehdi Amini // module 2721aafabf7SMehdi Amini for (auto &GVInfo : DefinedGVSummaries) { 2731aafabf7SMehdi Amini auto *Summary = GVInfo.second; 2742d28f7aaSMehdi Amini if (auto *AS = dyn_cast<AliasSummary>(Summary)) 2752d28f7aaSMehdi Amini Summary = &AS->getAliasee(); 2761aafabf7SMehdi Amini auto *FuncSummary = dyn_cast<FunctionSummary>(Summary); 2771aafabf7SMehdi Amini if (!FuncSummary) 2781aafabf7SMehdi Amini // Skip import for global variables 2791aafabf7SMehdi Amini continue; 2801aafabf7SMehdi Amini DEBUG(dbgs() << "Initalize import for " << GVInfo.first << "\n"); 2812d28f7aaSMehdi Amini computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, 2821aafabf7SMehdi Amini DefinedGVSummaries, Worklist, ImportsForModule, 28301e32130SMehdi Amini ExportLists); 28401e32130SMehdi Amini } 28501e32130SMehdi Amini 28642418abaSMehdi Amini while (!Worklist.empty()) { 28701e32130SMehdi Amini auto FuncInfo = Worklist.pop_back_val(); 28801e32130SMehdi Amini auto *Summary = FuncInfo.first; 28901e32130SMehdi Amini auto Threshold = FuncInfo.second; 29042418abaSMehdi Amini 2917e88d0daSMehdi Amini // Process the newly imported functions and add callees to the worklist. 29240641748SMehdi Amini // Adjust the threshold 29340641748SMehdi Amini Threshold = Threshold * ImportInstrFactor; 29401e32130SMehdi Amini 2951aafabf7SMehdi Amini computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries, 2963255eec1STeresa Johnson Worklist, ImportsForModule, ExportLists); 297c8c55170SMehdi Amini } 29842418abaSMehdi Amini } 299ffe2e4aaSMehdi Amini 30001e32130SMehdi Amini } // anonymous namespace 30101e32130SMehdi Amini 302c86af334STeresa Johnson /// Compute all the import and export for every module using the Index. 30301e32130SMehdi Amini void llvm::ComputeCrossModuleImport( 30401e32130SMehdi Amini const ModuleSummaryIndex &Index, 3051aafabf7SMehdi Amini const StringMap<std::map<GlobalValue::GUID, GlobalValueSummary *>> & 3061aafabf7SMehdi Amini ModuleToDefinedGVSummaries, 30701e32130SMehdi Amini StringMap<FunctionImporter::ImportMapTy> &ImportLists, 30801e32130SMehdi Amini StringMap<FunctionImporter::ExportSetTy> &ExportLists) { 30901e32130SMehdi Amini // For each module that has function defined, compute the import/export lists. 3101aafabf7SMehdi Amini for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { 3111aafabf7SMehdi Amini auto &ImportsForModule = ImportLists[DefinedGVSummaries.first()]; 3121aafabf7SMehdi Amini DEBUG(dbgs() << "Computing import for Module '" 3131aafabf7SMehdi Amini << DefinedGVSummaries.first() << "'\n"); 3141aafabf7SMehdi Amini ComputeImportForModule(DefinedGVSummaries.second, Index, ImportsForModule, 315c86af334STeresa Johnson &ExportLists); 31601e32130SMehdi Amini } 31701e32130SMehdi Amini 31801e32130SMehdi Amini #ifndef NDEBUG 31901e32130SMehdi Amini DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() 32001e32130SMehdi Amini << " modules:\n"); 32101e32130SMehdi Amini for (auto &ModuleImports : ImportLists) { 32201e32130SMehdi Amini auto ModName = ModuleImports.first(); 32301e32130SMehdi Amini auto &Exports = ExportLists[ModName]; 32401e32130SMehdi Amini DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size() 32501e32130SMehdi Amini << " functions. Imports from " << ModuleImports.second.size() 32601e32130SMehdi Amini << " modules.\n"); 32701e32130SMehdi Amini for (auto &Src : ModuleImports.second) { 32801e32130SMehdi Amini auto SrcModName = Src.first(); 32901e32130SMehdi Amini DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " 33001e32130SMehdi Amini << SrcModName << "\n"); 33101e32130SMehdi Amini } 33201e32130SMehdi Amini } 33301e32130SMehdi Amini #endif 33401e32130SMehdi Amini } 33501e32130SMehdi Amini 336c86af334STeresa Johnson /// Compute all the imports for the given module in the Index. 337c86af334STeresa Johnson void llvm::ComputeCrossModuleImportForModule( 338c86af334STeresa Johnson StringRef ModulePath, const ModuleSummaryIndex &Index, 339c86af334STeresa Johnson FunctionImporter::ImportMapTy &ImportList) { 340c86af334STeresa Johnson 341c86af334STeresa Johnson // Collect the list of functions this module defines. 342c86af334STeresa Johnson // GUID -> Summary 3432d28f7aaSMehdi Amini std::map<GlobalValue::GUID, GlobalValueSummary *> FunctionInfoMap; 344c86af334STeresa Johnson Index.collectDefinedFunctionsForModule(ModulePath, FunctionInfoMap); 345c86af334STeresa Johnson 346c86af334STeresa Johnson // Compute the import list for this module. 347c86af334STeresa Johnson DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); 348c86af334STeresa Johnson ComputeImportForModule(FunctionInfoMap, Index, ImportList); 349c86af334STeresa Johnson 350c86af334STeresa Johnson #ifndef NDEBUG 351c86af334STeresa Johnson DEBUG(dbgs() << "* Module " << ModulePath << " imports from " 352c86af334STeresa Johnson << ImportList.size() << " modules.\n"); 353c86af334STeresa Johnson for (auto &Src : ImportList) { 354c86af334STeresa Johnson auto SrcModName = Src.first(); 355c86af334STeresa Johnson DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " 356c86af334STeresa Johnson << SrcModName << "\n"); 357c86af334STeresa Johnson } 358c86af334STeresa Johnson #endif 359c86af334STeresa Johnson } 360c86af334STeresa Johnson 361c8c55170SMehdi Amini // Automatically import functions in Module \p DestModule based on the summaries 362c8c55170SMehdi Amini // index. 363c8c55170SMehdi Amini // 36401e32130SMehdi Amini bool FunctionImporter::importFunctions( 365bda3c97cSMehdi Amini Module &DestModule, const FunctionImporter::ImportMapTy &ImportList, 366bda3c97cSMehdi Amini bool ForceImportReferencedDiscardableSymbols) { 3675411d051SMehdi Amini DEBUG(dbgs() << "Starting import for Module " 368311fef6eSMehdi Amini << DestModule.getModuleIdentifier() << "\n"); 369c8c55170SMehdi Amini unsigned ImportedCount = 0; 370c8c55170SMehdi Amini 371c8c55170SMehdi Amini // Linker that will be used for importing function 3729d2bfc48SRafael Espindola Linker TheLinker(DestModule); 3737e88d0daSMehdi Amini // Do the actual import of functions now, one Module at a time 37401e32130SMehdi Amini std::set<StringRef> ModuleNameOrderedList; 37501e32130SMehdi Amini for (auto &FunctionsToImportPerModule : ImportList) { 37601e32130SMehdi Amini ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); 37701e32130SMehdi Amini } 37801e32130SMehdi Amini for (auto &Name : ModuleNameOrderedList) { 3797e88d0daSMehdi Amini // Get the module for the import 38001e32130SMehdi Amini const auto &FunctionsToImportPerModule = ImportList.find(Name); 38101e32130SMehdi Amini assert(FunctionsToImportPerModule != ImportList.end()); 38201e32130SMehdi Amini std::unique_ptr<Module> SrcModule = ModuleLoader(Name); 3837e88d0daSMehdi Amini assert(&DestModule.getContext() == &SrcModule->getContext() && 3847e88d0daSMehdi Amini "Context mismatch"); 3857e88d0daSMehdi Amini 3866cba37ceSTeresa Johnson // If modules were created with lazy metadata loading, materialize it 3876cba37ceSTeresa Johnson // now, before linking it (otherwise this will be a noop). 3886cba37ceSTeresa Johnson SrcModule->materializeMetadata(); 3896cba37ceSTeresa Johnson UpgradeDebugInfo(*SrcModule); 390e5a61917STeresa Johnson 39101e32130SMehdi Amini auto &ImportGUIDs = FunctionsToImportPerModule->second; 39201e32130SMehdi Amini // Find the globals to import 39301e32130SMehdi Amini DenseSet<const GlobalValue *> GlobalsToImport; 39401e32130SMehdi Amini for (auto &GV : *SrcModule) { 3950beb858eSTeresa Johnson if (!GV.hasName()) 3960beb858eSTeresa Johnson continue; 3970beb858eSTeresa Johnson auto GUID = GV.getGUID(); 3980beb858eSTeresa Johnson auto Import = ImportGUIDs.count(GUID); 399aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID 400aeb1e59bSMehdi Amini << " " << GV.getName() << " from " 401aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 4020beb858eSTeresa Johnson if (Import) { 40301e32130SMehdi Amini GV.materialize(); 40401e32130SMehdi Amini GlobalsToImport.insert(&GV); 40501e32130SMehdi Amini } 40601e32130SMehdi Amini } 4072d28f7aaSMehdi Amini for (auto &GV : SrcModule->globals()) { 4082d28f7aaSMehdi Amini if (!GV.hasName()) 4092d28f7aaSMehdi Amini continue; 4102d28f7aaSMehdi Amini auto GUID = GV.getGUID(); 4112d28f7aaSMehdi Amini auto Import = ImportGUIDs.count(GUID); 412aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID 413aeb1e59bSMehdi Amini << " " << GV.getName() << " from " 414aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 4152d28f7aaSMehdi Amini if (Import) { 4162d28f7aaSMehdi Amini GV.materialize(); 4172d28f7aaSMehdi Amini GlobalsToImport.insert(&GV); 4182d28f7aaSMehdi Amini } 4192d28f7aaSMehdi Amini } 42001e32130SMehdi Amini for (auto &GV : SrcModule->aliases()) { 42101e32130SMehdi Amini if (!GV.hasName()) 42201e32130SMehdi Amini continue; 42301e32130SMehdi Amini auto GUID = GV.getGUID(); 4240beb858eSTeresa Johnson auto Import = ImportGUIDs.count(GUID); 425aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID 426aeb1e59bSMehdi Amini << " " << GV.getName() << " from " 427aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 4280beb858eSTeresa Johnson if (Import) { 42901e32130SMehdi Amini // Alias can't point to "available_externally". However when we import 4309aae395fSTeresa Johnson // linkOnceODR the linkage does not change. So we import the alias 4316968ef77SMehdi Amini // and aliasee only in this case. This has been handled by 4326968ef77SMehdi Amini // computeImportForFunction() 4332d28f7aaSMehdi Amini GlobalObject *GO = GV.getBaseObject(); 4346968ef77SMehdi Amini assert(GO->hasLinkOnceODRLinkage() && 4356968ef77SMehdi Amini "Unexpected alias to a non-linkonceODR in import list"); 4362d28f7aaSMehdi Amini #ifndef NDEBUG 4372d28f7aaSMehdi Amini if (!GlobalsToImport.count(GO)) 4382d28f7aaSMehdi Amini DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID() 4392d28f7aaSMehdi Amini << " " << GO->getName() << " from " 4402d28f7aaSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 4412d28f7aaSMehdi Amini #endif 4422d28f7aaSMehdi Amini GO->materialize(); 44301e32130SMehdi Amini GlobalsToImport.insert(GO); 44401e32130SMehdi Amini GV.materialize(); 44501e32130SMehdi Amini GlobalsToImport.insert(&GV); 44601e32130SMehdi Amini } 44701e32130SMehdi Amini } 44801e32130SMehdi Amini 4497e88d0daSMehdi Amini // Link in the specified functions. 45001e32130SMehdi Amini if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport)) 4518d05185aSMehdi Amini return true; 4528d05185aSMehdi Amini 453d29478f7STeresa Johnson if (PrintImports) { 454d29478f7STeresa Johnson for (const auto *GV : GlobalsToImport) 455d29478f7STeresa Johnson dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() 456d29478f7STeresa Johnson << " from " << SrcModule->getSourceFileName() << "\n"; 457d29478f7STeresa Johnson } 458d29478f7STeresa Johnson 459bda3c97cSMehdi Amini // Instruct the linker that the client will take care of linkonce resolution 460bda3c97cSMehdi Amini unsigned Flags = Linker::Flags::None; 461bda3c97cSMehdi Amini if (!ForceImportReferencedDiscardableSymbols) 462bda3c97cSMehdi Amini Flags |= Linker::Flags::DontForceLinkLinkonceODR; 463bda3c97cSMehdi Amini 464bda3c97cSMehdi Amini if (TheLinker.linkInModule(std::move(SrcModule), Flags, &GlobalsToImport)) 4657e88d0daSMehdi Amini report_fatal_error("Function Import: link error"); 4667e88d0daSMehdi Amini 46701e32130SMehdi Amini ImportedCount += GlobalsToImport.size(); 4687e88d0daSMehdi Amini } 469e5a61917STeresa Johnson 470d29478f7STeresa Johnson NumImported += ImportedCount; 471d29478f7STeresa Johnson 4727e88d0daSMehdi Amini DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module " 473c8c55170SMehdi Amini << DestModule.getModuleIdentifier() << "\n"); 474c8c55170SMehdi Amini return ImportedCount; 47542418abaSMehdi Amini } 47642418abaSMehdi Amini 47742418abaSMehdi Amini /// Summary file to use for function importing when using -function-import from 47842418abaSMehdi Amini /// the command line. 47942418abaSMehdi Amini static cl::opt<std::string> 48042418abaSMehdi Amini SummaryFile("summary-file", 48142418abaSMehdi Amini cl::desc("The summary file to use for function importing.")); 48242418abaSMehdi Amini 48342418abaSMehdi Amini static void diagnosticHandler(const DiagnosticInfo &DI) { 48442418abaSMehdi Amini raw_ostream &OS = errs(); 48542418abaSMehdi Amini DiagnosticPrinterRawOStream DP(OS); 48642418abaSMehdi Amini DI.print(DP); 48742418abaSMehdi Amini OS << '\n'; 48842418abaSMehdi Amini } 48942418abaSMehdi Amini 49026ab5772STeresa Johnson /// Parse the summary index out of an IR file and return the summary 49142418abaSMehdi Amini /// index object if found, or nullptr if not. 49226ab5772STeresa Johnson static std::unique_ptr<ModuleSummaryIndex> 49326ab5772STeresa Johnson getModuleSummaryIndexForFile(StringRef Path, std::string &Error, 49442418abaSMehdi Amini DiagnosticHandlerFunction DiagnosticHandler) { 49542418abaSMehdi Amini std::unique_ptr<MemoryBuffer> Buffer; 49642418abaSMehdi Amini ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr = 49742418abaSMehdi Amini MemoryBuffer::getFile(Path); 49842418abaSMehdi Amini if (std::error_code EC = BufferOrErr.getError()) { 49942418abaSMehdi Amini Error = EC.message(); 50042418abaSMehdi Amini return nullptr; 50142418abaSMehdi Amini } 50242418abaSMehdi Amini Buffer = std::move(BufferOrErr.get()); 50326ab5772STeresa Johnson ErrorOr<std::unique_ptr<object::ModuleSummaryIndexObjectFile>> ObjOrErr = 50426ab5772STeresa Johnson object::ModuleSummaryIndexObjectFile::create(Buffer->getMemBufferRef(), 50542418abaSMehdi Amini DiagnosticHandler); 50642418abaSMehdi Amini if (std::error_code EC = ObjOrErr.getError()) { 50742418abaSMehdi Amini Error = EC.message(); 50842418abaSMehdi Amini return nullptr; 50942418abaSMehdi Amini } 51042418abaSMehdi Amini return (*ObjOrErr)->takeIndex(); 51142418abaSMehdi Amini } 51242418abaSMehdi Amini 513fe2b5415SBenjamin Kramer namespace { 51442418abaSMehdi Amini /// Pass that performs cross-module function import provided a summary file. 51542418abaSMehdi Amini class FunctionImportPass : public ModulePass { 51626ab5772STeresa Johnson /// Optional module summary index to use for importing, otherwise 5175fcbdb71STeresa Johnson /// the summary-file option must be specified. 51826ab5772STeresa Johnson const ModuleSummaryIndex *Index; 51942418abaSMehdi Amini 52042418abaSMehdi Amini public: 52142418abaSMehdi Amini /// Pass identification, replacement for typeid 52242418abaSMehdi Amini static char ID; 52342418abaSMehdi Amini 5245fcbdb71STeresa Johnson /// Specify pass name for debug output 5252d28f7aaSMehdi Amini const char *getPassName() const override { return "Function Importing"; } 5265fcbdb71STeresa Johnson 52726ab5772STeresa Johnson explicit FunctionImportPass(const ModuleSummaryIndex *Index = nullptr) 5285fcbdb71STeresa Johnson : ModulePass(ID), Index(Index) {} 52942418abaSMehdi Amini 53042418abaSMehdi Amini bool runOnModule(Module &M) override { 531aa641a51SAndrew Kaylor if (skipModule(M)) 532aa641a51SAndrew Kaylor return false; 533aa641a51SAndrew Kaylor 5345fcbdb71STeresa Johnson if (SummaryFile.empty() && !Index) 5355fcbdb71STeresa Johnson report_fatal_error("error: -function-import requires -summary-file or " 5365fcbdb71STeresa Johnson "file from frontend\n"); 53726ab5772STeresa Johnson std::unique_ptr<ModuleSummaryIndex> IndexPtr; 5385fcbdb71STeresa Johnson if (!SummaryFile.empty()) { 5395fcbdb71STeresa Johnson if (Index) 5405fcbdb71STeresa Johnson report_fatal_error("error: -summary-file and index from frontend\n"); 54142418abaSMehdi Amini std::string Error; 54226ab5772STeresa Johnson IndexPtr = 54326ab5772STeresa Johnson getModuleSummaryIndexForFile(SummaryFile, Error, diagnosticHandler); 5445fcbdb71STeresa Johnson if (!IndexPtr) { 5455fcbdb71STeresa Johnson errs() << "Error loading file '" << SummaryFile << "': " << Error 5465fcbdb71STeresa Johnson << "\n"; 54742418abaSMehdi Amini return false; 54842418abaSMehdi Amini } 5495fcbdb71STeresa Johnson Index = IndexPtr.get(); 5505fcbdb71STeresa Johnson } 55142418abaSMehdi Amini 552c86af334STeresa Johnson // First step is collecting the import list. 553c86af334STeresa Johnson FunctionImporter::ImportMapTy ImportList; 554c86af334STeresa Johnson ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index, 555c86af334STeresa Johnson ImportList); 55601e32130SMehdi Amini 55701e32130SMehdi Amini // Next we need to promote to global scope and rename any local values that 5581b00f2d9STeresa Johnson // are potentially exported to other modules. 55901e32130SMehdi Amini if (renameModuleForThinLTO(M, *Index, nullptr)) { 5601b00f2d9STeresa Johnson errs() << "Error renaming module\n"; 5611b00f2d9STeresa Johnson return false; 5621b00f2d9STeresa Johnson } 5631b00f2d9STeresa Johnson 56442418abaSMehdi Amini // Perform the import now. 565d16c8065SMehdi Amini auto ModuleLoader = [&M](StringRef Identifier) { 566d16c8065SMehdi Amini return loadFile(Identifier, M.getContext()); 567d16c8065SMehdi Amini }; 5689d2bfc48SRafael Espindola FunctionImporter Importer(*Index, ModuleLoader); 569bda3c97cSMehdi Amini return Importer.importFunctions( 570bda3c97cSMehdi Amini M, ImportList, !DontForceImportReferencedDiscardableSymbols); 57142418abaSMehdi Amini } 57242418abaSMehdi Amini }; 573fe2b5415SBenjamin Kramer } // anonymous namespace 57442418abaSMehdi Amini 57542418abaSMehdi Amini char FunctionImportPass::ID = 0; 57642418abaSMehdi Amini INITIALIZE_PASS_BEGIN(FunctionImportPass, "function-import", 57742418abaSMehdi Amini "Summary Based Function Import", false, false) 57842418abaSMehdi Amini INITIALIZE_PASS_END(FunctionImportPass, "function-import", 57942418abaSMehdi Amini "Summary Based Function Import", false, false) 58042418abaSMehdi Amini 58142418abaSMehdi Amini namespace llvm { 58226ab5772STeresa Johnson Pass *createFunctionImportPass(const ModuleSummaryIndex *Index = nullptr) { 5835fcbdb71STeresa Johnson return new FunctionImportPass(Index); 5845fcbdb71STeresa Johnson } 58542418abaSMehdi Amini } 586