142418abaSMehdi Amini //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===// 242418abaSMehdi Amini // 342418abaSMehdi Amini // The LLVM Compiler Infrastructure 442418abaSMehdi Amini // 542418abaSMehdi Amini // This file is distributed under the University of Illinois Open Source 642418abaSMehdi Amini // License. See LICENSE.TXT for details. 742418abaSMehdi Amini // 842418abaSMehdi Amini //===----------------------------------------------------------------------===// 942418abaSMehdi Amini // 1042418abaSMehdi Amini // This file implements Function import based on summaries. 1142418abaSMehdi Amini // 1242418abaSMehdi Amini //===----------------------------------------------------------------------===// 1342418abaSMehdi Amini 1442418abaSMehdi Amini #include "llvm/Transforms/IPO/FunctionImport.h" 1542418abaSMehdi Amini 1601e32130SMehdi Amini #include "llvm/ADT/SmallVector.h" 17d29478f7STeresa Johnson #include "llvm/ADT/Statistic.h" 1842418abaSMehdi Amini #include "llvm/ADT/StringSet.h" 1904c9a2d6STeresa Johnson #include "llvm/ADT/Triple.h" 2042418abaSMehdi Amini #include "llvm/IR/AutoUpgrade.h" 2142418abaSMehdi Amini #include "llvm/IR/DiagnosticPrinter.h" 2242418abaSMehdi Amini #include "llvm/IR/IntrinsicInst.h" 2342418abaSMehdi Amini #include "llvm/IR/Module.h" 24fc06b83eSMehdi Amini #include "llvm/IR/Verifier.h" 2542418abaSMehdi Amini #include "llvm/IRReader/IRReader.h" 2642418abaSMehdi Amini #include "llvm/Linker/Linker.h" 2704c9a2d6STeresa Johnson #include "llvm/Object/IRObjectFile.h" 2826ab5772STeresa Johnson #include "llvm/Object/ModuleSummaryIndexObjectFile.h" 2942418abaSMehdi Amini #include "llvm/Support/CommandLine.h" 3042418abaSMehdi Amini #include "llvm/Support/Debug.h" 3142418abaSMehdi Amini #include "llvm/Support/SourceMgr.h" 3204c9a2d6STeresa Johnson #include "llvm/Transforms/IPO/Internalize.h" 33488a800aSTeresa Johnson #include "llvm/Transforms/Utils/FunctionImportUtils.h" 347e88d0daSMehdi Amini 3501e32130SMehdi Amini #define DEBUG_TYPE "function-import" 367e88d0daSMehdi Amini 3742418abaSMehdi Amini using namespace llvm; 3842418abaSMehdi Amini 396c475a75STeresa Johnson STATISTIC(NumImportedFunctions, "Number of functions imported"); 406c475a75STeresa Johnson STATISTIC(NumImportedModules, "Number of modules imported from"); 416c475a75STeresa Johnson STATISTIC(NumDeadSymbols, "Number of dead stripped symbols in index"); 426c475a75STeresa Johnson STATISTIC(NumLiveSymbols, "Number of live symbols in index"); 43d29478f7STeresa Johnson 4439303619STeresa Johnson /// Limit on instruction count of imported functions. 4539303619STeresa Johnson static cl::opt<unsigned> ImportInstrLimit( 4639303619STeresa Johnson "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"), 4739303619STeresa Johnson cl::desc("Only import functions with less than N instructions")); 4839303619STeresa Johnson 4940641748SMehdi Amini static cl::opt<float> 5040641748SMehdi Amini ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7), 5140641748SMehdi Amini cl::Hidden, cl::value_desc("x"), 5240641748SMehdi Amini cl::desc("As we import functions, multiply the " 5340641748SMehdi Amini "`import-instr-limit` threshold by this factor " 5440641748SMehdi Amini "before processing newly imported functions")); 55ba72b95fSPiotr Padlewski 56d2869473SPiotr Padlewski static cl::opt<float> ImportHotInstrFactor( 57d2869473SPiotr Padlewski "import-hot-evolution-factor", cl::init(1.0), cl::Hidden, 58d2869473SPiotr Padlewski cl::value_desc("x"), 59d2869473SPiotr Padlewski cl::desc("As we import functions called from hot callsite, multiply the " 60d2869473SPiotr Padlewski "`import-instr-limit` threshold by this factor " 61d2869473SPiotr Padlewski "before processing newly imported functions")); 62d2869473SPiotr Padlewski 63d9830eb7SPiotr Padlewski static cl::opt<float> ImportHotMultiplier( 64d9830eb7SPiotr Padlewski "import-hot-multiplier", cl::init(3.0), cl::Hidden, cl::value_desc("x"), 65ba72b95fSPiotr Padlewski cl::desc("Multiply the `import-instr-limit` threshold for hot callsites")); 66ba72b95fSPiotr Padlewski 67ba72b95fSPiotr Padlewski // FIXME: This multiplier was not really tuned up. 68ba72b95fSPiotr Padlewski static cl::opt<float> ImportColdMultiplier( 69ba72b95fSPiotr Padlewski "import-cold-multiplier", cl::init(0), cl::Hidden, cl::value_desc("N"), 70ba72b95fSPiotr Padlewski cl::desc("Multiply the `import-instr-limit` threshold for cold callsites")); 7140641748SMehdi Amini 72d29478f7STeresa Johnson static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden, 73d29478f7STeresa Johnson cl::desc("Print imported functions")); 74d29478f7STeresa Johnson 756c475a75STeresa Johnson static cl::opt<bool> ComputeDead("compute-dead", cl::init(true), cl::Hidden, 766c475a75STeresa Johnson cl::desc("Compute dead symbols")); 776c475a75STeresa Johnson 783b776128SPiotr Padlewski static cl::opt<bool> EnableImportMetadata( 793b776128SPiotr Padlewski "enable-import-metadata", cl::init( 803b776128SPiotr Padlewski #if !defined(NDEBUG) 813b776128SPiotr Padlewski true /*Enabled with asserts.*/ 823b776128SPiotr Padlewski #else 833b776128SPiotr Padlewski false 843b776128SPiotr Padlewski #endif 853b776128SPiotr Padlewski ), 863b776128SPiotr Padlewski cl::Hidden, cl::desc("Enable import metadata like 'thinlto_src_module'")); 873b776128SPiotr Padlewski 8842418abaSMehdi Amini // Load lazily a module from \p FileName in \p Context. 8942418abaSMehdi Amini static std::unique_ptr<Module> loadFile(const std::string &FileName, 9042418abaSMehdi Amini LLVMContext &Context) { 9142418abaSMehdi Amini SMDiagnostic Err; 9242418abaSMehdi Amini DEBUG(dbgs() << "Loading '" << FileName << "'\n"); 936cba37ceSTeresa Johnson // Metadata isn't loaded until functions are imported, to minimize 946cba37ceSTeresa Johnson // the memory overhead. 95a1080ee6STeresa Johnson std::unique_ptr<Module> Result = 96a1080ee6STeresa Johnson getLazyIRFileModule(FileName, Err, Context, 97a1080ee6STeresa Johnson /* ShouldLazyLoadMetadata = */ true); 9842418abaSMehdi Amini if (!Result) { 9942418abaSMehdi Amini Err.print("function-import", errs()); 100d7ad221cSMehdi Amini report_fatal_error("Abort"); 10142418abaSMehdi Amini } 10242418abaSMehdi Amini 10342418abaSMehdi Amini return Result; 10442418abaSMehdi Amini } 10542418abaSMehdi Amini 1067e88d0daSMehdi Amini namespace { 10740641748SMehdi Amini 10801e32130SMehdi Amini /// Given a list of possible callee implementation for a call site, select one 10901e32130SMehdi Amini /// that fits the \p Threshold. 11001e32130SMehdi Amini /// 11101e32130SMehdi Amini /// FIXME: select "best" instead of first that fits. But what is "best"? 11201e32130SMehdi Amini /// - The smallest: more likely to be inlined. 11301e32130SMehdi Amini /// - The one with the least outgoing edges (already well optimized). 11401e32130SMehdi Amini /// - One from a module already being imported from in order to reduce the 11501e32130SMehdi Amini /// number of source modules parsed/linked. 11601e32130SMehdi Amini /// - One that has PGO data attached. 11701e32130SMehdi Amini /// - [insert you fancy metric here] 1182d28f7aaSMehdi Amini static const GlobalValueSummary * 119b4e1e829SMehdi Amini selectCallee(const ModuleSummaryIndex &Index, 120b4e1e829SMehdi Amini const GlobalValueSummaryList &CalleeSummaryList, 12183aaf358STeresa Johnson unsigned Threshold, StringRef CallerModulePath) { 12201e32130SMehdi Amini auto It = llvm::find_if( 12328e457bcSTeresa Johnson CalleeSummaryList, 12428e457bcSTeresa Johnson [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) { 12528e457bcSTeresa Johnson auto *GVSummary = SummaryPtr.get(); 126f329be83SRafael Espindola if (GlobalValue::isInterposableLinkage(GVSummary->linkage())) 1275b85d8d6SMehdi Amini // There is no point in importing these, we can't inline them 12801e32130SMehdi Amini return false; 1292c719cc1SMehdi Amini if (auto *AS = dyn_cast<AliasSummary>(GVSummary)) { 1302c719cc1SMehdi Amini GVSummary = &AS->getAliasee(); 1312c719cc1SMehdi Amini // Alias can't point to "available_externally". However when we import 1322c719cc1SMehdi Amini // linkOnceODR the linkage does not change. So we import the alias 1332c719cc1SMehdi Amini // and aliasee only in this case. 1342c719cc1SMehdi Amini // FIXME: we should import alias as available_externally *function*, 1352c719cc1SMehdi Amini // the destination module does need to know it is an alias. 1362c719cc1SMehdi Amini if (!GlobalValue::isLinkOnceODRLinkage(GVSummary->linkage())) 1372c719cc1SMehdi Amini return false; 1382c719cc1SMehdi Amini } 1392c719cc1SMehdi Amini 1402c719cc1SMehdi Amini auto *Summary = cast<FunctionSummary>(GVSummary); 1417e88d0daSMehdi Amini 14283aaf358STeresa Johnson // If this is a local function, make sure we import the copy 14383aaf358STeresa Johnson // in the caller's module. The only time a local function can 14483aaf358STeresa Johnson // share an entry in the index is if there is a local with the same name 14583aaf358STeresa Johnson // in another module that had the same source file name (in a different 14683aaf358STeresa Johnson // directory), where each was compiled in their own directory so there 14783aaf358STeresa Johnson // was not distinguishing path. 14883aaf358STeresa Johnson // However, do the import from another module if there is only one 14983aaf358STeresa Johnson // entry in the list - in that case this must be a reference due 15083aaf358STeresa Johnson // to indirect call profile data, since a function pointer can point to 15183aaf358STeresa Johnson // a local in another module. 15283aaf358STeresa Johnson if (GlobalValue::isLocalLinkage(Summary->linkage()) && 15383aaf358STeresa Johnson CalleeSummaryList.size() > 1 && 15483aaf358STeresa Johnson Summary->modulePath() != CallerModulePath) 15583aaf358STeresa Johnson return false; 15683aaf358STeresa Johnson 15701e32130SMehdi Amini if (Summary->instCount() > Threshold) 15801e32130SMehdi Amini return false; 1597e88d0daSMehdi Amini 160519465b9STeresa Johnson if (Summary->notEligibleToImport()) 161b4e1e829SMehdi Amini return false; 162b4e1e829SMehdi Amini 16301e32130SMehdi Amini return true; 16401e32130SMehdi Amini }); 16528e457bcSTeresa Johnson if (It == CalleeSummaryList.end()) 16601e32130SMehdi Amini return nullptr; 1677e88d0daSMehdi Amini 16828e457bcSTeresa Johnson return cast<GlobalValueSummary>(It->get()); 169434e9561SRafael Espindola } 1707e88d0daSMehdi Amini 17101e32130SMehdi Amini /// Return the summary for the function \p GUID that fits the \p Threshold, or 17201e32130SMehdi Amini /// null if there's no match. 1732d28f7aaSMehdi Amini static const GlobalValueSummary *selectCallee(GlobalValue::GUID GUID, 174ad5741b0SMehdi Amini unsigned Threshold, 17583aaf358STeresa Johnson const ModuleSummaryIndex &Index, 17683aaf358STeresa Johnson StringRef CallerModulePath) { 17728e457bcSTeresa Johnson auto CalleeSummaryList = Index.findGlobalValueSummaryList(GUID); 178b4e1e829SMehdi Amini if (CalleeSummaryList == Index.end()) 17901e32130SMehdi Amini return nullptr; // This function does not have a summary 18083aaf358STeresa Johnson return selectCallee(Index, CalleeSummaryList->second, Threshold, 18183aaf358STeresa Johnson CallerModulePath); 18201e32130SMehdi Amini } 1837e88d0daSMehdi Amini 184475b51a7STeresa Johnson using EdgeInfo = std::tuple<const FunctionSummary *, unsigned /* Threshold */, 185475b51a7STeresa Johnson GlobalValue::GUID>; 18601e32130SMehdi Amini 18701e32130SMehdi Amini /// Compute the list of functions to import for a given caller. Mark these 18801e32130SMehdi Amini /// imported functions and the symbols they reference in their source module as 18901e32130SMehdi Amini /// exported from their source module. 19001e32130SMehdi Amini static void computeImportForFunction( 1913255eec1STeresa Johnson const FunctionSummary &Summary, const ModuleSummaryIndex &Index, 192d9830eb7SPiotr Padlewski const unsigned Threshold, const GVSummaryMapTy &DefinedGVSummaries, 19301e32130SMehdi Amini SmallVectorImpl<EdgeInfo> &Worklist, 1949b490f10SMehdi Amini FunctionImporter::ImportMapTy &ImportList, 195c86af334STeresa Johnson StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) { 19601e32130SMehdi Amini for (auto &Edge : Summary.calls()) { 1972d5487cfSTeresa Johnson auto GUID = Edge.first.getGUID(); 19801e32130SMehdi Amini DEBUG(dbgs() << " edge -> " << GUID << " Threshold:" << Threshold << "\n"); 19901e32130SMehdi Amini 2001aafabf7SMehdi Amini if (DefinedGVSummaries.count(GUID)) { 20101e32130SMehdi Amini DEBUG(dbgs() << "ignored! Target already in destination module.\n"); 2027e88d0daSMehdi Amini continue; 203d450da32STeresa Johnson } 20440641748SMehdi Amini 205ba72b95fSPiotr Padlewski auto GetBonusMultiplier = [](CalleeInfo::HotnessType Hotness) -> float { 206ba72b95fSPiotr Padlewski if (Hotness == CalleeInfo::HotnessType::Hot) 207ba72b95fSPiotr Padlewski return ImportHotMultiplier; 208ba72b95fSPiotr Padlewski if (Hotness == CalleeInfo::HotnessType::Cold) 209ba72b95fSPiotr Padlewski return ImportColdMultiplier; 210ba72b95fSPiotr Padlewski return 1.0; 211ba72b95fSPiotr Padlewski }; 212ba72b95fSPiotr Padlewski 213d9830eb7SPiotr Padlewski const auto NewThreshold = 214ba72b95fSPiotr Padlewski Threshold * GetBonusMultiplier(Edge.second.Hotness); 215d2869473SPiotr Padlewski 21683aaf358STeresa Johnson auto *CalleeSummary = 21783aaf358STeresa Johnson selectCallee(GUID, NewThreshold, Index, Summary.modulePath()); 21801e32130SMehdi Amini if (!CalleeSummary) { 21901e32130SMehdi Amini DEBUG(dbgs() << "ignored! No qualifying callee with summary found.\n"); 2207e88d0daSMehdi Amini continue; 2217e88d0daSMehdi Amini } 2222d28f7aaSMehdi Amini // "Resolve" the summary, traversing alias, 2232d28f7aaSMehdi Amini const FunctionSummary *ResolvedCalleeSummary; 2246968ef77SMehdi Amini if (isa<AliasSummary>(CalleeSummary)) { 2252d28f7aaSMehdi Amini ResolvedCalleeSummary = cast<FunctionSummary>( 2262d28f7aaSMehdi Amini &cast<AliasSummary>(CalleeSummary)->getAliasee()); 2272c719cc1SMehdi Amini assert( 2282c719cc1SMehdi Amini GlobalValue::isLinkOnceODRLinkage(ResolvedCalleeSummary->linkage()) && 2292c719cc1SMehdi Amini "Unexpected alias to a non-linkonceODR in import list"); 2306968ef77SMehdi Amini } else 2312d28f7aaSMehdi Amini ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary); 2322d28f7aaSMehdi Amini 233d9830eb7SPiotr Padlewski assert(ResolvedCalleeSummary->instCount() <= NewThreshold && 23401e32130SMehdi Amini "selectCallee() didn't honor the threshold"); 23501e32130SMehdi Amini 236d2869473SPiotr Padlewski auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) { 237d2869473SPiotr Padlewski // Adjust the threshold for next level of imported functions. 238d2869473SPiotr Padlewski // The threshold is different for hot callsites because we can then 239d2869473SPiotr Padlewski // inline chains of hot calls. 240d2869473SPiotr Padlewski if (IsHotCallsite) 241d2869473SPiotr Padlewski return Threshold * ImportHotInstrFactor; 242d2869473SPiotr Padlewski return Threshold * ImportInstrFactor; 243d2869473SPiotr Padlewski }; 244d2869473SPiotr Padlewski 245d2869473SPiotr Padlewski bool IsHotCallsite = Edge.second.Hotness == CalleeInfo::HotnessType::Hot; 2461b859a23STeresa Johnson const auto AdjThreshold = GetAdjustedThreshold(Threshold, IsHotCallsite); 2471b859a23STeresa Johnson 2481b859a23STeresa Johnson auto ExportModulePath = ResolvedCalleeSummary->modulePath(); 2491b859a23STeresa Johnson auto &ProcessedThreshold = ImportList[ExportModulePath][GUID]; 2501b859a23STeresa Johnson /// Since the traversal of the call graph is DFS, we can revisit a function 2511b859a23STeresa Johnson /// a second time with a higher threshold. In this case, it is added back to 2521b859a23STeresa Johnson /// the worklist with the new threshold. 2531b859a23STeresa Johnson if (ProcessedThreshold && ProcessedThreshold >= AdjThreshold) { 2541b859a23STeresa Johnson DEBUG(dbgs() << "ignored! Target was already seen with Threshold " 2551b859a23STeresa Johnson << ProcessedThreshold << "\n"); 2561b859a23STeresa Johnson continue; 2571b859a23STeresa Johnson } 25819f2aa78STeresa Johnson bool PreviouslyImported = ProcessedThreshold != 0; 2591b859a23STeresa Johnson // Mark this function as imported in this module, with the current Threshold 2601b859a23STeresa Johnson ProcessedThreshold = AdjThreshold; 2611b859a23STeresa Johnson 2621b859a23STeresa Johnson // Make exports in the source module. 2631b859a23STeresa Johnson if (ExportLists) { 2641b859a23STeresa Johnson auto &ExportList = (*ExportLists)[ExportModulePath]; 2651b859a23STeresa Johnson ExportList.insert(GUID); 26619f2aa78STeresa Johnson if (!PreviouslyImported) { 26719f2aa78STeresa Johnson // This is the first time this function was exported from its source 26819f2aa78STeresa Johnson // module, so mark all functions and globals it references as exported 2691b859a23STeresa Johnson // to the outside if they are defined in the same source module. 270edddca22STeresa Johnson // For efficiency, we unconditionally add all the referenced GUIDs 271edddca22STeresa Johnson // to the ExportList for this module, and will prune out any not 272edddca22STeresa Johnson // defined in the module later in a single pass. 2731b859a23STeresa Johnson for (auto &Edge : ResolvedCalleeSummary->calls()) { 2741b859a23STeresa Johnson auto CalleeGUID = Edge.first.getGUID(); 275edddca22STeresa Johnson ExportList.insert(CalleeGUID); 2761b859a23STeresa Johnson } 2771b859a23STeresa Johnson for (auto &Ref : ResolvedCalleeSummary->refs()) { 2781b859a23STeresa Johnson auto GUID = Ref.getGUID(); 279edddca22STeresa Johnson ExportList.insert(GUID); 2801b859a23STeresa Johnson } 2811b859a23STeresa Johnson } 28219f2aa78STeresa Johnson } 283d2869473SPiotr Padlewski 28401e32130SMehdi Amini // Insert the newly imported function to the worklist. 285475b51a7STeresa Johnson Worklist.emplace_back(ResolvedCalleeSummary, AdjThreshold, GUID); 286d450da32STeresa Johnson } 287d450da32STeresa Johnson } 288d450da32STeresa Johnson 28901e32130SMehdi Amini /// Given the list of globals defined in a module, compute the list of imports 29001e32130SMehdi Amini /// as well as the list of "exports", i.e. the list of symbols referenced from 29101e32130SMehdi Amini /// another module (that may require promotion). 29201e32130SMehdi Amini static void ComputeImportForModule( 293c851d216STeresa Johnson const GVSummaryMapTy &DefinedGVSummaries, const ModuleSummaryIndex &Index, 2949b490f10SMehdi Amini FunctionImporter::ImportMapTy &ImportList, 2956c475a75STeresa Johnson StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr, 2966c475a75STeresa Johnson const DenseSet<GlobalValue::GUID> *DeadSymbols = nullptr) { 29701e32130SMehdi Amini // Worklist contains the list of function imported in this module, for which 29801e32130SMehdi Amini // we will analyse the callees and may import further down the callgraph. 29901e32130SMehdi Amini SmallVector<EdgeInfo, 128> Worklist; 30001e32130SMehdi Amini 30101e32130SMehdi Amini // Populate the worklist with the import for the functions in the current 30201e32130SMehdi Amini // module 30328e457bcSTeresa Johnson for (auto &GVSummary : DefinedGVSummaries) { 3046c475a75STeresa Johnson if (DeadSymbols && DeadSymbols->count(GVSummary.first)) { 3056c475a75STeresa Johnson DEBUG(dbgs() << "Ignores Dead GUID: " << GVSummary.first << "\n"); 3066c475a75STeresa Johnson continue; 3076c475a75STeresa Johnson } 30828e457bcSTeresa Johnson auto *Summary = GVSummary.second; 3092d28f7aaSMehdi Amini if (auto *AS = dyn_cast<AliasSummary>(Summary)) 3102d28f7aaSMehdi Amini Summary = &AS->getAliasee(); 3111aafabf7SMehdi Amini auto *FuncSummary = dyn_cast<FunctionSummary>(Summary); 3121aafabf7SMehdi Amini if (!FuncSummary) 3131aafabf7SMehdi Amini // Skip import for global variables 3141aafabf7SMehdi Amini continue; 31528e457bcSTeresa Johnson DEBUG(dbgs() << "Initalize import for " << GVSummary.first << "\n"); 3162d28f7aaSMehdi Amini computeImportForFunction(*FuncSummary, Index, ImportInstrLimit, 3179b490f10SMehdi Amini DefinedGVSummaries, Worklist, ImportList, 31801e32130SMehdi Amini ExportLists); 31901e32130SMehdi Amini } 32001e32130SMehdi Amini 321d2869473SPiotr Padlewski // Process the newly imported functions and add callees to the worklist. 32242418abaSMehdi Amini while (!Worklist.empty()) { 32301e32130SMehdi Amini auto FuncInfo = Worklist.pop_back_val(); 324475b51a7STeresa Johnson auto *Summary = std::get<0>(FuncInfo); 325475b51a7STeresa Johnson auto Threshold = std::get<1>(FuncInfo); 326475b51a7STeresa Johnson auto GUID = std::get<2>(FuncInfo); 327475b51a7STeresa Johnson 328475b51a7STeresa Johnson // Check if we later added this summary with a higher threshold. 329475b51a7STeresa Johnson // If so, skip this entry. 330475b51a7STeresa Johnson auto ExportModulePath = Summary->modulePath(); 331475b51a7STeresa Johnson auto &LatestProcessedThreshold = ImportList[ExportModulePath][GUID]; 332475b51a7STeresa Johnson if (LatestProcessedThreshold > Threshold) 333475b51a7STeresa Johnson continue; 33442418abaSMehdi Amini 3351aafabf7SMehdi Amini computeImportForFunction(*Summary, Index, Threshold, DefinedGVSummaries, 3369b490f10SMehdi Amini Worklist, ImportList, ExportLists); 337c8c55170SMehdi Amini } 33842418abaSMehdi Amini } 339ffe2e4aaSMehdi Amini 34001e32130SMehdi Amini } // anonymous namespace 34101e32130SMehdi Amini 342c86af334STeresa Johnson /// Compute all the import and export for every module using the Index. 34301e32130SMehdi Amini void llvm::ComputeCrossModuleImport( 34401e32130SMehdi Amini const ModuleSummaryIndex &Index, 345c851d216STeresa Johnson const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 34601e32130SMehdi Amini StringMap<FunctionImporter::ImportMapTy> &ImportLists, 3476c475a75STeresa Johnson StringMap<FunctionImporter::ExportSetTy> &ExportLists, 3486c475a75STeresa Johnson const DenseSet<GlobalValue::GUID> *DeadSymbols) { 34901e32130SMehdi Amini // For each module that has function defined, compute the import/export lists. 3501aafabf7SMehdi Amini for (auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) { 3519b490f10SMehdi Amini auto &ImportList = ImportLists[DefinedGVSummaries.first()]; 3521aafabf7SMehdi Amini DEBUG(dbgs() << "Computing import for Module '" 3531aafabf7SMehdi Amini << DefinedGVSummaries.first() << "'\n"); 3549b490f10SMehdi Amini ComputeImportForModule(DefinedGVSummaries.second, Index, ImportList, 3556c475a75STeresa Johnson &ExportLists, DeadSymbols); 35601e32130SMehdi Amini } 35701e32130SMehdi Amini 358edddca22STeresa Johnson // When computing imports we added all GUIDs referenced by anything 359edddca22STeresa Johnson // imported from the module to its ExportList. Now we prune each ExportList 360edddca22STeresa Johnson // of any not defined in that module. This is more efficient than checking 361edddca22STeresa Johnson // while computing imports because some of the summary lists may be long 362edddca22STeresa Johnson // due to linkonce (comdat) copies. 363edddca22STeresa Johnson for (auto &ELI : ExportLists) { 364edddca22STeresa Johnson const auto &DefinedGVSummaries = 365edddca22STeresa Johnson ModuleToDefinedGVSummaries.lookup(ELI.first()); 366edddca22STeresa Johnson for (auto EI = ELI.second.begin(); EI != ELI.second.end();) { 367edddca22STeresa Johnson if (!DefinedGVSummaries.count(*EI)) 368edddca22STeresa Johnson EI = ELI.second.erase(EI); 369edddca22STeresa Johnson else 370edddca22STeresa Johnson ++EI; 371edddca22STeresa Johnson } 372edddca22STeresa Johnson } 373edddca22STeresa Johnson 37401e32130SMehdi Amini #ifndef NDEBUG 37501e32130SMehdi Amini DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size() 37601e32130SMehdi Amini << " modules:\n"); 37701e32130SMehdi Amini for (auto &ModuleImports : ImportLists) { 37801e32130SMehdi Amini auto ModName = ModuleImports.first(); 37901e32130SMehdi Amini auto &Exports = ExportLists[ModName]; 38001e32130SMehdi Amini DEBUG(dbgs() << "* Module " << ModName << " exports " << Exports.size() 38101e32130SMehdi Amini << " functions. Imports from " << ModuleImports.second.size() 38201e32130SMehdi Amini << " modules.\n"); 38301e32130SMehdi Amini for (auto &Src : ModuleImports.second) { 38401e32130SMehdi Amini auto SrcModName = Src.first(); 38501e32130SMehdi Amini DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " 38601e32130SMehdi Amini << SrcModName << "\n"); 38701e32130SMehdi Amini } 38801e32130SMehdi Amini } 38901e32130SMehdi Amini #endif 39001e32130SMehdi Amini } 39101e32130SMehdi Amini 392c86af334STeresa Johnson /// Compute all the imports for the given module in the Index. 393c86af334STeresa Johnson void llvm::ComputeCrossModuleImportForModule( 394c86af334STeresa Johnson StringRef ModulePath, const ModuleSummaryIndex &Index, 395c86af334STeresa Johnson FunctionImporter::ImportMapTy &ImportList) { 396c86af334STeresa Johnson 397c86af334STeresa Johnson // Collect the list of functions this module defines. 398c86af334STeresa Johnson // GUID -> Summary 399c851d216STeresa Johnson GVSummaryMapTy FunctionSummaryMap; 40028e457bcSTeresa Johnson Index.collectDefinedFunctionsForModule(ModulePath, FunctionSummaryMap); 401c86af334STeresa Johnson 402c86af334STeresa Johnson // Compute the import list for this module. 403c86af334STeresa Johnson DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n"); 40428e457bcSTeresa Johnson ComputeImportForModule(FunctionSummaryMap, Index, ImportList); 405c86af334STeresa Johnson 406c86af334STeresa Johnson #ifndef NDEBUG 407c86af334STeresa Johnson DEBUG(dbgs() << "* Module " << ModulePath << " imports from " 408c86af334STeresa Johnson << ImportList.size() << " modules.\n"); 409c86af334STeresa Johnson for (auto &Src : ImportList) { 410c86af334STeresa Johnson auto SrcModName = Src.first(); 411c86af334STeresa Johnson DEBUG(dbgs() << " - " << Src.second.size() << " functions imported from " 412c86af334STeresa Johnson << SrcModName << "\n"); 413c86af334STeresa Johnson } 414c86af334STeresa Johnson #endif 415c86af334STeresa Johnson } 416c86af334STeresa Johnson 4176c475a75STeresa Johnson DenseSet<GlobalValue::GUID> llvm::computeDeadSymbols( 4186c475a75STeresa Johnson const ModuleSummaryIndex &Index, 4196c475a75STeresa Johnson const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) { 4206c475a75STeresa Johnson if (!ComputeDead) 4216c475a75STeresa Johnson return DenseSet<GlobalValue::GUID>(); 4226c475a75STeresa Johnson if (GUIDPreservedSymbols.empty()) 4236c475a75STeresa Johnson // Don't do anything when nothing is live, this is friendly with tests. 4246c475a75STeresa Johnson return DenseSet<GlobalValue::GUID>(); 4256c475a75STeresa Johnson DenseSet<GlobalValue::GUID> LiveSymbols = GUIDPreservedSymbols; 4266c475a75STeresa Johnson SmallVector<GlobalValue::GUID, 128> Worklist; 4276c475a75STeresa Johnson Worklist.reserve(LiveSymbols.size() * 2); 4286c475a75STeresa Johnson for (auto GUID : LiveSymbols) { 4296c475a75STeresa Johnson DEBUG(dbgs() << "Live root: " << GUID << "\n"); 4306c475a75STeresa Johnson Worklist.push_back(GUID); 4316c475a75STeresa Johnson } 4326c475a75STeresa Johnson // Add values flagged in the index as live roots to the worklist. 4336c475a75STeresa Johnson for (const auto &Entry : Index) { 4346c475a75STeresa Johnson bool IsLiveRoot = llvm::any_of( 4356c475a75STeresa Johnson Entry.second, 4366c475a75STeresa Johnson [&](const std::unique_ptr<llvm::GlobalValueSummary> &Summary) { 4376c475a75STeresa Johnson return Summary->liveRoot(); 4386c475a75STeresa Johnson }); 4396c475a75STeresa Johnson if (!IsLiveRoot) 4406c475a75STeresa Johnson continue; 4416c475a75STeresa Johnson DEBUG(dbgs() << "Live root (summary): " << Entry.first << "\n"); 4426c475a75STeresa Johnson Worklist.push_back(Entry.first); 4436c475a75STeresa Johnson } 4446c475a75STeresa Johnson 4456c475a75STeresa Johnson while (!Worklist.empty()) { 4466c475a75STeresa Johnson auto GUID = Worklist.pop_back_val(); 4476c475a75STeresa Johnson auto It = Index.findGlobalValueSummaryList(GUID); 4486c475a75STeresa Johnson if (It == Index.end()) { 4496c475a75STeresa Johnson DEBUG(dbgs() << "Not in index: " << GUID << "\n"); 4506c475a75STeresa Johnson continue; 4516c475a75STeresa Johnson } 4526c475a75STeresa Johnson 4536c475a75STeresa Johnson // FIXME: we should only make the prevailing copy live here 4546c475a75STeresa Johnson for (auto &Summary : It->second) { 4556c475a75STeresa Johnson for (auto Ref : Summary->refs()) { 4566c475a75STeresa Johnson auto RefGUID = Ref.getGUID(); 4576c475a75STeresa Johnson if (LiveSymbols.insert(RefGUID).second) { 4586c475a75STeresa Johnson DEBUG(dbgs() << "Marking live (ref): " << RefGUID << "\n"); 4596c475a75STeresa Johnson Worklist.push_back(RefGUID); 4606c475a75STeresa Johnson } 4616c475a75STeresa Johnson } 4626c475a75STeresa Johnson if (auto *FS = dyn_cast<FunctionSummary>(Summary.get())) { 4636c475a75STeresa Johnson for (auto Call : FS->calls()) { 4646c475a75STeresa Johnson auto CallGUID = Call.first.getGUID(); 4656c475a75STeresa Johnson if (LiveSymbols.insert(CallGUID).second) { 4666c475a75STeresa Johnson DEBUG(dbgs() << "Marking live (call): " << CallGUID << "\n"); 4676c475a75STeresa Johnson Worklist.push_back(CallGUID); 4686c475a75STeresa Johnson } 4696c475a75STeresa Johnson } 4706c475a75STeresa Johnson } 4716c475a75STeresa Johnson if (auto *AS = dyn_cast<AliasSummary>(Summary.get())) { 4726c475a75STeresa Johnson auto AliaseeGUID = AS->getAliasee().getOriginalName(); 4736c475a75STeresa Johnson if (LiveSymbols.insert(AliaseeGUID).second) { 4746c475a75STeresa Johnson DEBUG(dbgs() << "Marking live (alias): " << AliaseeGUID << "\n"); 4756c475a75STeresa Johnson Worklist.push_back(AliaseeGUID); 4766c475a75STeresa Johnson } 4776c475a75STeresa Johnson } 4786c475a75STeresa Johnson } 4796c475a75STeresa Johnson } 4806c475a75STeresa Johnson DenseSet<GlobalValue::GUID> DeadSymbols; 4816c475a75STeresa Johnson DeadSymbols.reserve( 4826c475a75STeresa Johnson std::min(Index.size(), Index.size() - LiveSymbols.size())); 4836c475a75STeresa Johnson for (auto &Entry : Index) { 4846c475a75STeresa Johnson auto GUID = Entry.first; 4856c475a75STeresa Johnson if (!LiveSymbols.count(GUID)) { 4866c475a75STeresa Johnson DEBUG(dbgs() << "Marking dead: " << GUID << "\n"); 4876c475a75STeresa Johnson DeadSymbols.insert(GUID); 4886c475a75STeresa Johnson } 4896c475a75STeresa Johnson } 4906c475a75STeresa Johnson DEBUG(dbgs() << LiveSymbols.size() << " symbols Live, and " 4916c475a75STeresa Johnson << DeadSymbols.size() << " symbols Dead \n"); 4926c475a75STeresa Johnson NumDeadSymbols += DeadSymbols.size(); 4936c475a75STeresa Johnson NumLiveSymbols += LiveSymbols.size(); 4946c475a75STeresa Johnson return DeadSymbols; 4956c475a75STeresa Johnson } 4966c475a75STeresa Johnson 49784174c37STeresa Johnson /// Compute the set of summaries needed for a ThinLTO backend compilation of 49884174c37STeresa Johnson /// \p ModulePath. 49984174c37STeresa Johnson void llvm::gatherImportedSummariesForModule( 50084174c37STeresa Johnson StringRef ModulePath, 50184174c37STeresa Johnson const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries, 502cdbcbf74SMehdi Amini const FunctionImporter::ImportMapTy &ImportList, 50384174c37STeresa Johnson std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) { 50484174c37STeresa Johnson // Include all summaries from the importing module. 50584174c37STeresa Johnson ModuleToSummariesForIndex[ModulePath] = 50684174c37STeresa Johnson ModuleToDefinedGVSummaries.lookup(ModulePath); 50784174c37STeresa Johnson // Include summaries for imports. 50888c491ddSMehdi Amini for (auto &ILI : ImportList) { 50984174c37STeresa Johnson auto &SummariesForIndex = ModuleToSummariesForIndex[ILI.first()]; 51084174c37STeresa Johnson const auto &DefinedGVSummaries = 51184174c37STeresa Johnson ModuleToDefinedGVSummaries.lookup(ILI.first()); 51284174c37STeresa Johnson for (auto &GI : ILI.second) { 51384174c37STeresa Johnson const auto &DS = DefinedGVSummaries.find(GI.first); 51484174c37STeresa Johnson assert(DS != DefinedGVSummaries.end() && 51584174c37STeresa Johnson "Expected a defined summary for imported global value"); 51684174c37STeresa Johnson SummariesForIndex[GI.first] = DS->second; 51784174c37STeresa Johnson } 51884174c37STeresa Johnson } 51984174c37STeresa Johnson } 52084174c37STeresa Johnson 5218570fe47STeresa Johnson /// Emit the files \p ModulePath will import from into \p OutputFilename. 522cdbcbf74SMehdi Amini std::error_code 523cdbcbf74SMehdi Amini llvm::EmitImportsFiles(StringRef ModulePath, StringRef OutputFilename, 524cdbcbf74SMehdi Amini const FunctionImporter::ImportMapTy &ModuleImports) { 5258570fe47STeresa Johnson std::error_code EC; 5268570fe47STeresa Johnson raw_fd_ostream ImportsOS(OutputFilename, EC, sys::fs::OpenFlags::F_None); 5278570fe47STeresa Johnson if (EC) 5288570fe47STeresa Johnson return EC; 529cdbcbf74SMehdi Amini for (auto &ILI : ModuleImports) 5308570fe47STeresa Johnson ImportsOS << ILI.first() << "\n"; 5318570fe47STeresa Johnson return std::error_code(); 5328570fe47STeresa Johnson } 5338570fe47STeresa Johnson 53404c9a2d6STeresa Johnson /// Fixup WeakForLinker linkages in \p TheModule based on summary analysis. 53504c9a2d6STeresa Johnson void llvm::thinLTOResolveWeakForLinkerModule( 53604c9a2d6STeresa Johnson Module &TheModule, const GVSummaryMapTy &DefinedGlobals) { 5374566c6dbSTeresa Johnson auto ConvertToDeclaration = [](GlobalValue &GV) { 5384566c6dbSTeresa Johnson DEBUG(dbgs() << "Converting to a declaration: `" << GV.getName() << "\n"); 5394566c6dbSTeresa Johnson if (Function *F = dyn_cast<Function>(&GV)) { 5404566c6dbSTeresa Johnson F->deleteBody(); 5414566c6dbSTeresa Johnson F->clearMetadata(); 5424566c6dbSTeresa Johnson } else if (GlobalVariable *V = dyn_cast<GlobalVariable>(&GV)) { 5434566c6dbSTeresa Johnson V->setInitializer(nullptr); 5444566c6dbSTeresa Johnson V->setLinkage(GlobalValue::ExternalLinkage); 5454566c6dbSTeresa Johnson V->clearMetadata(); 5464566c6dbSTeresa Johnson } else 5474566c6dbSTeresa Johnson // For now we don't resolve or drop aliases. Once we do we'll 5484566c6dbSTeresa Johnson // need to add support here for creating either a function or 5494566c6dbSTeresa Johnson // variable declaration, and return the new GlobalValue* for 5504566c6dbSTeresa Johnson // the caller to use. 5514566c6dbSTeresa Johnson assert(false && "Expected function or variable"); 5524566c6dbSTeresa Johnson }; 5534566c6dbSTeresa Johnson 55404c9a2d6STeresa Johnson auto updateLinkage = [&](GlobalValue &GV) { 55504c9a2d6STeresa Johnson if (!GlobalValue::isWeakForLinker(GV.getLinkage())) 55604c9a2d6STeresa Johnson return; 55704c9a2d6STeresa Johnson // See if the global summary analysis computed a new resolved linkage. 55804c9a2d6STeresa Johnson const auto &GS = DefinedGlobals.find(GV.getGUID()); 55904c9a2d6STeresa Johnson if (GS == DefinedGlobals.end()) 56004c9a2d6STeresa Johnson return; 56104c9a2d6STeresa Johnson auto NewLinkage = GS->second->linkage(); 56204c9a2d6STeresa Johnson if (NewLinkage == GV.getLinkage()) 56304c9a2d6STeresa Johnson return; 5644566c6dbSTeresa Johnson // Check for a non-prevailing def that has interposable linkage 5654566c6dbSTeresa Johnson // (e.g. non-odr weak or linkonce). In that case we can't simply 5664566c6dbSTeresa Johnson // convert to available_externally, since it would lose the 5674566c6dbSTeresa Johnson // interposable property and possibly get inlined. Simply drop 5684566c6dbSTeresa Johnson // the definition in that case. 5694566c6dbSTeresa Johnson if (GlobalValue::isAvailableExternallyLinkage(NewLinkage) && 5704566c6dbSTeresa Johnson GlobalValue::isInterposableLinkage(GV.getLinkage())) 5714566c6dbSTeresa Johnson ConvertToDeclaration(GV); 5724566c6dbSTeresa Johnson else { 57304c9a2d6STeresa Johnson DEBUG(dbgs() << "ODR fixing up linkage for `" << GV.getName() << "` from " 57404c9a2d6STeresa Johnson << GV.getLinkage() << " to " << NewLinkage << "\n"); 57504c9a2d6STeresa Johnson GV.setLinkage(NewLinkage); 5764566c6dbSTeresa Johnson } 5774566c6dbSTeresa Johnson // Remove declarations from comdats, including available_externally 5786107a419STeresa Johnson // as this is a declaration for the linker, and will be dropped eventually. 5796107a419STeresa Johnson // It is illegal for comdats to contain declarations. 5806107a419STeresa Johnson auto *GO = dyn_cast_or_null<GlobalObject>(&GV); 5814566c6dbSTeresa Johnson if (GO && GO->isDeclarationForLinker() && GO->hasComdat()) 5826107a419STeresa Johnson GO->setComdat(nullptr); 58304c9a2d6STeresa Johnson }; 58404c9a2d6STeresa Johnson 58504c9a2d6STeresa Johnson // Process functions and global now 58604c9a2d6STeresa Johnson for (auto &GV : TheModule) 58704c9a2d6STeresa Johnson updateLinkage(GV); 58804c9a2d6STeresa Johnson for (auto &GV : TheModule.globals()) 58904c9a2d6STeresa Johnson updateLinkage(GV); 59004c9a2d6STeresa Johnson for (auto &GV : TheModule.aliases()) 59104c9a2d6STeresa Johnson updateLinkage(GV); 59204c9a2d6STeresa Johnson } 59304c9a2d6STeresa Johnson 59404c9a2d6STeresa Johnson /// Run internalization on \p TheModule based on symmary analysis. 59504c9a2d6STeresa Johnson void llvm::thinLTOInternalizeModule(Module &TheModule, 59604c9a2d6STeresa Johnson const GVSummaryMapTy &DefinedGlobals) { 59704c9a2d6STeresa Johnson // Parse inline ASM and collect the list of symbols that are not defined in 59804c9a2d6STeresa Johnson // the current module. 59904c9a2d6STeresa Johnson StringSet<> AsmUndefinedRefs; 600863cbfbeSPeter Collingbourne ModuleSymbolTable::CollectAsmSymbols( 601*d8204472STeresa Johnson TheModule, 60204c9a2d6STeresa Johnson [&AsmUndefinedRefs](StringRef Name, object::BasicSymbolRef::Flags Flags) { 60304c9a2d6STeresa Johnson if (Flags & object::BasicSymbolRef::SF_Undefined) 60404c9a2d6STeresa Johnson AsmUndefinedRefs.insert(Name); 60504c9a2d6STeresa Johnson }); 60604c9a2d6STeresa Johnson 60704c9a2d6STeresa Johnson // Declare a callback for the internalize pass that will ask for every 60804c9a2d6STeresa Johnson // candidate GlobalValue if it can be internalized or not. 60904c9a2d6STeresa Johnson auto MustPreserveGV = [&](const GlobalValue &GV) -> bool { 61004c9a2d6STeresa Johnson // Can't be internalized if referenced in inline asm. 61104c9a2d6STeresa Johnson if (AsmUndefinedRefs.count(GV.getName())) 61204c9a2d6STeresa Johnson return true; 61304c9a2d6STeresa Johnson 61404c9a2d6STeresa Johnson // Lookup the linkage recorded in the summaries during global analysis. 61504c9a2d6STeresa Johnson const auto &GS = DefinedGlobals.find(GV.getGUID()); 61604c9a2d6STeresa Johnson GlobalValue::LinkageTypes Linkage; 61704c9a2d6STeresa Johnson if (GS == DefinedGlobals.end()) { 61804c9a2d6STeresa Johnson // Must have been promoted (possibly conservatively). Find original 61904c9a2d6STeresa Johnson // name so that we can access the correct summary and see if it can 62004c9a2d6STeresa Johnson // be internalized again. 62104c9a2d6STeresa Johnson // FIXME: Eventually we should control promotion instead of promoting 62204c9a2d6STeresa Johnson // and internalizing again. 62304c9a2d6STeresa Johnson StringRef OrigName = 62404c9a2d6STeresa Johnson ModuleSummaryIndex::getOriginalNameBeforePromote(GV.getName()); 62504c9a2d6STeresa Johnson std::string OrigId = GlobalValue::getGlobalIdentifier( 62604c9a2d6STeresa Johnson OrigName, GlobalValue::InternalLinkage, 62704c9a2d6STeresa Johnson TheModule.getSourceFileName()); 62804c9a2d6STeresa Johnson const auto &GS = DefinedGlobals.find(GlobalValue::getGUID(OrigId)); 6297ab1f692STeresa Johnson if (GS == DefinedGlobals.end()) { 6307ab1f692STeresa Johnson // Also check the original non-promoted non-globalized name. In some 6317ab1f692STeresa Johnson // cases a preempted weak value is linked in as a local copy because 6327ab1f692STeresa Johnson // it is referenced by an alias (IRLinker::linkGlobalValueProto). 6337ab1f692STeresa Johnson // In that case, since it was originally not a local value, it was 6347ab1f692STeresa Johnson // recorded in the index using the original name. 6357ab1f692STeresa Johnson // FIXME: This may not be needed once PR27866 is fixed. 6367ab1f692STeresa Johnson const auto &GS = DefinedGlobals.find(GlobalValue::getGUID(OrigName)); 63704c9a2d6STeresa Johnson assert(GS != DefinedGlobals.end()); 63804c9a2d6STeresa Johnson Linkage = GS->second->linkage(); 6397ab1f692STeresa Johnson } else { 6407ab1f692STeresa Johnson Linkage = GS->second->linkage(); 6417ab1f692STeresa Johnson } 64204c9a2d6STeresa Johnson } else 64304c9a2d6STeresa Johnson Linkage = GS->second->linkage(); 64404c9a2d6STeresa Johnson return !GlobalValue::isLocalLinkage(Linkage); 64504c9a2d6STeresa Johnson }; 64604c9a2d6STeresa Johnson 64704c9a2d6STeresa Johnson // FIXME: See if we can just internalize directly here via linkage changes 64804c9a2d6STeresa Johnson // based on the index, rather than invoking internalizeModule. 64904c9a2d6STeresa Johnson llvm::internalizeModule(TheModule, MustPreserveGV); 65004c9a2d6STeresa Johnson } 65104c9a2d6STeresa Johnson 652c8c55170SMehdi Amini // Automatically import functions in Module \p DestModule based on the summaries 653c8c55170SMehdi Amini // index. 654c8c55170SMehdi Amini // 6557f00d0a1SPeter Collingbourne Expected<bool> FunctionImporter::importFunctions( 65637e24591SPeter Collingbourne Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) { 6575411d051SMehdi Amini DEBUG(dbgs() << "Starting import for Module " 658311fef6eSMehdi Amini << DestModule.getModuleIdentifier() << "\n"); 659c8c55170SMehdi Amini unsigned ImportedCount = 0; 660c8c55170SMehdi Amini 6616d8f817fSPeter Collingbourne IRMover Mover(DestModule); 6627e88d0daSMehdi Amini // Do the actual import of functions now, one Module at a time 66301e32130SMehdi Amini std::set<StringRef> ModuleNameOrderedList; 66401e32130SMehdi Amini for (auto &FunctionsToImportPerModule : ImportList) { 66501e32130SMehdi Amini ModuleNameOrderedList.insert(FunctionsToImportPerModule.first()); 66601e32130SMehdi Amini } 66701e32130SMehdi Amini for (auto &Name : ModuleNameOrderedList) { 6687e88d0daSMehdi Amini // Get the module for the import 66901e32130SMehdi Amini const auto &FunctionsToImportPerModule = ImportList.find(Name); 67001e32130SMehdi Amini assert(FunctionsToImportPerModule != ImportList.end()); 671d9445c49SPeter Collingbourne Expected<std::unique_ptr<Module>> SrcModuleOrErr = ModuleLoader(Name); 672d9445c49SPeter Collingbourne if (!SrcModuleOrErr) 673d9445c49SPeter Collingbourne return SrcModuleOrErr.takeError(); 674d9445c49SPeter Collingbourne std::unique_ptr<Module> SrcModule = std::move(*SrcModuleOrErr); 6757e88d0daSMehdi Amini assert(&DestModule.getContext() == &SrcModule->getContext() && 6767e88d0daSMehdi Amini "Context mismatch"); 6777e88d0daSMehdi Amini 6786cba37ceSTeresa Johnson // If modules were created with lazy metadata loading, materialize it 6796cba37ceSTeresa Johnson // now, before linking it (otherwise this will be a noop). 6807f00d0a1SPeter Collingbourne if (Error Err = SrcModule->materializeMetadata()) 6817f00d0a1SPeter Collingbourne return std::move(Err); 682e5a61917STeresa Johnson 68301e32130SMehdi Amini auto &ImportGUIDs = FunctionsToImportPerModule->second; 68401e32130SMehdi Amini // Find the globals to import 6856d8f817fSPeter Collingbourne SetVector<GlobalValue *> GlobalsToImport; 6861f685e01SPiotr Padlewski for (Function &F : *SrcModule) { 6871f685e01SPiotr Padlewski if (!F.hasName()) 6880beb858eSTeresa Johnson continue; 6891f685e01SPiotr Padlewski auto GUID = F.getGUID(); 6900beb858eSTeresa Johnson auto Import = ImportGUIDs.count(GUID); 691aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function " << GUID 6921f685e01SPiotr Padlewski << " " << F.getName() << " from " 693aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 6940beb858eSTeresa Johnson if (Import) { 6957f00d0a1SPeter Collingbourne if (Error Err = F.materialize()) 6967f00d0a1SPeter Collingbourne return std::move(Err); 6973b776128SPiotr Padlewski if (EnableImportMetadata) { 6986deaa6afSPiotr Padlewski // Add 'thinlto_src_module' metadata for statistics and debugging. 6993b776128SPiotr Padlewski F.setMetadata( 7003b776128SPiotr Padlewski "thinlto_src_module", 7013b776128SPiotr Padlewski llvm::MDNode::get( 7026deaa6afSPiotr Padlewski DestModule.getContext(), 7033b776128SPiotr Padlewski {llvm::MDString::get(DestModule.getContext(), 7046deaa6afSPiotr Padlewski SrcModule->getSourceFileName())})); 7053b776128SPiotr Padlewski } 7061f685e01SPiotr Padlewski GlobalsToImport.insert(&F); 70701e32130SMehdi Amini } 70801e32130SMehdi Amini } 7091f685e01SPiotr Padlewski for (GlobalVariable &GV : SrcModule->globals()) { 7102d28f7aaSMehdi Amini if (!GV.hasName()) 7112d28f7aaSMehdi Amini continue; 7122d28f7aaSMehdi Amini auto GUID = GV.getGUID(); 7132d28f7aaSMehdi Amini auto Import = ImportGUIDs.count(GUID); 714aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global " << GUID 715aeb1e59bSMehdi Amini << " " << GV.getName() << " from " 716aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 7172d28f7aaSMehdi Amini if (Import) { 7187f00d0a1SPeter Collingbourne if (Error Err = GV.materialize()) 7197f00d0a1SPeter Collingbourne return std::move(Err); 7202d28f7aaSMehdi Amini GlobalsToImport.insert(&GV); 7212d28f7aaSMehdi Amini } 7222d28f7aaSMehdi Amini } 7231f685e01SPiotr Padlewski for (GlobalAlias &GA : SrcModule->aliases()) { 7246d8f817fSPeter Collingbourne // FIXME: This should eventually be controlled entirely by the summary. 7256d8f817fSPeter Collingbourne if (FunctionImportGlobalProcessing::doImportAsDefinition( 7266d8f817fSPeter Collingbourne &GA, &GlobalsToImport)) { 7276d8f817fSPeter Collingbourne GlobalsToImport.insert(&GA); 7286d8f817fSPeter Collingbourne continue; 7296d8f817fSPeter Collingbourne } 7306d8f817fSPeter Collingbourne 7311f685e01SPiotr Padlewski if (!GA.hasName()) 73201e32130SMehdi Amini continue; 7331f685e01SPiotr Padlewski auto GUID = GA.getGUID(); 7340beb858eSTeresa Johnson auto Import = ImportGUIDs.count(GUID); 735aeb1e59bSMehdi Amini DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias " << GUID 7361f685e01SPiotr Padlewski << " " << GA.getName() << " from " 737aeb1e59bSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 7380beb858eSTeresa Johnson if (Import) { 73901e32130SMehdi Amini // Alias can't point to "available_externally". However when we import 7409aae395fSTeresa Johnson // linkOnceODR the linkage does not change. So we import the alias 7416968ef77SMehdi Amini // and aliasee only in this case. This has been handled by 7426968ef77SMehdi Amini // computeImportForFunction() 7431f685e01SPiotr Padlewski GlobalObject *GO = GA.getBaseObject(); 7446968ef77SMehdi Amini assert(GO->hasLinkOnceODRLinkage() && 7456968ef77SMehdi Amini "Unexpected alias to a non-linkonceODR in import list"); 7462d28f7aaSMehdi Amini #ifndef NDEBUG 7472d28f7aaSMehdi Amini if (!GlobalsToImport.count(GO)) 7482d28f7aaSMehdi Amini DEBUG(dbgs() << " alias triggers importing aliasee " << GO->getGUID() 7492d28f7aaSMehdi Amini << " " << GO->getName() << " from " 7502d28f7aaSMehdi Amini << SrcModule->getSourceFileName() << "\n"); 7512d28f7aaSMehdi Amini #endif 7527f00d0a1SPeter Collingbourne if (Error Err = GO->materialize()) 7537f00d0a1SPeter Collingbourne return std::move(Err); 75401e32130SMehdi Amini GlobalsToImport.insert(GO); 7557f00d0a1SPeter Collingbourne if (Error Err = GA.materialize()) 7567f00d0a1SPeter Collingbourne return std::move(Err); 7571f685e01SPiotr Padlewski GlobalsToImport.insert(&GA); 75801e32130SMehdi Amini } 75901e32130SMehdi Amini } 76001e32130SMehdi Amini 76119ef4fadSMehdi Amini // Upgrade debug info after we're done materializing all the globals and we 76219ef4fadSMehdi Amini // have loaded all the required metadata! 76319ef4fadSMehdi Amini UpgradeDebugInfo(*SrcModule); 76419ef4fadSMehdi Amini 7657e88d0daSMehdi Amini // Link in the specified functions. 76601e32130SMehdi Amini if (renameModuleForThinLTO(*SrcModule, Index, &GlobalsToImport)) 7678d05185aSMehdi Amini return true; 7688d05185aSMehdi Amini 769d29478f7STeresa Johnson if (PrintImports) { 770d29478f7STeresa Johnson for (const auto *GV : GlobalsToImport) 771d29478f7STeresa Johnson dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName() 772d29478f7STeresa Johnson << " from " << SrcModule->getSourceFileName() << "\n"; 773d29478f7STeresa Johnson } 774d29478f7STeresa Johnson 7756d8f817fSPeter Collingbourne if (Mover.move(std::move(SrcModule), GlobalsToImport.getArrayRef(), 7766d8f817fSPeter Collingbourne [](GlobalValue &, IRMover::ValueAdder) {}, 777e6fd9ff9SPeter Collingbourne /*IsPerformingImport=*/true)) 7787e88d0daSMehdi Amini report_fatal_error("Function Import: link error"); 7797e88d0daSMehdi Amini 78001e32130SMehdi Amini ImportedCount += GlobalsToImport.size(); 7816c475a75STeresa Johnson NumImportedModules++; 7827e88d0daSMehdi Amini } 783e5a61917STeresa Johnson 7846c475a75STeresa Johnson NumImportedFunctions += ImportedCount; 785d29478f7STeresa Johnson 7867e88d0daSMehdi Amini DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module " 787c8c55170SMehdi Amini << DestModule.getModuleIdentifier() << "\n"); 788c8c55170SMehdi Amini return ImportedCount; 78942418abaSMehdi Amini } 79042418abaSMehdi Amini 79142418abaSMehdi Amini /// Summary file to use for function importing when using -function-import from 79242418abaSMehdi Amini /// the command line. 79342418abaSMehdi Amini static cl::opt<std::string> 79442418abaSMehdi Amini SummaryFile("summary-file", 79542418abaSMehdi Amini cl::desc("The summary file to use for function importing.")); 79642418abaSMehdi Amini 797598bd2a2SPeter Collingbourne static bool doImportingForModule(Module &M) { 798598bd2a2SPeter Collingbourne if (SummaryFile.empty()) 799598bd2a2SPeter Collingbourne report_fatal_error("error: -function-import requires -summary-file\n"); 8006de481a3SPeter Collingbourne Expected<std::unique_ptr<ModuleSummaryIndex>> IndexPtrOrErr = 8016de481a3SPeter Collingbourne getModuleSummaryIndexForFile(SummaryFile); 8026de481a3SPeter Collingbourne if (!IndexPtrOrErr) { 8036de481a3SPeter Collingbourne logAllUnhandledErrors(IndexPtrOrErr.takeError(), errs(), 8046de481a3SPeter Collingbourne "Error loading file '" + SummaryFile + "': "); 80542418abaSMehdi Amini return false; 80642418abaSMehdi Amini } 807598bd2a2SPeter Collingbourne std::unique_ptr<ModuleSummaryIndex> Index = std::move(*IndexPtrOrErr); 80842418abaSMehdi Amini 809c86af334STeresa Johnson // First step is collecting the import list. 810c86af334STeresa Johnson FunctionImporter::ImportMapTy ImportList; 811c86af334STeresa Johnson ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index, 812c86af334STeresa Johnson ImportList); 81301e32130SMehdi Amini 8144fef68cbSTeresa Johnson // Conservatively mark all internal values as promoted. This interface is 8154fef68cbSTeresa Johnson // only used when doing importing via the function importing pass. The pass 8164fef68cbSTeresa Johnson // is only enabled when testing importing via the 'opt' tool, which does 8174fef68cbSTeresa Johnson // not do the ThinLink that would normally determine what values to promote. 8184fef68cbSTeresa Johnson for (auto &I : *Index) { 8194fef68cbSTeresa Johnson for (auto &S : I.second) { 8204fef68cbSTeresa Johnson if (GlobalValue::isLocalLinkage(S->linkage())) 8214fef68cbSTeresa Johnson S->setLinkage(GlobalValue::ExternalLinkage); 8224fef68cbSTeresa Johnson } 8234fef68cbSTeresa Johnson } 8244fef68cbSTeresa Johnson 82501e32130SMehdi Amini // Next we need to promote to global scope and rename any local values that 8261b00f2d9STeresa Johnson // are potentially exported to other modules. 82701e32130SMehdi Amini if (renameModuleForThinLTO(M, *Index, nullptr)) { 8281b00f2d9STeresa Johnson errs() << "Error renaming module\n"; 8291b00f2d9STeresa Johnson return false; 8301b00f2d9STeresa Johnson } 8311b00f2d9STeresa Johnson 83242418abaSMehdi Amini // Perform the import now. 833d16c8065SMehdi Amini auto ModuleLoader = [&M](StringRef Identifier) { 834d16c8065SMehdi Amini return loadFile(Identifier, M.getContext()); 835d16c8065SMehdi Amini }; 8369d2bfc48SRafael Espindola FunctionImporter Importer(*Index, ModuleLoader); 83737e24591SPeter Collingbourne Expected<bool> Result = Importer.importFunctions(M, ImportList); 8387f00d0a1SPeter Collingbourne 8397f00d0a1SPeter Collingbourne // FIXME: Probably need to propagate Errors through the pass manager. 8407f00d0a1SPeter Collingbourne if (!Result) { 8417f00d0a1SPeter Collingbourne logAllUnhandledErrors(Result.takeError(), errs(), 8427f00d0a1SPeter Collingbourne "Error importing module: "); 8437f00d0a1SPeter Collingbourne return false; 8447f00d0a1SPeter Collingbourne } 8457f00d0a1SPeter Collingbourne 8467f00d0a1SPeter Collingbourne return *Result; 84721241571STeresa Johnson } 84821241571STeresa Johnson 84921241571STeresa Johnson namespace { 85021241571STeresa Johnson /// Pass that performs cross-module function import provided a summary file. 85121241571STeresa Johnson class FunctionImportLegacyPass : public ModulePass { 85221241571STeresa Johnson public: 85321241571STeresa Johnson /// Pass identification, replacement for typeid 85421241571STeresa Johnson static char ID; 85521241571STeresa Johnson 85621241571STeresa Johnson /// Specify pass name for debug output 857117296c0SMehdi Amini StringRef getPassName() const override { return "Function Importing"; } 85821241571STeresa Johnson 859598bd2a2SPeter Collingbourne explicit FunctionImportLegacyPass() : ModulePass(ID) {} 86021241571STeresa Johnson 86121241571STeresa Johnson bool runOnModule(Module &M) override { 86221241571STeresa Johnson if (skipModule(M)) 86321241571STeresa Johnson return false; 86421241571STeresa Johnson 865598bd2a2SPeter Collingbourne return doImportingForModule(M); 86642418abaSMehdi Amini } 86742418abaSMehdi Amini }; 868fe2b5415SBenjamin Kramer } // anonymous namespace 86942418abaSMehdi Amini 87021241571STeresa Johnson PreservedAnalyses FunctionImportPass::run(Module &M, 871fd03ac6aSSean Silva ModuleAnalysisManager &AM) { 872598bd2a2SPeter Collingbourne if (!doImportingForModule(M)) 87321241571STeresa Johnson return PreservedAnalyses::all(); 87421241571STeresa Johnson 87521241571STeresa Johnson return PreservedAnalyses::none(); 87621241571STeresa Johnson } 87721241571STeresa Johnson 87821241571STeresa Johnson char FunctionImportLegacyPass::ID = 0; 87921241571STeresa Johnson INITIALIZE_PASS(FunctionImportLegacyPass, "function-import", 88042418abaSMehdi Amini "Summary Based Function Import", false, false) 88142418abaSMehdi Amini 88242418abaSMehdi Amini namespace llvm { 883598bd2a2SPeter Collingbourne Pass *createFunctionImportPass() { 884598bd2a2SPeter Collingbourne return new FunctionImportLegacyPass(); 8855fcbdb71STeresa Johnson } 88642418abaSMehdi Amini } 887