1384ca190SMehdi Amini //===- ModuleSummaryAnalysis.cpp - Module summary index builder -----------===// 2384ca190SMehdi Amini // 3384ca190SMehdi Amini // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4384ca190SMehdi Amini // See https://llvm.org/LICENSE.txt for license information. 5384ca190SMehdi Amini // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6384ca190SMehdi Amini // 7384ca190SMehdi Amini //===----------------------------------------------------------------------===// 8384ca190SMehdi Amini // 9384ca190SMehdi Amini // This pass builds a ModuleSummaryIndex object for the module, to be written 10384ca190SMehdi Amini // to bitcode or LLVM assembly. 11384ca190SMehdi Amini // 12384ca190SMehdi Amini //===----------------------------------------------------------------------===// 13384ca190SMehdi Amini 14384ca190SMehdi Amini #include "llvm/Analysis/ModuleSummaryAnalysis.h" 15384ca190SMehdi Amini #include "llvm/ADT/ArrayRef.h" 16384ca190SMehdi Amini #include "llvm/ADT/DenseSet.h" 17384ca190SMehdi Amini #include "llvm/ADT/MapVector.h" 18384ca190SMehdi Amini #include "llvm/ADT/STLExtras.h" 19384ca190SMehdi Amini #include "llvm/ADT/SetVector.h" 20384ca190SMehdi Amini #include "llvm/ADT/SmallPtrSet.h" 21384ca190SMehdi Amini #include "llvm/ADT/SmallVector.h" 22384ca190SMehdi Amini #include "llvm/ADT/StringRef.h" 23384ca190SMehdi Amini #include "llvm/Analysis/BlockFrequencyInfo.h" 24384ca190SMehdi Amini #include "llvm/Analysis/BranchProbabilityInfo.h" 25384ca190SMehdi Amini #include "llvm/Analysis/IndirectCallPromotionAnalysis.h" 26384ca190SMehdi Amini #include "llvm/Analysis/LoopInfo.h" 27384ca190SMehdi Amini #include "llvm/Analysis/ProfileSummaryInfo.h" 284666953cSVitaly Buka #include "llvm/Analysis/StackSafetyAnalysis.h" 29384ca190SMehdi Amini #include "llvm/Analysis/TypeMetadataUtils.h" 30384ca190SMehdi Amini #include "llvm/IR/Attributes.h" 31384ca190SMehdi Amini #include "llvm/IR/BasicBlock.h" 32384ca190SMehdi Amini #include "llvm/IR/Constant.h" 33384ca190SMehdi Amini #include "llvm/IR/Constants.h" 34384ca190SMehdi Amini #include "llvm/IR/Dominators.h" 35384ca190SMehdi Amini #include "llvm/IR/Function.h" 36384ca190SMehdi Amini #include "llvm/IR/GlobalAlias.h" 37384ca190SMehdi Amini #include "llvm/IR/GlobalValue.h" 38384ca190SMehdi Amini #include "llvm/IR/GlobalVariable.h" 39384ca190SMehdi Amini #include "llvm/IR/Instructions.h" 40384ca190SMehdi Amini #include "llvm/IR/IntrinsicInst.h" 41384ca190SMehdi Amini #include "llvm/IR/Intrinsics.h" 42384ca190SMehdi Amini #include "llvm/IR/Metadata.h" 43384ca190SMehdi Amini #include "llvm/IR/Module.h" 44384ca190SMehdi Amini #include "llvm/IR/ModuleSummaryIndex.h" 45384ca190SMehdi Amini #include "llvm/IR/Use.h" 46384ca190SMehdi Amini #include "llvm/IR/User.h" 47384ca190SMehdi Amini #include "llvm/InitializePasses.h" 48384ca190SMehdi Amini #include "llvm/Object/ModuleSymbolTable.h" 49384ca190SMehdi Amini #include "llvm/Object/SymbolicFile.h" 50384ca190SMehdi Amini #include "llvm/Pass.h" 51384ca190SMehdi Amini #include "llvm/Support/Casting.h" 52384ca190SMehdi Amini #include "llvm/Support/CommandLine.h" 53ba7a92c0SNico Weber #include "llvm/Support/FileSystem.h" 54384ca190SMehdi Amini #include <algorithm> 55384ca190SMehdi Amini #include <cassert> 56384ca190SMehdi Amini #include <cstdint> 57384ca190SMehdi Amini #include <vector> 58384ca190SMehdi Amini 59384ca190SMehdi Amini using namespace llvm; 60384ca190SMehdi Amini 61384ca190SMehdi Amini #define DEBUG_TYPE "module-summary-analysis" 62384ca190SMehdi Amini 63384ca190SMehdi Amini // Option to force edges cold which will block importing when the 64384ca190SMehdi Amini // -import-cold-multiplier is set to 0. Useful for debugging. 65384ca190SMehdi Amini FunctionSummary::ForceSummaryHotnessType ForceSummaryEdgesCold = 66384ca190SMehdi Amini FunctionSummary::FSHT_None; 67384ca190SMehdi Amini cl::opt<FunctionSummary::ForceSummaryHotnessType, true> FSEC( 68384ca190SMehdi Amini "force-summary-edges-cold", cl::Hidden, cl::location(ForceSummaryEdgesCold), 69384ca190SMehdi Amini cl::desc("Force all edges in the function summary to cold"), 70384ca190SMehdi Amini cl::values(clEnumValN(FunctionSummary::FSHT_None, "none", "None."), 71384ca190SMehdi Amini clEnumValN(FunctionSummary::FSHT_AllNonCritical, 72384ca190SMehdi Amini "all-non-critical", "All non-critical edges."), 73384ca190SMehdi Amini clEnumValN(FunctionSummary::FSHT_All, "all", "All edges."))); 74384ca190SMehdi Amini 75384ca190SMehdi Amini cl::opt<std::string> ModuleSummaryDotFile( 76384ca190SMehdi Amini "module-summary-dot-file", cl::init(""), cl::Hidden, 77384ca190SMehdi Amini cl::value_desc("filename"), 78384ca190SMehdi Amini cl::desc("File to emit dot graph of new summary into.")); 79384ca190SMehdi Amini 80384ca190SMehdi Amini // Walk through the operands of a given User via worklist iteration and populate 81384ca190SMehdi Amini // the set of GlobalValue references encountered. Invoked either on an 82384ca190SMehdi Amini // Instruction or a GlobalVariable (which walks its initializer). 83384ca190SMehdi Amini // Return true if any of the operands contains blockaddress. This is important 84384ca190SMehdi Amini // to know when computing summary for global var, because if global variable 85384ca190SMehdi Amini // references basic block address we can't import it separately from function 86384ca190SMehdi Amini // containing that basic block. For simplicity we currently don't import such 87384ca190SMehdi Amini // global vars at all. When importing function we aren't interested if any 88384ca190SMehdi Amini // instruction in it takes an address of any basic block, because instruction 89384ca190SMehdi Amini // can only take an address of basic block located in the same function. 90384ca190SMehdi Amini static bool findRefEdges(ModuleSummaryIndex &Index, const User *CurUser, 91384ca190SMehdi Amini SetVector<ValueInfo> &RefEdges, 92384ca190SMehdi Amini SmallPtrSet<const User *, 8> &Visited) { 93384ca190SMehdi Amini bool HasBlockAddress = false; 94384ca190SMehdi Amini SmallVector<const User *, 32> Worklist; 95e6a10446SFangrui Song if (Visited.insert(CurUser).second) 96384ca190SMehdi Amini Worklist.push_back(CurUser); 97384ca190SMehdi Amini 98384ca190SMehdi Amini while (!Worklist.empty()) { 99384ca190SMehdi Amini const User *U = Worklist.pop_back_val(); 100cea6f4d5SMircea Trofin const auto *CB = dyn_cast<CallBase>(U); 101384ca190SMehdi Amini 102384ca190SMehdi Amini for (const auto &OI : U->operands()) { 103384ca190SMehdi Amini const User *Operand = dyn_cast<User>(OI); 104384ca190SMehdi Amini if (!Operand) 105384ca190SMehdi Amini continue; 106384ca190SMehdi Amini if (isa<BlockAddress>(Operand)) { 107384ca190SMehdi Amini HasBlockAddress = true; 108384ca190SMehdi Amini continue; 109384ca190SMehdi Amini } 110384ca190SMehdi Amini if (auto *GV = dyn_cast<GlobalValue>(Operand)) { 111384ca190SMehdi Amini // We have a reference to a global value. This should be added to 112384ca190SMehdi Amini // the reference set unless it is a callee. Callees are handled 113384ca190SMehdi Amini // specially by WriteFunction and are added to a separate list. 114cea6f4d5SMircea Trofin if (!(CB && CB->isCallee(&OI))) 115384ca190SMehdi Amini RefEdges.insert(Index.getOrInsertValueInfo(GV)); 116384ca190SMehdi Amini continue; 117384ca190SMehdi Amini } 118e6a10446SFangrui Song if (Visited.insert(Operand).second) 119384ca190SMehdi Amini Worklist.push_back(Operand); 120384ca190SMehdi Amini } 121384ca190SMehdi Amini } 122384ca190SMehdi Amini return HasBlockAddress; 123384ca190SMehdi Amini } 124384ca190SMehdi Amini 125384ca190SMehdi Amini static CalleeInfo::HotnessType getHotness(uint64_t ProfileCount, 126384ca190SMehdi Amini ProfileSummaryInfo *PSI) { 127384ca190SMehdi Amini if (!PSI) 128384ca190SMehdi Amini return CalleeInfo::HotnessType::Unknown; 129384ca190SMehdi Amini if (PSI->isHotCount(ProfileCount)) 130384ca190SMehdi Amini return CalleeInfo::HotnessType::Hot; 131384ca190SMehdi Amini if (PSI->isColdCount(ProfileCount)) 132384ca190SMehdi Amini return CalleeInfo::HotnessType::Cold; 133384ca190SMehdi Amini return CalleeInfo::HotnessType::None; 134384ca190SMehdi Amini } 135384ca190SMehdi Amini 136384ca190SMehdi Amini static bool isNonRenamableLocal(const GlobalValue &GV) { 137384ca190SMehdi Amini return GV.hasSection() && GV.hasLocalLinkage(); 138384ca190SMehdi Amini } 139384ca190SMehdi Amini 140384ca190SMehdi Amini /// Determine whether this call has all constant integer arguments (excluding 141384ca190SMehdi Amini /// "this") and summarize it to VCalls or ConstVCalls as appropriate. 142384ca190SMehdi Amini static void addVCallToSet(DevirtCallSite Call, GlobalValue::GUID Guid, 143384ca190SMehdi Amini SetVector<FunctionSummary::VFuncId> &VCalls, 144384ca190SMehdi Amini SetVector<FunctionSummary::ConstVCall> &ConstVCalls) { 145384ca190SMehdi Amini std::vector<uint64_t> Args; 146384ca190SMehdi Amini // Start from the second argument to skip the "this" pointer. 14723b0ab2aSKazu Hirata for (auto &Arg : drop_begin(Call.CB.args())) { 148384ca190SMehdi Amini auto *CI = dyn_cast<ConstantInt>(Arg); 149384ca190SMehdi Amini if (!CI || CI->getBitWidth() > 64) { 150384ca190SMehdi Amini VCalls.insert({Guid, Call.Offset}); 151384ca190SMehdi Amini return; 152384ca190SMehdi Amini } 153384ca190SMehdi Amini Args.push_back(CI->getZExtValue()); 154384ca190SMehdi Amini } 155384ca190SMehdi Amini ConstVCalls.insert({{Guid, Call.Offset}, std::move(Args)}); 156384ca190SMehdi Amini } 157384ca190SMehdi Amini 158384ca190SMehdi Amini /// If this intrinsic call requires that we add information to the function 159384ca190SMehdi Amini /// summary, do so via the non-constant reference arguments. 160384ca190SMehdi Amini static void addIntrinsicToSummary( 161384ca190SMehdi Amini const CallInst *CI, SetVector<GlobalValue::GUID> &TypeTests, 162384ca190SMehdi Amini SetVector<FunctionSummary::VFuncId> &TypeTestAssumeVCalls, 163384ca190SMehdi Amini SetVector<FunctionSummary::VFuncId> &TypeCheckedLoadVCalls, 164384ca190SMehdi Amini SetVector<FunctionSummary::ConstVCall> &TypeTestAssumeConstVCalls, 165384ca190SMehdi Amini SetVector<FunctionSummary::ConstVCall> &TypeCheckedLoadConstVCalls, 166384ca190SMehdi Amini DominatorTree &DT) { 167384ca190SMehdi Amini switch (CI->getCalledFunction()->getIntrinsicID()) { 168384ca190SMehdi Amini case Intrinsic::type_test: { 169384ca190SMehdi Amini auto *TypeMDVal = cast<MetadataAsValue>(CI->getArgOperand(1)); 170384ca190SMehdi Amini auto *TypeId = dyn_cast<MDString>(TypeMDVal->getMetadata()); 171384ca190SMehdi Amini if (!TypeId) 172384ca190SMehdi Amini break; 173384ca190SMehdi Amini GlobalValue::GUID Guid = GlobalValue::getGUID(TypeId->getString()); 174384ca190SMehdi Amini 175384ca190SMehdi Amini // Produce a summary from type.test intrinsics. We only summarize type.test 176384ca190SMehdi Amini // intrinsics that are used other than by an llvm.assume intrinsic. 177384ca190SMehdi Amini // Intrinsics that are assumed are relevant only to the devirtualization 178384ca190SMehdi Amini // pass, not the type test lowering pass. 179384ca190SMehdi Amini bool HasNonAssumeUses = llvm::any_of(CI->uses(), [](const Use &CIU) { 180908215b3SPhilip Reames return !isa<AssumeInst>(CIU.getUser()); 181384ca190SMehdi Amini }); 182384ca190SMehdi Amini if (HasNonAssumeUses) 183384ca190SMehdi Amini TypeTests.insert(Guid); 184384ca190SMehdi Amini 185384ca190SMehdi Amini SmallVector<DevirtCallSite, 4> DevirtCalls; 186384ca190SMehdi Amini SmallVector<CallInst *, 4> Assumes; 187384ca190SMehdi Amini findDevirtualizableCallsForTypeTest(DevirtCalls, Assumes, CI, DT); 188384ca190SMehdi Amini for (auto &Call : DevirtCalls) 189384ca190SMehdi Amini addVCallToSet(Call, Guid, TypeTestAssumeVCalls, 190384ca190SMehdi Amini TypeTestAssumeConstVCalls); 191384ca190SMehdi Amini 192384ca190SMehdi Amini break; 193384ca190SMehdi Amini } 194384ca190SMehdi Amini 195384ca190SMehdi Amini case Intrinsic::type_checked_load: { 196384ca190SMehdi Amini auto *TypeMDVal = cast<MetadataAsValue>(CI->getArgOperand(2)); 197384ca190SMehdi Amini auto *TypeId = dyn_cast<MDString>(TypeMDVal->getMetadata()); 198384ca190SMehdi Amini if (!TypeId) 199384ca190SMehdi Amini break; 200384ca190SMehdi Amini GlobalValue::GUID Guid = GlobalValue::getGUID(TypeId->getString()); 201384ca190SMehdi Amini 202384ca190SMehdi Amini SmallVector<DevirtCallSite, 4> DevirtCalls; 203384ca190SMehdi Amini SmallVector<Instruction *, 4> LoadedPtrs; 204384ca190SMehdi Amini SmallVector<Instruction *, 4> Preds; 205384ca190SMehdi Amini bool HasNonCallUses = false; 206384ca190SMehdi Amini findDevirtualizableCallsForTypeCheckedLoad(DevirtCalls, LoadedPtrs, Preds, 207384ca190SMehdi Amini HasNonCallUses, CI, DT); 208384ca190SMehdi Amini // Any non-call uses of the result of llvm.type.checked.load will 209384ca190SMehdi Amini // prevent us from optimizing away the llvm.type.test. 210384ca190SMehdi Amini if (HasNonCallUses) 211384ca190SMehdi Amini TypeTests.insert(Guid); 212384ca190SMehdi Amini for (auto &Call : DevirtCalls) 213384ca190SMehdi Amini addVCallToSet(Call, Guid, TypeCheckedLoadVCalls, 214384ca190SMehdi Amini TypeCheckedLoadConstVCalls); 215384ca190SMehdi Amini 216384ca190SMehdi Amini break; 217384ca190SMehdi Amini } 218384ca190SMehdi Amini default: 219384ca190SMehdi Amini break; 220384ca190SMehdi Amini } 221384ca190SMehdi Amini } 222384ca190SMehdi Amini 223384ca190SMehdi Amini static bool isNonVolatileLoad(const Instruction *I) { 224384ca190SMehdi Amini if (const auto *LI = dyn_cast<LoadInst>(I)) 225384ca190SMehdi Amini return !LI->isVolatile(); 226384ca190SMehdi Amini 227384ca190SMehdi Amini return false; 228384ca190SMehdi Amini } 229384ca190SMehdi Amini 230384ca190SMehdi Amini static bool isNonVolatileStore(const Instruction *I) { 231384ca190SMehdi Amini if (const auto *SI = dyn_cast<StoreInst>(I)) 232384ca190SMehdi Amini return !SI->isVolatile(); 233384ca190SMehdi Amini 234384ca190SMehdi Amini return false; 235384ca190SMehdi Amini } 236384ca190SMehdi Amini 237*cf9e61a9SFangrui Song // Returns true if the function definition must be unreachable. 23809a704c5SMingming Liu // 23909a704c5SMingming Liu // Note if this helper function returns true, `F` is guaranteed 24009a704c5SMingming Liu // to be unreachable; if it returns false, `F` might still 24109a704c5SMingming Liu // be unreachable but not covered by this helper function. 24209a704c5SMingming Liu static bool mustBeUnreachableFunction(const Function &F) { 243*cf9e61a9SFangrui Song // A function must be unreachable if its entry block ends with an 244*cf9e61a9SFangrui Song // 'unreachable'. 245*cf9e61a9SFangrui Song assert(!F.isDeclaration()); 246*cf9e61a9SFangrui Song return isa<UnreachableInst>(F.getEntryBlock().getTerminator()); 24709a704c5SMingming Liu } 24809a704c5SMingming Liu 2494666953cSVitaly Buka static void computeFunctionSummary( 2504666953cSVitaly Buka ModuleSummaryIndex &Index, const Module &M, const Function &F, 2514666953cSVitaly Buka BlockFrequencyInfo *BFI, ProfileSummaryInfo *PSI, DominatorTree &DT, 2524666953cSVitaly Buka bool HasLocalsInUsedOrAsm, DenseSet<GlobalValue::GUID> &CantBePromoted, 2534666953cSVitaly Buka bool IsThinLTO, 2544666953cSVitaly Buka std::function<const StackSafetyInfo *(const Function &F)> GetSSICallback) { 255384ca190SMehdi Amini // Summary not currently supported for anonymous functions, they should 256384ca190SMehdi Amini // have been named. 257384ca190SMehdi Amini assert(F.hasName()); 258384ca190SMehdi Amini 259384ca190SMehdi Amini unsigned NumInsts = 0; 260384ca190SMehdi Amini // Map from callee ValueId to profile count. Used to accumulate profile 261384ca190SMehdi Amini // counts for all static calls to a given callee. 262384ca190SMehdi Amini MapVector<ValueInfo, CalleeInfo> CallGraphEdges; 263384ca190SMehdi Amini SetVector<ValueInfo> RefEdges, LoadRefEdges, StoreRefEdges; 264384ca190SMehdi Amini SetVector<GlobalValue::GUID> TypeTests; 265384ca190SMehdi Amini SetVector<FunctionSummary::VFuncId> TypeTestAssumeVCalls, 266384ca190SMehdi Amini TypeCheckedLoadVCalls; 267384ca190SMehdi Amini SetVector<FunctionSummary::ConstVCall> TypeTestAssumeConstVCalls, 268384ca190SMehdi Amini TypeCheckedLoadConstVCalls; 269384ca190SMehdi Amini ICallPromotionAnalysis ICallAnalysis; 270384ca190SMehdi Amini SmallPtrSet<const User *, 8> Visited; 271384ca190SMehdi Amini 272384ca190SMehdi Amini // Add personality function, prefix data and prologue data to function's ref 273384ca190SMehdi Amini // list. 274384ca190SMehdi Amini findRefEdges(Index, &F, RefEdges, Visited); 275384ca190SMehdi Amini std::vector<const Instruction *> NonVolatileLoads; 276384ca190SMehdi Amini std::vector<const Instruction *> NonVolatileStores; 277384ca190SMehdi Amini 278384ca190SMehdi Amini bool HasInlineAsmMaybeReferencingInternal = false; 2791a8087adSWenlei He bool HasIndirBranchToBlockAddress = false; 28020faf789Smodimo bool HasUnknownCall = false; 28120faf789Smodimo bool MayThrow = false; 2821a8087adSWenlei He for (const BasicBlock &BB : F) { 2831a8087adSWenlei He // We don't allow inlining of function with indirect branch to blockaddress. 2841a8087adSWenlei He // If the blockaddress escapes the function, e.g., via a global variable, 2851a8087adSWenlei He // inlining may lead to an invalid cross-function reference. So we shouldn't 2861a8087adSWenlei He // import such function either. 2871a8087adSWenlei He if (BB.hasAddressTaken()) { 2881a8087adSWenlei He for (User *U : BlockAddress::get(const_cast<BasicBlock *>(&BB))->users()) 2891a8087adSWenlei He if (!isa<CallBrInst>(*U)) { 2901a8087adSWenlei He HasIndirBranchToBlockAddress = true; 2911a8087adSWenlei He break; 2921a8087adSWenlei He } 2931a8087adSWenlei He } 2941a8087adSWenlei He 295384ca190SMehdi Amini for (const Instruction &I : BB) { 296c5fafc1eSHongtao Yu if (I.isDebugOrPseudoInst()) 297384ca190SMehdi Amini continue; 298384ca190SMehdi Amini ++NumInsts; 29920faf789Smodimo 300384ca190SMehdi Amini // Regular LTO module doesn't participate in ThinLTO import, 301384ca190SMehdi Amini // so no reference from it can be read/writeonly, since this 302384ca190SMehdi Amini // would require importing variable as local copy 303384ca190SMehdi Amini if (IsThinLTO) { 304384ca190SMehdi Amini if (isNonVolatileLoad(&I)) { 305384ca190SMehdi Amini // Postpone processing of non-volatile load instructions 306384ca190SMehdi Amini // See comments below 307384ca190SMehdi Amini Visited.insert(&I); 308384ca190SMehdi Amini NonVolatileLoads.push_back(&I); 309384ca190SMehdi Amini continue; 310384ca190SMehdi Amini } else if (isNonVolatileStore(&I)) { 311384ca190SMehdi Amini Visited.insert(&I); 312384ca190SMehdi Amini NonVolatileStores.push_back(&I); 313384ca190SMehdi Amini // All references from second operand of store (destination address) 314384ca190SMehdi Amini // can be considered write-only if they're not referenced by any 315384ca190SMehdi Amini // non-store instruction. References from first operand of store 316384ca190SMehdi Amini // (stored value) can't be treated either as read- or as write-only 317384ca190SMehdi Amini // so we add them to RefEdges as we do with all other instructions 318384ca190SMehdi Amini // except non-volatile load. 319384ca190SMehdi Amini Value *Stored = I.getOperand(0); 320384ca190SMehdi Amini if (auto *GV = dyn_cast<GlobalValue>(Stored)) 321384ca190SMehdi Amini // findRefEdges will try to examine GV operands, so instead 322384ca190SMehdi Amini // of calling it we should add GV to RefEdges directly. 323384ca190SMehdi Amini RefEdges.insert(Index.getOrInsertValueInfo(GV)); 324384ca190SMehdi Amini else if (auto *U = dyn_cast<User>(Stored)) 325384ca190SMehdi Amini findRefEdges(Index, U, RefEdges, Visited); 326384ca190SMehdi Amini continue; 327384ca190SMehdi Amini } 328384ca190SMehdi Amini } 329384ca190SMehdi Amini findRefEdges(Index, &I, RefEdges, Visited); 330cea6f4d5SMircea Trofin const auto *CB = dyn_cast<CallBase>(&I); 33120faf789Smodimo if (!CB) { 33220faf789Smodimo if (I.mayThrow()) 33320faf789Smodimo MayThrow = true; 334384ca190SMehdi Amini continue; 33520faf789Smodimo } 336384ca190SMehdi Amini 337384ca190SMehdi Amini const auto *CI = dyn_cast<CallInst>(&I); 338384ca190SMehdi Amini // Since we don't know exactly which local values are referenced in inline 339384ca190SMehdi Amini // assembly, conservatively mark the function as possibly referencing 340384ca190SMehdi Amini // a local value from inline assembly to ensure we don't export a 341384ca190SMehdi Amini // reference (which would require renaming and promotion of the 342384ca190SMehdi Amini // referenced value). 343384ca190SMehdi Amini if (HasLocalsInUsedOrAsm && CI && CI->isInlineAsm()) 344384ca190SMehdi Amini HasInlineAsmMaybeReferencingInternal = true; 345384ca190SMehdi Amini 346a58b62b4SCraig Topper auto *CalledValue = CB->getCalledOperand(); 347cea6f4d5SMircea Trofin auto *CalledFunction = CB->getCalledFunction(); 348384ca190SMehdi Amini if (CalledValue && !CalledFunction) { 349384ca190SMehdi Amini CalledValue = CalledValue->stripPointerCasts(); 350384ca190SMehdi Amini // Stripping pointer casts can reveal a called function. 351384ca190SMehdi Amini CalledFunction = dyn_cast<Function>(CalledValue); 352384ca190SMehdi Amini } 353384ca190SMehdi Amini // Check if this is an alias to a function. If so, get the 354384ca190SMehdi Amini // called aliasee for the checks below. 355384ca190SMehdi Amini if (auto *GA = dyn_cast<GlobalAlias>(CalledValue)) { 356384ca190SMehdi Amini assert(!CalledFunction && "Expected null called function in callsite for alias"); 35740ec1c0fSItay Bookstein CalledFunction = dyn_cast<Function>(GA->getAliaseeObject()); 358384ca190SMehdi Amini } 359384ca190SMehdi Amini // Check if this is a direct call to a known function or a known 360384ca190SMehdi Amini // intrinsic, or an indirect call with profile data. 361384ca190SMehdi Amini if (CalledFunction) { 362384ca190SMehdi Amini if (CI && CalledFunction->isIntrinsic()) { 363384ca190SMehdi Amini addIntrinsicToSummary( 364384ca190SMehdi Amini CI, TypeTests, TypeTestAssumeVCalls, TypeCheckedLoadVCalls, 365384ca190SMehdi Amini TypeTestAssumeConstVCalls, TypeCheckedLoadConstVCalls, DT); 366384ca190SMehdi Amini continue; 367384ca190SMehdi Amini } 368384ca190SMehdi Amini // We should have named any anonymous globals 369384ca190SMehdi Amini assert(CalledFunction->hasName()); 370cb56e9b9SMircea Trofin auto ScaledCount = PSI->getProfileCount(*CB, BFI); 371384ca190SMehdi Amini auto Hotness = ScaledCount ? getHotness(ScaledCount.getValue(), PSI) 372384ca190SMehdi Amini : CalleeInfo::HotnessType::Unknown; 373384ca190SMehdi Amini if (ForceSummaryEdgesCold != FunctionSummary::FSHT_None) 374384ca190SMehdi Amini Hotness = CalleeInfo::HotnessType::Cold; 375384ca190SMehdi Amini 376384ca190SMehdi Amini // Use the original CalledValue, in case it was an alias. We want 377384ca190SMehdi Amini // to record the call edge to the alias in that case. Eventually 378384ca190SMehdi Amini // an alias summary will be created to associate the alias and 379384ca190SMehdi Amini // aliasee. 380384ca190SMehdi Amini auto &ValueInfo = CallGraphEdges[Index.getOrInsertValueInfo( 381384ca190SMehdi Amini cast<GlobalValue>(CalledValue))]; 382384ca190SMehdi Amini ValueInfo.updateHotness(Hotness); 383384ca190SMehdi Amini // Add the relative block frequency to CalleeInfo if there is no profile 384384ca190SMehdi Amini // information. 385384ca190SMehdi Amini if (BFI != nullptr && Hotness == CalleeInfo::HotnessType::Unknown) { 386384ca190SMehdi Amini uint64_t BBFreq = BFI->getBlockFreq(&BB).getFrequency(); 387384ca190SMehdi Amini uint64_t EntryFreq = BFI->getEntryFreq(); 388384ca190SMehdi Amini ValueInfo.updateRelBlockFreq(BBFreq, EntryFreq); 389384ca190SMehdi Amini } 390384ca190SMehdi Amini } else { 39120faf789Smodimo HasUnknownCall = true; 392384ca190SMehdi Amini // Skip inline assembly calls. 393384ca190SMehdi Amini if (CI && CI->isInlineAsm()) 394384ca190SMehdi Amini continue; 395384ca190SMehdi Amini // Skip direct calls. 396384ca190SMehdi Amini if (!CalledValue || isa<Constant>(CalledValue)) 397384ca190SMehdi Amini continue; 398384ca190SMehdi Amini 399384ca190SMehdi Amini // Check if the instruction has a callees metadata. If so, add callees 400384ca190SMehdi Amini // to CallGraphEdges to reflect the references from the metadata, and 401384ca190SMehdi Amini // to enable importing for subsequent indirect call promotion and 402384ca190SMehdi Amini // inlining. 403384ca190SMehdi Amini if (auto *MD = I.getMetadata(LLVMContext::MD_callees)) { 404384ca190SMehdi Amini for (auto &Op : MD->operands()) { 405384ca190SMehdi Amini Function *Callee = mdconst::extract_or_null<Function>(Op); 406384ca190SMehdi Amini if (Callee) 407384ca190SMehdi Amini CallGraphEdges[Index.getOrInsertValueInfo(Callee)]; 408384ca190SMehdi Amini } 409384ca190SMehdi Amini } 410384ca190SMehdi Amini 411384ca190SMehdi Amini uint32_t NumVals, NumCandidates; 412384ca190SMehdi Amini uint64_t TotalCount; 413384ca190SMehdi Amini auto CandidateProfileData = 414384ca190SMehdi Amini ICallAnalysis.getPromotionCandidatesForInstruction( 415384ca190SMehdi Amini &I, NumVals, TotalCount, NumCandidates); 416384ca190SMehdi Amini for (auto &Candidate : CandidateProfileData) 417384ca190SMehdi Amini CallGraphEdges[Index.getOrInsertValueInfo(Candidate.Value)] 418384ca190SMehdi Amini .updateHotness(getHotness(Candidate.Count, PSI)); 419384ca190SMehdi Amini } 420384ca190SMehdi Amini } 4211a8087adSWenlei He } 422a7fa35a6SHiroshi Yamauchi Index.addBlockCount(F.size()); 423384ca190SMehdi Amini 424384ca190SMehdi Amini std::vector<ValueInfo> Refs; 425384ca190SMehdi Amini if (IsThinLTO) { 426384ca190SMehdi Amini auto AddRefEdges = [&](const std::vector<const Instruction *> &Instrs, 427384ca190SMehdi Amini SetVector<ValueInfo> &Edges, 428384ca190SMehdi Amini SmallPtrSet<const User *, 8> &Cache) { 429384ca190SMehdi Amini for (const auto *I : Instrs) { 430384ca190SMehdi Amini Cache.erase(I); 431384ca190SMehdi Amini findRefEdges(Index, I, Edges, Cache); 432384ca190SMehdi Amini } 433384ca190SMehdi Amini }; 434384ca190SMehdi Amini 435384ca190SMehdi Amini // By now we processed all instructions in a function, except 436384ca190SMehdi Amini // non-volatile loads and non-volatile value stores. Let's find 437384ca190SMehdi Amini // ref edges for both of instruction sets 438384ca190SMehdi Amini AddRefEdges(NonVolatileLoads, LoadRefEdges, Visited); 439384ca190SMehdi Amini // We can add some values to the Visited set when processing load 440384ca190SMehdi Amini // instructions which are also used by stores in NonVolatileStores. 441384ca190SMehdi Amini // For example this can happen if we have following code: 442384ca190SMehdi Amini // 443384ca190SMehdi Amini // store %Derived* @foo, %Derived** bitcast (%Base** @bar to %Derived**) 444384ca190SMehdi Amini // %42 = load %Derived*, %Derived** bitcast (%Base** @bar to %Derived**) 445384ca190SMehdi Amini // 446384ca190SMehdi Amini // After processing loads we'll add bitcast to the Visited set, and if 447384ca190SMehdi Amini // we use the same set while processing stores, we'll never see store 448384ca190SMehdi Amini // to @bar and @bar will be mistakenly treated as readonly. 449384ca190SMehdi Amini SmallPtrSet<const llvm::User *, 8> StoreCache; 450384ca190SMehdi Amini AddRefEdges(NonVolatileStores, StoreRefEdges, StoreCache); 451384ca190SMehdi Amini 452384ca190SMehdi Amini // If both load and store instruction reference the same variable 453384ca190SMehdi Amini // we won't be able to optimize it. Add all such reference edges 454384ca190SMehdi Amini // to RefEdges set. 455384ca190SMehdi Amini for (auto &VI : StoreRefEdges) 456384ca190SMehdi Amini if (LoadRefEdges.remove(VI)) 457384ca190SMehdi Amini RefEdges.insert(VI); 458384ca190SMehdi Amini 459384ca190SMehdi Amini unsigned RefCnt = RefEdges.size(); 460384ca190SMehdi Amini // All new reference edges inserted in two loops below are either 461384ca190SMehdi Amini // read or write only. They will be grouped in the end of RefEdges 462384ca190SMehdi Amini // vector, so we can use a single integer value to identify them. 463384ca190SMehdi Amini for (auto &VI : LoadRefEdges) 464384ca190SMehdi Amini RefEdges.insert(VI); 465384ca190SMehdi Amini 466384ca190SMehdi Amini unsigned FirstWORef = RefEdges.size(); 467384ca190SMehdi Amini for (auto &VI : StoreRefEdges) 468384ca190SMehdi Amini RefEdges.insert(VI); 469384ca190SMehdi Amini 470384ca190SMehdi Amini Refs = RefEdges.takeVector(); 471384ca190SMehdi Amini for (; RefCnt < FirstWORef; ++RefCnt) 472384ca190SMehdi Amini Refs[RefCnt].setReadOnly(); 473384ca190SMehdi Amini 474384ca190SMehdi Amini for (; RefCnt < Refs.size(); ++RefCnt) 475384ca190SMehdi Amini Refs[RefCnt].setWriteOnly(); 476384ca190SMehdi Amini } else { 477384ca190SMehdi Amini Refs = RefEdges.takeVector(); 478384ca190SMehdi Amini } 479384ca190SMehdi Amini // Explicit add hot edges to enforce importing for designated GUIDs for 480384ca190SMehdi Amini // sample PGO, to enable the same inlines as the profiled optimized binary. 481384ca190SMehdi Amini for (auto &I : F.getImportGUIDs()) 482384ca190SMehdi Amini CallGraphEdges[Index.getOrInsertValueInfo(I)].updateHotness( 483384ca190SMehdi Amini ForceSummaryEdgesCold == FunctionSummary::FSHT_All 484384ca190SMehdi Amini ? CalleeInfo::HotnessType::Cold 485384ca190SMehdi Amini : CalleeInfo::HotnessType::Critical); 486384ca190SMehdi Amini 487384ca190SMehdi Amini bool NonRenamableLocal = isNonRenamableLocal(F); 4881a8087adSWenlei He bool NotEligibleForImport = NonRenamableLocal || 4891a8087adSWenlei He HasInlineAsmMaybeReferencingInternal || 4901a8087adSWenlei He HasIndirBranchToBlockAddress; 49154fb3ca9SFangrui Song GlobalValueSummary::GVFlags Flags( 49254fb3ca9SFangrui Song F.getLinkage(), F.getVisibility(), NotEligibleForImport, 493384ca190SMehdi Amini /* Live = */ false, F.isDSOLocal(), 494384ca190SMehdi Amini F.hasLinkOnceODRLinkage() && F.hasGlobalUnnamedAddr()); 495384ca190SMehdi Amini FunctionSummary::FFlags FunFlags{ 496384ca190SMehdi Amini F.hasFnAttribute(Attribute::ReadNone), 497384ca190SMehdi Amini F.hasFnAttribute(Attribute::ReadOnly), 498384ca190SMehdi Amini F.hasFnAttribute(Attribute::NoRecurse), F.returnDoesNotAlias(), 499384ca190SMehdi Amini // FIXME: refactor this to use the same code that inliner is using. 500384ca190SMehdi Amini // Don't try to import functions with noinline attribute. 50192ce6db9SArthur Eubanks F.getAttributes().hasFnAttr(Attribute::NoInline), 50220faf789Smodimo F.hasFnAttribute(Attribute::AlwaysInline), 50309a704c5SMingming Liu F.hasFnAttribute(Attribute::NoUnwind), MayThrow, HasUnknownCall, 50409a704c5SMingming Liu mustBeUnreachableFunction(F)}; 5054666953cSVitaly Buka std::vector<FunctionSummary::ParamAccess> ParamAccesses; 5064666953cSVitaly Buka if (auto *SSI = GetSSICallback(F)) 507fc4fd898SVitaly Buka ParamAccesses = SSI->getParamAccesses(Index); 508384ca190SMehdi Amini auto FuncSummary = std::make_unique<FunctionSummary>( 509384ca190SMehdi Amini Flags, NumInsts, FunFlags, /*EntryCount=*/0, std::move(Refs), 510384ca190SMehdi Amini CallGraphEdges.takeVector(), TypeTests.takeVector(), 511384ca190SMehdi Amini TypeTestAssumeVCalls.takeVector(), TypeCheckedLoadVCalls.takeVector(), 512384ca190SMehdi Amini TypeTestAssumeConstVCalls.takeVector(), 5134666953cSVitaly Buka TypeCheckedLoadConstVCalls.takeVector(), std::move(ParamAccesses)); 514384ca190SMehdi Amini if (NonRenamableLocal) 515384ca190SMehdi Amini CantBePromoted.insert(F.getGUID()); 516384ca190SMehdi Amini Index.addGlobalValueSummary(F, std::move(FuncSummary)); 517384ca190SMehdi Amini } 518384ca190SMehdi Amini 519384ca190SMehdi Amini /// Find function pointers referenced within the given vtable initializer 520384ca190SMehdi Amini /// (or subset of an initializer) \p I. The starting offset of \p I within 521384ca190SMehdi Amini /// the vtable initializer is \p StartingOffset. Any discovered function 522384ca190SMehdi Amini /// pointers are added to \p VTableFuncs along with their cumulative offset 523384ca190SMehdi Amini /// within the initializer. 524384ca190SMehdi Amini static void findFuncPointers(const Constant *I, uint64_t StartingOffset, 525384ca190SMehdi Amini const Module &M, ModuleSummaryIndex &Index, 526384ca190SMehdi Amini VTableFuncList &VTableFuncs) { 527384ca190SMehdi Amini // First check if this is a function pointer. 528384ca190SMehdi Amini if (I->getType()->isPointerTy()) { 529384ca190SMehdi Amini auto Fn = dyn_cast<Function>(I->stripPointerCasts()); 530384ca190SMehdi Amini // We can disregard __cxa_pure_virtual as a possible call target, as 531384ca190SMehdi Amini // calls to pure virtuals are UB. 532384ca190SMehdi Amini if (Fn && Fn->getName() != "__cxa_pure_virtual") 533384ca190SMehdi Amini VTableFuncs.push_back({Index.getOrInsertValueInfo(Fn), StartingOffset}); 534384ca190SMehdi Amini return; 535384ca190SMehdi Amini } 536384ca190SMehdi Amini 537384ca190SMehdi Amini // Walk through the elements in the constant struct or array and recursively 538384ca190SMehdi Amini // look for virtual function pointers. 539384ca190SMehdi Amini const DataLayout &DL = M.getDataLayout(); 540384ca190SMehdi Amini if (auto *C = dyn_cast<ConstantStruct>(I)) { 541384ca190SMehdi Amini StructType *STy = dyn_cast<StructType>(C->getType()); 542384ca190SMehdi Amini assert(STy); 543384ca190SMehdi Amini const StructLayout *SL = DL.getStructLayout(C->getType()); 544384ca190SMehdi Amini 545896d0e1aSKazu Hirata for (auto EI : llvm::enumerate(STy->elements())) { 546896d0e1aSKazu Hirata auto Offset = SL->getElementOffset(EI.index()); 547384ca190SMehdi Amini unsigned Op = SL->getElementContainingOffset(Offset); 548384ca190SMehdi Amini findFuncPointers(cast<Constant>(I->getOperand(Op)), 549384ca190SMehdi Amini StartingOffset + Offset, M, Index, VTableFuncs); 550384ca190SMehdi Amini } 551384ca190SMehdi Amini } else if (auto *C = dyn_cast<ConstantArray>(I)) { 552384ca190SMehdi Amini ArrayType *ATy = C->getType(); 553384ca190SMehdi Amini Type *EltTy = ATy->getElementType(); 554384ca190SMehdi Amini uint64_t EltSize = DL.getTypeAllocSize(EltTy); 555384ca190SMehdi Amini for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i) { 556384ca190SMehdi Amini findFuncPointers(cast<Constant>(I->getOperand(i)), 557384ca190SMehdi Amini StartingOffset + i * EltSize, M, Index, VTableFuncs); 558384ca190SMehdi Amini } 559384ca190SMehdi Amini } 560384ca190SMehdi Amini } 561384ca190SMehdi Amini 562384ca190SMehdi Amini // Identify the function pointers referenced by vtable definition \p V. 563384ca190SMehdi Amini static void computeVTableFuncs(ModuleSummaryIndex &Index, 564384ca190SMehdi Amini const GlobalVariable &V, const Module &M, 565384ca190SMehdi Amini VTableFuncList &VTableFuncs) { 566384ca190SMehdi Amini if (!V.isConstant()) 567384ca190SMehdi Amini return; 568384ca190SMehdi Amini 569384ca190SMehdi Amini findFuncPointers(V.getInitializer(), /*StartingOffset=*/0, M, Index, 570384ca190SMehdi Amini VTableFuncs); 571384ca190SMehdi Amini 572384ca190SMehdi Amini #ifndef NDEBUG 573384ca190SMehdi Amini // Validate that the VTableFuncs list is ordered by offset. 574384ca190SMehdi Amini uint64_t PrevOffset = 0; 575384ca190SMehdi Amini for (auto &P : VTableFuncs) { 576384ca190SMehdi Amini // The findVFuncPointers traversal should have encountered the 577384ca190SMehdi Amini // functions in offset order. We need to use ">=" since PrevOffset 578384ca190SMehdi Amini // starts at 0. 579384ca190SMehdi Amini assert(P.VTableOffset >= PrevOffset); 580384ca190SMehdi Amini PrevOffset = P.VTableOffset; 581384ca190SMehdi Amini } 582384ca190SMehdi Amini #endif 583384ca190SMehdi Amini } 584384ca190SMehdi Amini 585384ca190SMehdi Amini /// Record vtable definition \p V for each type metadata it references. 586384ca190SMehdi Amini static void 587384ca190SMehdi Amini recordTypeIdCompatibleVtableReferences(ModuleSummaryIndex &Index, 588384ca190SMehdi Amini const GlobalVariable &V, 589384ca190SMehdi Amini SmallVectorImpl<MDNode *> &Types) { 590384ca190SMehdi Amini for (MDNode *Type : Types) { 591384ca190SMehdi Amini auto TypeID = Type->getOperand(1).get(); 592384ca190SMehdi Amini 593384ca190SMehdi Amini uint64_t Offset = 594384ca190SMehdi Amini cast<ConstantInt>( 595384ca190SMehdi Amini cast<ConstantAsMetadata>(Type->getOperand(0))->getValue()) 596384ca190SMehdi Amini ->getZExtValue(); 597384ca190SMehdi Amini 598384ca190SMehdi Amini if (auto *TypeId = dyn_cast<MDString>(TypeID)) 599384ca190SMehdi Amini Index.getOrInsertTypeIdCompatibleVtableSummary(TypeId->getString()) 600384ca190SMehdi Amini .push_back({Offset, Index.getOrInsertValueInfo(&V)}); 601384ca190SMehdi Amini } 602384ca190SMehdi Amini } 603384ca190SMehdi Amini 604384ca190SMehdi Amini static void computeVariableSummary(ModuleSummaryIndex &Index, 605384ca190SMehdi Amini const GlobalVariable &V, 606384ca190SMehdi Amini DenseSet<GlobalValue::GUID> &CantBePromoted, 607384ca190SMehdi Amini const Module &M, 608384ca190SMehdi Amini SmallVectorImpl<MDNode *> &Types) { 609384ca190SMehdi Amini SetVector<ValueInfo> RefEdges; 610384ca190SMehdi Amini SmallPtrSet<const User *, 8> Visited; 611384ca190SMehdi Amini bool HasBlockAddress = findRefEdges(Index, &V, RefEdges, Visited); 612384ca190SMehdi Amini bool NonRenamableLocal = isNonRenamableLocal(V); 61354fb3ca9SFangrui Song GlobalValueSummary::GVFlags Flags( 61454fb3ca9SFangrui Song V.getLinkage(), V.getVisibility(), NonRenamableLocal, 615384ca190SMehdi Amini /* Live = */ false, V.isDSOLocal(), 616384ca190SMehdi Amini V.hasLinkOnceODRLinkage() && V.hasGlobalUnnamedAddr()); 617384ca190SMehdi Amini 618384ca190SMehdi Amini VTableFuncList VTableFuncs; 619384ca190SMehdi Amini // If splitting is not enabled, then we compute the summary information 620384ca190SMehdi Amini // necessary for index-based whole program devirtualization. 621384ca190SMehdi Amini if (!Index.enableSplitLTOUnit()) { 622384ca190SMehdi Amini Types.clear(); 623384ca190SMehdi Amini V.getMetadata(LLVMContext::MD_type, Types); 624384ca190SMehdi Amini if (!Types.empty()) { 625384ca190SMehdi Amini // Identify the function pointers referenced by this vtable definition. 626384ca190SMehdi Amini computeVTableFuncs(Index, V, M, VTableFuncs); 627384ca190SMehdi Amini 628384ca190SMehdi Amini // Record this vtable definition for each type metadata it references. 629384ca190SMehdi Amini recordTypeIdCompatibleVtableReferences(Index, V, Types); 630384ca190SMehdi Amini } 631384ca190SMehdi Amini } 632384ca190SMehdi Amini 633384ca190SMehdi Amini // Don't mark variables we won't be able to internalize as read/write-only. 634384ca190SMehdi Amini bool CanBeInternalized = 635384ca190SMehdi Amini !V.hasComdat() && !V.hasAppendingLinkage() && !V.isInterposable() && 636384ca190SMehdi Amini !V.hasAvailableExternallyLinkage() && !V.hasDLLExportStorageClass(); 637384ca190SMehdi Amini bool Constant = V.isConstant(); 638384ca190SMehdi Amini GlobalVarSummary::GVarFlags VarFlags(CanBeInternalized, 639384ca190SMehdi Amini Constant ? false : CanBeInternalized, 640384ca190SMehdi Amini Constant, V.getVCallVisibility()); 641384ca190SMehdi Amini auto GVarSummary = std::make_unique<GlobalVarSummary>(Flags, VarFlags, 642384ca190SMehdi Amini RefEdges.takeVector()); 643384ca190SMehdi Amini if (NonRenamableLocal) 644384ca190SMehdi Amini CantBePromoted.insert(V.getGUID()); 645384ca190SMehdi Amini if (HasBlockAddress) 646384ca190SMehdi Amini GVarSummary->setNotEligibleToImport(); 647384ca190SMehdi Amini if (!VTableFuncs.empty()) 648384ca190SMehdi Amini GVarSummary->setVTableFuncs(VTableFuncs); 649384ca190SMehdi Amini Index.addGlobalValueSummary(V, std::move(GVarSummary)); 650384ca190SMehdi Amini } 651384ca190SMehdi Amini 652384ca190SMehdi Amini static void 653384ca190SMehdi Amini computeAliasSummary(ModuleSummaryIndex &Index, const GlobalAlias &A, 654384ca190SMehdi Amini DenseSet<GlobalValue::GUID> &CantBePromoted) { 655384ca190SMehdi Amini bool NonRenamableLocal = isNonRenamableLocal(A); 65654fb3ca9SFangrui Song GlobalValueSummary::GVFlags Flags( 65754fb3ca9SFangrui Song A.getLinkage(), A.getVisibility(), NonRenamableLocal, 658384ca190SMehdi Amini /* Live = */ false, A.isDSOLocal(), 659384ca190SMehdi Amini A.hasLinkOnceODRLinkage() && A.hasGlobalUnnamedAddr()); 660384ca190SMehdi Amini auto AS = std::make_unique<AliasSummary>(Flags); 66140ec1c0fSItay Bookstein auto *Aliasee = A.getAliaseeObject(); 662384ca190SMehdi Amini auto AliaseeVI = Index.getValueInfo(Aliasee->getGUID()); 663384ca190SMehdi Amini assert(AliaseeVI && "Alias expects aliasee summary to be available"); 664384ca190SMehdi Amini assert(AliaseeVI.getSummaryList().size() == 1 && 665384ca190SMehdi Amini "Expected a single entry per aliasee in per-module index"); 666384ca190SMehdi Amini AS->setAliasee(AliaseeVI, AliaseeVI.getSummaryList()[0].get()); 667384ca190SMehdi Amini if (NonRenamableLocal) 668384ca190SMehdi Amini CantBePromoted.insert(A.getGUID()); 669384ca190SMehdi Amini Index.addGlobalValueSummary(A, std::move(AS)); 670384ca190SMehdi Amini } 671384ca190SMehdi Amini 672384ca190SMehdi Amini // Set LiveRoot flag on entries matching the given value name. 673384ca190SMehdi Amini static void setLiveRoot(ModuleSummaryIndex &Index, StringRef Name) { 674384ca190SMehdi Amini if (ValueInfo VI = Index.getValueInfo(GlobalValue::getGUID(Name))) 675384ca190SMehdi Amini for (auto &Summary : VI.getSummaryList()) 676384ca190SMehdi Amini Summary->setLive(true); 677384ca190SMehdi Amini } 678384ca190SMehdi Amini 679384ca190SMehdi Amini ModuleSummaryIndex llvm::buildModuleSummaryIndex( 680384ca190SMehdi Amini const Module &M, 681384ca190SMehdi Amini std::function<BlockFrequencyInfo *(const Function &F)> GetBFICallback, 6824666953cSVitaly Buka ProfileSummaryInfo *PSI, 6834666953cSVitaly Buka std::function<const StackSafetyInfo *(const Function &F)> GetSSICallback) { 684384ca190SMehdi Amini assert(PSI); 685384ca190SMehdi Amini bool EnableSplitLTOUnit = false; 686384ca190SMehdi Amini if (auto *MD = mdconst::extract_or_null<ConstantInt>( 687384ca190SMehdi Amini M.getModuleFlag("EnableSplitLTOUnit"))) 688384ca190SMehdi Amini EnableSplitLTOUnit = MD->getZExtValue(); 689384ca190SMehdi Amini ModuleSummaryIndex Index(/*HaveGVs=*/true, EnableSplitLTOUnit); 690384ca190SMehdi Amini 691384ca190SMehdi Amini // Identify the local values in the llvm.used and llvm.compiler.used sets, 692384ca190SMehdi Amini // which should not be exported as they would then require renaming and 693384ca190SMehdi Amini // promotion, but we may have opaque uses e.g. in inline asm. We collect them 694384ca190SMehdi Amini // here because we use this information to mark functions containing inline 695384ca190SMehdi Amini // assembly calls as not importable. 696ef312951SFangrui Song SmallPtrSet<GlobalValue *, 4> LocalsUsed; 697ef312951SFangrui Song SmallVector<GlobalValue *, 4> Used; 698384ca190SMehdi Amini // First collect those in the llvm.used set. 699ef312951SFangrui Song collectUsedGlobalVariables(M, Used, /*CompilerUsed=*/false); 700384ca190SMehdi Amini // Next collect those in the llvm.compiler.used set. 701ef312951SFangrui Song collectUsedGlobalVariables(M, Used, /*CompilerUsed=*/true); 702384ca190SMehdi Amini DenseSet<GlobalValue::GUID> CantBePromoted; 703384ca190SMehdi Amini for (auto *V : Used) { 704384ca190SMehdi Amini if (V->hasLocalLinkage()) { 705384ca190SMehdi Amini LocalsUsed.insert(V); 706384ca190SMehdi Amini CantBePromoted.insert(V->getGUID()); 707384ca190SMehdi Amini } 708384ca190SMehdi Amini } 709384ca190SMehdi Amini 710384ca190SMehdi Amini bool HasLocalInlineAsmSymbol = false; 711384ca190SMehdi Amini if (!M.getModuleInlineAsm().empty()) { 712384ca190SMehdi Amini // Collect the local values defined by module level asm, and set up 713384ca190SMehdi Amini // summaries for these symbols so that they can be marked as NoRename, 714384ca190SMehdi Amini // to prevent export of any use of them in regular IR that would require 715384ca190SMehdi Amini // renaming within the module level asm. Note we don't need to create a 716384ca190SMehdi Amini // summary for weak or global defs, as they don't need to be flagged as 717384ca190SMehdi Amini // NoRename, and defs in module level asm can't be imported anyway. 718384ca190SMehdi Amini // Also, any values used but not defined within module level asm should 719384ca190SMehdi Amini // be listed on the llvm.used or llvm.compiler.used global and marked as 720384ca190SMehdi Amini // referenced from there. 721384ca190SMehdi Amini ModuleSymbolTable::CollectAsmSymbols( 722384ca190SMehdi Amini M, [&](StringRef Name, object::BasicSymbolRef::Flags Flags) { 723384ca190SMehdi Amini // Symbols not marked as Weak or Global are local definitions. 724384ca190SMehdi Amini if (Flags & (object::BasicSymbolRef::SF_Weak | 725384ca190SMehdi Amini object::BasicSymbolRef::SF_Global)) 726384ca190SMehdi Amini return; 727384ca190SMehdi Amini HasLocalInlineAsmSymbol = true; 728384ca190SMehdi Amini GlobalValue *GV = M.getNamedValue(Name); 729384ca190SMehdi Amini if (!GV) 730384ca190SMehdi Amini return; 731384ca190SMehdi Amini assert(GV->isDeclaration() && "Def in module asm already has definition"); 73254fb3ca9SFangrui Song GlobalValueSummary::GVFlags GVFlags( 73354fb3ca9SFangrui Song GlobalValue::InternalLinkage, GlobalValue::DefaultVisibility, 734384ca190SMehdi Amini /* NotEligibleToImport = */ true, 735384ca190SMehdi Amini /* Live = */ true, 736384ca190SMehdi Amini /* Local */ GV->isDSOLocal(), 737384ca190SMehdi Amini GV->hasLinkOnceODRLinkage() && GV->hasGlobalUnnamedAddr()); 738384ca190SMehdi Amini CantBePromoted.insert(GV->getGUID()); 739384ca190SMehdi Amini // Create the appropriate summary type. 740384ca190SMehdi Amini if (Function *F = dyn_cast<Function>(GV)) { 741384ca190SMehdi Amini std::unique_ptr<FunctionSummary> Summary = 742384ca190SMehdi Amini std::make_unique<FunctionSummary>( 743384ca190SMehdi Amini GVFlags, /*InstCount=*/0, 744384ca190SMehdi Amini FunctionSummary::FFlags{ 745384ca190SMehdi Amini F->hasFnAttribute(Attribute::ReadNone), 746384ca190SMehdi Amini F->hasFnAttribute(Attribute::ReadOnly), 747384ca190SMehdi Amini F->hasFnAttribute(Attribute::NoRecurse), 748384ca190SMehdi Amini F->returnDoesNotAlias(), 749384ca190SMehdi Amini /* NoInline = */ false, 75020faf789Smodimo F->hasFnAttribute(Attribute::AlwaysInline), 75120faf789Smodimo F->hasFnAttribute(Attribute::NoUnwind), 75220faf789Smodimo /* MayThrow */ true, 75309a704c5SMingming Liu /* HasUnknownCall */ true, 75409a704c5SMingming Liu /* MustBeUnreachable */ false}, 755384ca190SMehdi Amini /*EntryCount=*/0, ArrayRef<ValueInfo>{}, 756384ca190SMehdi Amini ArrayRef<FunctionSummary::EdgeTy>{}, 757384ca190SMehdi Amini ArrayRef<GlobalValue::GUID>{}, 758384ca190SMehdi Amini ArrayRef<FunctionSummary::VFuncId>{}, 759384ca190SMehdi Amini ArrayRef<FunctionSummary::VFuncId>{}, 760384ca190SMehdi Amini ArrayRef<FunctionSummary::ConstVCall>{}, 7614666953cSVitaly Buka ArrayRef<FunctionSummary::ConstVCall>{}, 7624666953cSVitaly Buka ArrayRef<FunctionSummary::ParamAccess>{}); 763384ca190SMehdi Amini Index.addGlobalValueSummary(*GV, std::move(Summary)); 764384ca190SMehdi Amini } else { 765384ca190SMehdi Amini std::unique_ptr<GlobalVarSummary> Summary = 766384ca190SMehdi Amini std::make_unique<GlobalVarSummary>( 767384ca190SMehdi Amini GVFlags, 768384ca190SMehdi Amini GlobalVarSummary::GVarFlags( 769384ca190SMehdi Amini false, false, cast<GlobalVariable>(GV)->isConstant(), 770384ca190SMehdi Amini GlobalObject::VCallVisibilityPublic), 771384ca190SMehdi Amini ArrayRef<ValueInfo>{}); 772384ca190SMehdi Amini Index.addGlobalValueSummary(*GV, std::move(Summary)); 773384ca190SMehdi Amini } 774384ca190SMehdi Amini }); 775384ca190SMehdi Amini } 776384ca190SMehdi Amini 777384ca190SMehdi Amini bool IsThinLTO = true; 778384ca190SMehdi Amini if (auto *MD = 779384ca190SMehdi Amini mdconst::extract_or_null<ConstantInt>(M.getModuleFlag("ThinLTO"))) 780384ca190SMehdi Amini IsThinLTO = MD->getZExtValue(); 781384ca190SMehdi Amini 782384ca190SMehdi Amini // Compute summaries for all functions defined in module, and save in the 783384ca190SMehdi Amini // index. 784384ca190SMehdi Amini for (auto &F : M) { 785384ca190SMehdi Amini if (F.isDeclaration()) 786384ca190SMehdi Amini continue; 787384ca190SMehdi Amini 788384ca190SMehdi Amini DominatorTree DT(const_cast<Function &>(F)); 789384ca190SMehdi Amini BlockFrequencyInfo *BFI = nullptr; 790384ca190SMehdi Amini std::unique_ptr<BlockFrequencyInfo> BFIPtr; 791384ca190SMehdi Amini if (GetBFICallback) 792384ca190SMehdi Amini BFI = GetBFICallback(F); 793384ca190SMehdi Amini else if (F.hasProfileData()) { 794384ca190SMehdi Amini LoopInfo LI{DT}; 795384ca190SMehdi Amini BranchProbabilityInfo BPI{F, LI}; 796384ca190SMehdi Amini BFIPtr = std::make_unique<BlockFrequencyInfo>(F, BPI, LI); 797384ca190SMehdi Amini BFI = BFIPtr.get(); 798384ca190SMehdi Amini } 799384ca190SMehdi Amini 800384ca190SMehdi Amini computeFunctionSummary(Index, M, F, BFI, PSI, DT, 801384ca190SMehdi Amini !LocalsUsed.empty() || HasLocalInlineAsmSymbol, 8024666953cSVitaly Buka CantBePromoted, IsThinLTO, GetSSICallback); 803384ca190SMehdi Amini } 804384ca190SMehdi Amini 805384ca190SMehdi Amini // Compute summaries for all variables defined in module, and save in the 806384ca190SMehdi Amini // index. 807384ca190SMehdi Amini SmallVector<MDNode *, 2> Types; 808384ca190SMehdi Amini for (const GlobalVariable &G : M.globals()) { 809384ca190SMehdi Amini if (G.isDeclaration()) 810384ca190SMehdi Amini continue; 811384ca190SMehdi Amini computeVariableSummary(Index, G, CantBePromoted, M, Types); 812384ca190SMehdi Amini } 813384ca190SMehdi Amini 814384ca190SMehdi Amini // Compute summaries for all aliases defined in module, and save in the 815384ca190SMehdi Amini // index. 816384ca190SMehdi Amini for (const GlobalAlias &A : M.aliases()) 817384ca190SMehdi Amini computeAliasSummary(Index, A, CantBePromoted); 818384ca190SMehdi Amini 819384ca190SMehdi Amini for (auto *V : LocalsUsed) { 820384ca190SMehdi Amini auto *Summary = Index.getGlobalValueSummary(*V); 821384ca190SMehdi Amini assert(Summary && "Missing summary for global value"); 822384ca190SMehdi Amini Summary->setNotEligibleToImport(); 823384ca190SMehdi Amini } 824384ca190SMehdi Amini 825384ca190SMehdi Amini // The linker doesn't know about these LLVM produced values, so we need 826384ca190SMehdi Amini // to flag them as live in the index to ensure index-based dead value 827384ca190SMehdi Amini // analysis treats them as live roots of the analysis. 828384ca190SMehdi Amini setLiveRoot(Index, "llvm.used"); 829384ca190SMehdi Amini setLiveRoot(Index, "llvm.compiler.used"); 830384ca190SMehdi Amini setLiveRoot(Index, "llvm.global_ctors"); 831384ca190SMehdi Amini setLiveRoot(Index, "llvm.global_dtors"); 832384ca190SMehdi Amini setLiveRoot(Index, "llvm.global.annotations"); 833384ca190SMehdi Amini 834384ca190SMehdi Amini for (auto &GlobalList : Index) { 835384ca190SMehdi Amini // Ignore entries for references that are undefined in the current module. 836384ca190SMehdi Amini if (GlobalList.second.SummaryList.empty()) 837384ca190SMehdi Amini continue; 838384ca190SMehdi Amini 839384ca190SMehdi Amini assert(GlobalList.second.SummaryList.size() == 1 && 840384ca190SMehdi Amini "Expected module's index to have one summary per GUID"); 841384ca190SMehdi Amini auto &Summary = GlobalList.second.SummaryList[0]; 842384ca190SMehdi Amini if (!IsThinLTO) { 843384ca190SMehdi Amini Summary->setNotEligibleToImport(); 844384ca190SMehdi Amini continue; 845384ca190SMehdi Amini } 846384ca190SMehdi Amini 847384ca190SMehdi Amini bool AllRefsCanBeExternallyReferenced = 848384ca190SMehdi Amini llvm::all_of(Summary->refs(), [&](const ValueInfo &VI) { 849384ca190SMehdi Amini return !CantBePromoted.count(VI.getGUID()); 850384ca190SMehdi Amini }); 851384ca190SMehdi Amini if (!AllRefsCanBeExternallyReferenced) { 852384ca190SMehdi Amini Summary->setNotEligibleToImport(); 853384ca190SMehdi Amini continue; 854384ca190SMehdi Amini } 855384ca190SMehdi Amini 856384ca190SMehdi Amini if (auto *FuncSummary = dyn_cast<FunctionSummary>(Summary.get())) { 857384ca190SMehdi Amini bool AllCallsCanBeExternallyReferenced = llvm::all_of( 858384ca190SMehdi Amini FuncSummary->calls(), [&](const FunctionSummary::EdgeTy &Edge) { 859384ca190SMehdi Amini return !CantBePromoted.count(Edge.first.getGUID()); 860384ca190SMehdi Amini }); 861384ca190SMehdi Amini if (!AllCallsCanBeExternallyReferenced) 862384ca190SMehdi Amini Summary->setNotEligibleToImport(); 863384ca190SMehdi Amini } 864384ca190SMehdi Amini } 865384ca190SMehdi Amini 866384ca190SMehdi Amini if (!ModuleSummaryDotFile.empty()) { 867384ca190SMehdi Amini std::error_code EC; 868384ca190SMehdi Amini raw_fd_ostream OSDot(ModuleSummaryDotFile, EC, sys::fs::OpenFlags::OF_None); 869384ca190SMehdi Amini if (EC) 870384ca190SMehdi Amini report_fatal_error(Twine("Failed to open dot file ") + 871384ca190SMehdi Amini ModuleSummaryDotFile + ": " + EC.message() + "\n"); 872384ca190SMehdi Amini Index.exportToDot(OSDot, {}); 873384ca190SMehdi Amini } 874384ca190SMehdi Amini 875384ca190SMehdi Amini return Index; 876384ca190SMehdi Amini } 877384ca190SMehdi Amini 878384ca190SMehdi Amini AnalysisKey ModuleSummaryIndexAnalysis::Key; 879384ca190SMehdi Amini 880384ca190SMehdi Amini ModuleSummaryIndex 881384ca190SMehdi Amini ModuleSummaryIndexAnalysis::run(Module &M, ModuleAnalysisManager &AM) { 882384ca190SMehdi Amini ProfileSummaryInfo &PSI = AM.getResult<ProfileSummaryAnalysis>(M); 883384ca190SMehdi Amini auto &FAM = AM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager(); 8844666953cSVitaly Buka bool NeedSSI = needsParamAccessSummary(M); 885384ca190SMehdi Amini return buildModuleSummaryIndex( 886384ca190SMehdi Amini M, 887384ca190SMehdi Amini [&FAM](const Function &F) { 888384ca190SMehdi Amini return &FAM.getResult<BlockFrequencyAnalysis>( 889384ca190SMehdi Amini *const_cast<Function *>(&F)); 890384ca190SMehdi Amini }, 8914666953cSVitaly Buka &PSI, 8924666953cSVitaly Buka [&FAM, NeedSSI](const Function &F) -> const StackSafetyInfo * { 8934666953cSVitaly Buka return NeedSSI ? &FAM.getResult<StackSafetyAnalysis>( 8944666953cSVitaly Buka const_cast<Function &>(F)) 8954666953cSVitaly Buka : nullptr; 8964666953cSVitaly Buka }); 897384ca190SMehdi Amini } 898384ca190SMehdi Amini 899384ca190SMehdi Amini char ModuleSummaryIndexWrapperPass::ID = 0; 900384ca190SMehdi Amini 901384ca190SMehdi Amini INITIALIZE_PASS_BEGIN(ModuleSummaryIndexWrapperPass, "module-summary-analysis", 902384ca190SMehdi Amini "Module Summary Analysis", false, true) 903384ca190SMehdi Amini INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) 904384ca190SMehdi Amini INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) 9054666953cSVitaly Buka INITIALIZE_PASS_DEPENDENCY(StackSafetyInfoWrapperPass) 906384ca190SMehdi Amini INITIALIZE_PASS_END(ModuleSummaryIndexWrapperPass, "module-summary-analysis", 907384ca190SMehdi Amini "Module Summary Analysis", false, true) 908384ca190SMehdi Amini 909384ca190SMehdi Amini ModulePass *llvm::createModuleSummaryIndexWrapperPass() { 910384ca190SMehdi Amini return new ModuleSummaryIndexWrapperPass(); 911384ca190SMehdi Amini } 912384ca190SMehdi Amini 913384ca190SMehdi Amini ModuleSummaryIndexWrapperPass::ModuleSummaryIndexWrapperPass() 914384ca190SMehdi Amini : ModulePass(ID) { 915384ca190SMehdi Amini initializeModuleSummaryIndexWrapperPassPass(*PassRegistry::getPassRegistry()); 916384ca190SMehdi Amini } 917384ca190SMehdi Amini 918384ca190SMehdi Amini bool ModuleSummaryIndexWrapperPass::runOnModule(Module &M) { 919384ca190SMehdi Amini auto *PSI = &getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI(); 9204666953cSVitaly Buka bool NeedSSI = needsParamAccessSummary(M); 921384ca190SMehdi Amini Index.emplace(buildModuleSummaryIndex( 922384ca190SMehdi Amini M, 923384ca190SMehdi Amini [this](const Function &F) { 924384ca190SMehdi Amini return &(this->getAnalysis<BlockFrequencyInfoWrapperPass>( 925384ca190SMehdi Amini *const_cast<Function *>(&F)) 926384ca190SMehdi Amini .getBFI()); 927384ca190SMehdi Amini }, 9284666953cSVitaly Buka PSI, 9294666953cSVitaly Buka [&](const Function &F) -> const StackSafetyInfo * { 9304666953cSVitaly Buka return NeedSSI ? &getAnalysis<StackSafetyInfoWrapperPass>( 9314666953cSVitaly Buka const_cast<Function &>(F)) 9324666953cSVitaly Buka .getResult() 9334666953cSVitaly Buka : nullptr; 9344666953cSVitaly Buka })); 935384ca190SMehdi Amini return false; 936384ca190SMehdi Amini } 937384ca190SMehdi Amini 938384ca190SMehdi Amini bool ModuleSummaryIndexWrapperPass::doFinalization(Module &M) { 939384ca190SMehdi Amini Index.reset(); 940384ca190SMehdi Amini return false; 941384ca190SMehdi Amini } 942384ca190SMehdi Amini 943384ca190SMehdi Amini void ModuleSummaryIndexWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const { 944384ca190SMehdi Amini AU.setPreservesAll(); 945384ca190SMehdi Amini AU.addRequired<BlockFrequencyInfoWrapperPass>(); 946384ca190SMehdi Amini AU.addRequired<ProfileSummaryInfoWrapperPass>(); 9474666953cSVitaly Buka AU.addRequired<StackSafetyInfoWrapperPass>(); 948384ca190SMehdi Amini } 9495b1c70a4SVitaly Buka 9505b1c70a4SVitaly Buka char ImmutableModuleSummaryIndexWrapperPass::ID = 0; 9515b1c70a4SVitaly Buka 9525b1c70a4SVitaly Buka ImmutableModuleSummaryIndexWrapperPass::ImmutableModuleSummaryIndexWrapperPass( 9535b1c70a4SVitaly Buka const ModuleSummaryIndex *Index) 9545b1c70a4SVitaly Buka : ImmutablePass(ID), Index(Index) { 9555b1c70a4SVitaly Buka initializeImmutableModuleSummaryIndexWrapperPassPass( 9565b1c70a4SVitaly Buka *PassRegistry::getPassRegistry()); 9575b1c70a4SVitaly Buka } 9585b1c70a4SVitaly Buka 9595b1c70a4SVitaly Buka void ImmutableModuleSummaryIndexWrapperPass::getAnalysisUsage( 9605b1c70a4SVitaly Buka AnalysisUsage &AU) const { 9615b1c70a4SVitaly Buka AU.setPreservesAll(); 9625b1c70a4SVitaly Buka } 9635b1c70a4SVitaly Buka 9645b1c70a4SVitaly Buka ImmutablePass *llvm::createImmutableModuleSummaryIndexWrapperPass( 9655b1c70a4SVitaly Buka const ModuleSummaryIndex *Index) { 9665b1c70a4SVitaly Buka return new ImmutableModuleSummaryIndexWrapperPass(Index); 9675b1c70a4SVitaly Buka } 9685b1c70a4SVitaly Buka 9695b1c70a4SVitaly Buka INITIALIZE_PASS(ImmutableModuleSummaryIndexWrapperPass, "module-summary-info", 9705b1c70a4SVitaly Buka "Module summary info", false, true) 971