1bdceefe9SMircea Trofin //===- MLInlineAdvisor.cpp - machine learned InlineAdvisor ----------------===//
2bdceefe9SMircea Trofin //
3bdceefe9SMircea Trofin // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4bdceefe9SMircea Trofin // See https://llvm.org/LICENSE.txt for license information.
5bdceefe9SMircea Trofin // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6bdceefe9SMircea Trofin //
7bdceefe9SMircea Trofin //===----------------------------------------------------------------------===//
8bdceefe9SMircea Trofin //
9bdceefe9SMircea Trofin // This file implements the interface between the inliner and a learned model.
10bdceefe9SMircea Trofin // It delegates model evaluation to either the AOT compiled model (the
11bdceefe9SMircea Trofin // 'release' mode) or a runtime-loaded model (the 'development' case).
12bdceefe9SMircea Trofin //
13bdceefe9SMircea Trofin //===----------------------------------------------------------------------===//
14f29256a6SMircea Trofin #include "llvm/Analysis/MLInlineAdvisor.h"
15bdceefe9SMircea Trofin #include "llvm/ADT/SCCIterator.h"
1671c3a551Sserge-sans-paille #include "llvm/Analysis/AssumptionCache.h"
17bdceefe9SMircea Trofin #include "llvm/Analysis/CallGraph.h"
18418121c3STarindu Jayatilaka #include "llvm/Analysis/FunctionPropertiesAnalysis.h"
19bdceefe9SMircea Trofin #include "llvm/Analysis/InlineCost.h"
20f29256a6SMircea Trofin #include "llvm/Analysis/InlineModelFeatureMaps.h"
21248d55afSMircea Trofin #include "llvm/Analysis/LazyCallGraph.h"
22f46dd19bSMircea Trofin #include "llvm/Analysis/LoopInfo.h"
23bdceefe9SMircea Trofin #include "llvm/Analysis/MLModelRunner.h"
24bdceefe9SMircea Trofin #include "llvm/Analysis/OptimizationRemarkEmitter.h"
25bdceefe9SMircea Trofin #include "llvm/Analysis/TargetTransformInfo.h"
2622a1f998SMircea Trofin #include "llvm/IR/Dominators.h"
27bdceefe9SMircea Trofin #include "llvm/IR/InstIterator.h"
28bdceefe9SMircea Trofin #include "llvm/IR/PassManager.h"
29bdceefe9SMircea Trofin #include "llvm/Support/CommandLine.h"
30f29256a6SMircea Trofin
31bdceefe9SMircea Trofin using namespace llvm;
32bdceefe9SMircea Trofin
33b1af01feSMircea Trofin #if defined(LLVM_HAVE_TF_AOT_INLINERSIZEMODEL)
3426141927SMircea Trofin #include "llvm/Analysis/ReleaseModeModelRunner.h"
35db5aceb9SMircea Trofin // codegen-ed file
36db5aceb9SMircea Trofin #include "InlinerSizeModel.h" // NOLINT
37db5aceb9SMircea Trofin
38db5aceb9SMircea Trofin std::unique_ptr<InlineAdvisor>
getReleaseModeAdvisor(Module & M,ModuleAnalysisManager & MAM)39db5aceb9SMircea Trofin llvm::getReleaseModeAdvisor(Module &M, ModuleAnalysisManager &MAM) {
40db5aceb9SMircea Trofin auto AOTRunner =
41db5aceb9SMircea Trofin std::make_unique<ReleaseModeModelRunner<llvm::InlinerSizeModel>>(
42c35ad9eeSMircea Trofin M.getContext(), FeatureMap, DecisionName);
43db5aceb9SMircea Trofin return std::make_unique<MLInlineAdvisor>(M, MAM, std::move(AOTRunner));
44db5aceb9SMircea Trofin }
45db5aceb9SMircea Trofin #endif
46db5aceb9SMircea Trofin
47bdceefe9SMircea Trofin #define DEBUG_TYPE "inline-ml"
48bdceefe9SMircea Trofin
49bdceefe9SMircea Trofin static cl::opt<float> SizeIncreaseThreshold(
50bdceefe9SMircea Trofin "ml-advisor-size-increase-threshold", cl::Hidden,
51bdceefe9SMircea Trofin cl::desc("Maximum factor by which expected native size may increase before "
52bdceefe9SMircea Trofin "blocking any further inlining."),
53bdceefe9SMircea Trofin cl::init(2.0));
54bdceefe9SMircea Trofin
557e7021caSMircea Trofin static cl::opt<bool> KeepFPICache(
567e7021caSMircea Trofin "ml-advisor-keep-fpi-cache", cl::Hidden,
577e7021caSMircea Trofin cl::desc(
587e7021caSMircea Trofin "For test - keep the ML Inline advisor's FunctionPropertiesInfo cache"),
597e7021caSMircea Trofin cl::init(false));
607e7021caSMircea Trofin
6199f00635SJacob Hegna // clang-format off
62c35ad9eeSMircea Trofin const std::array<TensorSpec, NumberOfFeatures> llvm::FeatureMap{
63c35ad9eeSMircea Trofin #define POPULATE_NAMES(_, NAME) TensorSpec::createSpec<int64_t>(NAME, {1} ),
6499f00635SJacob Hegna // InlineCost features - these must come first
6599f00635SJacob Hegna INLINE_COST_FEATURE_ITERATOR(POPULATE_NAMES)
6699f00635SJacob Hegna #undef POPULATE_NAMES
6799f00635SJacob Hegna
6899f00635SJacob Hegna // Non-cost features
69c35ad9eeSMircea Trofin #define POPULATE_NAMES(_, NAME, __) TensorSpec::createSpec<int64_t>(NAME, {1} ),
70bdceefe9SMircea Trofin INLINE_FEATURE_ITERATOR(POPULATE_NAMES)
71bdceefe9SMircea Trofin #undef POPULATE_NAMES
72bdceefe9SMircea Trofin };
7399f00635SJacob Hegna // clang-format on
74bdceefe9SMircea Trofin
75bdceefe9SMircea Trofin const char *const llvm::DecisionName = "inlining_decision";
76bdceefe9SMircea Trofin const char *const llvm::DefaultDecisionName = "inlining_default";
77bdceefe9SMircea Trofin const char *const llvm::RewardName = "delta_size";
78bdceefe9SMircea Trofin
getInlinableCS(Instruction & I)79bdceefe9SMircea Trofin CallBase *getInlinableCS(Instruction &I) {
80bdceefe9SMircea Trofin if (auto *CS = dyn_cast<CallBase>(&I))
81bdceefe9SMircea Trofin if (Function *Callee = CS->getCalledFunction()) {
82bdceefe9SMircea Trofin if (!Callee->isDeclaration()) {
83bdceefe9SMircea Trofin return CS;
84bdceefe9SMircea Trofin }
85bdceefe9SMircea Trofin }
86bdceefe9SMircea Trofin return nullptr;
87bdceefe9SMircea Trofin }
88bdceefe9SMircea Trofin
MLInlineAdvisor(Module & M,ModuleAnalysisManager & MAM,std::unique_ptr<MLModelRunner> Runner)89bdceefe9SMircea Trofin MLInlineAdvisor::MLInlineAdvisor(Module &M, ModuleAnalysisManager &MAM,
90bdceefe9SMircea Trofin std::unique_ptr<MLModelRunner> Runner)
91bdceefe9SMircea Trofin : InlineAdvisor(
92ccec2cf1SMircea Trofin M, MAM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager()),
93248d55afSMircea Trofin ModelRunner(std::move(Runner)),
94248d55afSMircea Trofin CG(MAM.getResult<LazyCallGraphAnalysis>(M)),
95bdceefe9SMircea Trofin InitialIRSize(getModuleIRSize()), CurrentIRSize(InitialIRSize) {
96bdceefe9SMircea Trofin assert(ModelRunner);
97bdceefe9SMircea Trofin
98bdceefe9SMircea Trofin // Extract the 'call site height' feature - the position of a call site
99bdceefe9SMircea Trofin // relative to the farthest statically reachable SCC node. We don't mutate
100bdceefe9SMircea Trofin // this value while inlining happens. Empirically, this feature proved
101bdceefe9SMircea Trofin // critical in behavioral cloning - i.e. training a model to mimic the manual
102bdceefe9SMircea Trofin // heuristic's decisions - and, thus, equally important for training for
103bdceefe9SMircea Trofin // improvement.
104248d55afSMircea Trofin CallGraph CGraph(M);
105248d55afSMircea Trofin for (auto I = scc_begin(&CGraph); !I.isAtEnd(); ++I) {
106bdceefe9SMircea Trofin const std::vector<CallGraphNode *> &CGNodes = *I;
107bdceefe9SMircea Trofin unsigned Level = 0;
108bdceefe9SMircea Trofin for (auto *CGNode : CGNodes) {
109bdceefe9SMircea Trofin Function *F = CGNode->getFunction();
110bdceefe9SMircea Trofin if (!F || F->isDeclaration())
111bdceefe9SMircea Trofin continue;
112bdceefe9SMircea Trofin for (auto &I : instructions(F)) {
113bdceefe9SMircea Trofin if (auto *CS = getInlinableCS(I)) {
114bdceefe9SMircea Trofin auto *Called = CS->getCalledFunction();
115248d55afSMircea Trofin auto Pos = FunctionLevels.find(&CG.get(*Called));
116bdceefe9SMircea Trofin // In bottom up traversal, an inlinable callee is either in the
117bdceefe9SMircea Trofin // same SCC, or to a function in a visited SCC. So not finding its
118bdceefe9SMircea Trofin // level means we haven't visited it yet, meaning it's in this SCC.
119bdceefe9SMircea Trofin if (Pos == FunctionLevels.end())
120bdceefe9SMircea Trofin continue;
121bdceefe9SMircea Trofin Level = std::max(Level, Pos->second + 1);
122bdceefe9SMircea Trofin }
123bdceefe9SMircea Trofin }
124bdceefe9SMircea Trofin }
125bdceefe9SMircea Trofin for (auto *CGNode : CGNodes) {
126bdceefe9SMircea Trofin Function *F = CGNode->getFunction();
127bdceefe9SMircea Trofin if (F && !F->isDeclaration())
128248d55afSMircea Trofin FunctionLevels[&CG.get(*F)] = Level;
129bdceefe9SMircea Trofin }
130bdceefe9SMircea Trofin }
1313e8553aaSMircea Trofin for (auto KVP : FunctionLevels) {
1323e8553aaSMircea Trofin AllNodes.insert(KVP.first);
1333e8553aaSMircea Trofin EdgeCount += getLocalCalls(KVP.first->getFunction());
1343e8553aaSMircea Trofin }
1353e8553aaSMircea Trofin NodeCount = AllNodes.size();
136bdceefe9SMircea Trofin }
137bdceefe9SMircea Trofin
getInitialFunctionLevel(const Function & F) const138248d55afSMircea Trofin unsigned MLInlineAdvisor::getInitialFunctionLevel(const Function &F) const {
139248d55afSMircea Trofin return CG.lookup(F) ? FunctionLevels.at(CG.lookup(F)) : 0;
140248d55afSMircea Trofin }
141248d55afSMircea Trofin
onPassEntry(LazyCallGraph::SCC * LastSCC)142aaff3fb6SJin Xin Ng void MLInlineAdvisor::onPassEntry(LazyCallGraph::SCC *LastSCC) {
143aaff3fb6SJin Xin Ng if (!LastSCC || ForceStop)
144a3a7826dSJin Xin Ng return;
145f46dd19bSMircea Trofin FPICache.clear();
146bdceefe9SMircea Trofin // Function passes executed between InlinerPass runs may have changed the
147bdceefe9SMircea Trofin // module-wide features.
1483e8553aaSMircea Trofin // The cgscc pass manager rules are such that:
1493e8553aaSMircea Trofin // - if a pass leads to merging SCCs, then the pipeline is restarted on the
1503e8553aaSMircea Trofin // merged SCC
1513e8553aaSMircea Trofin // - if a pass leads to splitting the SCC, then we continue with one of the
1523e8553aaSMircea Trofin // splits
1533e8553aaSMircea Trofin // This means that the NodesInLastSCC is a superset (not strict) of the nodes
1543e8553aaSMircea Trofin // that subsequent passes would have processed
1553e8553aaSMircea Trofin // - in addition, if new Nodes were created by a pass (e.g. CoroSplit),
1563e8553aaSMircea Trofin // they'd be adjacent to Nodes in the last SCC. So we just need to check the
1573e8553aaSMircea Trofin // boundary of Nodes in NodesInLastSCC for Nodes we haven't seen. We don't
1583e8553aaSMircea Trofin // care about the nature of the Edge (call or ref).
1593e8553aaSMircea Trofin NodeCount -= static_cast<int64_t>(NodesInLastSCC.size());
1603e8553aaSMircea Trofin while (!NodesInLastSCC.empty()) {
161aaff3fb6SJin Xin Ng const auto *N = *NodesInLastSCC.begin();
162aaff3fb6SJin Xin Ng NodesInLastSCC.erase(N);
1633e8553aaSMircea Trofin // The Function wrapped by N could have been deleted since we last saw it.
1643e8553aaSMircea Trofin if (N->isDead()) {
1653e8553aaSMircea Trofin assert(!N->getFunction().isDeclaration());
1663e8553aaSMircea Trofin continue;
167bdceefe9SMircea Trofin }
1683e8553aaSMircea Trofin ++NodeCount;
1693e8553aaSMircea Trofin EdgeCount += getLocalCalls(N->getFunction());
1703e8553aaSMircea Trofin for (const auto &E : *(*N)) {
1713e8553aaSMircea Trofin const auto *AdjNode = &E.getNode();
1723e8553aaSMircea Trofin assert(!AdjNode->isDead() && !AdjNode->getFunction().isDeclaration());
1733e8553aaSMircea Trofin auto I = AllNodes.insert(AdjNode);
1743e8553aaSMircea Trofin if (I.second)
175aaff3fb6SJin Xin Ng NodesInLastSCC.insert(AdjNode);
1763e8553aaSMircea Trofin }
1773e8553aaSMircea Trofin }
1783e8553aaSMircea Trofin
1793e8553aaSMircea Trofin EdgeCount -= EdgesOfLastSeenNodes;
1803e8553aaSMircea Trofin EdgesOfLastSeenNodes = 0;
181aaff3fb6SJin Xin Ng
182aaff3fb6SJin Xin Ng // (Re)use NodesInLastSCC to remember the nodes in the SCC right now,
183aaff3fb6SJin Xin Ng // in case the SCC is split before onPassExit and some nodes are split out
184aaff3fb6SJin Xin Ng assert(NodesInLastSCC.empty());
185aaff3fb6SJin Xin Ng for (const auto &N : *LastSCC)
186aaff3fb6SJin Xin Ng NodesInLastSCC.insert(&N);
1873e8553aaSMircea Trofin }
1883e8553aaSMircea Trofin
onPassExit(LazyCallGraph::SCC * LastSCC)1893e8553aaSMircea Trofin void MLInlineAdvisor::onPassExit(LazyCallGraph::SCC *LastSCC) {
190f46dd19bSMircea Trofin // No need to keep this around - function passes will invalidate it.
1917e7021caSMircea Trofin if (!KeepFPICache)
192f46dd19bSMircea Trofin FPICache.clear();
193a3a7826dSJin Xin Ng if (!LastSCC || ForceStop)
1943e8553aaSMircea Trofin return;
1953e8553aaSMircea Trofin // Keep track of the nodes and edges we last saw. Then, in onPassEntry,
1963e8553aaSMircea Trofin // we update the node count and edge count from the subset of these nodes that
1973e8553aaSMircea Trofin // survived.
1983e8553aaSMircea Trofin EdgesOfLastSeenNodes = 0;
199aaff3fb6SJin Xin Ng
200aaff3fb6SJin Xin Ng // Check on nodes that were in SCC onPassEntry
201aaff3fb6SJin Xin Ng for (auto I = NodesInLastSCC.begin(); I != NodesInLastSCC.end();) {
202aaff3fb6SJin Xin Ng if ((*I)->isDead())
203aaff3fb6SJin Xin Ng NodesInLastSCC.erase(*I++);
204aaff3fb6SJin Xin Ng else
205aaff3fb6SJin Xin Ng EdgesOfLastSeenNodes += getLocalCalls((*I++)->getFunction());
206aaff3fb6SJin Xin Ng }
207aaff3fb6SJin Xin Ng
208aaff3fb6SJin Xin Ng // Check on nodes that may have got added to SCC
2093e8553aaSMircea Trofin for (const auto &N : *LastSCC) {
2103e8553aaSMircea Trofin assert(!N.isDead());
211aaff3fb6SJin Xin Ng auto I = NodesInLastSCC.insert(&N);
212aaff3fb6SJin Xin Ng if (I.second)
2133e8553aaSMircea Trofin EdgesOfLastSeenNodes += getLocalCalls(N.getFunction());
2143e8553aaSMircea Trofin }
215aaff3fb6SJin Xin Ng assert(NodeCount >= NodesInLastSCC.size());
2163e8553aaSMircea Trofin assert(EdgeCount >= EdgesOfLastSeenNodes);
217bdceefe9SMircea Trofin }
218bdceefe9SMircea Trofin
getLocalCalls(Function & F)219bdceefe9SMircea Trofin int64_t MLInlineAdvisor::getLocalCalls(Function &F) {
220f46dd19bSMircea Trofin return getCachedFPI(F).DirectCallsToDefinedFunctions;
221bdceefe9SMircea Trofin }
222bdceefe9SMircea Trofin
223bdceefe9SMircea Trofin // Update the internal state of the advisor, and force invalidate feature
224bdceefe9SMircea Trofin // analysis. Currently, we maintain minimal (and very simple) global state - the
225bdceefe9SMircea Trofin // number of functions and the number of static calls. We also keep track of the
226bdceefe9SMircea Trofin // total IR size in this module, to stop misbehaving policies at a certain bloat
227bdceefe9SMircea Trofin // factor (SizeIncreaseThreshold)
onSuccessfulInlining(const MLInlineAdvice & Advice,bool CalleeWasDeleted)228bdceefe9SMircea Trofin void MLInlineAdvisor::onSuccessfulInlining(const MLInlineAdvice &Advice,
229bdceefe9SMircea Trofin bool CalleeWasDeleted) {
230bdceefe9SMircea Trofin assert(!ForceStop);
231bdceefe9SMircea Trofin Function *Caller = Advice.getCaller();
232bdceefe9SMircea Trofin Function *Callee = Advice.getCallee();
233bdceefe9SMircea Trofin // The caller features aren't valid anymore.
2340d06b14fSMircea Trofin {
235*7ae92a69SMircea Trofin PreservedAnalyses PA = PreservedAnalyses::all();
236*7ae92a69SMircea Trofin PA.abandon<FunctionPropertiesAnalysis>();
237*7ae92a69SMircea Trofin PA.abandon<DominatorTreeAnalysis>();
238*7ae92a69SMircea Trofin PA.abandon<LoopAnalysis>();
2390d06b14fSMircea Trofin FAM.invalidate(*Caller, PA);
2400d06b14fSMircea Trofin }
24122a1f998SMircea Trofin Advice.updateCachedCallerFPI(FAM);
242bdceefe9SMircea Trofin int64_t IRSizeAfter =
243bdceefe9SMircea Trofin getIRSize(*Caller) + (CalleeWasDeleted ? 0 : Advice.CalleeIRSize);
244bdceefe9SMircea Trofin CurrentIRSize += IRSizeAfter - (Advice.CallerIRSize + Advice.CalleeIRSize);
245bdceefe9SMircea Trofin if (CurrentIRSize > SizeIncreaseThreshold * InitialIRSize)
246bdceefe9SMircea Trofin ForceStop = true;
247bdceefe9SMircea Trofin
248bdceefe9SMircea Trofin // We can delta-update module-wide features. We know the inlining only changed
249bdceefe9SMircea Trofin // the caller, and maybe the callee (by deleting the latter).
250bdceefe9SMircea Trofin // Nodes are simple to update.
251bdceefe9SMircea Trofin // For edges, we 'forget' the edges that the caller and callee used to have
252bdceefe9SMircea Trofin // before inlining, and add back what they currently have together.
253bdceefe9SMircea Trofin int64_t NewCallerAndCalleeEdges =
254f46dd19bSMircea Trofin getCachedFPI(*Caller).DirectCallsToDefinedFunctions;
255bdceefe9SMircea Trofin
256bdceefe9SMircea Trofin if (CalleeWasDeleted)
257bdceefe9SMircea Trofin --NodeCount;
258bdceefe9SMircea Trofin else
259418121c3STarindu Jayatilaka NewCallerAndCalleeEdges +=
260f46dd19bSMircea Trofin getCachedFPI(*Callee).DirectCallsToDefinedFunctions;
261bdceefe9SMircea Trofin EdgeCount += (NewCallerAndCalleeEdges - Advice.CallerAndCalleeEdges);
262bdceefe9SMircea Trofin assert(CurrentIRSize >= 0 && EdgeCount >= 0 && NodeCount >= 0);
263bdceefe9SMircea Trofin }
264bdceefe9SMircea Trofin
getModuleIRSize() const265bdceefe9SMircea Trofin int64_t MLInlineAdvisor::getModuleIRSize() const {
266bdceefe9SMircea Trofin int64_t Ret = 0;
267248d55afSMircea Trofin for (auto &F : M)
268bdceefe9SMircea Trofin if (!F.isDeclaration())
269bdceefe9SMircea Trofin Ret += getIRSize(F);
270bdceefe9SMircea Trofin return Ret;
271bdceefe9SMircea Trofin }
272bdceefe9SMircea Trofin
getCachedFPI(Function & F) const273f46dd19bSMircea Trofin FunctionPropertiesInfo &MLInlineAdvisor::getCachedFPI(Function &F) const {
274f46dd19bSMircea Trofin auto InsertPair =
275f46dd19bSMircea Trofin FPICache.insert(std::make_pair(&F, FunctionPropertiesInfo()));
276f46dd19bSMircea Trofin if (!InsertPair.second)
277f46dd19bSMircea Trofin return InsertPair.first->second;
278f46dd19bSMircea Trofin InsertPair.first->second = FAM.getResult<FunctionPropertiesAnalysis>(F);
279f46dd19bSMircea Trofin return InsertPair.first->second;
280f46dd19bSMircea Trofin }
281f46dd19bSMircea Trofin
getAdviceImpl(CallBase & CB)282e8049dc3SMircea Trofin std::unique_ptr<InlineAdvice> MLInlineAdvisor::getAdviceImpl(CallBase &CB) {
2837f24e574SMircea Trofin if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))
2847f24e574SMircea Trofin return Skip;
2857f24e574SMircea Trofin
286bdceefe9SMircea Trofin auto &Caller = *CB.getCaller();
287bdceefe9SMircea Trofin auto &Callee = *CB.getCalledFunction();
288bdceefe9SMircea Trofin
289bdceefe9SMircea Trofin auto GetAssumptionCache = [&](Function &F) -> AssumptionCache & {
290bdceefe9SMircea Trofin return FAM.getResult<AssumptionAnalysis>(F);
291bdceefe9SMircea Trofin };
292bdceefe9SMircea Trofin auto &TIR = FAM.getResult<TargetIRAnalysis>(Callee);
293bdceefe9SMircea Trofin auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(Caller);
294bdceefe9SMircea Trofin
295e8049dc3SMircea Trofin auto MandatoryKind = InlineAdvisor::getMandatoryKind(CB, FAM, ORE);
296bdceefe9SMircea Trofin // If this is a "never inline" case, there won't be any changes to internal
297bdceefe9SMircea Trofin // state we need to track, so we can just return the base InlineAdvice, which
298bdceefe9SMircea Trofin // will do nothing interesting.
299bdceefe9SMircea Trofin // Same thing if this is a recursive case.
300e8049dc3SMircea Trofin if (MandatoryKind == InlineAdvisor::MandatoryInliningKind::Never ||
301bdceefe9SMircea Trofin &Caller == &Callee)
302e8049dc3SMircea Trofin return getMandatoryAdvice(CB, false);
303bdceefe9SMircea Trofin
3045fe10263SMircea Trofin bool Mandatory =
305e8049dc3SMircea Trofin MandatoryKind == InlineAdvisor::MandatoryInliningKind::Always;
306bdceefe9SMircea Trofin
307bdceefe9SMircea Trofin // If we need to stop, we won't want to track anymore any state changes, so
308bdceefe9SMircea Trofin // we just return the base InlineAdvice, which acts as a noop.
309bdceefe9SMircea Trofin if (ForceStop) {
310bdceefe9SMircea Trofin ORE.emit([&] {
311bdceefe9SMircea Trofin return OptimizationRemarkMissed(DEBUG_TYPE, "ForceStop", &CB)
312bdceefe9SMircea Trofin << "Won't attempt inlining because module size grew too much.";
313bdceefe9SMircea Trofin });
314bdceefe9SMircea Trofin return std::make_unique<InlineAdvice>(this, CB, ORE, Mandatory);
315bdceefe9SMircea Trofin }
316bdceefe9SMircea Trofin
317bdceefe9SMircea Trofin int CostEstimate = 0;
318bdceefe9SMircea Trofin if (!Mandatory) {
319bdceefe9SMircea Trofin auto IsCallSiteInlinable =
320bdceefe9SMircea Trofin llvm::getInliningCostEstimate(CB, TIR, GetAssumptionCache);
321bdceefe9SMircea Trofin if (!IsCallSiteInlinable) {
322bdceefe9SMircea Trofin // We can't inline this for correctness reasons, so return the base
323bdceefe9SMircea Trofin // InlineAdvice, as we don't care about tracking any state changes (which
324bdceefe9SMircea Trofin // won't happen).
325bdceefe9SMircea Trofin return std::make_unique<InlineAdvice>(this, CB, ORE, false);
326bdceefe9SMircea Trofin }
327bdceefe9SMircea Trofin CostEstimate = *IsCallSiteInlinable;
328bdceefe9SMircea Trofin }
329bdceefe9SMircea Trofin
33099f00635SJacob Hegna const auto CostFeatures =
33199f00635SJacob Hegna llvm::getInliningCostFeatures(CB, TIR, GetAssumptionCache);
33299f00635SJacob Hegna if (!CostFeatures) {
33399f00635SJacob Hegna return std::make_unique<InlineAdvice>(this, CB, ORE, false);
33499f00635SJacob Hegna }
33599f00635SJacob Hegna
336bdceefe9SMircea Trofin if (Mandatory)
337e8049dc3SMircea Trofin return getMandatoryAdvice(CB, true);
338bdceefe9SMircea Trofin
339bdceefe9SMircea Trofin auto NrCtantParams = 0;
340bdceefe9SMircea Trofin for (auto I = CB.arg_begin(), E = CB.arg_end(); I != E; ++I) {
341bdceefe9SMircea Trofin NrCtantParams += (isa<Constant>(*I));
342bdceefe9SMircea Trofin }
343bdceefe9SMircea Trofin
344f46dd19bSMircea Trofin auto &CallerBefore = getCachedFPI(Caller);
345f46dd19bSMircea Trofin auto &CalleeBefore = getCachedFPI(Callee);
346bdceefe9SMircea Trofin
347059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CalleeBasicBlockCount) =
348059e0347SMircea Trofin CalleeBefore.BasicBlockCount;
349059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CallSiteHeight) =
350248d55afSMircea Trofin getInitialFunctionLevel(Caller);
351059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::NodeCount) = NodeCount;
352059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::NrCtantParams) = NrCtantParams;
353059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::EdgeCount) = EdgeCount;
354059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CallerUsers) =
355059e0347SMircea Trofin CallerBefore.Uses;
356059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(
357059e0347SMircea Trofin FeatureIndex::CallerConditionallyExecutedBlocks) =
358059e0347SMircea Trofin CallerBefore.BlocksReachedFromConditionalInstruction;
359059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CallerBasicBlockCount) =
360059e0347SMircea Trofin CallerBefore.BasicBlockCount;
361059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(
362059e0347SMircea Trofin FeatureIndex::CalleeConditionallyExecutedBlocks) =
363059e0347SMircea Trofin CalleeBefore.BlocksReachedFromConditionalInstruction;
364059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CalleeUsers) =
365059e0347SMircea Trofin CalleeBefore.Uses;
366059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(FeatureIndex::CostEstimate) = CostEstimate;
36799f00635SJacob Hegna
36899f00635SJacob Hegna // Add the cost features
36999f00635SJacob Hegna for (size_t I = 0;
37099f00635SJacob Hegna I < static_cast<size_t>(InlineCostFeatureIndex::NumberOfFeatures); ++I) {
371059e0347SMircea Trofin *ModelRunner->getTensor<int64_t>(inlineCostFeatureToMlFeature(
372059e0347SMircea Trofin static_cast<InlineCostFeatureIndex>(I))) = CostFeatures->at(I);
37399f00635SJacob Hegna }
37499f00635SJacob Hegna
375bdceefe9SMircea Trofin return getAdviceFromModel(CB, ORE);
376bdceefe9SMircea Trofin }
377bdceefe9SMircea Trofin
378bdceefe9SMircea Trofin std::unique_ptr<MLInlineAdvice>
getAdviceFromModel(CallBase & CB,OptimizationRemarkEmitter & ORE)379bdceefe9SMircea Trofin MLInlineAdvisor::getAdviceFromModel(CallBase &CB,
380bdceefe9SMircea Trofin OptimizationRemarkEmitter &ORE) {
381059e0347SMircea Trofin return std::make_unique<MLInlineAdvice>(
382059e0347SMircea Trofin this, CB, ORE, static_cast<bool>(ModelRunner->evaluate<int64_t>()));
383bdceefe9SMircea Trofin }
384bdceefe9SMircea Trofin
3857f24e574SMircea Trofin std::unique_ptr<InlineAdvice>
getSkipAdviceIfUnreachableCallsite(CallBase & CB)3867f24e574SMircea Trofin MLInlineAdvisor::getSkipAdviceIfUnreachableCallsite(CallBase &CB) {
3877f24e574SMircea Trofin if (!FAM.getResult<DominatorTreeAnalysis>(*CB.getCaller())
3887f24e574SMircea Trofin .isReachableFromEntry(CB.getParent()))
3897f24e574SMircea Trofin return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), false);
3907f24e574SMircea Trofin return nullptr;
3917f24e574SMircea Trofin }
3927f24e574SMircea Trofin
getMandatoryAdvice(CallBase & CB,bool Advice)393e8049dc3SMircea Trofin std::unique_ptr<InlineAdvice> MLInlineAdvisor::getMandatoryAdvice(CallBase &CB,
394e8049dc3SMircea Trofin bool Advice) {
395e8049dc3SMircea Trofin // Make sure we track inlinings in all cases - mandatory or not.
3967f24e574SMircea Trofin if (auto Skip = getSkipAdviceIfUnreachableCallsite(CB))
3977f24e574SMircea Trofin return Skip;
398e8049dc3SMircea Trofin if (Advice && !ForceStop)
399e8049dc3SMircea Trofin return getMandatoryAdviceImpl(CB);
400e8049dc3SMircea Trofin
401e8049dc3SMircea Trofin // If this is a "never inline" case, there won't be any changes to internal
402e8049dc3SMircea Trofin // state we need to track, so we can just return the base InlineAdvice, which
403e8049dc3SMircea Trofin // will do nothing interesting.
404e8049dc3SMircea Trofin // Same if we are forced to stop - we don't track anymore.
405e8049dc3SMircea Trofin return std::make_unique<InlineAdvice>(this, CB, getCallerORE(CB), Advice);
406e8049dc3SMircea Trofin }
407e8049dc3SMircea Trofin
408bdceefe9SMircea Trofin std::unique_ptr<MLInlineAdvice>
getMandatoryAdviceImpl(CallBase & CB)409e8049dc3SMircea Trofin MLInlineAdvisor::getMandatoryAdviceImpl(CallBase &CB) {
410e8049dc3SMircea Trofin return std::make_unique<MLInlineAdvice>(this, CB, getCallerORE(CB), true);
411bdceefe9SMircea Trofin }
412bdceefe9SMircea Trofin
print(raw_ostream & OS) const4137e7021caSMircea Trofin void MLInlineAdvisor::print(raw_ostream &OS) const {
4147e7021caSMircea Trofin OS << "[MLInlineAdvisor] Nodes: " << NodeCount << " Edges: " << EdgeCount
415aaff3fb6SJin Xin Ng << " EdgesOfLastSeenNodes: " << EdgesOfLastSeenNodes << "\n";
4167e7021caSMircea Trofin OS << "[MLInlineAdvisor] FPI:\n";
4177e7021caSMircea Trofin for (auto I : FPICache) {
4187e7021caSMircea Trofin OS << I.getFirst()->getName() << ":\n";
4197e7021caSMircea Trofin I.getSecond().print(OS);
4207e7021caSMircea Trofin OS << "\n";
4217e7021caSMircea Trofin }
4227e7021caSMircea Trofin OS << "\n";
4237e7021caSMircea Trofin }
4247e7021caSMircea Trofin
MLInlineAdvice(MLInlineAdvisor * Advisor,CallBase & CB,OptimizationRemarkEmitter & ORE,bool Recommendation)425f46dd19bSMircea Trofin MLInlineAdvice::MLInlineAdvice(MLInlineAdvisor *Advisor, CallBase &CB,
426f46dd19bSMircea Trofin OptimizationRemarkEmitter &ORE,
427f46dd19bSMircea Trofin bool Recommendation)
428f46dd19bSMircea Trofin : InlineAdvice(Advisor, CB, ORE, Recommendation),
429f46dd19bSMircea Trofin CallerIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Caller)),
430f46dd19bSMircea Trofin CalleeIRSize(Advisor->isForcedToStop() ? 0 : Advisor->getIRSize(*Callee)),
431f46dd19bSMircea Trofin CallerAndCalleeEdges(Advisor->isForcedToStop()
432f46dd19bSMircea Trofin ? 0
433f46dd19bSMircea Trofin : (Advisor->getLocalCalls(*Caller) +
434f46dd19bSMircea Trofin Advisor->getLocalCalls(*Callee))),
435f46dd19bSMircea Trofin PreInlineCallerFPI(Advisor->getCachedFPI(*Caller)) {
436f46dd19bSMircea Trofin if (Recommendation)
437f46dd19bSMircea Trofin FPU.emplace(Advisor->getCachedFPI(*getCaller()), CB);
438f46dd19bSMircea Trofin }
439f46dd19bSMircea Trofin
reportContextForRemark(DiagnosticInfoOptimizationBase & OR)440bdceefe9SMircea Trofin void MLInlineAdvice::reportContextForRemark(
441bdceefe9SMircea Trofin DiagnosticInfoOptimizationBase &OR) {
442bdceefe9SMircea Trofin using namespace ore;
443bdceefe9SMircea Trofin OR << NV("Callee", Callee->getName());
444bdceefe9SMircea Trofin for (size_t I = 0; I < NumberOfFeatures; ++I)
445c35ad9eeSMircea Trofin OR << NV(FeatureMap[I].name(),
446059e0347SMircea Trofin *getAdvisor()->getModelRunner().getTensor<int64_t>(I));
447bdceefe9SMircea Trofin OR << NV("ShouldInline", isInliningRecommended());
448bdceefe9SMircea Trofin }
449bdceefe9SMircea Trofin
updateCachedCallerFPI(FunctionAnalysisManager & FAM) const45022a1f998SMircea Trofin void MLInlineAdvice::updateCachedCallerFPI(FunctionAnalysisManager &FAM) const {
45122a1f998SMircea Trofin FPU->finish(FAM);
452f46dd19bSMircea Trofin }
453f46dd19bSMircea Trofin
recordInliningImpl()454bdceefe9SMircea Trofin void MLInlineAdvice::recordInliningImpl() {
455bdceefe9SMircea Trofin ORE.emit([&]() {
456bdceefe9SMircea Trofin OptimizationRemark R(DEBUG_TYPE, "InliningSuccess", DLoc, Block);
457bdceefe9SMircea Trofin reportContextForRemark(R);
458bdceefe9SMircea Trofin return R;
459bdceefe9SMircea Trofin });
460bdceefe9SMircea Trofin getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ false);
461bdceefe9SMircea Trofin }
462bdceefe9SMircea Trofin
recordInliningWithCalleeDeletedImpl()463bdceefe9SMircea Trofin void MLInlineAdvice::recordInliningWithCalleeDeletedImpl() {
464bdceefe9SMircea Trofin ORE.emit([&]() {
465bdceefe9SMircea Trofin OptimizationRemark R(DEBUG_TYPE, "InliningSuccessWithCalleeDeleted", DLoc,
466bdceefe9SMircea Trofin Block);
467bdceefe9SMircea Trofin reportContextForRemark(R);
468bdceefe9SMircea Trofin return R;
469bdceefe9SMircea Trofin });
470bdceefe9SMircea Trofin getAdvisor()->onSuccessfulInlining(*this, /*CalleeWasDeleted*/ true);
471bdceefe9SMircea Trofin }
472bdceefe9SMircea Trofin
recordUnsuccessfulInliningImpl(const InlineResult & Result)473bdceefe9SMircea Trofin void MLInlineAdvice::recordUnsuccessfulInliningImpl(
474bdceefe9SMircea Trofin const InlineResult &Result) {
475f46dd19bSMircea Trofin getAdvisor()->getCachedFPI(*Caller) = PreInlineCallerFPI;
476bdceefe9SMircea Trofin ORE.emit([&]() {
477bdceefe9SMircea Trofin OptimizationRemarkMissed R(DEBUG_TYPE, "InliningAttemptedAndUnsuccessful",
478bdceefe9SMircea Trofin DLoc, Block);
479bdceefe9SMircea Trofin reportContextForRemark(R);
480bdceefe9SMircea Trofin return R;
481bdceefe9SMircea Trofin });
482bdceefe9SMircea Trofin }
recordUnattemptedInliningImpl()483bdceefe9SMircea Trofin void MLInlineAdvice::recordUnattemptedInliningImpl() {
484f46dd19bSMircea Trofin assert(!FPU);
485bdceefe9SMircea Trofin ORE.emit([&]() {
486bdceefe9SMircea Trofin OptimizationRemarkMissed R(DEBUG_TYPE, "IniningNotAttempted", DLoc, Block);
487bdceefe9SMircea Trofin reportContextForRemark(R);
488bdceefe9SMircea Trofin return R;
489bdceefe9SMircea Trofin });
490bdceefe9SMircea Trofin }
491