1ee6f0e10STarindu Jayatilaka //===- FunctionPropertiesAnalysis.cpp - Function Properties Analysis ------===//
2418121c3STarindu Jayatilaka //
3418121c3STarindu Jayatilaka // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4418121c3STarindu Jayatilaka // See https://llvm.org/LICENSE.txt for license information.
5418121c3STarindu Jayatilaka // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6418121c3STarindu Jayatilaka //
7418121c3STarindu Jayatilaka //===----------------------------------------------------------------------===//
8418121c3STarindu Jayatilaka //
9ee6f0e10STarindu Jayatilaka // This file defines the FunctionPropertiesInfo and FunctionPropertiesAnalysis
10ee6f0e10STarindu Jayatilaka // classes used to extract function properties.
11418121c3STarindu Jayatilaka //
12418121c3STarindu Jayatilaka //===----------------------------------------------------------------------===//
13418121c3STarindu Jayatilaka 
14418121c3STarindu Jayatilaka #include "llvm/Analysis/FunctionPropertiesAnalysis.h"
15f46dd19bSMircea Trofin #include "llvm/ADT/STLExtras.h"
1622a1f998SMircea Trofin #include "llvm/ADT/SetVector.h"
1771c3a551Sserge-sans-paille #include "llvm/Analysis/LoopInfo.h"
18f46dd19bSMircea Trofin #include "llvm/IR/CFG.h"
1922a1f998SMircea Trofin #include "llvm/IR/Dominators.h"
20418121c3STarindu Jayatilaka #include "llvm/IR/Instructions.h"
21f46dd19bSMircea Trofin #include <deque>
22418121c3STarindu Jayatilaka 
23418121c3STarindu Jayatilaka using namespace llvm;
24418121c3STarindu Jayatilaka 
25f46dd19bSMircea Trofin namespace {
getNrBlocksFromCond(const BasicBlock & BB)26f46dd19bSMircea Trofin int64_t getNrBlocksFromCond(const BasicBlock &BB) {
27f46dd19bSMircea Trofin   int64_t Ret = 0;
28f46dd19bSMircea Trofin   if (const auto *BI = dyn_cast<BranchInst>(BB.getTerminator())) {
29f46dd19bSMircea Trofin     if (BI->isConditional())
30f46dd19bSMircea Trofin       Ret += BI->getNumSuccessors();
31f46dd19bSMircea Trofin   } else if (const auto *SI = dyn_cast<SwitchInst>(BB.getTerminator())) {
32f46dd19bSMircea Trofin     Ret += (SI->getNumCases() + (nullptr != SI->getDefaultDest()));
33f46dd19bSMircea Trofin   }
34f46dd19bSMircea Trofin   return Ret;
35f46dd19bSMircea Trofin }
36f46dd19bSMircea Trofin 
getUses(const Function & F)37f46dd19bSMircea Trofin int64_t getUses(const Function &F) {
38f46dd19bSMircea Trofin   return ((!F.hasLocalLinkage()) ? 1 : 0) + F.getNumUses();
39f46dd19bSMircea Trofin }
40f46dd19bSMircea Trofin } // namespace
41f46dd19bSMircea Trofin 
reIncludeBB(const BasicBlock & BB)4222a1f998SMircea Trofin void FunctionPropertiesInfo::reIncludeBB(const BasicBlock &BB) {
43f46dd19bSMircea Trofin   updateForBB(BB, +1);
44f46dd19bSMircea Trofin }
45f46dd19bSMircea Trofin 
updateForBB(const BasicBlock & BB,int64_t Direction)46f46dd19bSMircea Trofin void FunctionPropertiesInfo::updateForBB(const BasicBlock &BB,
47f46dd19bSMircea Trofin                                          int64_t Direction) {
48f46dd19bSMircea Trofin   assert(Direction == 1 || Direction == -1);
49f46dd19bSMircea Trofin   BasicBlockCount += Direction;
50f46dd19bSMircea Trofin   BlocksReachedFromConditionalInstruction +=
51f46dd19bSMircea Trofin       (Direction * getNrBlocksFromCond(BB));
52f46dd19bSMircea Trofin   for (const auto &I : BB) {
53f46dd19bSMircea Trofin     if (auto *CS = dyn_cast<CallBase>(&I)) {
54f46dd19bSMircea Trofin       const auto *Callee = CS->getCalledFunction();
55f46dd19bSMircea Trofin       if (Callee && !Callee->isIntrinsic() && !Callee->isDeclaration())
56f46dd19bSMircea Trofin         DirectCallsToDefinedFunctions += Direction;
57f46dd19bSMircea Trofin     }
58f46dd19bSMircea Trofin     if (I.getOpcode() == Instruction::Load) {
59f46dd19bSMircea Trofin       LoadInstCount += Direction;
60f46dd19bSMircea Trofin     } else if (I.getOpcode() == Instruction::Store) {
61f46dd19bSMircea Trofin       StoreInstCount += Direction;
62f46dd19bSMircea Trofin     }
63f46dd19bSMircea Trofin   }
64f46dd19bSMircea Trofin   TotalInstructionCount += Direction * BB.sizeWithoutDebug();
65f46dd19bSMircea Trofin }
66f46dd19bSMircea Trofin 
updateAggregateStats(const Function & F,const LoopInfo & LI)67f46dd19bSMircea Trofin void FunctionPropertiesInfo::updateAggregateStats(const Function &F,
68f46dd19bSMircea Trofin                                                   const LoopInfo &LI) {
69f46dd19bSMircea Trofin 
70f46dd19bSMircea Trofin   Uses = getUses(F);
71f46dd19bSMircea Trofin   TopLevelLoopCount = llvm::size(LI);
7222a1f998SMircea Trofin   MaxLoopDepth = 0;
7322a1f998SMircea Trofin   std::deque<const Loop *> Worklist;
7422a1f998SMircea Trofin   llvm::append_range(Worklist, LI);
7522a1f998SMircea Trofin   while (!Worklist.empty()) {
7622a1f998SMircea Trofin     const auto *L = Worklist.front();
7722a1f998SMircea Trofin     MaxLoopDepth =
7822a1f998SMircea Trofin         std::max(MaxLoopDepth, static_cast<int64_t>(L->getLoopDepth()));
7922a1f998SMircea Trofin     Worklist.pop_front();
8022a1f998SMircea Trofin     llvm::append_range(Worklist, L->getSubLoops());
8122a1f998SMircea Trofin   }
82f46dd19bSMircea Trofin }
83f46dd19bSMircea Trofin 
getFunctionPropertiesInfo(const Function & F,FunctionAnalysisManager & FAM)8422a1f998SMircea Trofin FunctionPropertiesInfo FunctionPropertiesInfo::getFunctionPropertiesInfo(
8522a1f998SMircea Trofin     const Function &F, FunctionAnalysisManager &FAM) {
86418121c3STarindu Jayatilaka 
872f56046dSTarindu Jayatilaka   FunctionPropertiesInfo FPI;
8822a1f998SMircea Trofin   // The const casts are due to the getResult API - there's no mutation of F.
8922a1f998SMircea Trofin   const auto &LI = FAM.getResult<LoopAnalysis>(const_cast<Function &>(F));
9022a1f998SMircea Trofin   const auto &DT =
9122a1f998SMircea Trofin       FAM.getResult<DominatorTreeAnalysis>(const_cast<Function &>(F));
92f46dd19bSMircea Trofin   for (const auto &BB : F)
9322a1f998SMircea Trofin     if (DT.isReachableFromEntry(&BB))
9422a1f998SMircea Trofin       FPI.reIncludeBB(BB);
95f46dd19bSMircea Trofin   FPI.updateAggregateStats(F, LI);
962f56046dSTarindu Jayatilaka   return FPI;
972f56046dSTarindu Jayatilaka }
982f56046dSTarindu Jayatilaka 
print(raw_ostream & OS) const99ee6f0e10STarindu Jayatilaka void FunctionPropertiesInfo::print(raw_ostream &OS) const {
100ee6f0e10STarindu Jayatilaka   OS << "BasicBlockCount: " << BasicBlockCount << "\n"
101ee6f0e10STarindu Jayatilaka      << "BlocksReachedFromConditionalInstruction: "
102ee6f0e10STarindu Jayatilaka      << BlocksReachedFromConditionalInstruction << "\n"
103ee6f0e10STarindu Jayatilaka      << "Uses: " << Uses << "\n"
104ee6f0e10STarindu Jayatilaka      << "DirectCallsToDefinedFunctions: " << DirectCallsToDefinedFunctions
10506283661STarindu Jayatilaka      << "\n"
10606283661STarindu Jayatilaka      << "LoadInstCount: " << LoadInstCount << "\n"
10706283661STarindu Jayatilaka      << "StoreInstCount: " << StoreInstCount << "\n"
10806283661STarindu Jayatilaka      << "MaxLoopDepth: " << MaxLoopDepth << "\n"
109f46dd19bSMircea Trofin      << "TopLevelLoopCount: " << TopLevelLoopCount << "\n"
110f46dd19bSMircea Trofin      << "TotalInstructionCount: " << TotalInstructionCount << "\n\n";
111ee6f0e10STarindu Jayatilaka }
112ee6f0e10STarindu Jayatilaka 
1132f56046dSTarindu Jayatilaka AnalysisKey FunctionPropertiesAnalysis::Key;
1142f56046dSTarindu Jayatilaka 
11549942d59SMircea Trofin FunctionPropertiesInfo
run(Function & F,FunctionAnalysisManager & FAM)1162f56046dSTarindu Jayatilaka FunctionPropertiesAnalysis::run(Function &F, FunctionAnalysisManager &FAM) {
11722a1f998SMircea Trofin   return FunctionPropertiesInfo::getFunctionPropertiesInfo(F, FAM);
118418121c3STarindu Jayatilaka }
119ee6f0e10STarindu Jayatilaka 
120ee6f0e10STarindu Jayatilaka PreservedAnalyses
run(Function & F,FunctionAnalysisManager & AM)121ee6f0e10STarindu Jayatilaka FunctionPropertiesPrinterPass::run(Function &F, FunctionAnalysisManager &AM) {
122ee6f0e10STarindu Jayatilaka   OS << "Printing analysis results of CFA for function "
123ee6f0e10STarindu Jayatilaka      << "'" << F.getName() << "':"
124ee6f0e10STarindu Jayatilaka      << "\n";
125ee6f0e10STarindu Jayatilaka   AM.getResult<FunctionPropertiesAnalysis>(F).print(OS);
126ee6f0e10STarindu Jayatilaka   return PreservedAnalyses::all();
127ee6f0e10STarindu Jayatilaka }
128f46dd19bSMircea Trofin 
FunctionPropertiesUpdater(FunctionPropertiesInfo & FPI,const CallBase & CB)129f46dd19bSMircea Trofin FunctionPropertiesUpdater::FunctionPropertiesUpdater(
130f46dd19bSMircea Trofin     FunctionPropertiesInfo &FPI, const CallBase &CB)
131f46dd19bSMircea Trofin     : FPI(FPI), CallSiteBB(*CB.getParent()), Caller(*CallSiteBB.getParent()) {
132*3f8e4169SMircea Trofin   assert(isa<CallInst>(CB) || isa<InvokeInst>(CB));
133f46dd19bSMircea Trofin   // For BBs that are likely to change, we subtract from feature totals their
134f46dd19bSMircea Trofin   // contribution. Some features, like max loop counts or depths, are left
135f46dd19bSMircea Trofin   // invalid, as they will be updated post-inlining.
136f46dd19bSMircea Trofin   SmallPtrSet<const BasicBlock *, 4> LikelyToChangeBBs;
137f46dd19bSMircea Trofin   // The CB BB will change - it'll either be split or the callee's body (single
138f46dd19bSMircea Trofin   // BB) will be pasted in.
139f46dd19bSMircea Trofin   LikelyToChangeBBs.insert(&CallSiteBB);
140f46dd19bSMircea Trofin 
141f46dd19bSMircea Trofin   // The caller's entry BB may change due to new alloca instructions.
142f46dd19bSMircea Trofin   LikelyToChangeBBs.insert(&*Caller.begin());
143f46dd19bSMircea Trofin 
144f46dd19bSMircea Trofin   // The successors may become unreachable in the case of `invoke` inlining.
145f46dd19bSMircea Trofin   // We track successors separately, too, because they form a boundary, together
146f46dd19bSMircea Trofin   // with the CB BB ('Entry') between which the inlined callee will be pasted.
147f46dd19bSMircea Trofin   Successors.insert(succ_begin(&CallSiteBB), succ_end(&CallSiteBB));
148b8c39eb2SMircea Trofin 
149*3f8e4169SMircea Trofin   // Inlining only handles invoke and calls. If this is an invoke, and inlining
150*3f8e4169SMircea Trofin   // it pulls another invoke, the original landing pad may get split, so as to
151*3f8e4169SMircea Trofin   // share its content with other potential users. So the edge up to which we
152*3f8e4169SMircea Trofin   // need to invalidate and then re-account BB data is the successors of the
153*3f8e4169SMircea Trofin   // current landing pad. We can leave the current lp, too - if it doesn't get
154*3f8e4169SMircea Trofin   // split, then it will be the place traversal stops. Either way, the
155*3f8e4169SMircea Trofin   // discounted BBs will be checked if reachable and re-added.
156*3f8e4169SMircea Trofin   if (const auto *II = dyn_cast<InvokeInst>(&CB)) {
157*3f8e4169SMircea Trofin     const auto *UnwindDest = II->getUnwindDest();
158*3f8e4169SMircea Trofin     Successors.insert(succ_begin(UnwindDest), succ_end(UnwindDest));
159*3f8e4169SMircea Trofin   }
160*3f8e4169SMircea Trofin 
161b8c39eb2SMircea Trofin   // Exclude the CallSiteBB, if it happens to be its own successor (1-BB loop).
162b8c39eb2SMircea Trofin   // We are only interested in BBs the graph moves past the callsite BB to
163b8c39eb2SMircea Trofin   // define the frontier past which we don't want to re-process BBs. Including
164b8c39eb2SMircea Trofin   // the callsite BB in this case would prematurely stop the traversal in
165b8c39eb2SMircea Trofin   // finish().
166b8c39eb2SMircea Trofin   Successors.erase(&CallSiteBB);
167b8c39eb2SMircea Trofin 
168f46dd19bSMircea Trofin   for (const auto *BB : Successors)
169f46dd19bSMircea Trofin     LikelyToChangeBBs.insert(BB);
170f46dd19bSMircea Trofin 
171f46dd19bSMircea Trofin   // Commit the change. While some of the BBs accounted for above may play dual
172f46dd19bSMircea Trofin   // role - e.g. caller's entry BB may be the same as the callsite BB - set
173f46dd19bSMircea Trofin   // insertion semantics make sure we account them once. This needs to be
174f46dd19bSMircea Trofin   // followed in `finish`, too.
175f46dd19bSMircea Trofin   for (const auto *BB : LikelyToChangeBBs)
176f46dd19bSMircea Trofin     FPI.updateForBB(*BB, -1);
177f46dd19bSMircea Trofin }
178f46dd19bSMircea Trofin 
finish(FunctionAnalysisManager & FAM) const17922a1f998SMircea Trofin void FunctionPropertiesUpdater::finish(FunctionAnalysisManager &FAM) const {
180f46dd19bSMircea Trofin   // Update feature values from the BBs that were copied from the callee, or
181f46dd19bSMircea Trofin   // might have been modified because of inlining. The latter have been
182f46dd19bSMircea Trofin   // subtracted in the FunctionPropertiesUpdater ctor.
18322a1f998SMircea Trofin   // There could be successors that were reached before but now are only
18422a1f998SMircea Trofin   // reachable from elsewhere in the CFG.
185*3f8e4169SMircea Trofin   // One example is the following diamond CFG (lines are arrows pointing down):
18622a1f998SMircea Trofin   //    A
18722a1f998SMircea Trofin   //  /   \
18822a1f998SMircea Trofin   // B     C
189*3f8e4169SMircea Trofin   // |     |
190*3f8e4169SMircea Trofin   // |     D
191*3f8e4169SMircea Trofin   // |     |
192*3f8e4169SMircea Trofin   // |     E
19322a1f998SMircea Trofin   //  \   /
194*3f8e4169SMircea Trofin   //    F
19522a1f998SMircea Trofin   // There's a call site in C that is inlined. Upon doing that, it turns out
19622a1f998SMircea Trofin   // it expands to
19722a1f998SMircea Trofin   //   call void @llvm.trap()
19822a1f998SMircea Trofin   //   unreachable
199*3f8e4169SMircea Trofin   // F isn't reachable from C anymore, but we did discount it when we set up
20022a1f998SMircea Trofin   // FunctionPropertiesUpdater, so we need to re-include it here.
201*3f8e4169SMircea Trofin   // At the same time, D and E were reachable before, but now are not anymore,
202*3f8e4169SMircea Trofin   // so we need to leave D out (we discounted it at setup), and explicitly
203*3f8e4169SMircea Trofin   // remove E.
204*3f8e4169SMircea Trofin   SetVector<const BasicBlock *> Reinclude;
205*3f8e4169SMircea Trofin   SetVector<const BasicBlock *> Unreachable;
20622a1f998SMircea Trofin   const auto &DT =
20722a1f998SMircea Trofin       FAM.getResult<DominatorTreeAnalysis>(const_cast<Function &>(Caller));
20822a1f998SMircea Trofin 
209*3f8e4169SMircea Trofin   if (&CallSiteBB != &*Caller.begin())
210*3f8e4169SMircea Trofin     Reinclude.insert(&*Caller.begin());
211*3f8e4169SMircea Trofin 
212*3f8e4169SMircea Trofin   // Distribute the successors to the 2 buckets.
213*3f8e4169SMircea Trofin   for (const auto *Succ : Successors)
214*3f8e4169SMircea Trofin     if (DT.isReachableFromEntry(Succ))
215*3f8e4169SMircea Trofin       Reinclude.insert(Succ);
216*3f8e4169SMircea Trofin     else
217*3f8e4169SMircea Trofin       Unreachable.insert(Succ);
218*3f8e4169SMircea Trofin 
219*3f8e4169SMircea Trofin   // For reinclusion, we want to stop at the reachable successors, who are at
220*3f8e4169SMircea Trofin   // the beginning of the worklist; but, starting from the callsite bb and
221*3f8e4169SMircea Trofin   // ending at those successors, we also want to perform a traversal.
222*3f8e4169SMircea Trofin   // IncludeSuccessorsMark is the index after which we include successors.
223*3f8e4169SMircea Trofin   const auto IncludeSuccessorsMark = Reinclude.size();
224*3f8e4169SMircea Trofin   bool CSInsertion = Reinclude.insert(&CallSiteBB);
22522a1f998SMircea Trofin   (void)CSInsertion;
22622a1f998SMircea Trofin   assert(CSInsertion);
227*3f8e4169SMircea Trofin   for (size_t I = 0; I < Reinclude.size(); ++I) {
228*3f8e4169SMircea Trofin     const auto *BB = Reinclude[I];
22922a1f998SMircea Trofin     FPI.reIncludeBB(*BB);
230*3f8e4169SMircea Trofin     if (I >= IncludeSuccessorsMark)
231*3f8e4169SMircea Trofin       Reinclude.insert(succ_begin(BB), succ_end(BB));
232*3f8e4169SMircea Trofin   }
233*3f8e4169SMircea Trofin 
234*3f8e4169SMircea Trofin   // For exclusion, we don't need to exclude the set of BBs that were successors
235*3f8e4169SMircea Trofin   // before and are now unreachable, because we already did that at setup. For
236*3f8e4169SMircea Trofin   // the rest, as long as a successor is unreachable, we want to explicitly
237*3f8e4169SMircea Trofin   // exclude it.
238*3f8e4169SMircea Trofin   const auto AlreadyExcludedMark = Unreachable.size();
239*3f8e4169SMircea Trofin   for (size_t I = 0; I < Unreachable.size(); ++I) {
240*3f8e4169SMircea Trofin     const auto *U = Unreachable[I];
241*3f8e4169SMircea Trofin     if (I >= AlreadyExcludedMark)
242*3f8e4169SMircea Trofin       FPI.updateForBB(*U, -1);
243*3f8e4169SMircea Trofin     for (const auto *Succ : successors(U))
244*3f8e4169SMircea Trofin       if (!DT.isReachableFromEntry(Succ))
245*3f8e4169SMircea Trofin         Unreachable.insert(Succ);
246f46dd19bSMircea Trofin   }
24722a1f998SMircea Trofin 
24822a1f998SMircea Trofin   const auto &LI = FAM.getResult<LoopAnalysis>(const_cast<Function &>(Caller));
249f46dd19bSMircea Trofin   FPI.updateAggregateStats(Caller, LI);
25022a1f998SMircea Trofin   assert(FPI == FunctionPropertiesInfo::getFunctionPropertiesInfo(Caller, FAM));
251f46dd19bSMircea Trofin }
252