12cab237bSDimitry Andric //===- IfConversion.cpp - Machine code if conversion pass -----------------===//
2f22ef01cSRoman Divacky //
3f22ef01cSRoman Divacky // The LLVM Compiler Infrastructure
4f22ef01cSRoman Divacky //
5f22ef01cSRoman Divacky // This file is distributed under the University of Illinois Open Source
6f22ef01cSRoman Divacky // License. See LICENSE.TXT for details.
7f22ef01cSRoman Divacky //
8f22ef01cSRoman Divacky //===----------------------------------------------------------------------===//
9f22ef01cSRoman Divacky //
103ca95b02SDimitry Andric // This file implements the machine instruction level if-conversion pass, which
113ca95b02SDimitry Andric // tries to convert conditional branches into predicated instructions.
12f22ef01cSRoman Divacky //
13f22ef01cSRoman Divacky //===----------------------------------------------------------------------===//
14f22ef01cSRoman Divacky
15139f7f9bSDimitry Andric #include "BranchFolding.h"
16139f7f9bSDimitry Andric #include "llvm/ADT/STLExtras.h"
17d88c1a5aSDimitry Andric #include "llvm/ADT/ScopeExit.h"
18139f7f9bSDimitry Andric #include "llvm/ADT/SmallSet.h"
192cab237bSDimitry Andric #include "llvm/ADT/SmallVector.h"
202cab237bSDimitry Andric #include "llvm/ADT/SparseSet.h"
21139f7f9bSDimitry Andric #include "llvm/ADT/Statistic.h"
222cab237bSDimitry Andric #include "llvm/ADT/iterator_range.h"
2391bc56edSDimitry Andric #include "llvm/CodeGen/LivePhysRegs.h"
242cab237bSDimitry Andric #include "llvm/CodeGen/MachineBasicBlock.h"
2539d628a0SDimitry Andric #include "llvm/CodeGen/MachineBlockFrequencyInfo.h"
266122f3e6SDimitry Andric #include "llvm/CodeGen/MachineBranchProbabilityInfo.h"
272cab237bSDimitry Andric #include "llvm/CodeGen/MachineFunction.h"
28f22ef01cSRoman Divacky #include "llvm/CodeGen/MachineFunctionPass.h"
292cab237bSDimitry Andric #include "llvm/CodeGen/MachineInstr.h"
30139f7f9bSDimitry Andric #include "llvm/CodeGen/MachineInstrBuilder.h"
31139f7f9bSDimitry Andric #include "llvm/CodeGen/MachineModuleInfo.h"
322cab237bSDimitry Andric #include "llvm/CodeGen/MachineOperand.h"
337ae0e2c9SDimitry Andric #include "llvm/CodeGen/MachineRegisterInfo.h"
342cab237bSDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
352cab237bSDimitry Andric #include "llvm/CodeGen/TargetLowering.h"
362cab237bSDimitry Andric #include "llvm/CodeGen/TargetRegisterInfo.h"
37f785676fSDimitry Andric #include "llvm/CodeGen/TargetSchedule.h"
382cab237bSDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
392cab237bSDimitry Andric #include "llvm/IR/DebugLoc.h"
402cab237bSDimitry Andric #include "llvm/MC/MCRegisterInfo.h"
412cab237bSDimitry Andric #include "llvm/Pass.h"
422cab237bSDimitry Andric #include "llvm/Support/BranchProbability.h"
43f22ef01cSRoman Divacky #include "llvm/Support/CommandLine.h"
44f22ef01cSRoman Divacky #include "llvm/Support/Debug.h"
45f22ef01cSRoman Divacky #include "llvm/Support/ErrorHandling.h"
46f22ef01cSRoman Divacky #include "llvm/Support/raw_ostream.h"
477d523365SDimitry Andric #include <algorithm>
482cab237bSDimitry Andric #include <cassert>
492cab237bSDimitry Andric #include <functional>
502cab237bSDimitry Andric #include <iterator>
512cab237bSDimitry Andric #include <memory>
523ca95b02SDimitry Andric #include <utility>
532cab237bSDimitry Andric #include <vector>
54f785676fSDimitry Andric
55f22ef01cSRoman Divacky using namespace llvm;
56f22ef01cSRoman Divacky
57302affcbSDimitry Andric #define DEBUG_TYPE "if-converter"
5891bc56edSDimitry Andric
59f22ef01cSRoman Divacky // Hidden options for help debugging.
60f22ef01cSRoman Divacky static cl::opt<int> IfCvtFnStart("ifcvt-fn-start", cl::init(-1), cl::Hidden);
61f22ef01cSRoman Divacky static cl::opt<int> IfCvtFnStop("ifcvt-fn-stop", cl::init(-1), cl::Hidden);
62f22ef01cSRoman Divacky static cl::opt<int> IfCvtLimit("ifcvt-limit", cl::init(-1), cl::Hidden);
63f22ef01cSRoman Divacky static cl::opt<bool> DisableSimple("disable-ifcvt-simple",
64f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
65f22ef01cSRoman Divacky static cl::opt<bool> DisableSimpleF("disable-ifcvt-simple-false",
66f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
67f22ef01cSRoman Divacky static cl::opt<bool> DisableTriangle("disable-ifcvt-triangle",
68f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
69f22ef01cSRoman Divacky static cl::opt<bool> DisableTriangleR("disable-ifcvt-triangle-rev",
70f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
71f22ef01cSRoman Divacky static cl::opt<bool> DisableTriangleF("disable-ifcvt-triangle-false",
72f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
73f22ef01cSRoman Divacky static cl::opt<bool> DisableTriangleFR("disable-ifcvt-triangle-false-rev",
74f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
75f22ef01cSRoman Divacky static cl::opt<bool> DisableDiamond("disable-ifcvt-diamond",
76f22ef01cSRoman Divacky cl::init(false), cl::Hidden);
77d88c1a5aSDimitry Andric static cl::opt<bool> DisableForkedDiamond("disable-ifcvt-forked-diamond",
78d88c1a5aSDimitry Andric cl::init(false), cl::Hidden);
79ffd1746dSEd Schouten static cl::opt<bool> IfCvtBranchFold("ifcvt-branch-fold",
80ffd1746dSEd Schouten cl::init(true), cl::Hidden);
81f22ef01cSRoman Divacky
82f22ef01cSRoman Divacky STATISTIC(NumSimple, "Number of simple if-conversions performed");
83f22ef01cSRoman Divacky STATISTIC(NumSimpleFalse, "Number of simple (F) if-conversions performed");
84f22ef01cSRoman Divacky STATISTIC(NumTriangle, "Number of triangle if-conversions performed");
85f22ef01cSRoman Divacky STATISTIC(NumTriangleRev, "Number of triangle (R) if-conversions performed");
86f22ef01cSRoman Divacky STATISTIC(NumTriangleFalse,"Number of triangle (F) if-conversions performed");
87f22ef01cSRoman Divacky STATISTIC(NumTriangleFRev, "Number of triangle (F/R) if-conversions performed");
88f22ef01cSRoman Divacky STATISTIC(NumDiamonds, "Number of diamond if-conversions performed");
89d88c1a5aSDimitry Andric STATISTIC(NumForkedDiamonds, "Number of forked-diamond if-conversions performed");
90f22ef01cSRoman Divacky STATISTIC(NumIfConvBBs, "Number of if-converted blocks");
91f22ef01cSRoman Divacky STATISTIC(NumDupBBs, "Number of duplicated blocks");
92dff0c46cSDimitry Andric STATISTIC(NumUnpred, "Number of true blocks of diamonds unpredicated");
93f22ef01cSRoman Divacky
94f22ef01cSRoman Divacky namespace {
952cab237bSDimitry Andric
96f22ef01cSRoman Divacky class IfConverter : public MachineFunctionPass {
97f22ef01cSRoman Divacky enum IfcvtKind {
98f22ef01cSRoman Divacky ICNotClassfied, // BB data valid, but not classified.
99f22ef01cSRoman Divacky ICSimpleFalse, // Same as ICSimple, but on the false path.
100f22ef01cSRoman Divacky ICSimple, // BB is entry of an one split, no rejoin sub-CFG.
101f22ef01cSRoman Divacky ICTriangleFRev, // Same as ICTriangleFalse, but false path rev condition.
102f22ef01cSRoman Divacky ICTriangleRev, // Same as ICTriangle, but true path rev condition.
103f22ef01cSRoman Divacky ICTriangleFalse, // Same as ICTriangle, but on the false path.
104f22ef01cSRoman Divacky ICTriangle, // BB is entry of a triangle sub-CFG.
105d88c1a5aSDimitry Andric ICDiamond, // BB is entry of a diamond sub-CFG.
106d88c1a5aSDimitry Andric ICForkedDiamond // BB is entry of an almost diamond sub-CFG, with a
107d88c1a5aSDimitry Andric // common tail that can be shared.
108f22ef01cSRoman Divacky };
109f22ef01cSRoman Divacky
110d88c1a5aSDimitry Andric /// One per MachineBasicBlock, this is used to cache the result
111f22ef01cSRoman Divacky /// if-conversion feasibility analysis. This includes results from
1123ca95b02SDimitry Andric /// TargetInstrInfo::analyzeBranch() (i.e. TBB, FBB, and Cond), and its
113f22ef01cSRoman Divacky /// classification, and common tail block of its successors (if it's a
114f22ef01cSRoman Divacky /// diamond shape), its size, whether it's predicable, and whether any
115f22ef01cSRoman Divacky /// instruction can clobber the 'would-be' predicate.
116f22ef01cSRoman Divacky ///
117f22ef01cSRoman Divacky /// IsDone - True if BB is not to be considered for ifcvt.
118f22ef01cSRoman Divacky /// IsBeingAnalyzed - True if BB is currently being analyzed.
119f22ef01cSRoman Divacky /// IsAnalyzed - True if BB has been analyzed (info is still valid).
120f22ef01cSRoman Divacky /// IsEnqueued - True if BB has been enqueued to be ifcvt'ed.
1213ca95b02SDimitry Andric /// IsBrAnalyzable - True if analyzeBranch() returns false.
122f22ef01cSRoman Divacky /// HasFallThrough - True if BB may fallthrough to the following BB.
123f22ef01cSRoman Divacky /// IsUnpredicable - True if BB is known to be unpredicable.
124f22ef01cSRoman Divacky /// ClobbersPred - True if BB could modify predicates (e.g. has
125f22ef01cSRoman Divacky /// cmp, call, etc.)
126f22ef01cSRoman Divacky /// NonPredSize - Number of non-predicated instructions.
1272754fe60SDimitry Andric /// ExtraCost - Extra cost for multi-cycle instructions.
1282754fe60SDimitry Andric /// ExtraCost2 - Some instructions are slower when predicated
129f22ef01cSRoman Divacky /// BB - Corresponding MachineBasicBlock.
1303ca95b02SDimitry Andric /// TrueBB / FalseBB- See analyzeBranch().
131f22ef01cSRoman Divacky /// BrCond - Conditions for end of block conditional branches.
132f22ef01cSRoman Divacky /// Predicate - Predicate used in the BB.
133f22ef01cSRoman Divacky struct BBInfo {
134f22ef01cSRoman Divacky bool IsDone : 1;
135f22ef01cSRoman Divacky bool IsBeingAnalyzed : 1;
136f22ef01cSRoman Divacky bool IsAnalyzed : 1;
137f22ef01cSRoman Divacky bool IsEnqueued : 1;
138f22ef01cSRoman Divacky bool IsBrAnalyzable : 1;
139d88c1a5aSDimitry Andric bool IsBrReversible : 1;
140f22ef01cSRoman Divacky bool HasFallThrough : 1;
141f22ef01cSRoman Divacky bool IsUnpredicable : 1;
142f22ef01cSRoman Divacky bool CannotBeCopied : 1;
143f22ef01cSRoman Divacky bool ClobbersPred : 1;
1442cab237bSDimitry Andric unsigned NonPredSize = 0;
1452cab237bSDimitry Andric unsigned ExtraCost = 0;
1462cab237bSDimitry Andric unsigned ExtraCost2 = 0;
1472cab237bSDimitry Andric MachineBasicBlock *BB = nullptr;
1482cab237bSDimitry Andric MachineBasicBlock *TrueBB = nullptr;
1492cab237bSDimitry Andric MachineBasicBlock *FalseBB = nullptr;
150f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> BrCond;
151f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> Predicate;
1522cab237bSDimitry Andric
BBInfo__anon6ebe8f0e0111::IfConverter::BBInfo153f22ef01cSRoman Divacky BBInfo() : IsDone(false), IsBeingAnalyzed(false),
154f22ef01cSRoman Divacky IsAnalyzed(false), IsEnqueued(false), IsBrAnalyzable(false),
155d88c1a5aSDimitry Andric IsBrReversible(false), HasFallThrough(false),
156d88c1a5aSDimitry Andric IsUnpredicable(false), CannotBeCopied(false),
1572cab237bSDimitry Andric ClobbersPred(false) {}
158f22ef01cSRoman Divacky };
159f22ef01cSRoman Divacky
160d88c1a5aSDimitry Andric /// Record information about pending if-conversions to attempt:
161f22ef01cSRoman Divacky /// BBI - Corresponding BBInfo.
162f22ef01cSRoman Divacky /// Kind - Type of block. See IfcvtKind.
163f22ef01cSRoman Divacky /// NeedSubsumption - True if the to-be-predicated BB has already been
164f22ef01cSRoman Divacky /// predicated.
165f22ef01cSRoman Divacky /// NumDups - Number of instructions that would be duplicated due
166f22ef01cSRoman Divacky /// to this if-conversion. (For diamonds, the number of
167f22ef01cSRoman Divacky /// identical instructions at the beginnings of both
168f22ef01cSRoman Divacky /// paths).
169f22ef01cSRoman Divacky /// NumDups2 - For diamonds, the number of identical instructions
170f22ef01cSRoman Divacky /// at the ends of both paths.
171f22ef01cSRoman Divacky struct IfcvtToken {
172f22ef01cSRoman Divacky BBInfo &BBI;
173f22ef01cSRoman Divacky IfcvtKind Kind;
174f22ef01cSRoman Divacky unsigned NumDups;
175f22ef01cSRoman Divacky unsigned NumDups2;
176d88c1a5aSDimitry Andric bool NeedSubsumption : 1;
177d88c1a5aSDimitry Andric bool TClobbersPred : 1;
178d88c1a5aSDimitry Andric bool FClobbersPred : 1;
1792cab237bSDimitry Andric
IfcvtToken__anon6ebe8f0e0111::IfConverter::IfcvtToken180d88c1a5aSDimitry Andric IfcvtToken(BBInfo &b, IfcvtKind k, bool s, unsigned d, unsigned d2 = 0,
181d88c1a5aSDimitry Andric bool tc = false, bool fc = false)
182d88c1a5aSDimitry Andric : BBI(b), Kind(k), NumDups(d), NumDups2(d2), NeedSubsumption(s),
183d88c1a5aSDimitry Andric TClobbersPred(tc), FClobbersPred(fc) {}
184f22ef01cSRoman Divacky };
185f22ef01cSRoman Divacky
186d88c1a5aSDimitry Andric /// Results of if-conversion feasibility analysis indexed by basic block
187d88c1a5aSDimitry Andric /// number.
188f22ef01cSRoman Divacky std::vector<BBInfo> BBAnalysis;
189f785676fSDimitry Andric TargetSchedModel SchedModel;
190f22ef01cSRoman Divacky
191139f7f9bSDimitry Andric const TargetLoweringBase *TLI;
192f22ef01cSRoman Divacky const TargetInstrInfo *TII;
193ffd1746dSEd Schouten const TargetRegisterInfo *TRI;
1946122f3e6SDimitry Andric const MachineBranchProbabilityInfo *MBPI;
1957ae0e2c9SDimitry Andric MachineRegisterInfo *MRI;
1966122f3e6SDimitry Andric
19791bc56edSDimitry Andric LivePhysRegs Redefs;
198f785676fSDimitry Andric
1997ae0e2c9SDimitry Andric bool PreRegAlloc;
200f22ef01cSRoman Divacky bool MadeChange;
2012cab237bSDimitry Andric int FnNum = -1;
202d88c1a5aSDimitry Andric std::function<bool(const MachineFunction &)> PredicateFtor;
20397bc6c73SDimitry Andric
204f22ef01cSRoman Divacky public:
205f22ef01cSRoman Divacky static char ID;
2062cab237bSDimitry Andric
IfConverter(std::function<bool (const MachineFunction &)> Ftor=nullptr)207d88c1a5aSDimitry Andric IfConverter(std::function<bool(const MachineFunction &)> Ftor = nullptr)
2082cab237bSDimitry Andric : MachineFunctionPass(ID), PredicateFtor(std::move(Ftor)) {
2092754fe60SDimitry Andric initializeIfConverterPass(*PassRegistry::getPassRegistry());
2102754fe60SDimitry Andric }
2112754fe60SDimitry Andric
getAnalysisUsage(AnalysisUsage & AU) const21291bc56edSDimitry Andric void getAnalysisUsage(AnalysisUsage &AU) const override {
21339d628a0SDimitry Andric AU.addRequired<MachineBlockFrequencyInfo>();
2146122f3e6SDimitry Andric AU.addRequired<MachineBranchProbabilityInfo>();
2152754fe60SDimitry Andric MachineFunctionPass::getAnalysisUsage(AU);
2162754fe60SDimitry Andric }
217f22ef01cSRoman Divacky
21891bc56edSDimitry Andric bool runOnMachineFunction(MachineFunction &MF) override;
219f22ef01cSRoman Divacky
getRequiredProperties() const2203ca95b02SDimitry Andric MachineFunctionProperties getRequiredProperties() const override {
2213ca95b02SDimitry Andric return MachineFunctionProperties().set(
222d88c1a5aSDimitry Andric MachineFunctionProperties::Property::NoVRegs);
2233ca95b02SDimitry Andric }
2243ca95b02SDimitry Andric
225f22ef01cSRoman Divacky private:
226d88c1a5aSDimitry Andric bool reverseBranchCondition(BBInfo &BBI) const;
2272754fe60SDimitry Andric bool ValidSimple(BBInfo &TrueBBI, unsigned &Dups,
2287d523365SDimitry Andric BranchProbability Prediction) const;
229f22ef01cSRoman Divacky bool ValidTriangle(BBInfo &TrueBBI, BBInfo &FalseBBI,
2302754fe60SDimitry Andric bool FalseBranch, unsigned &Dups,
2317d523365SDimitry Andric BranchProbability Prediction) const;
232d88c1a5aSDimitry Andric bool CountDuplicatedInstructions(
233d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIB, MachineBasicBlock::iterator &FIB,
234d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIE, MachineBasicBlock::iterator &FIE,
235d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
236d88c1a5aSDimitry Andric MachineBasicBlock &TBB, MachineBasicBlock &FBB,
237d88c1a5aSDimitry Andric bool SkipUnconditionalBranches) const;
238f22ef01cSRoman Divacky bool ValidDiamond(BBInfo &TrueBBI, BBInfo &FalseBBI,
239d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
240d88c1a5aSDimitry Andric BBInfo &TrueBBICalc, BBInfo &FalseBBICalc) const;
241d88c1a5aSDimitry Andric bool ValidForkedDiamond(BBInfo &TrueBBI, BBInfo &FalseBBI,
242d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
243d88c1a5aSDimitry Andric BBInfo &TrueBBICalc, BBInfo &FalseBBICalc) const;
244d88c1a5aSDimitry Andric void AnalyzeBranches(BBInfo &BBI);
245d88c1a5aSDimitry Andric void ScanInstructions(BBInfo &BBI,
246d88c1a5aSDimitry Andric MachineBasicBlock::iterator &Begin,
247d88c1a5aSDimitry Andric MachineBasicBlock::iterator &End,
248d88c1a5aSDimitry Andric bool BranchUnpredicable = false) const;
249d88c1a5aSDimitry Andric bool RescanInstructions(
250d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIB, MachineBasicBlock::iterator &FIB,
251d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIE, MachineBasicBlock::iterator &FIE,
252d88c1a5aSDimitry Andric BBInfo &TrueBBI, BBInfo &FalseBBI) const;
253d88c1a5aSDimitry Andric void AnalyzeBlock(MachineBasicBlock &MBB,
2543ca95b02SDimitry Andric std::vector<std::unique_ptr<IfcvtToken>> &Tokens);
2554ba319b5SDimitry Andric bool FeasibilityAnalysis(BBInfo &BBI, SmallVectorImpl<MachineOperand> &Pred,
256d88c1a5aSDimitry Andric bool isTriangle = false, bool RevBranch = false,
257d88c1a5aSDimitry Andric bool hasCommonTail = false);
2583ca95b02SDimitry Andric void AnalyzeBlocks(MachineFunction &MF,
2593ca95b02SDimitry Andric std::vector<std::unique_ptr<IfcvtToken>> &Tokens);
260d88c1a5aSDimitry Andric void InvalidatePreds(MachineBasicBlock &MBB);
261f22ef01cSRoman Divacky bool IfConvertSimple(BBInfo &BBI, IfcvtKind Kind);
262f22ef01cSRoman Divacky bool IfConvertTriangle(BBInfo &BBI, IfcvtKind Kind);
263d88c1a5aSDimitry Andric bool IfConvertDiamondCommon(BBInfo &BBI, BBInfo &TrueBBI, BBInfo &FalseBBI,
264d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
265d88c1a5aSDimitry Andric bool TClobbersPred, bool FClobbersPred,
266d88c1a5aSDimitry Andric bool RemoveBranch, bool MergeAddEdges);
267f22ef01cSRoman Divacky bool IfConvertDiamond(BBInfo &BBI, IfcvtKind Kind,
268d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
269d88c1a5aSDimitry Andric bool TClobbers, bool FClobbers);
270d88c1a5aSDimitry Andric bool IfConvertForkedDiamond(BBInfo &BBI, IfcvtKind Kind,
271d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
272d88c1a5aSDimitry Andric bool TClobbers, bool FClobbers);
273f22ef01cSRoman Divacky void PredicateBlock(BBInfo &BBI,
274f22ef01cSRoman Divacky MachineBasicBlock::iterator E,
275ffd1746dSEd Schouten SmallVectorImpl<MachineOperand> &Cond,
276b5893f02SDimitry Andric SmallSet<MCPhysReg, 4> *LaterRedefs = nullptr);
277f22ef01cSRoman Divacky void CopyAndPredicateBlock(BBInfo &ToBBI, BBInfo &FromBBI,
278f22ef01cSRoman Divacky SmallVectorImpl<MachineOperand> &Cond,
279f22ef01cSRoman Divacky bool IgnoreBr = false);
280ffd1746dSEd Schouten void MergeBlocks(BBInfo &ToBBI, BBInfo &FromBBI, bool AddEdges = true);
281f22ef01cSRoman Divacky
MeetIfcvtSizeLimit(MachineBasicBlock & BB,unsigned Cycle,unsigned Extra,BranchProbability Prediction) const2822754fe60SDimitry Andric bool MeetIfcvtSizeLimit(MachineBasicBlock &BB,
2832754fe60SDimitry Andric unsigned Cycle, unsigned Extra,
2847d523365SDimitry Andric BranchProbability Prediction) const {
2852754fe60SDimitry Andric return Cycle > 0 && TII->isProfitableToIfCvt(BB, Cycle, Extra,
28617a519f9SDimitry Andric Prediction);
287ffd1746dSEd Schouten }
288ffd1746dSEd Schouten
MeetIfcvtSizeLimit(MachineBasicBlock & TBB,unsigned TCycle,unsigned TExtra,MachineBasicBlock & FBB,unsigned FCycle,unsigned FExtra,BranchProbability Prediction) const2892754fe60SDimitry Andric bool MeetIfcvtSizeLimit(MachineBasicBlock &TBB,
2902754fe60SDimitry Andric unsigned TCycle, unsigned TExtra,
2912754fe60SDimitry Andric MachineBasicBlock &FBB,
2922754fe60SDimitry Andric unsigned FCycle, unsigned FExtra,
2937d523365SDimitry Andric BranchProbability Prediction) const {
2942754fe60SDimitry Andric return TCycle > 0 && FCycle > 0 &&
2952754fe60SDimitry Andric TII->isProfitableToIfCvt(TBB, TCycle, TExtra, FBB, FCycle, FExtra,
29617a519f9SDimitry Andric Prediction);
297f22ef01cSRoman Divacky }
298f22ef01cSRoman Divacky
299d88c1a5aSDimitry Andric /// Returns true if Block ends without a terminator.
blockAlwaysFallThrough(BBInfo & BBI) const300f22ef01cSRoman Divacky bool blockAlwaysFallThrough(BBInfo &BBI) const {
30191bc56edSDimitry Andric return BBI.IsBrAnalyzable && BBI.TrueBB == nullptr;
302f22ef01cSRoman Divacky }
303f22ef01cSRoman Divacky
304d88c1a5aSDimitry Andric /// Used to sort if-conversion candidates.
IfcvtTokenCmp(const std::unique_ptr<IfcvtToken> & C1,const std::unique_ptr<IfcvtToken> & C2)3053ca95b02SDimitry Andric static bool IfcvtTokenCmp(const std::unique_ptr<IfcvtToken> &C1,
3063ca95b02SDimitry Andric const std::unique_ptr<IfcvtToken> &C2) {
307f22ef01cSRoman Divacky int Incr1 = (C1->Kind == ICDiamond)
308f22ef01cSRoman Divacky ? -(int)(C1->NumDups + C1->NumDups2) : (int)C1->NumDups;
309f22ef01cSRoman Divacky int Incr2 = (C2->Kind == ICDiamond)
310f22ef01cSRoman Divacky ? -(int)(C2->NumDups + C2->NumDups2) : (int)C2->NumDups;
311f22ef01cSRoman Divacky if (Incr1 > Incr2)
312f22ef01cSRoman Divacky return true;
313f22ef01cSRoman Divacky else if (Incr1 == Incr2) {
314f22ef01cSRoman Divacky // Favors subsumption.
315ff0cc061SDimitry Andric if (!C1->NeedSubsumption && C2->NeedSubsumption)
316f22ef01cSRoman Divacky return true;
317f22ef01cSRoman Divacky else if (C1->NeedSubsumption == C2->NeedSubsumption) {
318f22ef01cSRoman Divacky // Favors diamond over triangle, etc.
319f22ef01cSRoman Divacky if ((unsigned)C1->Kind < (unsigned)C2->Kind)
320f22ef01cSRoman Divacky return true;
321f22ef01cSRoman Divacky else if (C1->Kind == C2->Kind)
322f22ef01cSRoman Divacky return C1->BBI.BB->getNumber() < C2->BBI.BB->getNumber();
323f22ef01cSRoman Divacky }
324f22ef01cSRoman Divacky }
325f22ef01cSRoman Divacky return false;
326f22ef01cSRoman Divacky }
327f22ef01cSRoman Divacky };
328f22ef01cSRoman Divacky
3292cab237bSDimitry Andric } // end anonymous namespace
3302cab237bSDimitry Andric
331f22ef01cSRoman Divacky char IfConverter::ID = 0;
332f22ef01cSRoman Divacky
333dff0c46cSDimitry Andric char &llvm::IfConverterID = IfConverter::ID;
334dff0c46cSDimitry Andric
335302affcbSDimitry Andric INITIALIZE_PASS_BEGIN(IfConverter, DEBUG_TYPE, "If Converter", false, false)
INITIALIZE_PASS_DEPENDENCY(MachineBranchProbabilityInfo)3366122f3e6SDimitry Andric INITIALIZE_PASS_DEPENDENCY(MachineBranchProbabilityInfo)
337302affcbSDimitry Andric INITIALIZE_PASS_END(IfConverter, DEBUG_TYPE, "If Converter", false, false)
338f22ef01cSRoman Divacky
339f22ef01cSRoman Divacky bool IfConverter::runOnMachineFunction(MachineFunction &MF) {
3402cab237bSDimitry Andric if (skipFunction(MF.getFunction()) || (PredicateFtor && !PredicateFtor(MF)))
34197bc6c73SDimitry Andric return false;
34297bc6c73SDimitry Andric
343ff0cc061SDimitry Andric const TargetSubtargetInfo &ST = MF.getSubtarget();
344ff0cc061SDimitry Andric TLI = ST.getTargetLowering();
345ff0cc061SDimitry Andric TII = ST.getInstrInfo();
346ff0cc061SDimitry Andric TRI = ST.getRegisterInfo();
3473ca95b02SDimitry Andric BranchFolder::MBFIWrapper MBFI(getAnalysis<MachineBlockFrequencyInfo>());
3486122f3e6SDimitry Andric MBPI = &getAnalysis<MachineBranchProbabilityInfo>();
3497ae0e2c9SDimitry Andric MRI = &MF.getRegInfo();
3504ba319b5SDimitry Andric SchedModel.init(&ST);
351f785676fSDimitry Andric
352f22ef01cSRoman Divacky if (!TII) return false;
353f22ef01cSRoman Divacky
3547ae0e2c9SDimitry Andric PreRegAlloc = MRI->isSSA();
3557ae0e2c9SDimitry Andric
3567ae0e2c9SDimitry Andric bool BFChange = false;
3577ae0e2c9SDimitry Andric if (!PreRegAlloc) {
358ffd1746dSEd Schouten // Tail merge tend to expose more if-conversion opportunities.
3593ca95b02SDimitry Andric BranchFolder BF(true, false, MBFI, *MBPI);
360ff0cc061SDimitry Andric BFChange = BF.OptimizeFunction(MF, TII, ST.getRegisterInfo(),
361ffd1746dSEd Schouten getAnalysisIfAvailable<MachineModuleInfo>());
3627ae0e2c9SDimitry Andric }
363ffd1746dSEd Schouten
3644ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "\nIfcvt: function (" << ++FnNum << ") \'"
3653861d79fSDimitry Andric << MF.getName() << "\'");
366f22ef01cSRoman Divacky
367f22ef01cSRoman Divacky if (FnNum < IfCvtFnStart || (IfCvtFnStop != -1 && FnNum > IfCvtFnStop)) {
3684ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << " skipped\n");
369f22ef01cSRoman Divacky return false;
370f22ef01cSRoman Divacky }
3714ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "\n");
372f22ef01cSRoman Divacky
373f22ef01cSRoman Divacky MF.RenumberBlocks();
374f22ef01cSRoman Divacky BBAnalysis.resize(MF.getNumBlockIDs());
375f22ef01cSRoman Divacky
3763ca95b02SDimitry Andric std::vector<std::unique_ptr<IfcvtToken>> Tokens;
377f22ef01cSRoman Divacky MadeChange = false;
378f22ef01cSRoman Divacky unsigned NumIfCvts = NumSimple + NumSimpleFalse + NumTriangle +
379f22ef01cSRoman Divacky NumTriangleRev + NumTriangleFalse + NumTriangleFRev + NumDiamonds;
380f22ef01cSRoman Divacky while (IfCvtLimit == -1 || (int)NumIfCvts < IfCvtLimit) {
381f22ef01cSRoman Divacky // Do an initial analysis for each basic block and find all the potential
382f22ef01cSRoman Divacky // candidates to perform if-conversion.
383ffd1746dSEd Schouten bool Change = false;
384ffd1746dSEd Schouten AnalyzeBlocks(MF, Tokens);
385f22ef01cSRoman Divacky while (!Tokens.empty()) {
3863ca95b02SDimitry Andric std::unique_ptr<IfcvtToken> Token = std::move(Tokens.back());
387f22ef01cSRoman Divacky Tokens.pop_back();
388f22ef01cSRoman Divacky BBInfo &BBI = Token->BBI;
389f22ef01cSRoman Divacky IfcvtKind Kind = Token->Kind;
390f22ef01cSRoman Divacky unsigned NumDups = Token->NumDups;
391f22ef01cSRoman Divacky unsigned NumDups2 = Token->NumDups2;
392f22ef01cSRoman Divacky
393f22ef01cSRoman Divacky // If the block has been evicted out of the queue or it has already been
394f22ef01cSRoman Divacky // marked dead (due to it being predicated), then skip it.
395f22ef01cSRoman Divacky if (BBI.IsDone)
396f22ef01cSRoman Divacky BBI.IsEnqueued = false;
397f22ef01cSRoman Divacky if (!BBI.IsEnqueued)
398f22ef01cSRoman Divacky continue;
399f22ef01cSRoman Divacky
400f22ef01cSRoman Divacky BBI.IsEnqueued = false;
401f22ef01cSRoman Divacky
402f22ef01cSRoman Divacky bool RetVal = false;
403f22ef01cSRoman Divacky switch (Kind) {
404dff0c46cSDimitry Andric default: llvm_unreachable("Unexpected!");
405f22ef01cSRoman Divacky case ICSimple:
406f22ef01cSRoman Divacky case ICSimpleFalse: {
407f22ef01cSRoman Divacky bool isFalse = Kind == ICSimpleFalse;
408f22ef01cSRoman Divacky if ((isFalse && DisableSimpleF) || (!isFalse && DisableSimple)) break;
4094ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "Ifcvt (Simple"
4102cab237bSDimitry Andric << (Kind == ICSimpleFalse ? " false" : "")
4112cab237bSDimitry Andric << "): " << printMBBReference(*BBI.BB) << " ("
4122cab237bSDimitry Andric << ((Kind == ICSimpleFalse) ? BBI.FalseBB->getNumber()
4132cab237bSDimitry Andric : BBI.TrueBB->getNumber())
4142cab237bSDimitry Andric << ") ");
415f22ef01cSRoman Divacky RetVal = IfConvertSimple(BBI, Kind);
4164ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << (RetVal ? "succeeded!" : "failed!") << "\n");
417f22ef01cSRoman Divacky if (RetVal) {
418ffd1746dSEd Schouten if (isFalse) ++NumSimpleFalse;
419ffd1746dSEd Schouten else ++NumSimple;
420f22ef01cSRoman Divacky }
421f22ef01cSRoman Divacky break;
422f22ef01cSRoman Divacky }
423f22ef01cSRoman Divacky case ICTriangle:
424f22ef01cSRoman Divacky case ICTriangleRev:
425f22ef01cSRoman Divacky case ICTriangleFalse:
426f22ef01cSRoman Divacky case ICTriangleFRev: {
427f22ef01cSRoman Divacky bool isFalse = Kind == ICTriangleFalse;
428f22ef01cSRoman Divacky bool isRev = (Kind == ICTriangleRev || Kind == ICTriangleFRev);
429f22ef01cSRoman Divacky if (DisableTriangle && !isFalse && !isRev) break;
430f22ef01cSRoman Divacky if (DisableTriangleR && !isFalse && isRev) break;
431f22ef01cSRoman Divacky if (DisableTriangleF && isFalse && !isRev) break;
432f22ef01cSRoman Divacky if (DisableTriangleFR && isFalse && isRev) break;
4334ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "Ifcvt (Triangle");
434f22ef01cSRoman Divacky if (isFalse)
4354ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << " false");
436f22ef01cSRoman Divacky if (isRev)
4374ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << " rev");
4384ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "): " << printMBBReference(*BBI.BB)
4392cab237bSDimitry Andric << " (T:" << BBI.TrueBB->getNumber()
4402cab237bSDimitry Andric << ",F:" << BBI.FalseBB->getNumber() << ") ");
441f22ef01cSRoman Divacky RetVal = IfConvertTriangle(BBI, Kind);
4424ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << (RetVal ? "succeeded!" : "failed!") << "\n");
443f22ef01cSRoman Divacky if (RetVal) {
444f22ef01cSRoman Divacky if (isFalse) {
445ffd1746dSEd Schouten if (isRev) ++NumTriangleFRev;
446ffd1746dSEd Schouten else ++NumTriangleFalse;
447f22ef01cSRoman Divacky } else {
448ffd1746dSEd Schouten if (isRev) ++NumTriangleRev;
449ffd1746dSEd Schouten else ++NumTriangle;
450f22ef01cSRoman Divacky }
451f22ef01cSRoman Divacky }
452f22ef01cSRoman Divacky break;
453f22ef01cSRoman Divacky }
4542cab237bSDimitry Andric case ICDiamond:
455f22ef01cSRoman Divacky if (DisableDiamond) break;
4564ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "Ifcvt (Diamond): " << printMBBReference(*BBI.BB)
4572cab237bSDimitry Andric << " (T:" << BBI.TrueBB->getNumber()
4582cab237bSDimitry Andric << ",F:" << BBI.FalseBB->getNumber() << ") ");
459d88c1a5aSDimitry Andric RetVal = IfConvertDiamond(BBI, Kind, NumDups, NumDups2,
460d88c1a5aSDimitry Andric Token->TClobbersPred,
461d88c1a5aSDimitry Andric Token->FClobbersPred);
4624ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << (RetVal ? "succeeded!" : "failed!") << "\n");
463ffd1746dSEd Schouten if (RetVal) ++NumDiamonds;
464f22ef01cSRoman Divacky break;
4652cab237bSDimitry Andric case ICForkedDiamond:
466d88c1a5aSDimitry Andric if (DisableForkedDiamond) break;
4674ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << "Ifcvt (Forked Diamond): "
4684ba319b5SDimitry Andric << printMBBReference(*BBI.BB)
4692cab237bSDimitry Andric << " (T:" << BBI.TrueBB->getNumber()
4702cab237bSDimitry Andric << ",F:" << BBI.FalseBB->getNumber() << ") ");
471d88c1a5aSDimitry Andric RetVal = IfConvertForkedDiamond(BBI, Kind, NumDups, NumDups2,
472d88c1a5aSDimitry Andric Token->TClobbersPred,
473d88c1a5aSDimitry Andric Token->FClobbersPred);
4744ba319b5SDimitry Andric LLVM_DEBUG(dbgs() << (RetVal ? "succeeded!" : "failed!") << "\n");
475d88c1a5aSDimitry Andric if (RetVal) ++NumForkedDiamonds;
476d88c1a5aSDimitry Andric break;
477d88c1a5aSDimitry Andric }
4782cab237bSDimitry Andric
4792cab237bSDimitry Andric if (RetVal && MRI->tracksLiveness())
4802cab237bSDimitry Andric recomputeLivenessFlags(*BBI.BB);
481f22ef01cSRoman Divacky
482f22ef01cSRoman Divacky Change |= RetVal;
483f22ef01cSRoman Divacky
484f22ef01cSRoman Divacky NumIfCvts = NumSimple + NumSimpleFalse + NumTriangle + NumTriangleRev +
485f22ef01cSRoman Divacky NumTriangleFalse + NumTriangleFRev + NumDiamonds;
486f22ef01cSRoman Divacky if (IfCvtLimit != -1 && (int)NumIfCvts >= IfCvtLimit)
487f22ef01cSRoman Divacky break;
488f22ef01cSRoman Divacky }
489f22ef01cSRoman Divacky
490f22ef01cSRoman Divacky if (!Change)
491f22ef01cSRoman Divacky break;
492f22ef01cSRoman Divacky MadeChange |= Change;
493f22ef01cSRoman Divacky }
494f22ef01cSRoman Divacky
495f22ef01cSRoman Divacky Tokens.clear();
496f22ef01cSRoman Divacky BBAnalysis.clear();
497f22ef01cSRoman Divacky
498ffd1746dSEd Schouten if (MadeChange && IfCvtBranchFold) {
4993ca95b02SDimitry Andric BranchFolder BF(false, false, MBFI, *MBPI);
50039d628a0SDimitry Andric BF.OptimizeFunction(MF, TII, MF.getSubtarget().getRegisterInfo(),
501f22ef01cSRoman Divacky getAnalysisIfAvailable<MachineModuleInfo>());
502f22ef01cSRoman Divacky }
503f22ef01cSRoman Divacky
504ffd1746dSEd Schouten MadeChange |= BFChange;
505f22ef01cSRoman Divacky return MadeChange;
506f22ef01cSRoman Divacky }
507f22ef01cSRoman Divacky
508d88c1a5aSDimitry Andric /// BB has a fallthrough. Find its 'false' successor given its 'true' successor.
findFalseBlock(MachineBasicBlock * BB,MachineBasicBlock * TrueBB)509f22ef01cSRoman Divacky static MachineBasicBlock *findFalseBlock(MachineBasicBlock *BB,
510f22ef01cSRoman Divacky MachineBasicBlock *TrueBB) {
511d88c1a5aSDimitry Andric for (MachineBasicBlock *SuccBB : BB->successors()) {
512f22ef01cSRoman Divacky if (SuccBB != TrueBB)
513f22ef01cSRoman Divacky return SuccBB;
514f22ef01cSRoman Divacky }
51591bc56edSDimitry Andric return nullptr;
516f22ef01cSRoman Divacky }
517f22ef01cSRoman Divacky
518d88c1a5aSDimitry Andric /// Reverse the condition of the end of the block branch. Swap block's 'true'
519d88c1a5aSDimitry Andric /// and 'false' successors.
reverseBranchCondition(BBInfo & BBI) const520d88c1a5aSDimitry Andric bool IfConverter::reverseBranchCondition(BBInfo &BBI) const {
521ffd1746dSEd Schouten DebugLoc dl; // FIXME: this is nowhere
522d88c1a5aSDimitry Andric if (!TII->reverseBranchCondition(BBI.BrCond)) {
523d88c1a5aSDimitry Andric TII->removeBranch(*BBI.BB);
524d88c1a5aSDimitry Andric TII->insertBranch(*BBI.BB, BBI.FalseBB, BBI.TrueBB, BBI.BrCond, dl);
525f22ef01cSRoman Divacky std::swap(BBI.TrueBB, BBI.FalseBB);
526f22ef01cSRoman Divacky return true;
527f22ef01cSRoman Divacky }
528f22ef01cSRoman Divacky return false;
529f22ef01cSRoman Divacky }
530f22ef01cSRoman Divacky
531d88c1a5aSDimitry Andric /// Returns the next block in the function blocks ordering. If it is the end,
532d88c1a5aSDimitry Andric /// returns NULL.
getNextBlock(MachineBasicBlock & MBB)533d88c1a5aSDimitry Andric static inline MachineBasicBlock *getNextBlock(MachineBasicBlock &MBB) {
534d88c1a5aSDimitry Andric MachineFunction::iterator I = MBB.getIterator();
535d88c1a5aSDimitry Andric MachineFunction::iterator E = MBB.getParent()->end();
536f22ef01cSRoman Divacky if (++I == E)
53791bc56edSDimitry Andric return nullptr;
5387d523365SDimitry Andric return &*I;
539f22ef01cSRoman Divacky }
540f22ef01cSRoman Divacky
541d88c1a5aSDimitry Andric /// Returns true if the 'true' block (along with its predecessor) forms a valid
542d88c1a5aSDimitry Andric /// simple shape for ifcvt. It also returns the number of instructions that the
543d88c1a5aSDimitry Andric /// ifcvt would need to duplicate if performed in Dups.
ValidSimple(BBInfo & TrueBBI,unsigned & Dups,BranchProbability Prediction) const5442754fe60SDimitry Andric bool IfConverter::ValidSimple(BBInfo &TrueBBI, unsigned &Dups,
5457d523365SDimitry Andric BranchProbability Prediction) const {
546f22ef01cSRoman Divacky Dups = 0;
547f22ef01cSRoman Divacky if (TrueBBI.IsBeingAnalyzed || TrueBBI.IsDone)
548f22ef01cSRoman Divacky return false;
549f22ef01cSRoman Divacky
550f22ef01cSRoman Divacky if (TrueBBI.IsBrAnalyzable)
551f22ef01cSRoman Divacky return false;
552f22ef01cSRoman Divacky
553f22ef01cSRoman Divacky if (TrueBBI.BB->pred_size() > 1) {
554f22ef01cSRoman Divacky if (TrueBBI.CannotBeCopied ||
5552754fe60SDimitry Andric !TII->isProfitableToDupForIfCvt(*TrueBBI.BB, TrueBBI.NonPredSize,
55617a519f9SDimitry Andric Prediction))
557f22ef01cSRoman Divacky return false;
558f22ef01cSRoman Divacky Dups = TrueBBI.NonPredSize;
559f22ef01cSRoman Divacky }
560f22ef01cSRoman Divacky
561f22ef01cSRoman Divacky return true;
562f22ef01cSRoman Divacky }
563f22ef01cSRoman Divacky
564d88c1a5aSDimitry Andric /// Returns true if the 'true' and 'false' blocks (along with their common
565d88c1a5aSDimitry Andric /// predecessor) forms a valid triangle shape for ifcvt. If 'FalseBranch' is
566d88c1a5aSDimitry Andric /// true, it checks if 'true' block's false branch branches to the 'false' block
567d88c1a5aSDimitry Andric /// rather than the other way around. It also returns the number of instructions
568d88c1a5aSDimitry Andric /// that the ifcvt would need to duplicate if performed in 'Dups'.
ValidTriangle(BBInfo & TrueBBI,BBInfo & FalseBBI,bool FalseBranch,unsigned & Dups,BranchProbability Prediction) const569f22ef01cSRoman Divacky bool IfConverter::ValidTriangle(BBInfo &TrueBBI, BBInfo &FalseBBI,
5702754fe60SDimitry Andric bool FalseBranch, unsigned &Dups,
5717d523365SDimitry Andric BranchProbability Prediction) const {
572f22ef01cSRoman Divacky Dups = 0;
573f22ef01cSRoman Divacky if (TrueBBI.IsBeingAnalyzed || TrueBBI.IsDone)
574f22ef01cSRoman Divacky return false;
575f22ef01cSRoman Divacky
576f22ef01cSRoman Divacky if (TrueBBI.BB->pred_size() > 1) {
577f22ef01cSRoman Divacky if (TrueBBI.CannotBeCopied)
578f22ef01cSRoman Divacky return false;
579f22ef01cSRoman Divacky
580f22ef01cSRoman Divacky unsigned Size = TrueBBI.NonPredSize;
581f22ef01cSRoman Divacky if (TrueBBI.IsBrAnalyzable) {
582f22ef01cSRoman Divacky if (TrueBBI.TrueBB && TrueBBI.BrCond.empty())
583f22ef01cSRoman Divacky // Ends with an unconditional branch. It will be removed.
584f22ef01cSRoman Divacky --Size;
585f22ef01cSRoman Divacky else {
586f22ef01cSRoman Divacky MachineBasicBlock *FExit = FalseBranch
587f22ef01cSRoman Divacky ? TrueBBI.TrueBB : TrueBBI.FalseBB;
588f22ef01cSRoman Divacky if (FExit)
589f22ef01cSRoman Divacky // Require a conditional branch
590f22ef01cSRoman Divacky ++Size;
591f22ef01cSRoman Divacky }
592f22ef01cSRoman Divacky }
59317a519f9SDimitry Andric if (!TII->isProfitableToDupForIfCvt(*TrueBBI.BB, Size, Prediction))
594f22ef01cSRoman Divacky return false;
595f22ef01cSRoman Divacky Dups = Size;
596f22ef01cSRoman Divacky }
597f22ef01cSRoman Divacky
598f22ef01cSRoman Divacky MachineBasicBlock *TExit = FalseBranch ? TrueBBI.FalseBB : TrueBBI.TrueBB;
599f22ef01cSRoman Divacky if (!TExit && blockAlwaysFallThrough(TrueBBI)) {
6007d523365SDimitry Andric MachineFunction::iterator I = TrueBBI.BB->getIterator();
601f22ef01cSRoman Divacky if (++I == TrueBBI.BB->getParent()->end())
602f22ef01cSRoman Divacky return false;
6037d523365SDimitry Andric TExit = &*I;
604f22ef01cSRoman Divacky }
605f22ef01cSRoman Divacky return TExit && TExit == FalseBBI.BB;
606f22ef01cSRoman Divacky }
607f22ef01cSRoman Divacky
608d88c1a5aSDimitry Andric /// Count duplicated instructions and move the iterators to show where they
609d88c1a5aSDimitry Andric /// are.
610d88c1a5aSDimitry Andric /// @param TIB True Iterator Begin
611d88c1a5aSDimitry Andric /// @param FIB False Iterator Begin
612d88c1a5aSDimitry Andric /// These two iterators initially point to the first instruction of the two
613d88c1a5aSDimitry Andric /// blocks, and finally point to the first non-shared instruction.
614d88c1a5aSDimitry Andric /// @param TIE True Iterator End
615d88c1a5aSDimitry Andric /// @param FIE False Iterator End
616d88c1a5aSDimitry Andric /// These two iterators initially point to End() for the two blocks() and
617d88c1a5aSDimitry Andric /// finally point to the first shared instruction in the tail.
618d88c1a5aSDimitry Andric /// Upon return [TIB, TIE), and [FIB, FIE) mark the un-duplicated portions of
619d88c1a5aSDimitry Andric /// two blocks.
620d88c1a5aSDimitry Andric /// @param Dups1 count of duplicated instructions at the beginning of the 2
621d88c1a5aSDimitry Andric /// blocks.
622d88c1a5aSDimitry Andric /// @param Dups2 count of duplicated instructions at the end of the 2 blocks.
623d88c1a5aSDimitry Andric /// @param SkipUnconditionalBranches if true, Don't make sure that
624d88c1a5aSDimitry Andric /// unconditional branches at the end of the blocks are the same. True is
625d88c1a5aSDimitry Andric /// passed when the blocks are analyzable to allow for fallthrough to be
626d88c1a5aSDimitry Andric /// handled.
627d88c1a5aSDimitry Andric /// @return false if the shared portion prevents if conversion.
CountDuplicatedInstructions(MachineBasicBlock::iterator & TIB,MachineBasicBlock::iterator & FIB,MachineBasicBlock::iterator & TIE,MachineBasicBlock::iterator & FIE,unsigned & Dups1,unsigned & Dups2,MachineBasicBlock & TBB,MachineBasicBlock & FBB,bool SkipUnconditionalBranches) const628d88c1a5aSDimitry Andric bool IfConverter::CountDuplicatedInstructions(
629d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIB,
630d88c1a5aSDimitry Andric MachineBasicBlock::iterator &FIB,
631d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIE,
632d88c1a5aSDimitry Andric MachineBasicBlock::iterator &FIE,
633d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
634d88c1a5aSDimitry Andric MachineBasicBlock &TBB, MachineBasicBlock &FBB,
635d88c1a5aSDimitry Andric bool SkipUnconditionalBranches) const {
636d88c1a5aSDimitry Andric while (TIB != TIE && FIB != FIE) {
637d88c1a5aSDimitry Andric // Skip dbg_value instructions. These do not count.
638d88c1a5aSDimitry Andric TIB = skipDebugInstructionsForward(TIB, TIE);
639d88c1a5aSDimitry Andric FIB = skipDebugInstructionsForward(FIB, FIE);
6407a7e6055SDimitry Andric if (TIB == TIE || FIB == FIE)
641d88c1a5aSDimitry Andric break;
642d88c1a5aSDimitry Andric if (!TIB->isIdenticalTo(*FIB))
643d88c1a5aSDimitry Andric break;
644d88c1a5aSDimitry Andric // A pred-clobbering instruction in the shared portion prevents
645d88c1a5aSDimitry Andric // if-conversion.
646d88c1a5aSDimitry Andric std::vector<MachineOperand> PredDefs;
647d88c1a5aSDimitry Andric if (TII->DefinesPredicate(*TIB, PredDefs))
648d88c1a5aSDimitry Andric return false;
649d88c1a5aSDimitry Andric // If we get all the way to the branch instructions, don't count them.
650d88c1a5aSDimitry Andric if (!TIB->isBranch())
651d88c1a5aSDimitry Andric ++Dups1;
652d88c1a5aSDimitry Andric ++TIB;
653d88c1a5aSDimitry Andric ++FIB;
654d88c1a5aSDimitry Andric }
655d88c1a5aSDimitry Andric
656d88c1a5aSDimitry Andric // Check for already containing all of the block.
657d88c1a5aSDimitry Andric if (TIB == TIE || FIB == FIE)
658d88c1a5aSDimitry Andric return true;
659d88c1a5aSDimitry Andric // Now, in preparation for counting duplicate instructions at the ends of the
6607a7e6055SDimitry Andric // blocks, switch to reverse_iterators. Note that getReverse() returns an
6617a7e6055SDimitry Andric // iterator that points to the same instruction, unlike std::reverse_iterator.
6627a7e6055SDimitry Andric // We have to do our own shifting so that we get the same range.
6637a7e6055SDimitry Andric MachineBasicBlock::reverse_iterator RTIE = std::next(TIE.getReverse());
6647a7e6055SDimitry Andric MachineBasicBlock::reverse_iterator RFIE = std::next(FIE.getReverse());
6657a7e6055SDimitry Andric const MachineBasicBlock::reverse_iterator RTIB = std::next(TIB.getReverse());
6667a7e6055SDimitry Andric const MachineBasicBlock::reverse_iterator RFIB = std::next(FIB.getReverse());
667d88c1a5aSDimitry Andric
668d88c1a5aSDimitry Andric if (!TBB.succ_empty() || !FBB.succ_empty()) {
669d88c1a5aSDimitry Andric if (SkipUnconditionalBranches) {
6707a7e6055SDimitry Andric while (RTIE != RTIB && RTIE->isUnconditionalBranch())
6717a7e6055SDimitry Andric ++RTIE;
6727a7e6055SDimitry Andric while (RFIE != RFIB && RFIE->isUnconditionalBranch())
6737a7e6055SDimitry Andric ++RFIE;
674d88c1a5aSDimitry Andric }
675d88c1a5aSDimitry Andric }
676d88c1a5aSDimitry Andric
677d88c1a5aSDimitry Andric // Count duplicate instructions at the ends of the blocks.
6787a7e6055SDimitry Andric while (RTIE != RTIB && RFIE != RFIB) {
679d88c1a5aSDimitry Andric // Skip dbg_value instructions. These do not count.
6807a7e6055SDimitry Andric // Note that these are reverse iterators going forward.
6817a7e6055SDimitry Andric RTIE = skipDebugInstructionsForward(RTIE, RTIB);
6827a7e6055SDimitry Andric RFIE = skipDebugInstructionsForward(RFIE, RFIB);
6837a7e6055SDimitry Andric if (RTIE == RTIB || RFIE == RFIB)
684d88c1a5aSDimitry Andric break;
6857a7e6055SDimitry Andric if (!RTIE->isIdenticalTo(*RFIE))
686d88c1a5aSDimitry Andric break;
687d88c1a5aSDimitry Andric // We have to verify that any branch instructions are the same, and then we
688d88c1a5aSDimitry Andric // don't count them toward the # of duplicate instructions.
6897a7e6055SDimitry Andric if (!RTIE->isBranch())
690d88c1a5aSDimitry Andric ++Dups2;
6917a7e6055SDimitry Andric ++RTIE;
6927a7e6055SDimitry Andric ++RFIE;
693d88c1a5aSDimitry Andric }
6947a7e6055SDimitry Andric TIE = std::next(RTIE.getReverse());
6957a7e6055SDimitry Andric FIE = std::next(RFIE.getReverse());
696d88c1a5aSDimitry Andric return true;
697d88c1a5aSDimitry Andric }
698d88c1a5aSDimitry Andric
699d88c1a5aSDimitry Andric /// RescanInstructions - Run ScanInstructions on a pair of blocks.
700d88c1a5aSDimitry Andric /// @param TIB - True Iterator Begin, points to first non-shared instruction
701d88c1a5aSDimitry Andric /// @param FIB - False Iterator Begin, points to first non-shared instruction
702d88c1a5aSDimitry Andric /// @param TIE - True Iterator End, points past last non-shared instruction
703d88c1a5aSDimitry Andric /// @param FIE - False Iterator End, points past last non-shared instruction
704d88c1a5aSDimitry Andric /// @param TrueBBI - BBInfo to update for the true block.
705d88c1a5aSDimitry Andric /// @param FalseBBI - BBInfo to update for the false block.
706d88c1a5aSDimitry Andric /// @returns - false if either block cannot be predicated or if both blocks end
707d88c1a5aSDimitry Andric /// with a predicate-clobbering instruction.
RescanInstructions(MachineBasicBlock::iterator & TIB,MachineBasicBlock::iterator & FIB,MachineBasicBlock::iterator & TIE,MachineBasicBlock::iterator & FIE,BBInfo & TrueBBI,BBInfo & FalseBBI) const708d88c1a5aSDimitry Andric bool IfConverter::RescanInstructions(
709d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIB, MachineBasicBlock::iterator &FIB,
710d88c1a5aSDimitry Andric MachineBasicBlock::iterator &TIE, MachineBasicBlock::iterator &FIE,
711d88c1a5aSDimitry Andric BBInfo &TrueBBI, BBInfo &FalseBBI) const {
712d88c1a5aSDimitry Andric bool BranchUnpredicable = true;
713d88c1a5aSDimitry Andric TrueBBI.IsUnpredicable = FalseBBI.IsUnpredicable = false;
714d88c1a5aSDimitry Andric ScanInstructions(TrueBBI, TIB, TIE, BranchUnpredicable);
715d88c1a5aSDimitry Andric if (TrueBBI.IsUnpredicable)
716d88c1a5aSDimitry Andric return false;
717d88c1a5aSDimitry Andric ScanInstructions(FalseBBI, FIB, FIE, BranchUnpredicable);
718d88c1a5aSDimitry Andric if (FalseBBI.IsUnpredicable)
719d88c1a5aSDimitry Andric return false;
720d88c1a5aSDimitry Andric if (TrueBBI.ClobbersPred && FalseBBI.ClobbersPred)
721d88c1a5aSDimitry Andric return false;
722d88c1a5aSDimitry Andric return true;
723d88c1a5aSDimitry Andric }
724d88c1a5aSDimitry Andric
725d88c1a5aSDimitry Andric #ifndef NDEBUG
verifySameBranchInstructions(MachineBasicBlock * MBB1,MachineBasicBlock * MBB2)726d88c1a5aSDimitry Andric static void verifySameBranchInstructions(
727d88c1a5aSDimitry Andric MachineBasicBlock *MBB1,
728d88c1a5aSDimitry Andric MachineBasicBlock *MBB2) {
7297a7e6055SDimitry Andric const MachineBasicBlock::reverse_iterator B1 = MBB1->rend();
7307a7e6055SDimitry Andric const MachineBasicBlock::reverse_iterator B2 = MBB2->rend();
7317a7e6055SDimitry Andric MachineBasicBlock::reverse_iterator E1 = MBB1->rbegin();
7327a7e6055SDimitry Andric MachineBasicBlock::reverse_iterator E2 = MBB2->rbegin();
7337a7e6055SDimitry Andric while (E1 != B1 && E2 != B2) {
7347a7e6055SDimitry Andric skipDebugInstructionsForward(E1, B1);
7357a7e6055SDimitry Andric skipDebugInstructionsForward(E2, B2);
7367a7e6055SDimitry Andric if (E1 == B1 && E2 == B2)
737d88c1a5aSDimitry Andric break;
738d88c1a5aSDimitry Andric
7397a7e6055SDimitry Andric if (E1 == B1) {
740d88c1a5aSDimitry Andric assert(!E2->isBranch() && "Branch mis-match, one block is empty.");
741d88c1a5aSDimitry Andric break;
742d88c1a5aSDimitry Andric }
7437a7e6055SDimitry Andric if (E2 == B2) {
744d88c1a5aSDimitry Andric assert(!E1->isBranch() && "Branch mis-match, one block is empty.");
745d88c1a5aSDimitry Andric break;
746d88c1a5aSDimitry Andric }
747d88c1a5aSDimitry Andric
748d88c1a5aSDimitry Andric if (E1->isBranch() || E2->isBranch())
749d88c1a5aSDimitry Andric assert(E1->isIdenticalTo(*E2) &&
750d88c1a5aSDimitry Andric "Branch mis-match, branch instructions don't match.");
751d88c1a5aSDimitry Andric else
752d88c1a5aSDimitry Andric break;
7537a7e6055SDimitry Andric ++E1;
7547a7e6055SDimitry Andric ++E2;
755d88c1a5aSDimitry Andric }
756d88c1a5aSDimitry Andric }
757d88c1a5aSDimitry Andric #endif
758d88c1a5aSDimitry Andric
759d88c1a5aSDimitry Andric /// ValidForkedDiamond - Returns true if the 'true' and 'false' blocks (along
760d88c1a5aSDimitry Andric /// with their common predecessor) form a diamond if a common tail block is
761d88c1a5aSDimitry Andric /// extracted.
762d88c1a5aSDimitry Andric /// While not strictly a diamond, this pattern would form a diamond if
763d88c1a5aSDimitry Andric /// tail-merging had merged the shared tails.
764d88c1a5aSDimitry Andric /// EBB
765d88c1a5aSDimitry Andric /// _/ \_
766d88c1a5aSDimitry Andric /// | |
767d88c1a5aSDimitry Andric /// TBB FBB
768d88c1a5aSDimitry Andric /// / \ / \
769d88c1a5aSDimitry Andric /// FalseBB TrueBB FalseBB
770d88c1a5aSDimitry Andric /// Currently only handles analyzable branches.
771d88c1a5aSDimitry Andric /// Specifically excludes actual diamonds to avoid overlap.
ValidForkedDiamond(BBInfo & TrueBBI,BBInfo & FalseBBI,unsigned & Dups1,unsigned & Dups2,BBInfo & TrueBBICalc,BBInfo & FalseBBICalc) const772d88c1a5aSDimitry Andric bool IfConverter::ValidForkedDiamond(
773d88c1a5aSDimitry Andric BBInfo &TrueBBI, BBInfo &FalseBBI,
774d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
775d88c1a5aSDimitry Andric BBInfo &TrueBBICalc, BBInfo &FalseBBICalc) const {
776d88c1a5aSDimitry Andric Dups1 = Dups2 = 0;
777d88c1a5aSDimitry Andric if (TrueBBI.IsBeingAnalyzed || TrueBBI.IsDone ||
778d88c1a5aSDimitry Andric FalseBBI.IsBeingAnalyzed || FalseBBI.IsDone)
779d88c1a5aSDimitry Andric return false;
780d88c1a5aSDimitry Andric
781d88c1a5aSDimitry Andric if (!TrueBBI.IsBrAnalyzable || !FalseBBI.IsBrAnalyzable)
782d88c1a5aSDimitry Andric return false;
783d88c1a5aSDimitry Andric // Don't IfConvert blocks that can't be folded into their predecessor.
784d88c1a5aSDimitry Andric if (TrueBBI.BB->pred_size() > 1 || FalseBBI.BB->pred_size() > 1)
785d88c1a5aSDimitry Andric return false;
786d88c1a5aSDimitry Andric
787d88c1a5aSDimitry Andric // This function is specifically looking for conditional tails, as
788d88c1a5aSDimitry Andric // unconditional tails are already handled by the standard diamond case.
789d88c1a5aSDimitry Andric if (TrueBBI.BrCond.size() == 0 ||
790d88c1a5aSDimitry Andric FalseBBI.BrCond.size() == 0)
791d88c1a5aSDimitry Andric return false;
792d88c1a5aSDimitry Andric
793d88c1a5aSDimitry Andric MachineBasicBlock *TT = TrueBBI.TrueBB;
794d88c1a5aSDimitry Andric MachineBasicBlock *TF = TrueBBI.FalseBB;
795d88c1a5aSDimitry Andric MachineBasicBlock *FT = FalseBBI.TrueBB;
796d88c1a5aSDimitry Andric MachineBasicBlock *FF = FalseBBI.FalseBB;
797d88c1a5aSDimitry Andric
798d88c1a5aSDimitry Andric if (!TT)
799d88c1a5aSDimitry Andric TT = getNextBlock(*TrueBBI.BB);
800d88c1a5aSDimitry Andric if (!TF)
801d88c1a5aSDimitry Andric TF = getNextBlock(*TrueBBI.BB);
802d88c1a5aSDimitry Andric if (!FT)
803d88c1a5aSDimitry Andric FT = getNextBlock(*FalseBBI.BB);
804d88c1a5aSDimitry Andric if (!FF)
805d88c1a5aSDimitry Andric FF = getNextBlock(*FalseBBI.BB);
806d88c1a5aSDimitry Andric
807d88c1a5aSDimitry Andric if (!TT || !TF)
808d88c1a5aSDimitry Andric return false;
809d88c1a5aSDimitry Andric
810d88c1a5aSDimitry Andric // Check successors. If they don't match, bail.
811d88c1a5aSDimitry Andric if (!((TT == FT && TF == FF) || (TF == FT && TT == FF)))
812d88c1a5aSDimitry Andric return false;
813d88c1a5aSDimitry Andric
814d88c1a5aSDimitry Andric bool FalseReversed = false;
815d88c1a5aSDimitry Andric if (TF == FT && TT == FF) {
816d88c1a5aSDimitry Andric // If the branches are opposing, but we can't reverse, don't do it.
817d88c1a5aSDimitry Andric if (!FalseBBI.IsBrReversible)
818d88c1a5aSDimitry Andric return false;
819d88c1a5aSDimitry Andric FalseReversed = true;
820d88c1a5aSDimitry Andric reverseBranchCondition(FalseBBI);
821d88c1a5aSDimitry Andric }
822d88c1a5aSDimitry Andric auto UnReverseOnExit = make_scope_exit([&]() {
823d88c1a5aSDimitry Andric if (FalseReversed)
824d88c1a5aSDimitry Andric reverseBranchCondition(FalseBBI);
825d88c1a5aSDimitry Andric });
826d88c1a5aSDimitry Andric
827d88c1a5aSDimitry Andric // Count duplicate instructions at the beginning of the true and false blocks.
828d88c1a5aSDimitry Andric MachineBasicBlock::iterator TIB = TrueBBI.BB->begin();
829d88c1a5aSDimitry Andric MachineBasicBlock::iterator FIB = FalseBBI.BB->begin();
830d88c1a5aSDimitry Andric MachineBasicBlock::iterator TIE = TrueBBI.BB->end();
831d88c1a5aSDimitry Andric MachineBasicBlock::iterator FIE = FalseBBI.BB->end();
832d88c1a5aSDimitry Andric if(!CountDuplicatedInstructions(TIB, FIB, TIE, FIE, Dups1, Dups2,
833d88c1a5aSDimitry Andric *TrueBBI.BB, *FalseBBI.BB,
834d88c1a5aSDimitry Andric /* SkipUnconditionalBranches */ true))
835d88c1a5aSDimitry Andric return false;
836d88c1a5aSDimitry Andric
837d88c1a5aSDimitry Andric TrueBBICalc.BB = TrueBBI.BB;
838d88c1a5aSDimitry Andric FalseBBICalc.BB = FalseBBI.BB;
839d88c1a5aSDimitry Andric if (!RescanInstructions(TIB, FIB, TIE, FIE, TrueBBICalc, FalseBBICalc))
840d88c1a5aSDimitry Andric return false;
841d88c1a5aSDimitry Andric
842d88c1a5aSDimitry Andric // The size is used to decide whether to if-convert, and the shared portions
843d88c1a5aSDimitry Andric // are subtracted off. Because of the subtraction, we just use the size that
844d88c1a5aSDimitry Andric // was calculated by the original ScanInstructions, as it is correct.
845d88c1a5aSDimitry Andric TrueBBICalc.NonPredSize = TrueBBI.NonPredSize;
846d88c1a5aSDimitry Andric FalseBBICalc.NonPredSize = FalseBBI.NonPredSize;
847d88c1a5aSDimitry Andric return true;
848d88c1a5aSDimitry Andric }
849d88c1a5aSDimitry Andric
850f22ef01cSRoman Divacky /// ValidDiamond - Returns true if the 'true' and 'false' blocks (along
851f22ef01cSRoman Divacky /// with their common predecessor) forms a valid diamond shape for ifcvt.
ValidDiamond(BBInfo & TrueBBI,BBInfo & FalseBBI,unsigned & Dups1,unsigned & Dups2,BBInfo & TrueBBICalc,BBInfo & FalseBBICalc) const852d88c1a5aSDimitry Andric bool IfConverter::ValidDiamond(
853d88c1a5aSDimitry Andric BBInfo &TrueBBI, BBInfo &FalseBBI,
854d88c1a5aSDimitry Andric unsigned &Dups1, unsigned &Dups2,
855d88c1a5aSDimitry Andric BBInfo &TrueBBICalc, BBInfo &FalseBBICalc) const {
856f22ef01cSRoman Divacky Dups1 = Dups2 = 0;
857f22ef01cSRoman Divacky if (TrueBBI.IsBeingAnalyzed || TrueBBI.IsDone ||
858f22ef01cSRoman Divacky FalseBBI.IsBeingAnalyzed || FalseBBI.IsDone)
859f22ef01cSRoman Divacky return false;
860f22ef01cSRoman Divacky
861f22ef01cSRoman Divacky MachineBasicBlock *TT = TrueBBI.TrueBB;
862f22ef01cSRoman Divacky MachineBasicBlock *FT = FalseBBI.TrueBB;
863f22ef01cSRoman Divacky
864f22ef01cSRoman Divacky if (!TT && blockAlwaysFallThrough(TrueBBI))
865d88c1a5aSDimitry Andric TT = getNextBlock(*TrueBBI.BB);
866f22ef01cSRoman Divacky if (!FT && blockAlwaysFallThrough(FalseBBI))
867d88c1a5aSDimitry Andric FT = getNextBlock(*FalseBBI.BB);
868f22ef01cSRoman Divacky if (TT != FT)
869f22ef01cSRoman Divacky return false;
87091bc56edSDimitry Andric if (!TT && (TrueBBI.IsBrAnalyzable || FalseBBI.IsBrAnalyzable))
871f22ef01cSRoman Divacky return false;
872f22ef01cSRoman Divacky if (TrueBBI.BB->pred_size() > 1 || FalseBBI.BB->pred_size() > 1)
873f22ef01cSRoman Divacky return false;
874f22ef01cSRoman Divacky
875f22ef01cSRoman Divacky // FIXME: Allow true block to have an early exit?
876d88c1a5aSDimitry Andric if (TrueBBI.FalseBB || FalseBBI.FalseBB)
877f22ef01cSRoman Divacky return false;
878f22ef01cSRoman Divacky
879d88c1a5aSDimitry Andric // Count duplicate instructions at the beginning and end of the true and
880d88c1a5aSDimitry Andric // false blocks.
881d88c1a5aSDimitry Andric // Skip unconditional branches only if we are considering an analyzable
882d88c1a5aSDimitry Andric // diamond. Otherwise the branches must be the same.
883d88c1a5aSDimitry Andric bool SkipUnconditionalBranches =
884d88c1a5aSDimitry Andric TrueBBI.IsBrAnalyzable && FalseBBI.IsBrAnalyzable;
885ffd1746dSEd Schouten MachineBasicBlock::iterator TIB = TrueBBI.BB->begin();
886ffd1746dSEd Schouten MachineBasicBlock::iterator FIB = FalseBBI.BB->begin();
8872754fe60SDimitry Andric MachineBasicBlock::iterator TIE = TrueBBI.BB->end();
8882754fe60SDimitry Andric MachineBasicBlock::iterator FIE = FalseBBI.BB->end();
889d88c1a5aSDimitry Andric if(!CountDuplicatedInstructions(TIB, FIB, TIE, FIE, Dups1, Dups2,
890d88c1a5aSDimitry Andric *TrueBBI.BB, *FalseBBI.BB,
891d88c1a5aSDimitry Andric SkipUnconditionalBranches))
892d88c1a5aSDimitry Andric return false;
8932754fe60SDimitry Andric
894d88c1a5aSDimitry Andric TrueBBICalc.BB = TrueBBI.BB;
895d88c1a5aSDimitry Andric FalseBBICalc.BB = FalseBBI.BB;
896d88c1a5aSDimitry Andric if (!RescanInstructions(TIB, FIB, TIE, FIE, TrueBBICalc, FalseBBICalc))
897d88c1a5aSDimitry Andric return false;
898d88c1a5aSDimitry Andric // The size is used to decide whether to if-convert, and the shared portions
899d88c1a5aSDimitry Andric // are subtracted off. Because of the subtraction, we just use the size that
900d88c1a5aSDimitry Andric // was calculated by the original ScanInstructions, as it is correct.
901d88c1a5aSDimitry Andric TrueBBICalc.NonPredSize = TrueBBI.NonPredSize;
902d88c1a5aSDimitry Andric FalseBBICalc.NonPredSize = FalseBBI.NonPredSize;
903f22ef01cSRoman Divacky return true;
904f22ef01cSRoman Divacky }
905f22ef01cSRoman Divacky
906d88c1a5aSDimitry Andric /// AnalyzeBranches - Look at the branches at the end of a block to determine if
907d88c1a5aSDimitry Andric /// the block is predicable.
AnalyzeBranches(BBInfo & BBI)908d88c1a5aSDimitry Andric void IfConverter::AnalyzeBranches(BBInfo &BBI) {
909f22ef01cSRoman Divacky if (BBI.IsDone)
910f22ef01cSRoman Divacky return;
911f22ef01cSRoman Divacky
91291bc56edSDimitry Andric BBI.TrueBB = BBI.FalseBB = nullptr;
913f22ef01cSRoman Divacky BBI.BrCond.clear();
914f22ef01cSRoman Divacky BBI.IsBrAnalyzable =
9153ca95b02SDimitry Andric !TII->analyzeBranch(*BBI.BB, BBI.TrueBB, BBI.FalseBB, BBI.BrCond);
916d88c1a5aSDimitry Andric SmallVector<MachineOperand, 4> RevCond(BBI.BrCond.begin(), BBI.BrCond.end());
917d88c1a5aSDimitry Andric BBI.IsBrReversible = (RevCond.size() == 0) ||
918d88c1a5aSDimitry Andric !TII->reverseBranchCondition(RevCond);
91991bc56edSDimitry Andric BBI.HasFallThrough = BBI.IsBrAnalyzable && BBI.FalseBB == nullptr;
920f22ef01cSRoman Divacky
921f22ef01cSRoman Divacky if (BBI.BrCond.size()) {
922f22ef01cSRoman Divacky // No false branch. This BB must end with a conditional branch and a
923f22ef01cSRoman Divacky // fallthrough.
924f22ef01cSRoman Divacky if (!BBI.FalseBB)
925f22ef01cSRoman Divacky BBI.FalseBB = findFalseBlock(BBI.BB, BBI.TrueBB);
926f22ef01cSRoman Divacky if (!BBI.FalseBB) {
927f22ef01cSRoman Divacky // Malformed bcc? True and false blocks are the same?
928f22ef01cSRoman Divacky BBI.IsUnpredicable = true;
929d88c1a5aSDimitry Andric }
930f22ef01cSRoman Divacky }
931f22ef01cSRoman Divacky }
932f22ef01cSRoman Divacky
933d88c1a5aSDimitry Andric /// ScanInstructions - Scan all the instructions in the block to determine if
934d88c1a5aSDimitry Andric /// the block is predicable. In most cases, that means all the instructions
935d88c1a5aSDimitry Andric /// in the block are isPredicable(). Also checks if the block contains any
936d88c1a5aSDimitry Andric /// instruction which can clobber a predicate (e.g. condition code register).
937d88c1a5aSDimitry Andric /// If so, the block is not predicable unless it's the last instruction.
ScanInstructions(BBInfo & BBI,MachineBasicBlock::iterator & Begin,MachineBasicBlock::iterator & End,bool BranchUnpredicable) const938d88c1a5aSDimitry Andric void IfConverter::ScanInstructions(BBInfo &BBI,
939d88c1a5aSDimitry Andric MachineBasicBlock::iterator &Begin,
940d88c1a5aSDimitry Andric MachineBasicBlock::iterator &End,
941d88c1a5aSDimitry Andric bool BranchUnpredicable) const {
942d88c1a5aSDimitry Andric if (BBI.IsDone || BBI.IsUnpredicable)
943d88c1a5aSDimitry Andric return;
944d88c1a5aSDimitry Andric
945d88c1a5aSDimitry Andric bool AlreadyPredicated = !BBI.Predicate.empty();
946d88c1a5aSDimitry Andric
947f22ef01cSRoman Divacky BBI.NonPredSize = 0;
9482754fe60SDimitry Andric BBI.ExtraCost = 0;
9492754fe60SDimitry Andric BBI.ExtraCost2 = 0;
950f22ef01cSRoman Divacky BBI.ClobbersPred = false;
951d88c1a5aSDimitry Andric for (MachineInstr &MI : make_range(Begin, End)) {
9524ba319b5SDimitry Andric if (MI.isDebugInstr())
953ffd1746dSEd Schouten continue;
954ffd1746dSEd Schouten
9553ca95b02SDimitry Andric // It's unsafe to duplicate convergent instructions in this context, so set
9563ca95b02SDimitry Andric // BBI.CannotBeCopied to true if MI is convergent. To see why, consider the
9573ca95b02SDimitry Andric // following CFG, which is subject to our "simple" transformation.
9583ca95b02SDimitry Andric //
9593ca95b02SDimitry Andric // BB0 // if (c1) goto BB1; else goto BB2;
9603ca95b02SDimitry Andric // / \
9613ca95b02SDimitry Andric // BB1 |
9623ca95b02SDimitry Andric // | BB2 // if (c2) goto TBB; else goto FBB;
9633ca95b02SDimitry Andric // | / |
9643ca95b02SDimitry Andric // | / |
9653ca95b02SDimitry Andric // TBB |
9663ca95b02SDimitry Andric // | |
9673ca95b02SDimitry Andric // | FBB
9683ca95b02SDimitry Andric // |
9693ca95b02SDimitry Andric // exit
9703ca95b02SDimitry Andric //
9713ca95b02SDimitry Andric // Suppose we want to move TBB's contents up into BB1 and BB2 (in BB1 they'd
9723ca95b02SDimitry Andric // be unconditional, and in BB2, they'd be predicated upon c2), and suppose
9733ca95b02SDimitry Andric // TBB contains a convergent instruction. This is safe iff doing so does
9743ca95b02SDimitry Andric // not add a control-flow dependency to the convergent instruction -- i.e.,
9753ca95b02SDimitry Andric // it's safe iff the set of control flows that leads us to the convergent
9763ca95b02SDimitry Andric // instruction does not get smaller after the transformation.
9773ca95b02SDimitry Andric //
9783ca95b02SDimitry Andric // Originally we executed TBB if c1 || c2. After the transformation, there
9793ca95b02SDimitry Andric // are two copies of TBB's instructions. We get to the first if c1, and we
9803ca95b02SDimitry Andric // get to the second if !c1 && c2.
9813ca95b02SDimitry Andric //
9823ca95b02SDimitry Andric // There are clearly fewer ways to satisfy the condition "c1" than
9833ca95b02SDimitry Andric // "c1 || c2". Since we've shrunk the set of control flows which lead to
9843ca95b02SDimitry Andric // our convergent instruction, the transformation is unsafe.
9853ca95b02SDimitry Andric if (MI.isNotDuplicable() || MI.isConvergent())
986f22ef01cSRoman Divacky BBI.CannotBeCopied = true;
987f22ef01cSRoman Divacky
9883ca95b02SDimitry Andric bool isPredicated = TII->isPredicated(MI);
9893ca95b02SDimitry Andric bool isCondBr = BBI.IsBrAnalyzable && MI.isConditionalBranch();
990f22ef01cSRoman Divacky
991d88c1a5aSDimitry Andric if (BranchUnpredicable && MI.isBranch()) {
992d88c1a5aSDimitry Andric BBI.IsUnpredicable = true;
993d88c1a5aSDimitry Andric return;
994d88c1a5aSDimitry Andric }
995d88c1a5aSDimitry Andric
996f785676fSDimitry Andric // A conditional branch is not predicable, but it may be eliminated.
997f785676fSDimitry Andric if (isCondBr)
998f785676fSDimitry Andric continue;
999f785676fSDimitry Andric
10002754fe60SDimitry Andric if (!isPredicated) {
1001f22ef01cSRoman Divacky BBI.NonPredSize++;
10023ca95b02SDimitry Andric unsigned ExtraPredCost = TII->getPredicationCost(MI);
10033ca95b02SDimitry Andric unsigned NumCycles = SchedModel.computeInstrLatency(&MI, false);
10042754fe60SDimitry Andric if (NumCycles > 1)
10052754fe60SDimitry Andric BBI.ExtraCost += NumCycles-1;
10062754fe60SDimitry Andric BBI.ExtraCost2 += ExtraPredCost;
10072754fe60SDimitry Andric } else if (!AlreadyPredicated) {
1008f22ef01cSRoman Divacky // FIXME: This instruction is already predicated before the
1009f22ef01cSRoman Divacky // if-conversion pass. It's probably something like a conditional move.
1010f22ef01cSRoman Divacky // Mark this block unpredicable for now.
1011f22ef01cSRoman Divacky BBI.IsUnpredicable = true;
1012f22ef01cSRoman Divacky return;
1013f22ef01cSRoman Divacky }
1014f22ef01cSRoman Divacky
1015f22ef01cSRoman Divacky if (BBI.ClobbersPred && !isPredicated) {
1016f22ef01cSRoman Divacky // Predicate modification instruction should end the block (except for
1017f22ef01cSRoman Divacky // already predicated instructions and end of block branches).
1018f22ef01cSRoman Divacky // Predicate may have been modified, the subsequent (currently)
1019f22ef01cSRoman Divacky // unpredicated instructions cannot be correctly predicated.
1020f22ef01cSRoman Divacky BBI.IsUnpredicable = true;
1021f22ef01cSRoman Divacky return;
1022f22ef01cSRoman Divacky }
1023f22ef01cSRoman Divacky
1024f22ef01cSRoman Divacky // FIXME: Make use of PredDefs? e.g. ADDC, SUBC sets predicates but are
1025f22ef01cSRoman Divacky // still potentially predicable.
1026f22ef01cSRoman Divacky std::vector<MachineOperand> PredDefs;
10273ca95b02SDimitry Andric if (TII->DefinesPredicate(MI, PredDefs))
1028f22ef01cSRoman Divacky BBI.ClobbersPred = true;
1029f22ef01cSRoman Divacky
10303ca95b02SDimitry Andric if (!TII->isPredicable(MI)) {
1031f22ef01cSRoman Divacky BBI.IsUnpredicable = true;
1032f22ef01cSRoman Divacky return;
1033f22ef01cSRoman Divacky }
1034f22ef01cSRoman Divacky }
1035f22ef01cSRoman Divacky }
1036f22ef01cSRoman Divacky
1037d88c1a5aSDimitry Andric /// Determine if the block is a suitable candidate to be predicated by the
1038d88c1a5aSDimitry Andric /// specified predicate.
1039d88c1a5aSDimitry Andric /// @param BBI BBInfo for the block to check
1040d88c1a5aSDimitry Andric /// @param Pred Predicate array for the branch that leads to BBI
1041d88c1a5aSDimitry Andric /// @param isTriangle true if the Analysis is for a triangle
1042d88c1a5aSDimitry Andric /// @param RevBranch true if Reverse(Pred) leads to BBI (e.g. BBI is the false
1043d88c1a5aSDimitry Andric /// case
1044d88c1a5aSDimitry Andric /// @param hasCommonTail true if BBI shares a tail with a sibling block that
1045d88c1a5aSDimitry Andric /// contains any instruction that would make the block unpredicable.
FeasibilityAnalysis(BBInfo & BBI,SmallVectorImpl<MachineOperand> & Pred,bool isTriangle,bool RevBranch,bool hasCommonTail)1046f22ef01cSRoman Divacky bool IfConverter::FeasibilityAnalysis(BBInfo &BBI,
1047f22ef01cSRoman Divacky SmallVectorImpl<MachineOperand> &Pred,
1048d88c1a5aSDimitry Andric bool isTriangle, bool RevBranch,
1049d88c1a5aSDimitry Andric bool hasCommonTail) {
1050f22ef01cSRoman Divacky // If the block is dead or unpredicable, then it cannot be predicated.
1051d88c1a5aSDimitry Andric // Two blocks may share a common unpredicable tail, but this doesn't prevent
1052d88c1a5aSDimitry Andric // them from being if-converted. The non-shared portion is assumed to have
1053d88c1a5aSDimitry Andric // been checked
1054d88c1a5aSDimitry Andric if (BBI.IsDone || (BBI.IsUnpredicable && !hasCommonTail))
1055f22ef01cSRoman Divacky return false;
1056f22ef01cSRoman Divacky
1057ff0cc061SDimitry Andric // If it is already predicated but we couldn't analyze its terminator, the
1058ff0cc061SDimitry Andric // latter might fallthrough, but we can't determine where to.
1059ff0cc061SDimitry Andric // Conservatively avoid if-converting again.
1060ff0cc061SDimitry Andric if (BBI.Predicate.size() && !BBI.IsBrAnalyzable)
1061ff0cc061SDimitry Andric return false;
1062ff0cc061SDimitry Andric
1063f785676fSDimitry Andric // If it is already predicated, check if the new predicate subsumes
1064f785676fSDimitry Andric // its predicate.
1065f785676fSDimitry Andric if (BBI.Predicate.size() && !TII->SubsumesPredicate(Pred, BBI.Predicate))
1066f22ef01cSRoman Divacky return false;
1067f22ef01cSRoman Divacky
1068d88c1a5aSDimitry Andric if (!hasCommonTail && BBI.BrCond.size()) {
1069f22ef01cSRoman Divacky if (!isTriangle)
1070f22ef01cSRoman Divacky return false;
1071f22ef01cSRoman Divacky
1072f22ef01cSRoman Divacky // Test predicate subsumption.
1073f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> RevPred(Pred.begin(), Pred.end());
1074f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> Cond(BBI.BrCond.begin(), BBI.BrCond.end());
1075f22ef01cSRoman Divacky if (RevBranch) {
1076d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(Cond))
1077f22ef01cSRoman Divacky return false;
1078f22ef01cSRoman Divacky }
1079d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(RevPred) ||
1080f22ef01cSRoman Divacky !TII->SubsumesPredicate(Cond, RevPred))
1081f22ef01cSRoman Divacky return false;
1082f22ef01cSRoman Divacky }
1083f22ef01cSRoman Divacky
1084f22ef01cSRoman Divacky return true;
1085f22ef01cSRoman Divacky }
1086f22ef01cSRoman Divacky
1087d88c1a5aSDimitry Andric /// Analyze the structure of the sub-CFG starting from the specified block.
1088d88c1a5aSDimitry Andric /// Record its successors and whether it looks like an if-conversion candidate.
AnalyzeBlock(MachineBasicBlock & MBB,std::vector<std::unique_ptr<IfcvtToken>> & Tokens)10893ca95b02SDimitry Andric void IfConverter::AnalyzeBlock(
1090d88c1a5aSDimitry Andric MachineBasicBlock &MBB, std::vector<std::unique_ptr<IfcvtToken>> &Tokens) {
10913dac3a9bSDimitry Andric struct BBState {
1092d88c1a5aSDimitry Andric BBState(MachineBasicBlock &MBB) : MBB(&MBB), SuccsAnalyzed(false) {}
10933dac3a9bSDimitry Andric MachineBasicBlock *MBB;
10943dac3a9bSDimitry Andric
10953dac3a9bSDimitry Andric /// This flag is true if MBB's successors have been analyzed.
10963dac3a9bSDimitry Andric bool SuccsAnalyzed;
10973dac3a9bSDimitry Andric };
10983dac3a9bSDimitry Andric
10993dac3a9bSDimitry Andric // Push MBB to the stack.
11003dac3a9bSDimitry Andric SmallVector<BBState, 16> BBStack(1, MBB);
11013dac3a9bSDimitry Andric
11023dac3a9bSDimitry Andric while (!BBStack.empty()) {
11033dac3a9bSDimitry Andric BBState &State = BBStack.back();
11043dac3a9bSDimitry Andric MachineBasicBlock *BB = State.MBB;
1105f22ef01cSRoman Divacky BBInfo &BBI = BBAnalysis[BB->getNumber()];
1106f22ef01cSRoman Divacky
11073dac3a9bSDimitry Andric if (!State.SuccsAnalyzed) {
11083dac3a9bSDimitry Andric if (BBI.IsAnalyzed || BBI.IsBeingAnalyzed) {
11093dac3a9bSDimitry Andric BBStack.pop_back();
11103dac3a9bSDimitry Andric continue;
11113dac3a9bSDimitry Andric }
1112f22ef01cSRoman Divacky
1113f22ef01cSRoman Divacky BBI.BB = BB;
1114f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = true;
1115f22ef01cSRoman Divacky
1116d88c1a5aSDimitry Andric AnalyzeBranches(BBI);
1117d88c1a5aSDimitry Andric MachineBasicBlock::iterator Begin = BBI.BB->begin();
1118d88c1a5aSDimitry Andric MachineBasicBlock::iterator End = BBI.BB->end();
1119d88c1a5aSDimitry Andric ScanInstructions(BBI, Begin, End);
1120f22ef01cSRoman Divacky
11213dac3a9bSDimitry Andric // Unanalyzable or ends with fallthrough or unconditional branch, or if is
11223dac3a9bSDimitry Andric // not considered for ifcvt anymore.
112317a519f9SDimitry Andric if (!BBI.IsBrAnalyzable || BBI.BrCond.empty() || BBI.IsDone) {
1124f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = false;
1125f22ef01cSRoman Divacky BBI.IsAnalyzed = true;
11263dac3a9bSDimitry Andric BBStack.pop_back();
11273dac3a9bSDimitry Andric continue;
1128f22ef01cSRoman Divacky }
1129f22ef01cSRoman Divacky
1130f22ef01cSRoman Divacky // Do not ifcvt if either path is a back edge to the entry block.
1131f22ef01cSRoman Divacky if (BBI.TrueBB == BB || BBI.FalseBB == BB) {
1132f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = false;
1133f22ef01cSRoman Divacky BBI.IsAnalyzed = true;
11343dac3a9bSDimitry Andric BBStack.pop_back();
11353dac3a9bSDimitry Andric continue;
1136f22ef01cSRoman Divacky }
1137f22ef01cSRoman Divacky
1138f22ef01cSRoman Divacky // Do not ifcvt if true and false fallthrough blocks are the same.
1139f22ef01cSRoman Divacky if (!BBI.FalseBB) {
1140f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = false;
1141f22ef01cSRoman Divacky BBI.IsAnalyzed = true;
11423dac3a9bSDimitry Andric BBStack.pop_back();
11433dac3a9bSDimitry Andric continue;
1144f22ef01cSRoman Divacky }
1145f22ef01cSRoman Divacky
11463dac3a9bSDimitry Andric // Push the False and True blocks to the stack.
11473dac3a9bSDimitry Andric State.SuccsAnalyzed = true;
1148d88c1a5aSDimitry Andric BBStack.push_back(*BBI.FalseBB);
1149d88c1a5aSDimitry Andric BBStack.push_back(*BBI.TrueBB);
11503dac3a9bSDimitry Andric continue;
11513dac3a9bSDimitry Andric }
11523dac3a9bSDimitry Andric
11533dac3a9bSDimitry Andric BBInfo &TrueBBI = BBAnalysis[BBI.TrueBB->getNumber()];
11543dac3a9bSDimitry Andric BBInfo &FalseBBI = BBAnalysis[BBI.FalseBB->getNumber()];
1155f22ef01cSRoman Divacky
1156f22ef01cSRoman Divacky if (TrueBBI.IsDone && FalseBBI.IsDone) {
1157f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = false;
1158f22ef01cSRoman Divacky BBI.IsAnalyzed = true;
11593dac3a9bSDimitry Andric BBStack.pop_back();
11603dac3a9bSDimitry Andric continue;
1161f22ef01cSRoman Divacky }
1162f22ef01cSRoman Divacky
11633dac3a9bSDimitry Andric SmallVector<MachineOperand, 4>
11643dac3a9bSDimitry Andric RevCond(BBI.BrCond.begin(), BBI.BrCond.end());
1165d88c1a5aSDimitry Andric bool CanRevCond = !TII->reverseBranchCondition(RevCond);
1166f22ef01cSRoman Divacky
1167f22ef01cSRoman Divacky unsigned Dups = 0;
1168f22ef01cSRoman Divacky unsigned Dups2 = 0;
11697ae0e2c9SDimitry Andric bool TNeedSub = !TrueBBI.Predicate.empty();
11707ae0e2c9SDimitry Andric bool FNeedSub = !FalseBBI.Predicate.empty();
1171f22ef01cSRoman Divacky bool Enqueued = false;
11722754fe60SDimitry Andric
11736122f3e6SDimitry Andric BranchProbability Prediction = MBPI->getEdgeProbability(BB, TrueBBI.BB);
11742754fe60SDimitry Andric
1175d88c1a5aSDimitry Andric if (CanRevCond) {
1176d88c1a5aSDimitry Andric BBInfo TrueBBICalc, FalseBBICalc;
1177d88c1a5aSDimitry Andric auto feasibleDiamond = [&]() {
1178d88c1a5aSDimitry Andric bool MeetsSize = MeetIfcvtSizeLimit(
1179d88c1a5aSDimitry Andric *TrueBBI.BB, (TrueBBICalc.NonPredSize - (Dups + Dups2) +
1180d88c1a5aSDimitry Andric TrueBBICalc.ExtraCost), TrueBBICalc.ExtraCost2,
1181d88c1a5aSDimitry Andric *FalseBBI.BB, (FalseBBICalc.NonPredSize - (Dups + Dups2) +
1182d88c1a5aSDimitry Andric FalseBBICalc.ExtraCost), FalseBBICalc.ExtraCost2,
1183d88c1a5aSDimitry Andric Prediction);
1184d88c1a5aSDimitry Andric bool TrueFeasible = FeasibilityAnalysis(TrueBBI, BBI.BrCond,
1185d88c1a5aSDimitry Andric /* IsTriangle */ false, /* RevCond */ false,
1186d88c1a5aSDimitry Andric /* hasCommonTail */ true);
1187d88c1a5aSDimitry Andric bool FalseFeasible = FeasibilityAnalysis(FalseBBI, RevCond,
1188d88c1a5aSDimitry Andric /* IsTriangle */ false, /* RevCond */ false,
1189d88c1a5aSDimitry Andric /* hasCommonTail */ true);
1190d88c1a5aSDimitry Andric return MeetsSize && TrueFeasible && FalseFeasible;
1191d88c1a5aSDimitry Andric };
1192d88c1a5aSDimitry Andric
1193d88c1a5aSDimitry Andric if (ValidDiamond(TrueBBI, FalseBBI, Dups, Dups2,
1194d88c1a5aSDimitry Andric TrueBBICalc, FalseBBICalc)) {
1195d88c1a5aSDimitry Andric if (feasibleDiamond()) {
1196f22ef01cSRoman Divacky // Diamond:
1197f22ef01cSRoman Divacky // EBB
1198f22ef01cSRoman Divacky // / \_
1199f22ef01cSRoman Divacky // | |
1200f22ef01cSRoman Divacky // TBB FBB
1201f22ef01cSRoman Divacky // \ /
1202f22ef01cSRoman Divacky // TailBB
1203f22ef01cSRoman Divacky // Note TailBB can be empty.
12043ca95b02SDimitry Andric Tokens.push_back(llvm::make_unique<IfcvtToken>(
1205d88c1a5aSDimitry Andric BBI, ICDiamond, TNeedSub | FNeedSub, Dups, Dups2,
1206d88c1a5aSDimitry Andric (bool) TrueBBICalc.ClobbersPred, (bool) FalseBBICalc.ClobbersPred));
1207f22ef01cSRoman Divacky Enqueued = true;
1208f22ef01cSRoman Divacky }
1209d88c1a5aSDimitry Andric } else if (ValidForkedDiamond(TrueBBI, FalseBBI, Dups, Dups2,
1210d88c1a5aSDimitry Andric TrueBBICalc, FalseBBICalc)) {
1211d88c1a5aSDimitry Andric if (feasibleDiamond()) {
1212d88c1a5aSDimitry Andric // ForkedDiamond:
1213d88c1a5aSDimitry Andric // if TBB and FBB have a common tail that includes their conditional
1214d88c1a5aSDimitry Andric // branch instructions, then we can If Convert this pattern.
1215d88c1a5aSDimitry Andric // EBB
1216d88c1a5aSDimitry Andric // _/ \_
1217d88c1a5aSDimitry Andric // | |
1218d88c1a5aSDimitry Andric // TBB FBB
1219d88c1a5aSDimitry Andric // / \ / \
1220d88c1a5aSDimitry Andric // FalseBB TrueBB FalseBB
1221d88c1a5aSDimitry Andric //
1222d88c1a5aSDimitry Andric Tokens.push_back(llvm::make_unique<IfcvtToken>(
1223d88c1a5aSDimitry Andric BBI, ICForkedDiamond, TNeedSub | FNeedSub, Dups, Dups2,
1224d88c1a5aSDimitry Andric (bool) TrueBBICalc.ClobbersPred, (bool) FalseBBICalc.ClobbersPred));
1225d88c1a5aSDimitry Andric Enqueued = true;
1226d88c1a5aSDimitry Andric }
1227d88c1a5aSDimitry Andric }
1228d88c1a5aSDimitry Andric }
1229f22ef01cSRoman Divacky
123017a519f9SDimitry Andric if (ValidTriangle(TrueBBI, FalseBBI, false, Dups, Prediction) &&
12312754fe60SDimitry Andric MeetIfcvtSizeLimit(*TrueBBI.BB, TrueBBI.NonPredSize + TrueBBI.ExtraCost,
123217a519f9SDimitry Andric TrueBBI.ExtraCost2, Prediction) &&
1233f22ef01cSRoman Divacky FeasibilityAnalysis(TrueBBI, BBI.BrCond, true)) {
1234f22ef01cSRoman Divacky // Triangle:
1235f22ef01cSRoman Divacky // EBB
1236f22ef01cSRoman Divacky // | \_
1237f22ef01cSRoman Divacky // | |
1238f22ef01cSRoman Divacky // | TBB
1239f22ef01cSRoman Divacky // | /
1240f22ef01cSRoman Divacky // FBB
12413ca95b02SDimitry Andric Tokens.push_back(
12423ca95b02SDimitry Andric llvm::make_unique<IfcvtToken>(BBI, ICTriangle, TNeedSub, Dups));
1243f22ef01cSRoman Divacky Enqueued = true;
1244f22ef01cSRoman Divacky }
1245f22ef01cSRoman Divacky
124617a519f9SDimitry Andric if (ValidTriangle(TrueBBI, FalseBBI, true, Dups, Prediction) &&
12472754fe60SDimitry Andric MeetIfcvtSizeLimit(*TrueBBI.BB, TrueBBI.NonPredSize + TrueBBI.ExtraCost,
124817a519f9SDimitry Andric TrueBBI.ExtraCost2, Prediction) &&
1249f22ef01cSRoman Divacky FeasibilityAnalysis(TrueBBI, BBI.BrCond, true, true)) {
12503ca95b02SDimitry Andric Tokens.push_back(
12513ca95b02SDimitry Andric llvm::make_unique<IfcvtToken>(BBI, ICTriangleRev, TNeedSub, Dups));
1252f22ef01cSRoman Divacky Enqueued = true;
1253f22ef01cSRoman Divacky }
1254f22ef01cSRoman Divacky
125517a519f9SDimitry Andric if (ValidSimple(TrueBBI, Dups, Prediction) &&
12562754fe60SDimitry Andric MeetIfcvtSizeLimit(*TrueBBI.BB, TrueBBI.NonPredSize + TrueBBI.ExtraCost,
125717a519f9SDimitry Andric TrueBBI.ExtraCost2, Prediction) &&
1258f22ef01cSRoman Divacky FeasibilityAnalysis(TrueBBI, BBI.BrCond)) {
1259f22ef01cSRoman Divacky // Simple (split, no rejoin):
1260f22ef01cSRoman Divacky // EBB
1261f22ef01cSRoman Divacky // | \_
1262f22ef01cSRoman Divacky // | |
1263f22ef01cSRoman Divacky // | TBB---> exit
1264f22ef01cSRoman Divacky // |
1265f22ef01cSRoman Divacky // FBB
12663ca95b02SDimitry Andric Tokens.push_back(
12673ca95b02SDimitry Andric llvm::make_unique<IfcvtToken>(BBI, ICSimple, TNeedSub, Dups));
1268f22ef01cSRoman Divacky Enqueued = true;
1269f22ef01cSRoman Divacky }
1270f22ef01cSRoman Divacky
1271f22ef01cSRoman Divacky if (CanRevCond) {
1272f22ef01cSRoman Divacky // Try the other path...
12732754fe60SDimitry Andric if (ValidTriangle(FalseBBI, TrueBBI, false, Dups,
127417a519f9SDimitry Andric Prediction.getCompl()) &&
12752754fe60SDimitry Andric MeetIfcvtSizeLimit(*FalseBBI.BB,
12762754fe60SDimitry Andric FalseBBI.NonPredSize + FalseBBI.ExtraCost,
127717a519f9SDimitry Andric FalseBBI.ExtraCost2, Prediction.getCompl()) &&
1278f22ef01cSRoman Divacky FeasibilityAnalysis(FalseBBI, RevCond, true)) {
12793ca95b02SDimitry Andric Tokens.push_back(llvm::make_unique<IfcvtToken>(BBI, ICTriangleFalse,
12803ca95b02SDimitry Andric FNeedSub, Dups));
1281f22ef01cSRoman Divacky Enqueued = true;
1282f22ef01cSRoman Divacky }
1283f22ef01cSRoman Divacky
12842754fe60SDimitry Andric if (ValidTriangle(FalseBBI, TrueBBI, true, Dups,
128517a519f9SDimitry Andric Prediction.getCompl()) &&
12862754fe60SDimitry Andric MeetIfcvtSizeLimit(*FalseBBI.BB,
12872754fe60SDimitry Andric FalseBBI.NonPredSize + FalseBBI.ExtraCost,
128817a519f9SDimitry Andric FalseBBI.ExtraCost2, Prediction.getCompl()) &&
1289f22ef01cSRoman Divacky FeasibilityAnalysis(FalseBBI, RevCond, true, true)) {
12903ca95b02SDimitry Andric Tokens.push_back(
12913ca95b02SDimitry Andric llvm::make_unique<IfcvtToken>(BBI, ICTriangleFRev, FNeedSub, Dups));
1292f22ef01cSRoman Divacky Enqueued = true;
1293f22ef01cSRoman Divacky }
1294f22ef01cSRoman Divacky
129517a519f9SDimitry Andric if (ValidSimple(FalseBBI, Dups, Prediction.getCompl()) &&
12962754fe60SDimitry Andric MeetIfcvtSizeLimit(*FalseBBI.BB,
12972754fe60SDimitry Andric FalseBBI.NonPredSize + FalseBBI.ExtraCost,
129817a519f9SDimitry Andric FalseBBI.ExtraCost2, Prediction.getCompl()) &&
1299f22ef01cSRoman Divacky FeasibilityAnalysis(FalseBBI, RevCond)) {
13003ca95b02SDimitry Andric Tokens.push_back(
13013ca95b02SDimitry Andric llvm::make_unique<IfcvtToken>(BBI, ICSimpleFalse, FNeedSub, Dups));
1302f22ef01cSRoman Divacky Enqueued = true;
1303f22ef01cSRoman Divacky }
1304f22ef01cSRoman Divacky }
1305f22ef01cSRoman Divacky
1306f22ef01cSRoman Divacky BBI.IsEnqueued = Enqueued;
1307f22ef01cSRoman Divacky BBI.IsBeingAnalyzed = false;
1308f22ef01cSRoman Divacky BBI.IsAnalyzed = true;
13093dac3a9bSDimitry Andric BBStack.pop_back();
13103dac3a9bSDimitry Andric }
1311f22ef01cSRoman Divacky }
1312f22ef01cSRoman Divacky
1313d88c1a5aSDimitry Andric /// Analyze all blocks and find entries for all if-conversion candidates.
AnalyzeBlocks(MachineFunction & MF,std::vector<std::unique_ptr<IfcvtToken>> & Tokens)13143ca95b02SDimitry Andric void IfConverter::AnalyzeBlocks(
13153ca95b02SDimitry Andric MachineFunction &MF, std::vector<std::unique_ptr<IfcvtToken>> &Tokens) {
1316d88c1a5aSDimitry Andric for (MachineBasicBlock &MBB : MF)
1317d88c1a5aSDimitry Andric AnalyzeBlock(MBB, Tokens);
1318f22ef01cSRoman Divacky
1319f22ef01cSRoman Divacky // Sort to favor more complex ifcvt scheme.
1320f22ef01cSRoman Divacky std::stable_sort(Tokens.begin(), Tokens.end(), IfcvtTokenCmp);
1321f22ef01cSRoman Divacky }
1322f22ef01cSRoman Divacky
1323d88c1a5aSDimitry Andric /// Returns true either if ToMBB is the next block after MBB or that all the
1324d88c1a5aSDimitry Andric /// intervening blocks are empty (given MBB can fall through to its next block).
canFallThroughTo(MachineBasicBlock & MBB,MachineBasicBlock & ToMBB)1325d88c1a5aSDimitry Andric static bool canFallThroughTo(MachineBasicBlock &MBB, MachineBasicBlock &ToMBB) {
1326d88c1a5aSDimitry Andric MachineFunction::iterator PI = MBB.getIterator();
132791bc56edSDimitry Andric MachineFunction::iterator I = std::next(PI);
1328d88c1a5aSDimitry Andric MachineFunction::iterator TI = ToMBB.getIterator();
1329d88c1a5aSDimitry Andric MachineFunction::iterator E = MBB.getParent()->end();
1330ffd1746dSEd Schouten while (I != TI) {
1331ffd1746dSEd Schouten // Check isSuccessor to avoid case where the next block is empty, but
1332ffd1746dSEd Schouten // it's not a successor.
13337d523365SDimitry Andric if (I == E || !I->empty() || !PI->isSuccessor(&*I))
1334f22ef01cSRoman Divacky return false;
1335ffd1746dSEd Schouten PI = I++;
1336ffd1746dSEd Schouten }
13375517e702SDimitry Andric // Finally see if the last I is indeed a successor to PI.
13385517e702SDimitry Andric return PI->isSuccessor(&*I);
1339f22ef01cSRoman Divacky }
1340f22ef01cSRoman Divacky
1341d88c1a5aSDimitry Andric /// Invalidate predecessor BB info so it would be re-analyzed to determine if it
1342d88c1a5aSDimitry Andric /// can be if-converted. If predecessor is already enqueued, dequeue it!
InvalidatePreds(MachineBasicBlock & MBB)1343d88c1a5aSDimitry Andric void IfConverter::InvalidatePreds(MachineBasicBlock &MBB) {
1344d88c1a5aSDimitry Andric for (const MachineBasicBlock *Predecessor : MBB.predecessors()) {
134539d628a0SDimitry Andric BBInfo &PBBI = BBAnalysis[Predecessor->getNumber()];
1346d88c1a5aSDimitry Andric if (PBBI.IsDone || PBBI.BB == &MBB)
1347f22ef01cSRoman Divacky continue;
1348f22ef01cSRoman Divacky PBBI.IsAnalyzed = false;
1349f22ef01cSRoman Divacky PBBI.IsEnqueued = false;
1350f22ef01cSRoman Divacky }
1351f22ef01cSRoman Divacky }
1352f22ef01cSRoman Divacky
1353d88c1a5aSDimitry Andric /// Inserts an unconditional branch from \p MBB to \p ToMBB.
InsertUncondBranch(MachineBasicBlock & MBB,MachineBasicBlock & ToMBB,const TargetInstrInfo * TII)1354d88c1a5aSDimitry Andric static void InsertUncondBranch(MachineBasicBlock &MBB, MachineBasicBlock &ToMBB,
1355f22ef01cSRoman Divacky const TargetInstrInfo *TII) {
1356ffd1746dSEd Schouten DebugLoc dl; // FIXME: this is nowhere
1357f22ef01cSRoman Divacky SmallVector<MachineOperand, 0> NoCond;
1358d88c1a5aSDimitry Andric TII->insertBranch(MBB, &ToMBB, nullptr, NoCond, dl);
1359f22ef01cSRoman Divacky }
1360f22ef01cSRoman Divacky
1361f785676fSDimitry Andric /// Behaves like LiveRegUnits::StepForward() but also adds implicit uses to all
1362d88c1a5aSDimitry Andric /// values defined in MI which are also live/used by MI.
UpdatePredRedefs(MachineInstr & MI,LivePhysRegs & Redefs)13633ca95b02SDimitry Andric static void UpdatePredRedefs(MachineInstr &MI, LivePhysRegs &Redefs) {
13642cab237bSDimitry Andric const TargetRegisterInfo *TRI = MI.getMF()->getSubtarget().getRegisterInfo();
1365d88c1a5aSDimitry Andric
1366d88c1a5aSDimitry Andric // Before stepping forward past MI, remember which regs were live
1367d88c1a5aSDimitry Andric // before MI. This is needed to set the Undef flag only when reg is
1368d88c1a5aSDimitry Andric // dead.
1369b5893f02SDimitry Andric SparseSet<MCPhysReg, identity<MCPhysReg>> LiveBeforeMI;
1370d88c1a5aSDimitry Andric LiveBeforeMI.setUniverse(TRI->getNumRegs());
1371d88c1a5aSDimitry Andric for (unsigned Reg : Redefs)
1372d88c1a5aSDimitry Andric LiveBeforeMI.insert(Reg);
1373d88c1a5aSDimitry Andric
1374b5893f02SDimitry Andric SmallVector<std::pair<MCPhysReg, const MachineOperand*>, 4> Clobbers;
13753ca95b02SDimitry Andric Redefs.stepForward(MI, Clobbers);
1376ffd1746dSEd Schouten
1377ff0cc061SDimitry Andric // Now add the implicit uses for each of the clobbered values.
1378d88c1a5aSDimitry Andric for (auto Clobber : Clobbers) {
1379ff0cc061SDimitry Andric // FIXME: Const cast here is nasty, but better than making StepForward
1380ff0cc061SDimitry Andric // take a mutable instruction instead of const.
1381d88c1a5aSDimitry Andric unsigned Reg = Clobber.first;
1382d88c1a5aSDimitry Andric MachineOperand &Op = const_cast<MachineOperand&>(*Clobber.second);
1383ff0cc061SDimitry Andric MachineInstr *OpMI = Op.getParent();
13842cab237bSDimitry Andric MachineInstrBuilder MIB(*OpMI->getMF(), OpMI);
1385ff0cc061SDimitry Andric if (Op.isRegMask()) {
1386ff0cc061SDimitry Andric // First handle regmasks. They clobber any entries in the mask which
1387ff0cc061SDimitry Andric // means that we need a def for those registers.
1388d88c1a5aSDimitry Andric if (LiveBeforeMI.count(Reg))
1389d88c1a5aSDimitry Andric MIB.addReg(Reg, RegState::Implicit);
1390ff0cc061SDimitry Andric
1391ff0cc061SDimitry Andric // We also need to add an implicit def of this register for the later
1392ff0cc061SDimitry Andric // use to read from.
1393ff0cc061SDimitry Andric // For the register allocator to have allocated a register clobbered
1394ff0cc061SDimitry Andric // by the call which is used later, it must be the case that
1395ff0cc061SDimitry Andric // the call doesn't return.
1396d88c1a5aSDimitry Andric MIB.addReg(Reg, RegState::Implicit | RegState::Define);
1397ff0cc061SDimitry Andric continue;
1398ff0cc061SDimitry Andric }
1399d88c1a5aSDimitry Andric if (LiveBeforeMI.count(Reg))
1400d88c1a5aSDimitry Andric MIB.addReg(Reg, RegState::Implicit);
1401d88c1a5aSDimitry Andric else {
1402d88c1a5aSDimitry Andric bool HasLiveSubReg = false;
1403d88c1a5aSDimitry Andric for (MCSubRegIterator S(Reg, TRI); S.isValid(); ++S) {
1404d88c1a5aSDimitry Andric if (!LiveBeforeMI.count(*S))
1405d88c1a5aSDimitry Andric continue;
1406d88c1a5aSDimitry Andric HasLiveSubReg = true;
1407d88c1a5aSDimitry Andric break;
1408d88c1a5aSDimitry Andric }
1409d88c1a5aSDimitry Andric if (HasLiveSubReg)
1410d88c1a5aSDimitry Andric MIB.addReg(Reg, RegState::Implicit);
1411d88c1a5aSDimitry Andric }
1412ffd1746dSEd Schouten }
1413ffd1746dSEd Schouten }
1414ffd1746dSEd Schouten
1415d88c1a5aSDimitry Andric /// If convert a simple (split, no rejoin) sub-CFG.
IfConvertSimple(BBInfo & BBI,IfcvtKind Kind)1416f22ef01cSRoman Divacky bool IfConverter::IfConvertSimple(BBInfo &BBI, IfcvtKind Kind) {
1417f22ef01cSRoman Divacky BBInfo &TrueBBI = BBAnalysis[BBI.TrueBB->getNumber()];
1418f22ef01cSRoman Divacky BBInfo &FalseBBI = BBAnalysis[BBI.FalseBB->getNumber()];
1419f22ef01cSRoman Divacky BBInfo *CvtBBI = &TrueBBI;
1420f22ef01cSRoman Divacky BBInfo *NextBBI = &FalseBBI;
1421f22ef01cSRoman Divacky
1422f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> Cond(BBI.BrCond.begin(), BBI.BrCond.end());
1423f22ef01cSRoman Divacky if (Kind == ICSimpleFalse)
1424f22ef01cSRoman Divacky std::swap(CvtBBI, NextBBI);
1425f22ef01cSRoman Divacky
1426d88c1a5aSDimitry Andric MachineBasicBlock &CvtMBB = *CvtBBI->BB;
1427d88c1a5aSDimitry Andric MachineBasicBlock &NextMBB = *NextBBI->BB;
1428f22ef01cSRoman Divacky if (CvtBBI->IsDone ||
1429d88c1a5aSDimitry Andric (CvtBBI->CannotBeCopied && CvtMBB.pred_size() > 1)) {
1430f22ef01cSRoman Divacky // Something has changed. It's no longer safe to predicate this block.
1431f22ef01cSRoman Divacky BBI.IsAnalyzed = false;
1432f22ef01cSRoman Divacky CvtBBI->IsAnalyzed = false;
1433f22ef01cSRoman Divacky return false;
1434f22ef01cSRoman Divacky }
1435f22ef01cSRoman Divacky
1436d88c1a5aSDimitry Andric if (CvtMBB.hasAddressTaken())
1437284c1978SDimitry Andric // Conservatively abort if-conversion if BB's address is taken.
1438284c1978SDimitry Andric return false;
1439284c1978SDimitry Andric
1440f22ef01cSRoman Divacky if (Kind == ICSimpleFalse)
1441d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(Cond))
1442dff0c46cSDimitry Andric llvm_unreachable("Unable to reverse branch condition!");
1443f22ef01cSRoman Divacky
144495ec533aSDimitry Andric Redefs.init(*TRI);
144595ec533aSDimitry Andric
144695ec533aSDimitry Andric if (MRI->tracksLiveness()) {
1447b5893f02SDimitry Andric // Initialize liveins to the first BB. These are potentially redefined by
1448ffd1746dSEd Schouten // predicated instructions.
1449d88c1a5aSDimitry Andric Redefs.addLiveIns(CvtMBB);
1450d88c1a5aSDimitry Andric Redefs.addLiveIns(NextMBB);
145195ec533aSDimitry Andric }
1452ffd1746dSEd Schouten
1453edd7eaddSDimitry Andric // Remove the branches from the entry so we can add the contents of the true
1454edd7eaddSDimitry Andric // block to it.
1455d88c1a5aSDimitry Andric BBI.NonPredSize -= TII->removeBranch(*BBI.BB);
1456edd7eaddSDimitry Andric
1457edd7eaddSDimitry Andric if (CvtMBB.pred_size() > 1) {
1458f22ef01cSRoman Divacky // Copy instructions in the true block, predicate them, and add them to
1459f22ef01cSRoman Divacky // the entry block.
1460f785676fSDimitry Andric CopyAndPredicateBlock(BBI, *CvtBBI, Cond);
1461284c1978SDimitry Andric
14622cab237bSDimitry Andric // Keep the CFG updated.
1463d88c1a5aSDimitry Andric BBI.BB->removeSuccessor(&CvtMBB, true);
1464f22ef01cSRoman Divacky } else {
1465edd7eaddSDimitry Andric // Predicate the instructions in the true block.
1466d88c1a5aSDimitry Andric PredicateBlock(*CvtBBI, CvtMBB.end(), Cond);
1467f22ef01cSRoman Divacky
14682cab237bSDimitry Andric // Merge converted block into entry block. The BB to Cvt edge is removed
14692cab237bSDimitry Andric // by MergeBlocks.
1470f22ef01cSRoman Divacky MergeBlocks(BBI, *CvtBBI);
1471f22ef01cSRoman Divacky }
1472f22ef01cSRoman Divacky
1473f22ef01cSRoman Divacky bool IterIfcvt = true;
1474d88c1a5aSDimitry Andric if (!canFallThroughTo(*BBI.BB, NextMBB)) {
1475d88c1a5aSDimitry Andric InsertUncondBranch(*BBI.BB, NextMBB, TII);
1476f22ef01cSRoman Divacky BBI.HasFallThrough = false;
1477f22ef01cSRoman Divacky // Now ifcvt'd block will look like this:
1478f22ef01cSRoman Divacky // BB:
1479f22ef01cSRoman Divacky // ...
1480f22ef01cSRoman Divacky // t, f = cmp
1481f22ef01cSRoman Divacky // if t op
1482f22ef01cSRoman Divacky // b BBf
1483f22ef01cSRoman Divacky //
1484f22ef01cSRoman Divacky // We cannot further ifcvt this block because the unconditional branch
1485f22ef01cSRoman Divacky // will have to be predicated on the new condition, that will not be
1486f22ef01cSRoman Divacky // available if cmp executes.
1487f22ef01cSRoman Divacky IterIfcvt = false;
1488f22ef01cSRoman Divacky }
1489f22ef01cSRoman Divacky
1490f22ef01cSRoman Divacky // Update block info. BB can be iteratively if-converted.
1491f22ef01cSRoman Divacky if (!IterIfcvt)
1492f22ef01cSRoman Divacky BBI.IsDone = true;
1493d88c1a5aSDimitry Andric InvalidatePreds(*BBI.BB);
1494f22ef01cSRoman Divacky CvtBBI->IsDone = true;
1495f22ef01cSRoman Divacky
1496f22ef01cSRoman Divacky // FIXME: Must maintain LiveIns.
1497f22ef01cSRoman Divacky return true;
1498f22ef01cSRoman Divacky }
1499f22ef01cSRoman Divacky
1500d88c1a5aSDimitry Andric /// If convert a triangle sub-CFG.
IfConvertTriangle(BBInfo & BBI,IfcvtKind Kind)1501f22ef01cSRoman Divacky bool IfConverter::IfConvertTriangle(BBInfo &BBI, IfcvtKind Kind) {
1502f22ef01cSRoman Divacky BBInfo &TrueBBI = BBAnalysis[BBI.TrueBB->getNumber()];
1503f22ef01cSRoman Divacky BBInfo &FalseBBI = BBAnalysis[BBI.FalseBB->getNumber()];
1504f22ef01cSRoman Divacky BBInfo *CvtBBI = &TrueBBI;
1505f22ef01cSRoman Divacky BBInfo *NextBBI = &FalseBBI;
1506ffd1746dSEd Schouten DebugLoc dl; // FIXME: this is nowhere
1507f22ef01cSRoman Divacky
1508f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> Cond(BBI.BrCond.begin(), BBI.BrCond.end());
1509f22ef01cSRoman Divacky if (Kind == ICTriangleFalse || Kind == ICTriangleFRev)
1510f22ef01cSRoman Divacky std::swap(CvtBBI, NextBBI);
1511f22ef01cSRoman Divacky
1512d88c1a5aSDimitry Andric MachineBasicBlock &CvtMBB = *CvtBBI->BB;
1513d88c1a5aSDimitry Andric MachineBasicBlock &NextMBB = *NextBBI->BB;
1514f22ef01cSRoman Divacky if (CvtBBI->IsDone ||
1515d88c1a5aSDimitry Andric (CvtBBI->CannotBeCopied && CvtMBB.pred_size() > 1)) {
1516f22ef01cSRoman Divacky // Something has changed. It's no longer safe to predicate this block.
1517f22ef01cSRoman Divacky BBI.IsAnalyzed = false;
1518f22ef01cSRoman Divacky CvtBBI->IsAnalyzed = false;
1519f22ef01cSRoman Divacky return false;
1520f22ef01cSRoman Divacky }
1521f22ef01cSRoman Divacky
1522d88c1a5aSDimitry Andric if (CvtMBB.hasAddressTaken())
1523284c1978SDimitry Andric // Conservatively abort if-conversion if BB's address is taken.
1524284c1978SDimitry Andric return false;
1525284c1978SDimitry Andric
1526f22ef01cSRoman Divacky if (Kind == ICTriangleFalse || Kind == ICTriangleFRev)
1527d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(Cond))
1528dff0c46cSDimitry Andric llvm_unreachable("Unable to reverse branch condition!");
1529f22ef01cSRoman Divacky
1530f22ef01cSRoman Divacky if (Kind == ICTriangleRev || Kind == ICTriangleFRev) {
1531d88c1a5aSDimitry Andric if (reverseBranchCondition(*CvtBBI)) {
1532f22ef01cSRoman Divacky // BB has been changed, modify its predecessors (except for this
1533f22ef01cSRoman Divacky // one) so they don't get ifcvt'ed based on bad intel.
1534d88c1a5aSDimitry Andric for (MachineBasicBlock *PBB : CvtMBB.predecessors()) {
1535f22ef01cSRoman Divacky if (PBB == BBI.BB)
1536f22ef01cSRoman Divacky continue;
1537f22ef01cSRoman Divacky BBInfo &PBBI = BBAnalysis[PBB->getNumber()];
1538f22ef01cSRoman Divacky if (PBBI.IsEnqueued) {
1539f22ef01cSRoman Divacky PBBI.IsAnalyzed = false;
1540f22ef01cSRoman Divacky PBBI.IsEnqueued = false;
1541f22ef01cSRoman Divacky }
1542f22ef01cSRoman Divacky }
1543f22ef01cSRoman Divacky }
1544f22ef01cSRoman Divacky }
1545f22ef01cSRoman Divacky
1546ffd1746dSEd Schouten // Initialize liveins to the first BB. These are potentially redefined by
1547ffd1746dSEd Schouten // predicated instructions.
1548d88c1a5aSDimitry Andric Redefs.init(*TRI);
154995ec533aSDimitry Andric if (MRI->tracksLiveness()) {
1550d88c1a5aSDimitry Andric Redefs.addLiveIns(CvtMBB);
1551d88c1a5aSDimitry Andric Redefs.addLiveIns(NextMBB);
155295ec533aSDimitry Andric }
1553f785676fSDimitry Andric
155491bc56edSDimitry Andric bool HasEarlyExit = CvtBBI->FalseBB != nullptr;
15557d523365SDimitry Andric BranchProbability CvtNext, CvtFalse, BBNext, BBCvt;
155639d628a0SDimitry Andric
155791bc56edSDimitry Andric if (HasEarlyExit) {
1558d88c1a5aSDimitry Andric // Get probabilities before modifying CvtMBB and BBI.BB.
1559d88c1a5aSDimitry Andric CvtNext = MBPI->getEdgeProbability(&CvtMBB, &NextMBB);
1560d88c1a5aSDimitry Andric CvtFalse = MBPI->getEdgeProbability(&CvtMBB, CvtBBI->FalseBB);
1561d88c1a5aSDimitry Andric BBNext = MBPI->getEdgeProbability(BBI.BB, &NextMBB);
1562d88c1a5aSDimitry Andric BBCvt = MBPI->getEdgeProbability(BBI.BB, &CvtMBB);
156391bc56edSDimitry Andric }
156439d628a0SDimitry Andric
1565edd7eaddSDimitry Andric // Remove the branches from the entry so we can add the contents of the true
1566edd7eaddSDimitry Andric // block to it.
1567d88c1a5aSDimitry Andric BBI.NonPredSize -= TII->removeBranch(*BBI.BB);
1568edd7eaddSDimitry Andric
1569edd7eaddSDimitry Andric if (CvtMBB.pred_size() > 1) {
1570f22ef01cSRoman Divacky // Copy instructions in the true block, predicate them, and add them to
1571f22ef01cSRoman Divacky // the entry block.
1572f785676fSDimitry Andric CopyAndPredicateBlock(BBI, *CvtBBI, Cond, true);
1573f22ef01cSRoman Divacky } else {
1574f22ef01cSRoman Divacky // Predicate the 'true' block after removing its branch.
1575d88c1a5aSDimitry Andric CvtBBI->NonPredSize -= TII->removeBranch(CvtMBB);
1576d88c1a5aSDimitry Andric PredicateBlock(*CvtBBI, CvtMBB.end(), Cond);
1577f22ef01cSRoman Divacky
15785517e702SDimitry Andric // Now merge the entry of the triangle with the true block.
1579ffd1746dSEd Schouten MergeBlocks(BBI, *CvtBBI, false);
1580f22ef01cSRoman Divacky }
1581f22ef01cSRoman Divacky
15822cab237bSDimitry Andric // Keep the CFG updated.
15832cab237bSDimitry Andric BBI.BB->removeSuccessor(&CvtMBB, true);
15842cab237bSDimitry Andric
1585f22ef01cSRoman Divacky // If 'true' block has a 'false' successor, add an exit branch to it.
1586f22ef01cSRoman Divacky if (HasEarlyExit) {
1587f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> RevCond(CvtBBI->BrCond.begin(),
1588f22ef01cSRoman Divacky CvtBBI->BrCond.end());
1589d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(RevCond))
1590dff0c46cSDimitry Andric llvm_unreachable("Unable to reverse branch condition!");
159191bc56edSDimitry Andric
15927d523365SDimitry Andric // Update the edge probability for both CvtBBI->FalseBB and NextBBI.
1593d88c1a5aSDimitry Andric // NewNext = New_Prob(BBI.BB, NextMBB) =
1594d88c1a5aSDimitry Andric // Prob(BBI.BB, NextMBB) +
1595d88c1a5aSDimitry Andric // Prob(BBI.BB, CvtMBB) * Prob(CvtMBB, NextMBB)
15967d523365SDimitry Andric // NewFalse = New_Prob(BBI.BB, CvtBBI->FalseBB) =
1597d88c1a5aSDimitry Andric // Prob(BBI.BB, CvtMBB) * Prob(CvtMBB, CvtBBI->FalseBB)
1598d88c1a5aSDimitry Andric auto NewTrueBB = getNextBlock(*BBI.BB);
15997d523365SDimitry Andric auto NewNext = BBNext + BBCvt * CvtNext;
1600d88c1a5aSDimitry Andric auto NewTrueBBIter = find(BBI.BB->successors(), NewTrueBB);
16017d523365SDimitry Andric if (NewTrueBBIter != BBI.BB->succ_end())
16027d523365SDimitry Andric BBI.BB->setSuccProbability(NewTrueBBIter, NewNext);
16037d523365SDimitry Andric
16047d523365SDimitry Andric auto NewFalse = BBCvt * CvtFalse;
1605d88c1a5aSDimitry Andric TII->insertBranch(*BBI.BB, CvtBBI->FalseBB, nullptr, RevCond, dl);
16067d523365SDimitry Andric BBI.BB->addSuccessor(CvtBBI->FalseBB, NewFalse);
1607f22ef01cSRoman Divacky }
1608f22ef01cSRoman Divacky
1609f22ef01cSRoman Divacky // Merge in the 'false' block if the 'false' block has no other
1610f22ef01cSRoman Divacky // predecessors. Otherwise, add an unconditional branch to 'false'.
1611f22ef01cSRoman Divacky bool FalseBBDead = false;
1612f22ef01cSRoman Divacky bool IterIfcvt = true;
1613d88c1a5aSDimitry Andric bool isFallThrough = canFallThroughTo(*BBI.BB, NextMBB);
1614f22ef01cSRoman Divacky if (!isFallThrough) {
1615f22ef01cSRoman Divacky // Only merge them if the true block does not fallthrough to the false
1616f22ef01cSRoman Divacky // block. By not merging them, we make it possible to iteratively
1617f22ef01cSRoman Divacky // ifcvt the blocks.
1618f22ef01cSRoman Divacky if (!HasEarlyExit &&
1619302affcbSDimitry Andric NextMBB.pred_size() == 1 && !NextBBI->HasFallThrough &&
1620d88c1a5aSDimitry Andric !NextMBB.hasAddressTaken()) {
1621f22ef01cSRoman Divacky MergeBlocks(BBI, *NextBBI);
1622f22ef01cSRoman Divacky FalseBBDead = true;
1623f22ef01cSRoman Divacky } else {
1624d88c1a5aSDimitry Andric InsertUncondBranch(*BBI.BB, NextMBB, TII);
1625f22ef01cSRoman Divacky BBI.HasFallThrough = false;
1626f22ef01cSRoman Divacky }
1627f22ef01cSRoman Divacky // Mixed predicated and unpredicated code. This cannot be iteratively
1628f22ef01cSRoman Divacky // predicated.
1629f22ef01cSRoman Divacky IterIfcvt = false;
1630f22ef01cSRoman Divacky }
1631f22ef01cSRoman Divacky
1632f22ef01cSRoman Divacky // Update block info. BB can be iteratively if-converted.
1633f22ef01cSRoman Divacky if (!IterIfcvt)
1634f22ef01cSRoman Divacky BBI.IsDone = true;
1635d88c1a5aSDimitry Andric InvalidatePreds(*BBI.BB);
1636f22ef01cSRoman Divacky CvtBBI->IsDone = true;
1637f22ef01cSRoman Divacky if (FalseBBDead)
1638f22ef01cSRoman Divacky NextBBI->IsDone = true;
1639f22ef01cSRoman Divacky
1640f22ef01cSRoman Divacky // FIXME: Must maintain LiveIns.
1641f22ef01cSRoman Divacky return true;
1642f22ef01cSRoman Divacky }
1643f22ef01cSRoman Divacky
1644d88c1a5aSDimitry Andric /// Common code shared between diamond conversions.
1645d88c1a5aSDimitry Andric /// \p BBI, \p TrueBBI, and \p FalseBBI form the diamond shape.
1646d88c1a5aSDimitry Andric /// \p NumDups1 - number of shared instructions at the beginning of \p TrueBBI
1647d88c1a5aSDimitry Andric /// and FalseBBI
1648d88c1a5aSDimitry Andric /// \p NumDups2 - number of shared instructions at the end of \p TrueBBI
1649d88c1a5aSDimitry Andric /// and \p FalseBBI
1650d88c1a5aSDimitry Andric /// \p RemoveBranch - Remove the common branch of the two blocks before
1651d88c1a5aSDimitry Andric /// predicating. Only false for unanalyzable fallthrough
1652d88c1a5aSDimitry Andric /// cases. The caller will replace the branch if necessary.
1653d88c1a5aSDimitry Andric /// \p MergeAddEdges - Add successor edges when merging blocks. Only false for
1654d88c1a5aSDimitry Andric /// unanalyzable fallthrough
IfConvertDiamondCommon(BBInfo & BBI,BBInfo & TrueBBI,BBInfo & FalseBBI,unsigned NumDups1,unsigned NumDups2,bool TClobbersPred,bool FClobbersPred,bool RemoveBranch,bool MergeAddEdges)1655d88c1a5aSDimitry Andric bool IfConverter::IfConvertDiamondCommon(
1656d88c1a5aSDimitry Andric BBInfo &BBI, BBInfo &TrueBBI, BBInfo &FalseBBI,
1657d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
1658d88c1a5aSDimitry Andric bool TClobbersPred, bool FClobbersPred,
1659d88c1a5aSDimitry Andric bool RemoveBranch, bool MergeAddEdges) {
1660f22ef01cSRoman Divacky
1661f22ef01cSRoman Divacky if (TrueBBI.IsDone || FalseBBI.IsDone ||
1662d88c1a5aSDimitry Andric TrueBBI.BB->pred_size() > 1 || FalseBBI.BB->pred_size() > 1) {
1663f22ef01cSRoman Divacky // Something has changed. It's no longer safe to predicate these blocks.
1664f22ef01cSRoman Divacky BBI.IsAnalyzed = false;
1665f22ef01cSRoman Divacky TrueBBI.IsAnalyzed = false;
1666f22ef01cSRoman Divacky FalseBBI.IsAnalyzed = false;
1667f22ef01cSRoman Divacky return false;
1668f22ef01cSRoman Divacky }
1669f22ef01cSRoman Divacky
1670284c1978SDimitry Andric if (TrueBBI.BB->hasAddressTaken() || FalseBBI.BB->hasAddressTaken())
1671284c1978SDimitry Andric // Conservatively abort if-conversion if either BB has its address taken.
1672284c1978SDimitry Andric return false;
1673284c1978SDimitry Andric
1674ffd1746dSEd Schouten // Put the predicated instructions from the 'true' block before the
1675ffd1746dSEd Schouten // instructions from the 'false' block, unless the true block would clobber
1676ffd1746dSEd Schouten // the predicate, in which case, do the opposite.
1677f22ef01cSRoman Divacky BBInfo *BBI1 = &TrueBBI;
1678f22ef01cSRoman Divacky BBInfo *BBI2 = &FalseBBI;
1679f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> RevCond(BBI.BrCond.begin(), BBI.BrCond.end());
1680d88c1a5aSDimitry Andric if (TII->reverseBranchCondition(RevCond))
1681dff0c46cSDimitry Andric llvm_unreachable("Unable to reverse branch condition!");
1682f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> *Cond1 = &BBI.BrCond;
1683f22ef01cSRoman Divacky SmallVector<MachineOperand, 4> *Cond2 = &RevCond;
1684f22ef01cSRoman Divacky
1685f22ef01cSRoman Divacky // Figure out the more profitable ordering.
1686f22ef01cSRoman Divacky bool DoSwap = false;
1687d88c1a5aSDimitry Andric if (TClobbersPred && !FClobbersPred)
1688f22ef01cSRoman Divacky DoSwap = true;
1689d88c1a5aSDimitry Andric else if (!TClobbersPred && !FClobbersPred) {
1690f22ef01cSRoman Divacky if (TrueBBI.NonPredSize > FalseBBI.NonPredSize)
1691f22ef01cSRoman Divacky DoSwap = true;
1692d88c1a5aSDimitry Andric } else if (TClobbersPred && FClobbersPred)
1693d88c1a5aSDimitry Andric llvm_unreachable("Predicate info cannot be clobbered by both sides.");
1694f22ef01cSRoman Divacky if (DoSwap) {
1695f22ef01cSRoman Divacky std::swap(BBI1, BBI2);
1696f22ef01cSRoman Divacky std::swap(Cond1, Cond2);
1697f22ef01cSRoman Divacky }
1698f22ef01cSRoman Divacky
1699f22ef01cSRoman Divacky // Remove the conditional branch from entry to the blocks.
1700d88c1a5aSDimitry Andric BBI.NonPredSize -= TII->removeBranch(*BBI.BB);
1701f22ef01cSRoman Divacky
1702d88c1a5aSDimitry Andric MachineBasicBlock &MBB1 = *BBI1->BB;
1703d88c1a5aSDimitry Andric MachineBasicBlock &MBB2 = *BBI2->BB;
1704d88c1a5aSDimitry Andric
1705d88c1a5aSDimitry Andric // Initialize the Redefs:
1706d88c1a5aSDimitry Andric // - BB2 live-in regs need implicit uses before being redefined by BB1
1707d88c1a5aSDimitry Andric // instructions.
1708d88c1a5aSDimitry Andric // - BB1 live-out regs need implicit uses before being redefined by BB2
1709d88c1a5aSDimitry Andric // instructions. We start with BB1 live-ins so we have the live-out regs
1710d88c1a5aSDimitry Andric // after tracking the BB1 instructions.
1711d88c1a5aSDimitry Andric Redefs.init(*TRI);
171295ec533aSDimitry Andric if (MRI->tracksLiveness()) {
1713d88c1a5aSDimitry Andric Redefs.addLiveIns(MBB1);
1714d88c1a5aSDimitry Andric Redefs.addLiveIns(MBB2);
171595ec533aSDimitry Andric }
1716ffd1746dSEd Schouten
1717f22ef01cSRoman Divacky // Remove the duplicated instructions at the beginnings of both paths.
17186ccc06f6SDimitry Andric // Skip dbg_value instructions.
1719d88c1a5aSDimitry Andric MachineBasicBlock::iterator DI1 = MBB1.getFirstNonDebugInstr();
1720d88c1a5aSDimitry Andric MachineBasicBlock::iterator DI2 = MBB2.getFirstNonDebugInstr();
1721f22ef01cSRoman Divacky BBI1->NonPredSize -= NumDups1;
1722f22ef01cSRoman Divacky BBI2->NonPredSize -= NumDups1;
1723ffd1746dSEd Schouten
1724ffd1746dSEd Schouten // Skip past the dups on each side separately since there may be
17256ccc06f6SDimitry Andric // differing dbg_value entries. NumDups1 can include a "return"
17266ccc06f6SDimitry Andric // instruction, if it's not marked as "branch".
1727ffd1746dSEd Schouten for (unsigned i = 0; i < NumDups1; ++DI1) {
17286ccc06f6SDimitry Andric if (DI1 == MBB1.end())
17296ccc06f6SDimitry Andric break;
17304ba319b5SDimitry Andric if (!DI1->isDebugInstr())
1731ffd1746dSEd Schouten ++i;
1732ffd1746dSEd Schouten }
1733f22ef01cSRoman Divacky while (NumDups1 != 0) {
1734f22ef01cSRoman Divacky ++DI2;
17356ccc06f6SDimitry Andric if (DI2 == MBB2.end())
17366ccc06f6SDimitry Andric break;
17374ba319b5SDimitry Andric if (!DI2->isDebugInstr())
1738f22ef01cSRoman Divacky --NumDups1;
1739f22ef01cSRoman Divacky }
1740ffd1746dSEd Schouten
174195ec533aSDimitry Andric if (MRI->tracksLiveness()) {
1742d88c1a5aSDimitry Andric for (const MachineInstr &MI : make_range(MBB1.begin(), DI1)) {
1743b5893f02SDimitry Andric SmallVector<std::pair<MCPhysReg, const MachineOperand*>, 4> Dummy;
174495ec533aSDimitry Andric Redefs.stepForward(MI, Dummy);
174595ec533aSDimitry Andric }
1746f785676fSDimitry Andric }
17476ccc06f6SDimitry Andric
1748d88c1a5aSDimitry Andric BBI.BB->splice(BBI.BB->end(), &MBB1, MBB1.begin(), DI1);
1749d88c1a5aSDimitry Andric MBB2.erase(MBB2.begin(), DI2);
1750f22ef01cSRoman Divacky
17516ccc06f6SDimitry Andric // The branches have been checked to match, so it is safe to remove the
17526ccc06f6SDimitry Andric // branch in BB1 and rely on the copy in BB2. The complication is that
17536ccc06f6SDimitry Andric // the blocks may end with a return instruction, which may or may not
17546ccc06f6SDimitry Andric // be marked as "branch". If it's not, then it could be included in
17556ccc06f6SDimitry Andric // "dups1", leaving the blocks potentially empty after moving the common
17566ccc06f6SDimitry Andric // duplicates.
1757d88c1a5aSDimitry Andric #ifndef NDEBUG
1758d88c1a5aSDimitry Andric // Unanalyzable branches must match exactly. Check that now.
1759d88c1a5aSDimitry Andric if (!BBI1->IsBrAnalyzable)
1760d88c1a5aSDimitry Andric verifySameBranchInstructions(&MBB1, &MBB2);
1761d88c1a5aSDimitry Andric #endif
1762*ebfb7882SDimitry Andric // Remove duplicated instructions from the tail of MBB1: any branch
1763*ebfb7882SDimitry Andric // instructions, and the common instructions counted by NumDups2.
1764d88c1a5aSDimitry Andric DI1 = MBB1.end();
1765*ebfb7882SDimitry Andric while (DI1 != MBB1.begin()) {
1766*ebfb7882SDimitry Andric MachineBasicBlock::iterator Prev = std::prev(DI1);
1767*ebfb7882SDimitry Andric if (!Prev->isBranch() && !Prev->isDebugInstr())
1768*ebfb7882SDimitry Andric break;
1769*ebfb7882SDimitry Andric DI1 = Prev;
1770*ebfb7882SDimitry Andric }
1771ffd1746dSEd Schouten for (unsigned i = 0; i != NumDups2; ) {
1772ffd1746dSEd Schouten // NumDups2 only counted non-dbg_value instructions, so this won't
1773ffd1746dSEd Schouten // run off the head of the list.
1774d88c1a5aSDimitry Andric assert(DI1 != MBB1.begin());
1775f22ef01cSRoman Divacky --DI1;
1776ffd1746dSEd Schouten // skip dbg_value instructions
17774ba319b5SDimitry Andric if (!DI1->isDebugInstr())
1778ffd1746dSEd Schouten ++i;
1779ffd1746dSEd Schouten }
1780d88c1a5aSDimitry Andric MBB1.erase(DI1, MBB1.end());
1781f22ef01cSRoman Divacky
1782f22ef01cSRoman Divacky DI2 = BBI2->BB->end();
1783d88c1a5aSDimitry Andric // The branches have been checked to match. Skip over the branch in the false
1784d88c1a5aSDimitry Andric // block so that we don't try to predicate it.
1785d88c1a5aSDimitry Andric if (RemoveBranch)
1786d88c1a5aSDimitry Andric BBI2->NonPredSize -= TII->removeBranch(*BBI2->BB);
1787d88c1a5aSDimitry Andric else {
17886ccc06f6SDimitry Andric // Make DI2 point to the end of the range where the common "tail"
17896ccc06f6SDimitry Andric // instructions could be found.
17906ccc06f6SDimitry Andric while (DI2 != MBB2.begin()) {
17916ccc06f6SDimitry Andric MachineBasicBlock::iterator Prev = std::prev(DI2);
17924ba319b5SDimitry Andric if (!Prev->isBranch() && !Prev->isDebugInstr())
17936ccc06f6SDimitry Andric break;
17946ccc06f6SDimitry Andric DI2 = Prev;
17956ccc06f6SDimitry Andric }
1796d88c1a5aSDimitry Andric }
1797f22ef01cSRoman Divacky while (NumDups2 != 0) {
1798ffd1746dSEd Schouten // NumDups2 only counted non-dbg_value instructions, so this won't
1799ffd1746dSEd Schouten // run off the head of the list.
1800d88c1a5aSDimitry Andric assert(DI2 != MBB2.begin());
1801f22ef01cSRoman Divacky --DI2;
1802ffd1746dSEd Schouten // skip dbg_value instructions
18034ba319b5SDimitry Andric if (!DI2->isDebugInstr())
1804f22ef01cSRoman Divacky --NumDups2;
1805f22ef01cSRoman Divacky }
1806dff0c46cSDimitry Andric
1807dff0c46cSDimitry Andric // Remember which registers would later be defined by the false block.
1808dff0c46cSDimitry Andric // This allows us not to predicate instructions in the true block that would
1809dff0c46cSDimitry Andric // later be re-defined. That is, rather than
1810dff0c46cSDimitry Andric // subeq r0, r1, #1
1811dff0c46cSDimitry Andric // addne r0, r1, #1
1812dff0c46cSDimitry Andric // generate:
1813dff0c46cSDimitry Andric // sub r0, r1, #1
1814dff0c46cSDimitry Andric // addne r0, r1, #1
1815b5893f02SDimitry Andric SmallSet<MCPhysReg, 4> RedefsByFalse;
1816b5893f02SDimitry Andric SmallSet<MCPhysReg, 4> ExtUses;
1817d88c1a5aSDimitry Andric if (TII->isProfitableToUnpredicate(MBB1, MBB2)) {
1818d88c1a5aSDimitry Andric for (const MachineInstr &FI : make_range(MBB2.begin(), DI2)) {
18194ba319b5SDimitry Andric if (FI.isDebugInstr())
1820dff0c46cSDimitry Andric continue;
1821b5893f02SDimitry Andric SmallVector<MCPhysReg, 4> Defs;
1822d88c1a5aSDimitry Andric for (const MachineOperand &MO : FI.operands()) {
1823dff0c46cSDimitry Andric if (!MO.isReg())
1824dff0c46cSDimitry Andric continue;
1825dff0c46cSDimitry Andric unsigned Reg = MO.getReg();
1826dff0c46cSDimitry Andric if (!Reg)
1827dff0c46cSDimitry Andric continue;
1828dff0c46cSDimitry Andric if (MO.isDef()) {
1829dff0c46cSDimitry Andric Defs.push_back(Reg);
1830dff0c46cSDimitry Andric } else if (!RedefsByFalse.count(Reg)) {
1831dff0c46cSDimitry Andric // These are defined before ctrl flow reach the 'false' instructions.
1832dff0c46cSDimitry Andric // They cannot be modified by the 'true' instructions.
1833f785676fSDimitry Andric for (MCSubRegIterator SubRegs(Reg, TRI, /*IncludeSelf=*/true);
1834f785676fSDimitry Andric SubRegs.isValid(); ++SubRegs)
18357ae0e2c9SDimitry Andric ExtUses.insert(*SubRegs);
1836dff0c46cSDimitry Andric }
1837dff0c46cSDimitry Andric }
1838dff0c46cSDimitry Andric
1839b5893f02SDimitry Andric for (MCPhysReg Reg : Defs) {
1840dff0c46cSDimitry Andric if (!ExtUses.count(Reg)) {
1841f785676fSDimitry Andric for (MCSubRegIterator SubRegs(Reg, TRI, /*IncludeSelf=*/true);
1842f785676fSDimitry Andric SubRegs.isValid(); ++SubRegs)
18437ae0e2c9SDimitry Andric RedefsByFalse.insert(*SubRegs);
1844dff0c46cSDimitry Andric }
1845dff0c46cSDimitry Andric }
1846dff0c46cSDimitry Andric }
1847dff0c46cSDimitry Andric }
1848dff0c46cSDimitry Andric
1849dff0c46cSDimitry Andric // Predicate the 'true' block.
1850d88c1a5aSDimitry Andric PredicateBlock(*BBI1, MBB1.end(), *Cond1, &RedefsByFalse);
1851dff0c46cSDimitry Andric
18523ca95b02SDimitry Andric // After predicating BBI1, if there is a predicated terminator in BBI1 and
18533ca95b02SDimitry Andric // a non-predicated in BBI2, then we don't want to predicate the one from
18543ca95b02SDimitry Andric // BBI2. The reason is that if we merged these blocks, we would end up with
18553ca95b02SDimitry Andric // two predicated terminators in the same block.
18566ccc06f6SDimitry Andric // Also, if the branches in MBB1 and MBB2 were non-analyzable, then don't
18576ccc06f6SDimitry Andric // predicate them either. They were checked to be identical, and so the
18586ccc06f6SDimitry Andric // same branch would happen regardless of which path was taken.
1859d88c1a5aSDimitry Andric if (!MBB2.empty() && (DI2 == MBB2.end())) {
1860d88c1a5aSDimitry Andric MachineBasicBlock::iterator BBI1T = MBB1.getFirstTerminator();
1861d88c1a5aSDimitry Andric MachineBasicBlock::iterator BBI2T = MBB2.getFirstTerminator();
18626ccc06f6SDimitry Andric bool BB1Predicated = BBI1T != MBB1.end() && TII->isPredicated(*BBI1T);
18636ccc06f6SDimitry Andric bool BB2NonPredicated = BBI2T != MBB2.end() && !TII->isPredicated(*BBI2T);
18646ccc06f6SDimitry Andric if (BB2NonPredicated && (BB1Predicated || !BBI2->IsBrAnalyzable))
18653ca95b02SDimitry Andric --DI2;
18663ca95b02SDimitry Andric }
18673ca95b02SDimitry Andric
1868dff0c46cSDimitry Andric // Predicate the 'false' block.
1869f785676fSDimitry Andric PredicateBlock(*BBI2, DI2, *Cond2);
1870f22ef01cSRoman Divacky
1871f22ef01cSRoman Divacky // Merge the true block into the entry of the diamond.
1872d88c1a5aSDimitry Andric MergeBlocks(BBI, *BBI1, MergeAddEdges);
1873d88c1a5aSDimitry Andric MergeBlocks(BBI, *BBI2, MergeAddEdges);
1874d88c1a5aSDimitry Andric return true;
1875d88c1a5aSDimitry Andric }
1876d88c1a5aSDimitry Andric
1877d88c1a5aSDimitry Andric /// If convert an almost-diamond sub-CFG where the true
1878d88c1a5aSDimitry Andric /// and false blocks share a common tail.
IfConvertForkedDiamond(BBInfo & BBI,IfcvtKind Kind,unsigned NumDups1,unsigned NumDups2,bool TClobbersPred,bool FClobbersPred)1879d88c1a5aSDimitry Andric bool IfConverter::IfConvertForkedDiamond(
1880d88c1a5aSDimitry Andric BBInfo &BBI, IfcvtKind Kind,
1881d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
1882d88c1a5aSDimitry Andric bool TClobbersPred, bool FClobbersPred) {
1883d88c1a5aSDimitry Andric BBInfo &TrueBBI = BBAnalysis[BBI.TrueBB->getNumber()];
1884d88c1a5aSDimitry Andric BBInfo &FalseBBI = BBAnalysis[BBI.FalseBB->getNumber()];
1885d88c1a5aSDimitry Andric
1886d88c1a5aSDimitry Andric // Save the debug location for later.
1887d88c1a5aSDimitry Andric DebugLoc dl;
1888d88c1a5aSDimitry Andric MachineBasicBlock::iterator TIE = TrueBBI.BB->getFirstTerminator();
1889d88c1a5aSDimitry Andric if (TIE != TrueBBI.BB->end())
1890d88c1a5aSDimitry Andric dl = TIE->getDebugLoc();
1891d88c1a5aSDimitry Andric // Removing branches from both blocks is safe, because we have already
1892d88c1a5aSDimitry Andric // determined that both blocks have the same branch instructions. The branch
1893d88c1a5aSDimitry Andric // will be added back at the end, unpredicated.
1894d88c1a5aSDimitry Andric if (!IfConvertDiamondCommon(
1895d88c1a5aSDimitry Andric BBI, TrueBBI, FalseBBI,
1896d88c1a5aSDimitry Andric NumDups1, NumDups2,
1897d88c1a5aSDimitry Andric TClobbersPred, FClobbersPred,
1898d88c1a5aSDimitry Andric /* RemoveBranch */ true, /* MergeAddEdges */ true))
1899d88c1a5aSDimitry Andric return false;
1900d88c1a5aSDimitry Andric
1901d88c1a5aSDimitry Andric // Add back the branch.
1902d88c1a5aSDimitry Andric // Debug location saved above when removing the branch from BBI2
1903d88c1a5aSDimitry Andric TII->insertBranch(*BBI.BB, TrueBBI.TrueBB, TrueBBI.FalseBB,
1904d88c1a5aSDimitry Andric TrueBBI.BrCond, dl);
1905d88c1a5aSDimitry Andric
1906d88c1a5aSDimitry Andric // Update block info.
1907d88c1a5aSDimitry Andric BBI.IsDone = TrueBBI.IsDone = FalseBBI.IsDone = true;
1908d88c1a5aSDimitry Andric InvalidatePreds(*BBI.BB);
1909d88c1a5aSDimitry Andric
1910d88c1a5aSDimitry Andric // FIXME: Must maintain LiveIns.
1911d88c1a5aSDimitry Andric return true;
1912d88c1a5aSDimitry Andric }
1913d88c1a5aSDimitry Andric
1914d88c1a5aSDimitry Andric /// If convert a diamond sub-CFG.
IfConvertDiamond(BBInfo & BBI,IfcvtKind Kind,unsigned NumDups1,unsigned NumDups2,bool TClobbersPred,bool FClobbersPred)1915d88c1a5aSDimitry Andric bool IfConverter::IfConvertDiamond(BBInfo &BBI, IfcvtKind Kind,
1916d88c1a5aSDimitry Andric unsigned NumDups1, unsigned NumDups2,
1917d88c1a5aSDimitry Andric bool TClobbersPred, bool FClobbersPred) {
1918d88c1a5aSDimitry Andric BBInfo &TrueBBI = BBAnalysis[BBI.TrueBB->getNumber()];
1919d88c1a5aSDimitry Andric BBInfo &FalseBBI = BBAnalysis[BBI.FalseBB->getNumber()];
1920d88c1a5aSDimitry Andric MachineBasicBlock *TailBB = TrueBBI.TrueBB;
1921d88c1a5aSDimitry Andric
1922d88c1a5aSDimitry Andric // True block must fall through or end with an unanalyzable terminator.
1923d88c1a5aSDimitry Andric if (!TailBB) {
1924d88c1a5aSDimitry Andric if (blockAlwaysFallThrough(TrueBBI))
1925d88c1a5aSDimitry Andric TailBB = FalseBBI.TrueBB;
1926d88c1a5aSDimitry Andric assert((TailBB || !TrueBBI.IsBrAnalyzable) && "Unexpected!");
1927d88c1a5aSDimitry Andric }
1928d88c1a5aSDimitry Andric
1929d88c1a5aSDimitry Andric if (!IfConvertDiamondCommon(
1930d88c1a5aSDimitry Andric BBI, TrueBBI, FalseBBI,
1931d88c1a5aSDimitry Andric NumDups1, NumDups2,
1932d88c1a5aSDimitry Andric TClobbersPred, FClobbersPred,
1933d88c1a5aSDimitry Andric /* RemoveBranch */ TrueBBI.IsBrAnalyzable,
1934d88c1a5aSDimitry Andric /* MergeAddEdges */ TailBB == nullptr))
1935d88c1a5aSDimitry Andric return false;
1936f22ef01cSRoman Divacky
1937f22ef01cSRoman Divacky // If the if-converted block falls through or unconditionally branches into
1938f22ef01cSRoman Divacky // the tail block, and the tail block does not have other predecessors, then
1939f22ef01cSRoman Divacky // fold the tail block in as well. Otherwise, unless it falls through to the
1940f22ef01cSRoman Divacky // tail, add a unconditional branch to it.
1941f22ef01cSRoman Divacky if (TailBB) {
19422cab237bSDimitry Andric // We need to remove the edges to the true and false blocks manually since
19432cab237bSDimitry Andric // we didn't let IfConvertDiamondCommon update the CFG.
19442cab237bSDimitry Andric BBI.BB->removeSuccessor(TrueBBI.BB);
19452cab237bSDimitry Andric BBI.BB->removeSuccessor(FalseBBI.BB, true);
19462cab237bSDimitry Andric
1947dff0c46cSDimitry Andric BBInfo &TailBBI = BBAnalysis[TailBB->getNumber()];
1948284c1978SDimitry Andric bool CanMergeTail = !TailBBI.HasFallThrough &&
1949284c1978SDimitry Andric !TailBBI.BB->hasAddressTaken();
19503ca95b02SDimitry Andric // The if-converted block can still have a predicated terminator
19513ca95b02SDimitry Andric // (e.g. a predicated return). If that is the case, we cannot merge
19523ca95b02SDimitry Andric // it with the tail block.
19533ca95b02SDimitry Andric MachineBasicBlock::const_iterator TI = BBI.BB->getFirstTerminator();
19543ca95b02SDimitry Andric if (TI != BBI.BB->end() && TII->isPredicated(*TI))
19553ca95b02SDimitry Andric CanMergeTail = false;
1956ffd1746dSEd Schouten // There may still be a fall-through edge from BBI1 or BBI2 to TailBB;
1957ffd1746dSEd Schouten // check if there are any other predecessors besides those.
1958ffd1746dSEd Schouten unsigned NumPreds = TailBB->pred_size();
1959ffd1746dSEd Schouten if (NumPreds > 1)
1960ffd1746dSEd Schouten CanMergeTail = false;
1961ffd1746dSEd Schouten else if (NumPreds == 1 && CanMergeTail) {
1962ffd1746dSEd Schouten MachineBasicBlock::pred_iterator PI = TailBB->pred_begin();
1963d88c1a5aSDimitry Andric if (*PI != TrueBBI.BB && *PI != FalseBBI.BB)
1964ffd1746dSEd Schouten CanMergeTail = false;
1965ffd1746dSEd Schouten }
1966ffd1746dSEd Schouten if (CanMergeTail) {
1967f22ef01cSRoman Divacky MergeBlocks(BBI, TailBBI);
1968f22ef01cSRoman Divacky TailBBI.IsDone = true;
1969f22ef01cSRoman Divacky } else {
19707d523365SDimitry Andric BBI.BB->addSuccessor(TailBB, BranchProbability::getOne());
1971d88c1a5aSDimitry Andric InsertUncondBranch(*BBI.BB, *TailBB, TII);
1972f22ef01cSRoman Divacky BBI.HasFallThrough = false;
1973f22ef01cSRoman Divacky }
1974f22ef01cSRoman Divacky }
1975f22ef01cSRoman Divacky
1976f22ef01cSRoman Divacky // Update block info.
1977f22ef01cSRoman Divacky BBI.IsDone = TrueBBI.IsDone = FalseBBI.IsDone = true;
1978d88c1a5aSDimitry Andric InvalidatePreds(*BBI.BB);
1979f22ef01cSRoman Divacky
1980f22ef01cSRoman Divacky // FIXME: Must maintain LiveIns.
1981f22ef01cSRoman Divacky return true;
1982f22ef01cSRoman Divacky }
1983f22ef01cSRoman Divacky
MaySpeculate(const MachineInstr & MI,SmallSet<MCPhysReg,4> & LaterRedefs)19843ca95b02SDimitry Andric static bool MaySpeculate(const MachineInstr &MI,
1985b5893f02SDimitry Andric SmallSet<MCPhysReg, 4> &LaterRedefs) {
1986dff0c46cSDimitry Andric bool SawStore = true;
19873ca95b02SDimitry Andric if (!MI.isSafeToMove(nullptr, SawStore))
1988dff0c46cSDimitry Andric return false;
1989dff0c46cSDimitry Andric
1990d88c1a5aSDimitry Andric for (const MachineOperand &MO : MI.operands()) {
1991dff0c46cSDimitry Andric if (!MO.isReg())
1992dff0c46cSDimitry Andric continue;
1993dff0c46cSDimitry Andric unsigned Reg = MO.getReg();
1994dff0c46cSDimitry Andric if (!Reg)
1995dff0c46cSDimitry Andric continue;
1996dff0c46cSDimitry Andric if (MO.isDef() && !LaterRedefs.count(Reg))
1997dff0c46cSDimitry Andric return false;
1998dff0c46cSDimitry Andric }
1999dff0c46cSDimitry Andric
2000dff0c46cSDimitry Andric return true;
2001dff0c46cSDimitry Andric }
2002dff0c46cSDimitry Andric
2003d88c1a5aSDimitry Andric /// Predicate instructions from the start of the block to the specified end with
2004d88c1a5aSDimitry Andric /// the specified condition.
PredicateBlock(BBInfo & BBI,MachineBasicBlock::iterator E,SmallVectorImpl<MachineOperand> & Cond,SmallSet<MCPhysReg,4> * LaterRedefs)2005f22ef01cSRoman Divacky void IfConverter::PredicateBlock(BBInfo &BBI,
2006f22ef01cSRoman Divacky MachineBasicBlock::iterator E,
2007ffd1746dSEd Schouten SmallVectorImpl<MachineOperand> &Cond,
2008b5893f02SDimitry Andric SmallSet<MCPhysReg, 4> *LaterRedefs) {
2009dff0c46cSDimitry Andric bool AnyUnpred = false;
201091bc56edSDimitry Andric bool MaySpec = LaterRedefs != nullptr;
2011d88c1a5aSDimitry Andric for (MachineInstr &I : make_range(BBI.BB->begin(), E)) {
20124ba319b5SDimitry Andric if (I.isDebugInstr() || TII->isPredicated(I))
2013f22ef01cSRoman Divacky continue;
2014dff0c46cSDimitry Andric // It may be possible not to predicate an instruction if it's the 'true'
2015dff0c46cSDimitry Andric // side of a diamond and the 'false' side may re-define the instruction's
2016dff0c46cSDimitry Andric // defs.
2017ff0cc061SDimitry Andric if (MaySpec && MaySpeculate(I, *LaterRedefs)) {
2018dff0c46cSDimitry Andric AnyUnpred = true;
2019dff0c46cSDimitry Andric continue;
2020dff0c46cSDimitry Andric }
2021dff0c46cSDimitry Andric // If any instruction is predicated, then every instruction after it must
2022dff0c46cSDimitry Andric // be predicated.
2023dff0c46cSDimitry Andric MaySpec = false;
2024f22ef01cSRoman Divacky if (!TII->PredicateInstruction(I, Cond)) {
2025f22ef01cSRoman Divacky #ifndef NDEBUG
20263ca95b02SDimitry Andric dbgs() << "Unable to predicate " << I << "!\n";
2027f22ef01cSRoman Divacky #endif
202891bc56edSDimitry Andric llvm_unreachable(nullptr);
2029f22ef01cSRoman Divacky }
2030ffd1746dSEd Schouten
2031ffd1746dSEd Schouten // If the predicated instruction now redefines a register as the result of
2032ffd1746dSEd Schouten // if-conversion, add an implicit kill.
203391bc56edSDimitry Andric UpdatePredRedefs(I, Redefs);
2034f22ef01cSRoman Divacky }
2035f22ef01cSRoman Divacky
2036ff0cc061SDimitry Andric BBI.Predicate.append(Cond.begin(), Cond.end());
2037f22ef01cSRoman Divacky
2038f22ef01cSRoman Divacky BBI.IsAnalyzed = false;
2039f22ef01cSRoman Divacky BBI.NonPredSize = 0;
2040f22ef01cSRoman Divacky
2041ffd1746dSEd Schouten ++NumIfConvBBs;
2042dff0c46cSDimitry Andric if (AnyUnpred)
2043dff0c46cSDimitry Andric ++NumUnpred;
2044f22ef01cSRoman Divacky }
2045f22ef01cSRoman Divacky
2046d88c1a5aSDimitry Andric /// Copy and predicate instructions from source BB to the destination block.
2047d88c1a5aSDimitry Andric /// Skip end of block branches if IgnoreBr is true.
CopyAndPredicateBlock(BBInfo & ToBBI,BBInfo & FromBBI,SmallVectorImpl<MachineOperand> & Cond,bool IgnoreBr)2048f22ef01cSRoman Divacky void IfConverter::CopyAndPredicateBlock(BBInfo &ToBBI, BBInfo &FromBBI,
2049f22ef01cSRoman Divacky SmallVectorImpl<MachineOperand> &Cond,
2050f22ef01cSRoman Divacky bool IgnoreBr) {
2051f22ef01cSRoman Divacky MachineFunction &MF = *ToBBI.BB->getParent();
2052f22ef01cSRoman Divacky
2053d88c1a5aSDimitry Andric MachineBasicBlock &FromMBB = *FromBBI.BB;
2054d88c1a5aSDimitry Andric for (MachineInstr &I : FromMBB) {
2055f22ef01cSRoman Divacky // Do not copy the end of the block branches.
20563ca95b02SDimitry Andric if (IgnoreBr && I.isBranch())
2057f22ef01cSRoman Divacky break;
2058f22ef01cSRoman Divacky
20593ca95b02SDimitry Andric MachineInstr *MI = MF.CloneMachineInstr(&I);
2060f22ef01cSRoman Divacky ToBBI.BB->insert(ToBBI.BB->end(), MI);
2061f22ef01cSRoman Divacky ToBBI.NonPredSize++;
20623ca95b02SDimitry Andric unsigned ExtraPredCost = TII->getPredicationCost(I);
20633ca95b02SDimitry Andric unsigned NumCycles = SchedModel.computeInstrLatency(&I, false);
20642754fe60SDimitry Andric if (NumCycles > 1)
20652754fe60SDimitry Andric ToBBI.ExtraCost += NumCycles-1;
20662754fe60SDimitry Andric ToBBI.ExtraCost2 += ExtraPredCost;
2067f22ef01cSRoman Divacky
20684ba319b5SDimitry Andric if (!TII->isPredicated(I) && !MI->isDebugInstr()) {
20693ca95b02SDimitry Andric if (!TII->PredicateInstruction(*MI, Cond)) {
2070f22ef01cSRoman Divacky #ifndef NDEBUG
20713ca95b02SDimitry Andric dbgs() << "Unable to predicate " << I << "!\n";
2072f22ef01cSRoman Divacky #endif
207391bc56edSDimitry Andric llvm_unreachable(nullptr);
2074f22ef01cSRoman Divacky }
2075f22ef01cSRoman Divacky }
2076f22ef01cSRoman Divacky
2077ffd1746dSEd Schouten // If the predicated instruction now redefines a register as the result of
2078ffd1746dSEd Schouten // if-conversion, add an implicit kill.
20793ca95b02SDimitry Andric UpdatePredRedefs(*MI, Redefs);
2080ffd1746dSEd Schouten }
2081ffd1746dSEd Schouten
2082ffd1746dSEd Schouten if (!IgnoreBr) {
2083d88c1a5aSDimitry Andric std::vector<MachineBasicBlock *> Succs(FromMBB.succ_begin(),
2084d88c1a5aSDimitry Andric FromMBB.succ_end());
2085d88c1a5aSDimitry Andric MachineBasicBlock *NBB = getNextBlock(FromMBB);
208691bc56edSDimitry Andric MachineBasicBlock *FallThrough = FromBBI.HasFallThrough ? NBB : nullptr;
2087f22ef01cSRoman Divacky
2088d88c1a5aSDimitry Andric for (MachineBasicBlock *Succ : Succs) {
2089f22ef01cSRoman Divacky // Fallthrough edge can't be transferred.
2090f22ef01cSRoman Divacky if (Succ == FallThrough)
2091f22ef01cSRoman Divacky continue;
2092f22ef01cSRoman Divacky ToBBI.BB->addSuccessor(Succ);
2093f22ef01cSRoman Divacky }
2094ffd1746dSEd Schouten }
2095f22ef01cSRoman Divacky
2096ff0cc061SDimitry Andric ToBBI.Predicate.append(FromBBI.Predicate.begin(), FromBBI.Predicate.end());
2097ff0cc061SDimitry Andric ToBBI.Predicate.append(Cond.begin(), Cond.end());
2098f22ef01cSRoman Divacky
2099f22ef01cSRoman Divacky ToBBI.ClobbersPred |= FromBBI.ClobbersPred;
2100f22ef01cSRoman Divacky ToBBI.IsAnalyzed = false;
2101f22ef01cSRoman Divacky
2102ffd1746dSEd Schouten ++NumDupBBs;
2103f22ef01cSRoman Divacky }
2104f22ef01cSRoman Divacky
2105d88c1a5aSDimitry Andric /// Move all instructions from FromBB to the end of ToBB. This will leave
2106d88c1a5aSDimitry Andric /// FromBB as an empty block, so remove all of its successor edges except for
2107d88c1a5aSDimitry Andric /// the fall-through edge. If AddEdges is true, i.e., when FromBBI's branch is
21082cab237bSDimitry Andric /// being moved, add those successor edges to ToBBI and remove the old edge
21092cab237bSDimitry Andric /// from ToBBI to FromBBI.
MergeBlocks(BBInfo & ToBBI,BBInfo & FromBBI,bool AddEdges)2110ffd1746dSEd Schouten void IfConverter::MergeBlocks(BBInfo &ToBBI, BBInfo &FromBBI, bool AddEdges) {
2111d88c1a5aSDimitry Andric MachineBasicBlock &FromMBB = *FromBBI.BB;
2112d88c1a5aSDimitry Andric assert(!FromMBB.hasAddressTaken() &&
2113284c1978SDimitry Andric "Removing a BB whose address is taken!");
2114284c1978SDimitry Andric
2115d88c1a5aSDimitry Andric // In case FromMBB contains terminators (e.g. return instruction),
21163ca95b02SDimitry Andric // first move the non-terminator instructions, then the terminators.
2117d88c1a5aSDimitry Andric MachineBasicBlock::iterator FromTI = FromMBB.getFirstTerminator();
21183ca95b02SDimitry Andric MachineBasicBlock::iterator ToTI = ToBBI.BB->getFirstTerminator();
2119d88c1a5aSDimitry Andric ToBBI.BB->splice(ToTI, &FromMBB, FromMBB.begin(), FromTI);
21203ca95b02SDimitry Andric
21213ca95b02SDimitry Andric // If FromBB has non-predicated terminator we should copy it at the end.
2122d88c1a5aSDimitry Andric if (FromTI != FromMBB.end() && !TII->isPredicated(*FromTI))
21233ca95b02SDimitry Andric ToTI = ToBBI.BB->end();
2124d88c1a5aSDimitry Andric ToBBI.BB->splice(ToTI, &FromMBB, FromTI, FromMBB.end());
2125f22ef01cSRoman Divacky
21267d523365SDimitry Andric // Force normalizing the successors' probabilities of ToBBI.BB to convert all
21277d523365SDimitry Andric // unknown probabilities into known ones.
21287d523365SDimitry Andric // FIXME: This usage is too tricky and in the future we would like to
21297d523365SDimitry Andric // eliminate all unknown probabilities in MBB.
21307a7e6055SDimitry Andric if (ToBBI.IsBrAnalyzable)
21317d523365SDimitry Andric ToBBI.BB->normalizeSuccProbs();
21327d523365SDimitry Andric
2133d88c1a5aSDimitry Andric SmallVector<MachineBasicBlock *, 4> FromSuccs(FromMBB.succ_begin(),
2134d88c1a5aSDimitry Andric FromMBB.succ_end());
2135d88c1a5aSDimitry Andric MachineBasicBlock *NBB = getNextBlock(FromMBB);
213691bc56edSDimitry Andric MachineBasicBlock *FallThrough = FromBBI.HasFallThrough ? NBB : nullptr;
2137d88c1a5aSDimitry Andric // The edge probability from ToBBI.BB to FromMBB, which is only needed when
2138d88c1a5aSDimitry Andric // AddEdges is true and FromMBB is a successor of ToBBI.BB.
21397d523365SDimitry Andric auto To2FromProb = BranchProbability::getZero();
2140d88c1a5aSDimitry Andric if (AddEdges && ToBBI.BB->isSuccessor(&FromMBB)) {
21412cab237bSDimitry Andric // Remove the old edge but remember the edge probability so we can calculate
21422cab237bSDimitry Andric // the correct weights on the new edges being added further down.
2143d88c1a5aSDimitry Andric To2FromProb = MBPI->getEdgeProbability(ToBBI.BB, &FromMBB);
21442cab237bSDimitry Andric ToBBI.BB->removeSuccessor(&FromMBB);
21457d523365SDimitry Andric }
2146f22ef01cSRoman Divacky
2147d88c1a5aSDimitry Andric for (MachineBasicBlock *Succ : FromSuccs) {
2148f22ef01cSRoman Divacky // Fallthrough edge can't be transferred.
2149f22ef01cSRoman Divacky if (Succ == FallThrough)
2150f22ef01cSRoman Divacky continue;
21517d523365SDimitry Andric
21527d523365SDimitry Andric auto NewProb = BranchProbability::getZero();
21537d523365SDimitry Andric if (AddEdges) {
21547d523365SDimitry Andric // Calculate the edge probability for the edge from ToBBI.BB to Succ,
2155d88c1a5aSDimitry Andric // which is a portion of the edge probability from FromMBB to Succ. The
2156d88c1a5aSDimitry Andric // portion ratio is the edge probability from ToBBI.BB to FromMBB (if
2157b5893f02SDimitry Andric // FromBBI is a successor of ToBBI.BB. See comment below for exception).
2158d88c1a5aSDimitry Andric NewProb = MBPI->getEdgeProbability(&FromMBB, Succ);
21597d523365SDimitry Andric
2160d88c1a5aSDimitry Andric // To2FromProb is 0 when FromMBB is not a successor of ToBBI.BB. This
2161d88c1a5aSDimitry Andric // only happens when if-converting a diamond CFG and FromMBB is the
2162d88c1a5aSDimitry Andric // tail BB. In this case FromMBB post-dominates ToBBI.BB and hence we
2163d88c1a5aSDimitry Andric // could just use the probabilities on FromMBB's out-edges when adding
21647d523365SDimitry Andric // new successors.
21657d523365SDimitry Andric if (!To2FromProb.isZero())
21667d523365SDimitry Andric NewProb *= To2FromProb;
21677d523365SDimitry Andric }
21687d523365SDimitry Andric
2169d88c1a5aSDimitry Andric FromMBB.removeSuccessor(Succ);
21707d523365SDimitry Andric
21717d523365SDimitry Andric if (AddEdges) {
21727d523365SDimitry Andric // If the edge from ToBBI.BB to Succ already exists, update the
21737d523365SDimitry Andric // probability of this edge by adding NewProb to it. An example is shown
2174d88c1a5aSDimitry Andric // below, in which A is ToBBI.BB and B is FromMBB. In this case we
21757d523365SDimitry Andric // don't have to set C as A's successor as it already is. We only need to
21767d523365SDimitry Andric // update the edge probability on A->C. Note that B will not be
21777d523365SDimitry Andric // immediately removed from A's successors. It is possible that B->D is
21787d523365SDimitry Andric // not removed either if D is a fallthrough of B. Later the edge A->D
21797d523365SDimitry Andric // (generated here) and B->D will be combined into one edge. To maintain
21807d523365SDimitry Andric // correct edge probability of this combined edge, we need to set the edge
21817d523365SDimitry Andric // probability of A->B to zero, which is already done above. The edge
21827d523365SDimitry Andric // probability on A->D is calculated by scaling the original probability
21837d523365SDimitry Andric // on A->B by the probability of B->D.
21847d523365SDimitry Andric //
21857d523365SDimitry Andric // Before ifcvt: After ifcvt (assume B->D is kept):
21867d523365SDimitry Andric //
21877d523365SDimitry Andric // A A
21887d523365SDimitry Andric // /| /|\
21897d523365SDimitry Andric // / B / B|
21907d523365SDimitry Andric // | /| | ||
21917d523365SDimitry Andric // |/ | | |/
21927d523365SDimitry Andric // C D C D
21937d523365SDimitry Andric //
21947d523365SDimitry Andric if (ToBBI.BB->isSuccessor(Succ))
21957d523365SDimitry Andric ToBBI.BB->setSuccProbability(
2196d88c1a5aSDimitry Andric find(ToBBI.BB->successors(), Succ),
21977d523365SDimitry Andric MBPI->getEdgeProbability(ToBBI.BB, Succ) + NewProb);
21987d523365SDimitry Andric else
21997d523365SDimitry Andric ToBBI.BB->addSuccessor(Succ, NewProb);
22007d523365SDimitry Andric }
2201f22ef01cSRoman Divacky }
2202f22ef01cSRoman Divacky
22032cab237bSDimitry Andric // Move the now empty FromMBB out of the way to the end of the function so
22042cab237bSDimitry Andric // it doesn't interfere with fallthrough checks done by canFallThroughTo().
22052cab237bSDimitry Andric MachineBasicBlock *Last = &*FromMBB.getParent()->rbegin();
22062cab237bSDimitry Andric if (Last != &FromMBB)
22072cab237bSDimitry Andric FromMBB.moveAfter(Last);
2208f22ef01cSRoman Divacky
22097d523365SDimitry Andric // Normalize the probabilities of ToBBI.BB's successors with all adjustment
22107d523365SDimitry Andric // we've done above.
22117a7e6055SDimitry Andric if (ToBBI.IsBrAnalyzable && FromBBI.IsBrAnalyzable)
22127d523365SDimitry Andric ToBBI.BB->normalizeSuccProbs();
22137d523365SDimitry Andric
2214ff0cc061SDimitry Andric ToBBI.Predicate.append(FromBBI.Predicate.begin(), FromBBI.Predicate.end());
2215f22ef01cSRoman Divacky FromBBI.Predicate.clear();
2216f22ef01cSRoman Divacky
2217f22ef01cSRoman Divacky ToBBI.NonPredSize += FromBBI.NonPredSize;
22182754fe60SDimitry Andric ToBBI.ExtraCost += FromBBI.ExtraCost;
22192754fe60SDimitry Andric ToBBI.ExtraCost2 += FromBBI.ExtraCost2;
2220f22ef01cSRoman Divacky FromBBI.NonPredSize = 0;
22212754fe60SDimitry Andric FromBBI.ExtraCost = 0;
22222754fe60SDimitry Andric FromBBI.ExtraCost2 = 0;
2223f22ef01cSRoman Divacky
2224f22ef01cSRoman Divacky ToBBI.ClobbersPred |= FromBBI.ClobbersPred;
2225f22ef01cSRoman Divacky ToBBI.HasFallThrough = FromBBI.HasFallThrough;
2226f22ef01cSRoman Divacky ToBBI.IsAnalyzed = false;
2227f22ef01cSRoman Divacky FromBBI.IsAnalyzed = false;
2228f22ef01cSRoman Divacky }
222997bc6c73SDimitry Andric
223097bc6c73SDimitry Andric FunctionPass *
createIfConverter(std::function<bool (const MachineFunction &)> Ftor)2231d88c1a5aSDimitry Andric llvm::createIfConverter(std::function<bool(const MachineFunction &)> Ftor) {
22323ca95b02SDimitry Andric return new IfConverter(std::move(Ftor));
223397bc6c73SDimitry Andric }
2234