1dff0c46cSDimitry Andric //===-- PPCBranchSelector.cpp - Emit long conditional branches ------------===//
2f22ef01cSRoman Divacky //
3f22ef01cSRoman Divacky // The LLVM Compiler Infrastructure
4f22ef01cSRoman Divacky //
5f22ef01cSRoman Divacky // This file is distributed under the University of Illinois Open Source
6f22ef01cSRoman Divacky // License. See LICENSE.TXT for details.
7f22ef01cSRoman Divacky //
8f22ef01cSRoman Divacky //===----------------------------------------------------------------------===//
9f22ef01cSRoman Divacky //
10f22ef01cSRoman Divacky // This file contains a pass that scans a machine function to determine which
11f22ef01cSRoman Divacky // conditional branches need more than 16 bits of displacement to reach their
12f22ef01cSRoman Divacky // target basic block. It does this in two passes; a calculation of basic block
13e580952dSDimitry Andric // positions pass, and a branch pseudo op to machine branch opcode pass. This
14f22ef01cSRoman Divacky // pass should be run last, just before the assembly printer.
15f22ef01cSRoman Divacky //
16f22ef01cSRoman Divacky //===----------------------------------------------------------------------===//
17f22ef01cSRoman Divacky
18139f7f9bSDimitry Andric #include "MCTargetDesc/PPCPredicates.h"
19db17bf38SDimitry Andric #include "PPC.h"
20f22ef01cSRoman Divacky #include "PPCInstrBuilder.h"
21f22ef01cSRoman Divacky #include "PPCInstrInfo.h"
22d88c1a5aSDimitry Andric #include "PPCSubtarget.h"
23f22ef01cSRoman Divacky #include "llvm/ADT/Statistic.h"
24139f7f9bSDimitry Andric #include "llvm/CodeGen/MachineFunctionPass.h"
25d88c1a5aSDimitry Andric #include "llvm/CodeGen/MachineRegisterInfo.h"
262cab237bSDimitry Andric #include "llvm/CodeGen/TargetSubtargetInfo.h"
27f22ef01cSRoman Divacky #include "llvm/Support/MathExtras.h"
28139f7f9bSDimitry Andric #include "llvm/Target/TargetMachine.h"
29f22ef01cSRoman Divacky using namespace llvm;
30f22ef01cSRoman Divacky
3191bc56edSDimitry Andric #define DEBUG_TYPE "ppc-branch-select"
3291bc56edSDimitry Andric
33f22ef01cSRoman Divacky STATISTIC(NumExpanded, "Number of branches expanded to long format");
34f22ef01cSRoman Divacky
35139f7f9bSDimitry Andric namespace llvm {
36139f7f9bSDimitry Andric void initializePPCBSelPass(PassRegistry&);
37139f7f9bSDimitry Andric }
38139f7f9bSDimitry Andric
39f22ef01cSRoman Divacky namespace {
40f22ef01cSRoman Divacky struct PPCBSel : public MachineFunctionPass {
41f22ef01cSRoman Divacky static char ID;
PPCBSel__anon4b43ba6c0111::PPCBSel42139f7f9bSDimitry Andric PPCBSel() : MachineFunctionPass(ID) {
43139f7f9bSDimitry Andric initializePPCBSelPass(*PassRegistry::getPassRegistry());
44139f7f9bSDimitry Andric }
45f22ef01cSRoman Divacky
46d88c1a5aSDimitry Andric // The sizes of the basic blocks in the function (the first
47d88c1a5aSDimitry Andric // element of the pair); the second element of the pair is the amount of the
48d88c1a5aSDimitry Andric // size that is due to potential padding.
49d88c1a5aSDimitry Andric std::vector<std::pair<unsigned, unsigned>> BlockSizes;
50f22ef01cSRoman Divacky
5191bc56edSDimitry Andric bool runOnMachineFunction(MachineFunction &Fn) override;
52f22ef01cSRoman Divacky
getRequiredProperties__anon4b43ba6c0111::PPCBSel533ca95b02SDimitry Andric MachineFunctionProperties getRequiredProperties() const override {
543ca95b02SDimitry Andric return MachineFunctionProperties().set(
55d88c1a5aSDimitry Andric MachineFunctionProperties::Property::NoVRegs);
563ca95b02SDimitry Andric }
573ca95b02SDimitry Andric
getPassName__anon4b43ba6c0111::PPCBSel58d88c1a5aSDimitry Andric StringRef getPassName() const override { return "PowerPC Branch Selector"; }
59f22ef01cSRoman Divacky };
60f22ef01cSRoman Divacky char PPCBSel::ID = 0;
61f22ef01cSRoman Divacky }
62f22ef01cSRoman Divacky
63139f7f9bSDimitry Andric INITIALIZE_PASS(PPCBSel, "ppc-branch-select", "PowerPC Branch Selector",
64139f7f9bSDimitry Andric false, false)
65139f7f9bSDimitry Andric
66f22ef01cSRoman Divacky /// createPPCBranchSelectionPass - returns an instance of the Branch Selection
67f22ef01cSRoman Divacky /// Pass
68f22ef01cSRoman Divacky ///
createPPCBranchSelectionPass()69f22ef01cSRoman Divacky FunctionPass *llvm::createPPCBranchSelectionPass() {
70f22ef01cSRoman Divacky return new PPCBSel();
71f22ef01cSRoman Divacky }
72f22ef01cSRoman Divacky
runOnMachineFunction(MachineFunction & Fn)73f22ef01cSRoman Divacky bool PPCBSel::runOnMachineFunction(MachineFunction &Fn) {
74e580952dSDimitry Andric const PPCInstrInfo *TII =
7539d628a0SDimitry Andric static_cast<const PPCInstrInfo *>(Fn.getSubtarget().getInstrInfo());
76f22ef01cSRoman Divacky // Give the blocks of the function a dense, in-order, numbering.
77f22ef01cSRoman Divacky Fn.RenumberBlocks();
78f22ef01cSRoman Divacky BlockSizes.resize(Fn.getNumBlockIDs());
79f22ef01cSRoman Divacky
8039d628a0SDimitry Andric auto GetAlignmentAdjustment =
817a7e6055SDimitry Andric [](MachineBasicBlock &MBB, unsigned Offset) -> unsigned {
8239d628a0SDimitry Andric unsigned Align = MBB.getAlignment();
8339d628a0SDimitry Andric if (!Align)
8439d628a0SDimitry Andric return 0;
8539d628a0SDimitry Andric
8639d628a0SDimitry Andric unsigned AlignAmt = 1 << Align;
8739d628a0SDimitry Andric unsigned ParentAlign = MBB.getParent()->getAlignment();
8839d628a0SDimitry Andric
8939d628a0SDimitry Andric if (Align <= ParentAlign)
9039d628a0SDimitry Andric return OffsetToAlignment(Offset, AlignAmt);
9139d628a0SDimitry Andric
9239d628a0SDimitry Andric // The alignment of this MBB is larger than the function's alignment, so we
9339d628a0SDimitry Andric // can't tell whether or not it will insert nops. Assume that it will.
9439d628a0SDimitry Andric return AlignAmt + OffsetToAlignment(Offset, AlignAmt);
9539d628a0SDimitry Andric };
9639d628a0SDimitry Andric
97d88c1a5aSDimitry Andric // We need to be careful about the offset of the first block in the function
98d88c1a5aSDimitry Andric // because it might not have the function's alignment. This happens because,
99d88c1a5aSDimitry Andric // under the ELFv2 ABI, for functions which require a TOC pointer, we add a
100d88c1a5aSDimitry Andric // two-instruction sequence to the start of the function.
101d88c1a5aSDimitry Andric // Note: This needs to be synchronized with the check in
102d88c1a5aSDimitry Andric // PPCLinuxAsmPrinter::EmitFunctionBodyStart.
103d88c1a5aSDimitry Andric unsigned InitialOffset = 0;
104d88c1a5aSDimitry Andric if (Fn.getSubtarget<PPCSubtarget>().isELFv2ABI() &&
105d88c1a5aSDimitry Andric !Fn.getRegInfo().use_empty(PPC::X2))
106d88c1a5aSDimitry Andric InitialOffset = 8;
107d88c1a5aSDimitry Andric
108f22ef01cSRoman Divacky // Measure each MBB and compute a size for the entire function.
109d88c1a5aSDimitry Andric unsigned FuncSize = InitialOffset;
110f22ef01cSRoman Divacky for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E;
111f22ef01cSRoman Divacky ++MFI) {
1127d523365SDimitry Andric MachineBasicBlock *MBB = &*MFI;
113f22ef01cSRoman Divacky
11439d628a0SDimitry Andric // The end of the previous block may have extra nops if this block has an
11539d628a0SDimitry Andric // alignment requirement.
11639d628a0SDimitry Andric if (MBB->getNumber() > 0) {
11739d628a0SDimitry Andric unsigned AlignExtra = GetAlignmentAdjustment(*MBB, FuncSize);
118d88c1a5aSDimitry Andric
119d88c1a5aSDimitry Andric auto &BS = BlockSizes[MBB->getNumber()-1];
120d88c1a5aSDimitry Andric BS.first += AlignExtra;
121d88c1a5aSDimitry Andric BS.second = AlignExtra;
122d88c1a5aSDimitry Andric
12339d628a0SDimitry Andric FuncSize += AlignExtra;
12439d628a0SDimitry Andric }
12539d628a0SDimitry Andric
126f22ef01cSRoman Divacky unsigned BlockSize = 0;
1273ca95b02SDimitry Andric for (MachineInstr &MI : *MBB)
128d88c1a5aSDimitry Andric BlockSize += TII->getInstSizeInBytes(MI);
129f22ef01cSRoman Divacky
130d88c1a5aSDimitry Andric BlockSizes[MBB->getNumber()].first = BlockSize;
131f22ef01cSRoman Divacky FuncSize += BlockSize;
132f22ef01cSRoman Divacky }
133f22ef01cSRoman Divacky
134f22ef01cSRoman Divacky // If the entire function is smaller than the displacement of a branch field,
135f22ef01cSRoman Divacky // we know we don't need to shrink any branches in this function. This is a
136f22ef01cSRoman Divacky // common case.
137f22ef01cSRoman Divacky if (FuncSize < (1 << 15)) {
138f22ef01cSRoman Divacky BlockSizes.clear();
139f22ef01cSRoman Divacky return false;
140f22ef01cSRoman Divacky }
141f22ef01cSRoman Divacky
142f22ef01cSRoman Divacky // For each conditional branch, if the offset to its destination is larger
143f22ef01cSRoman Divacky // than the offset field allows, transform it into a long branch sequence
144f22ef01cSRoman Divacky // like this:
145f22ef01cSRoman Divacky // short branch:
146f22ef01cSRoman Divacky // bCC MBB
147f22ef01cSRoman Divacky // long branch:
148f22ef01cSRoman Divacky // b!CC $PC+8
149f22ef01cSRoman Divacky // b MBB
150f22ef01cSRoman Divacky //
151f22ef01cSRoman Divacky bool MadeChange = true;
152f22ef01cSRoman Divacky bool EverMadeChange = false;
153f22ef01cSRoman Divacky while (MadeChange) {
154f22ef01cSRoman Divacky // Iteratively expand branches until we reach a fixed point.
155f22ef01cSRoman Divacky MadeChange = false;
156f22ef01cSRoman Divacky
157f22ef01cSRoman Divacky for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E;
158f22ef01cSRoman Divacky ++MFI) {
159f22ef01cSRoman Divacky MachineBasicBlock &MBB = *MFI;
160f22ef01cSRoman Divacky unsigned MBBStartOffset = 0;
161f22ef01cSRoman Divacky for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end();
162f22ef01cSRoman Divacky I != E; ++I) {
16391bc56edSDimitry Andric MachineBasicBlock *Dest = nullptr;
164284c1978SDimitry Andric if (I->getOpcode() == PPC::BCC && !I->getOperand(2).isImm())
165284c1978SDimitry Andric Dest = I->getOperand(2).getMBB();
16691bc56edSDimitry Andric else if ((I->getOpcode() == PPC::BC || I->getOpcode() == PPC::BCn) &&
16791bc56edSDimitry Andric !I->getOperand(1).isImm())
16891bc56edSDimitry Andric Dest = I->getOperand(1).getMBB();
169284c1978SDimitry Andric else if ((I->getOpcode() == PPC::BDNZ8 || I->getOpcode() == PPC::BDNZ ||
170284c1978SDimitry Andric I->getOpcode() == PPC::BDZ8 || I->getOpcode() == PPC::BDZ) &&
171284c1978SDimitry Andric !I->getOperand(0).isImm())
172284c1978SDimitry Andric Dest = I->getOperand(0).getMBB();
173284c1978SDimitry Andric
174284c1978SDimitry Andric if (!Dest) {
175d88c1a5aSDimitry Andric MBBStartOffset += TII->getInstSizeInBytes(*I);
176f22ef01cSRoman Divacky continue;
177f22ef01cSRoman Divacky }
178f22ef01cSRoman Divacky
179f22ef01cSRoman Divacky // Determine the offset from the current branch to the destination
180f22ef01cSRoman Divacky // block.
181f22ef01cSRoman Divacky int BranchSize;
182f22ef01cSRoman Divacky if (Dest->getNumber() <= MBB.getNumber()) {
183f22ef01cSRoman Divacky // If this is a backwards branch, the delta is the offset from the
184f22ef01cSRoman Divacky // start of this block to this branch, plus the sizes of all blocks
185f22ef01cSRoman Divacky // from this block to the dest.
186f22ef01cSRoman Divacky BranchSize = MBBStartOffset;
187f22ef01cSRoman Divacky
188f22ef01cSRoman Divacky for (unsigned i = Dest->getNumber(), e = MBB.getNumber(); i != e; ++i)
189d88c1a5aSDimitry Andric BranchSize += BlockSizes[i].first;
190f22ef01cSRoman Divacky } else {
191f22ef01cSRoman Divacky // Otherwise, add the size of the blocks between this block and the
192f22ef01cSRoman Divacky // dest to the number of bytes left in this block.
193f22ef01cSRoman Divacky BranchSize = -MBBStartOffset;
194f22ef01cSRoman Divacky
195f22ef01cSRoman Divacky for (unsigned i = MBB.getNumber(), e = Dest->getNumber(); i != e; ++i)
196d88c1a5aSDimitry Andric BranchSize += BlockSizes[i].first;
197f22ef01cSRoman Divacky }
198f22ef01cSRoman Divacky
199f22ef01cSRoman Divacky // If this branch is in range, ignore it.
200f22ef01cSRoman Divacky if (isInt<16>(BranchSize)) {
201f22ef01cSRoman Divacky MBBStartOffset += 4;
202f22ef01cSRoman Divacky continue;
203f22ef01cSRoman Divacky }
204f22ef01cSRoman Divacky
205f22ef01cSRoman Divacky // Otherwise, we have to expand it to a long branch.
206d88c1a5aSDimitry Andric MachineInstr &OldBranch = *I;
207d88c1a5aSDimitry Andric DebugLoc dl = OldBranch.getDebugLoc();
2087ae0e2c9SDimitry Andric
2097ae0e2c9SDimitry Andric if (I->getOpcode() == PPC::BCC) {
210f22ef01cSRoman Divacky // The BCC operands are:
211f22ef01cSRoman Divacky // 0. PPC branch predicate
212f22ef01cSRoman Divacky // 1. CR register
213f22ef01cSRoman Divacky // 2. Target MBB
214f22ef01cSRoman Divacky PPC::Predicate Pred = (PPC::Predicate)I->getOperand(0).getImm();
215f22ef01cSRoman Divacky unsigned CRReg = I->getOperand(1).getReg();
216f22ef01cSRoman Divacky
217f22ef01cSRoman Divacky // Jump over the uncond branch inst (i.e. $PC+8) on opposite condition.
218f22ef01cSRoman Divacky BuildMI(MBB, I, dl, TII->get(PPC::BCC))
219f22ef01cSRoman Divacky .addImm(PPC::InvertPredicate(Pred)).addReg(CRReg).addImm(2);
22091bc56edSDimitry Andric } else if (I->getOpcode() == PPC::BC) {
22191bc56edSDimitry Andric unsigned CRBit = I->getOperand(0).getReg();
22291bc56edSDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BCn)).addReg(CRBit).addImm(2);
22391bc56edSDimitry Andric } else if (I->getOpcode() == PPC::BCn) {
22491bc56edSDimitry Andric unsigned CRBit = I->getOperand(0).getReg();
22591bc56edSDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BC)).addReg(CRBit).addImm(2);
2267ae0e2c9SDimitry Andric } else if (I->getOpcode() == PPC::BDNZ) {
2277ae0e2c9SDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BDZ)).addImm(2);
2287ae0e2c9SDimitry Andric } else if (I->getOpcode() == PPC::BDNZ8) {
2297ae0e2c9SDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BDZ8)).addImm(2);
2307ae0e2c9SDimitry Andric } else if (I->getOpcode() == PPC::BDZ) {
2317ae0e2c9SDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BDNZ)).addImm(2);
2327ae0e2c9SDimitry Andric } else if (I->getOpcode() == PPC::BDZ8) {
2337ae0e2c9SDimitry Andric BuildMI(MBB, I, dl, TII->get(PPC::BDNZ8)).addImm(2);
2347ae0e2c9SDimitry Andric } else {
2357ae0e2c9SDimitry Andric llvm_unreachable("Unhandled branch type!");
2367ae0e2c9SDimitry Andric }
237f22ef01cSRoman Divacky
238f22ef01cSRoman Divacky // Uncond branch to the real destination.
239f22ef01cSRoman Divacky I = BuildMI(MBB, I, dl, TII->get(PPC::B)).addMBB(Dest);
240f22ef01cSRoman Divacky
241f22ef01cSRoman Divacky // Remove the old branch from the function.
242d88c1a5aSDimitry Andric OldBranch.eraseFromParent();
243f22ef01cSRoman Divacky
244f22ef01cSRoman Divacky // Remember that this instruction is 8-bytes, increase the size of the
245f22ef01cSRoman Divacky // block by 4, remember to iterate.
246d88c1a5aSDimitry Andric BlockSizes[MBB.getNumber()].first += 4;
247f22ef01cSRoman Divacky MBBStartOffset += 8;
248f22ef01cSRoman Divacky ++NumExpanded;
249f22ef01cSRoman Divacky MadeChange = true;
250f22ef01cSRoman Divacky }
251f22ef01cSRoman Divacky }
252d88c1a5aSDimitry Andric
253d88c1a5aSDimitry Andric if (MadeChange) {
254d88c1a5aSDimitry Andric // If we're going to iterate again, make sure we've updated our
255d88c1a5aSDimitry Andric // padding-based contributions to the block sizes.
256d88c1a5aSDimitry Andric unsigned Offset = InitialOffset;
257d88c1a5aSDimitry Andric for (MachineFunction::iterator MFI = Fn.begin(), E = Fn.end(); MFI != E;
258d88c1a5aSDimitry Andric ++MFI) {
259d88c1a5aSDimitry Andric MachineBasicBlock *MBB = &*MFI;
260d88c1a5aSDimitry Andric
261d88c1a5aSDimitry Andric if (MBB->getNumber() > 0) {
262d88c1a5aSDimitry Andric auto &BS = BlockSizes[MBB->getNumber()-1];
263d88c1a5aSDimitry Andric BS.first -= BS.second;
264d88c1a5aSDimitry Andric Offset -= BS.second;
265d88c1a5aSDimitry Andric
266d88c1a5aSDimitry Andric unsigned AlignExtra = GetAlignmentAdjustment(*MBB, Offset);
267d88c1a5aSDimitry Andric
268d88c1a5aSDimitry Andric BS.first += AlignExtra;
269d88c1a5aSDimitry Andric BS.second = AlignExtra;
270d88c1a5aSDimitry Andric
271d88c1a5aSDimitry Andric Offset += AlignExtra;
272d88c1a5aSDimitry Andric }
273d88c1a5aSDimitry Andric
274d88c1a5aSDimitry Andric Offset += BlockSizes[MBB->getNumber()].first;
275d88c1a5aSDimitry Andric }
276d88c1a5aSDimitry Andric }
277d88c1a5aSDimitry Andric
278f22ef01cSRoman Divacky EverMadeChange |= MadeChange;
279f22ef01cSRoman Divacky }
280f22ef01cSRoman Divacky
281f22ef01cSRoman Divacky BlockSizes.clear();
282f22ef01cSRoman Divacky return true;
283f22ef01cSRoman Divacky }
284