1 //===-- BranchRelaxation.cpp ----------------------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "llvm/CodeGen/Passes.h"
11 #include "llvm/ADT/SmallVector.h"
12 #include "llvm/ADT/Statistic.h"
13 #include "llvm/CodeGen/LivePhysRegs.h"
14 #include "llvm/CodeGen/MachineFunctionPass.h"
15 #include "llvm/CodeGen/RegisterScavenging.h"
16 #include "llvm/Target/TargetInstrInfo.h"
17 #include "llvm/Target/TargetSubtargetInfo.h"
18 #include "llvm/Support/Debug.h"
19 #include "llvm/Support/Format.h"
20 #include "llvm/Support/raw_ostream.h"
21 
22 using namespace llvm;
23 
24 #define DEBUG_TYPE "branch-relaxation"
25 
26 STATISTIC(NumSplit, "Number of basic blocks split");
27 STATISTIC(NumConditionalRelaxed, "Number of conditional branches relaxed");
28 STATISTIC(NumUnconditionalRelaxed, "Number of unconditional branches relaxed");
29 
30 #define BRANCH_RELAX_NAME "Branch relaxation pass"
31 
32 namespace {
33 class BranchRelaxation : public MachineFunctionPass {
34   /// BasicBlockInfo - Information about the offset and size of a single
35   /// basic block.
36   struct BasicBlockInfo {
37     /// Offset - Distance from the beginning of the function to the beginning
38     /// of this basic block.
39     ///
40     /// The offset is always aligned as required by the basic block.
41     unsigned Offset;
42 
43     /// Size - Size of the basic block in bytes.  If the block contains
44     /// inline assembly, this is a worst case estimate.
45     ///
46     /// The size does not include any alignment padding whether from the
47     /// beginning of the block, or from an aligned jump table at the end.
48     unsigned Size;
49 
50     BasicBlockInfo() : Offset(0), Size(0) {}
51 
52     /// Compute the offset immediately following this block. \p MBB is the next
53     /// block.
54     unsigned postOffset(const MachineBasicBlock &MBB) const {
55       unsigned PO = Offset + Size;
56       unsigned Align = MBB.getAlignment();
57       if (Align == 0)
58         return PO;
59 
60       unsigned AlignAmt = 1 << Align;
61       unsigned ParentAlign = MBB.getParent()->getAlignment();
62       if (Align <= ParentAlign)
63         return PO + OffsetToAlignment(PO, AlignAmt);
64 
65       // The alignment of this MBB is larger than the function's alignment, so we
66       // can't tell whether or not it will insert nops. Assume that it will.
67       return PO + AlignAmt + OffsetToAlignment(PO, AlignAmt);
68     }
69   };
70 
71   SmallVector<BasicBlockInfo, 16> BlockInfo;
72   std::unique_ptr<RegScavenger> RS;
73   LivePhysRegs LiveRegs;
74 
75   MachineFunction *MF;
76   const TargetRegisterInfo *TRI;
77   const TargetInstrInfo *TII;
78 
79   bool relaxBranchInstructions();
80   void scanFunction();
81 
82   MachineBasicBlock *createNewBlockAfter(MachineBasicBlock &BB);
83 
84   MachineBasicBlock *splitBlockBeforeInstr(MachineInstr &MI,
85                                            MachineBasicBlock *DestBB);
86   void adjustBlockOffsets(MachineBasicBlock &MBB);
87   bool isBlockInRange(const MachineInstr &MI, const MachineBasicBlock &BB) const;
88 
89   bool fixupConditionalBranch(MachineInstr &MI);
90   bool fixupUnconditionalBranch(MachineInstr &MI);
91   uint64_t computeBlockSize(const MachineBasicBlock &MBB) const;
92   unsigned getInstrOffset(const MachineInstr &MI) const;
93   void dumpBBs();
94   void verify();
95 
96 public:
97   static char ID;
98   BranchRelaxation() : MachineFunctionPass(ID) { }
99 
100   bool runOnMachineFunction(MachineFunction &MF) override;
101 
102   StringRef getPassName() const override {
103     return BRANCH_RELAX_NAME;
104   }
105 };
106 
107 }
108 
109 char BranchRelaxation::ID = 0;
110 char &llvm::BranchRelaxationPassID = BranchRelaxation::ID;
111 
112 INITIALIZE_PASS(BranchRelaxation, DEBUG_TYPE, BRANCH_RELAX_NAME, false, false)
113 
114 /// verify - check BBOffsets, BBSizes, alignment of islands
115 void BranchRelaxation::verify() {
116 #ifndef NDEBUG
117   unsigned PrevNum = MF->begin()->getNumber();
118   for (MachineBasicBlock &MBB : *MF) {
119     unsigned Align = MBB.getAlignment();
120     unsigned Num = MBB.getNumber();
121     assert(BlockInfo[Num].Offset % (1u << Align) == 0);
122     assert(!Num || BlockInfo[PrevNum].postOffset(MBB) <= BlockInfo[Num].Offset);
123     assert(BlockInfo[Num].Size == computeBlockSize(MBB));
124     PrevNum = Num;
125   }
126 #endif
127 }
128 
129 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
130 /// print block size and offset information - debugging
131 LLVM_DUMP_METHOD void BranchRelaxation::dumpBBs() {
132   for (auto &MBB : *MF) {
133     const BasicBlockInfo &BBI = BlockInfo[MBB.getNumber()];
134     dbgs() << format("BB#%u\toffset=%08x\t", MBB.getNumber(), BBI.Offset)
135            << format("size=%#x\n", BBI.Size);
136   }
137 }
138 #endif
139 
140 /// scanFunction - Do the initial scan of the function, building up
141 /// information about each block.
142 void BranchRelaxation::scanFunction() {
143   BlockInfo.clear();
144   BlockInfo.resize(MF->getNumBlockIDs());
145 
146   // First thing, compute the size of all basic blocks, and see if the function
147   // has any inline assembly in it. If so, we have to be conservative about
148   // alignment assumptions, as we don't know for sure the size of any
149   // instructions in the inline assembly.
150   for (MachineBasicBlock &MBB : *MF)
151     BlockInfo[MBB.getNumber()].Size = computeBlockSize(MBB);
152 
153   // Compute block offsets and known bits.
154   adjustBlockOffsets(*MF->begin());
155 }
156 
157 /// computeBlockSize - Compute the size for MBB.
158 uint64_t BranchRelaxation::computeBlockSize(const MachineBasicBlock &MBB) const {
159   uint64_t Size = 0;
160   for (const MachineInstr &MI : MBB)
161     Size += TII->getInstSizeInBytes(MI);
162   return Size;
163 }
164 
165 /// getInstrOffset - Return the current offset of the specified machine
166 /// instruction from the start of the function.  This offset changes as stuff is
167 /// moved around inside the function.
168 unsigned BranchRelaxation::getInstrOffset(const MachineInstr &MI) const {
169   const MachineBasicBlock *MBB = MI.getParent();
170 
171   // The offset is composed of two things: the sum of the sizes of all MBB's
172   // before this instruction's block, and the offset from the start of the block
173   // it is in.
174   unsigned Offset = BlockInfo[MBB->getNumber()].Offset;
175 
176   // Sum instructions before MI in MBB.
177   for (MachineBasicBlock::const_iterator I = MBB->begin(); &*I != &MI; ++I) {
178     assert(I != MBB->end() && "Didn't find MI in its own basic block?");
179     Offset += TII->getInstSizeInBytes(*I);
180   }
181 
182   return Offset;
183 }
184 
185 void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock &Start) {
186   unsigned PrevNum = Start.getNumber();
187   for (auto &MBB : make_range(MachineFunction::iterator(Start), MF->end())) {
188     unsigned Num = MBB.getNumber();
189     if (!Num) // block zero is never changed from offset zero.
190       continue;
191     // Get the offset and known bits at the end of the layout predecessor.
192     // Include the alignment of the current block.
193     BlockInfo[Num].Offset = BlockInfo[PrevNum].postOffset(MBB);
194 
195     PrevNum = Num;
196   }
197 }
198 
199   /// Insert a new empty basic block and insert it after \BB
200 MachineBasicBlock *BranchRelaxation::createNewBlockAfter(MachineBasicBlock &BB) {
201   // Create a new MBB for the code after the OrigBB.
202   MachineBasicBlock *NewBB =
203       MF->CreateMachineBasicBlock(BB.getBasicBlock());
204   MF->insert(++BB.getIterator(), NewBB);
205 
206   // Insert an entry into BlockInfo to align it properly with the block numbers.
207   BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo());
208 
209   return NewBB;
210 }
211 
212 /// Split the basic block containing MI into two blocks, which are joined by
213 /// an unconditional branch.  Update data structures and renumber blocks to
214 /// account for this change and returns the newly created block.
215 MachineBasicBlock *BranchRelaxation::splitBlockBeforeInstr(MachineInstr &MI,
216                                                            MachineBasicBlock *DestBB) {
217   MachineBasicBlock *OrigBB = MI.getParent();
218 
219   // Create a new MBB for the code after the OrigBB.
220   MachineBasicBlock *NewBB =
221       MF->CreateMachineBasicBlock(OrigBB->getBasicBlock());
222   MF->insert(++OrigBB->getIterator(), NewBB);
223 
224   // Splice the instructions starting with MI over to NewBB.
225   NewBB->splice(NewBB->end(), OrigBB, MI.getIterator(), OrigBB->end());
226 
227   // Add an unconditional branch from OrigBB to NewBB.
228   // Note the new unconditional branch is not being recorded.
229   // There doesn't seem to be meaningful DebugInfo available; this doesn't
230   // correspond to anything in the source.
231   TII->insertUnconditionalBranch(*OrigBB, NewBB, DebugLoc());
232 
233   // Insert an entry into BlockInfo to align it properly with the block numbers.
234   BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo());
235 
236 
237   NewBB->transferSuccessors(OrigBB);
238   OrigBB->addSuccessor(NewBB);
239   OrigBB->addSuccessor(DestBB);
240 
241   // Cleanup potential unconditional branch to successor block.
242   // Note that updateTerminator may change the size of the blocks.
243   NewBB->updateTerminator();
244   OrigBB->updateTerminator();
245 
246   // Figure out how large the OrigBB is.  As the first half of the original
247   // block, it cannot contain a tablejump.  The size includes
248   // the new jump we added.  (It should be possible to do this without
249   // recounting everything, but it's very confusing, and this is rarely
250   // executed.)
251   BlockInfo[OrigBB->getNumber()].Size = computeBlockSize(*OrigBB);
252 
253   // Figure out how large the NewMBB is. As the second half of the original
254   // block, it may contain a tablejump.
255   BlockInfo[NewBB->getNumber()].Size = computeBlockSize(*NewBB);
256 
257   // All BBOffsets following these blocks must be modified.
258   adjustBlockOffsets(*OrigBB);
259 
260   // Need to fix live-in lists if we track liveness.
261   if (TRI->trackLivenessAfterRegAlloc(*MF))
262     computeLiveIns(LiveRegs, *TRI, *NewBB);
263 
264   ++NumSplit;
265 
266   return NewBB;
267 }
268 
269 /// isBlockInRange - Returns true if the distance between specific MI and
270 /// specific BB can fit in MI's displacement field.
271 bool BranchRelaxation::isBlockInRange(
272   const MachineInstr &MI, const MachineBasicBlock &DestBB) const {
273   int64_t BrOffset = getInstrOffset(MI);
274   int64_t DestOffset = BlockInfo[DestBB.getNumber()].Offset;
275 
276   if (TII->isBranchOffsetInRange(MI.getOpcode(), DestOffset - BrOffset))
277     return true;
278 
279   DEBUG(
280     dbgs() << "Out of range branch to destination BB#" << DestBB.getNumber()
281            << " from BB#" << MI.getParent()->getNumber()
282            << " to " << DestOffset
283            << " offset " << DestOffset - BrOffset
284            << '\t' << MI
285   );
286 
287   return false;
288 }
289 
290 /// fixupConditionalBranch - Fix up a conditional branch whose destination is
291 /// too far away to fit in its displacement field. It is converted to an inverse
292 /// conditional branch + an unconditional branch to the destination.
293 bool BranchRelaxation::fixupConditionalBranch(MachineInstr &MI) {
294   DebugLoc DL = MI.getDebugLoc();
295   MachineBasicBlock *MBB = MI.getParent();
296   MachineBasicBlock *TBB = nullptr, *FBB = nullptr;
297   SmallVector<MachineOperand, 4> Cond;
298 
299   bool Fail = TII->analyzeBranch(*MBB, TBB, FBB, Cond);
300   assert(!Fail && "branches to be relaxed must be analyzable");
301   (void)Fail;
302 
303   // Add an unconditional branch to the destination and invert the branch
304   // condition to jump over it:
305   // tbz L1
306   // =>
307   // tbnz L2
308   // b   L1
309   // L2:
310 
311   if (FBB && isBlockInRange(MI, *FBB)) {
312     // Last MI in the BB is an unconditional branch. We can simply invert the
313     // condition and swap destinations:
314     // beq L1
315     // b   L2
316     // =>
317     // bne L2
318     // b   L1
319     DEBUG(dbgs() << "  Invert condition and swap "
320                     "its destination with " << MBB->back());
321 
322     TII->reverseBranchCondition(Cond);
323     int OldSize = 0, NewSize = 0;
324     TII->removeBranch(*MBB, &OldSize);
325     TII->insertBranch(*MBB, FBB, TBB, Cond, DL, &NewSize);
326 
327     BlockInfo[MBB->getNumber()].Size += (NewSize - OldSize);
328     return true;
329   } else if (FBB) {
330     // We need to split the basic block here to obtain two long-range
331     // unconditional branches.
332     auto &NewBB = *MF->CreateMachineBasicBlock(MBB->getBasicBlock());
333     MF->insert(++MBB->getIterator(), &NewBB);
334 
335     // Insert an entry into BlockInfo to align it properly with the block
336     // numbers.
337     BlockInfo.insert(BlockInfo.begin() + NewBB.getNumber(), BasicBlockInfo());
338 
339     unsigned &NewBBSize = BlockInfo[NewBB.getNumber()].Size;
340     int NewBrSize;
341     TII->insertUnconditionalBranch(NewBB, FBB, DL, &NewBrSize);
342     NewBBSize += NewBrSize;
343 
344     // Update the successor lists according to the transformation to follow.
345     // Do it here since if there's no split, no update is needed.
346     MBB->replaceSuccessor(FBB, &NewBB);
347     NewBB.addSuccessor(FBB);
348   }
349 
350   // We now have an appropriate fall-through block in place (either naturally or
351   // just created), so we can invert the condition.
352   MachineBasicBlock &NextBB = *std::next(MachineFunction::iterator(MBB));
353 
354   DEBUG(dbgs() << "  Insert B to BB#" << TBB->getNumber()
355                << ", invert condition and change dest. to BB#"
356                << NextBB.getNumber() << '\n');
357 
358   unsigned &MBBSize = BlockInfo[MBB->getNumber()].Size;
359 
360   // Insert a new conditional branch and a new unconditional branch.
361   int RemovedSize = 0;
362   TII->reverseBranchCondition(Cond);
363   TII->removeBranch(*MBB, &RemovedSize);
364   MBBSize -= RemovedSize;
365 
366   int AddedSize = 0;
367   TII->insertBranch(*MBB, &NextBB, TBB, Cond, DL, &AddedSize);
368   MBBSize += AddedSize;
369 
370   // Finally, keep the block offsets up to date.
371   adjustBlockOffsets(*MBB);
372   return true;
373 }
374 
375 bool BranchRelaxation::fixupUnconditionalBranch(MachineInstr &MI) {
376   MachineBasicBlock *MBB = MI.getParent();
377 
378   unsigned OldBrSize = TII->getInstSizeInBytes(MI);
379   MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI);
380 
381   int64_t DestOffset = BlockInfo[DestBB->getNumber()].Offset;
382   int64_t SrcOffset = getInstrOffset(MI);
383 
384   assert(!TII->isBranchOffsetInRange(MI.getOpcode(), DestOffset - SrcOffset));
385 
386   BlockInfo[MBB->getNumber()].Size -= OldBrSize;
387 
388   MachineBasicBlock *BranchBB = MBB;
389 
390   // If this was an expanded conditional branch, there is already a single
391   // unconditional branch in a block.
392   if (!MBB->empty()) {
393     BranchBB = createNewBlockAfter(*MBB);
394 
395     // Add live outs.
396     for (const MachineBasicBlock *Succ : MBB->successors()) {
397       for (const MachineBasicBlock::RegisterMaskPair &LiveIn : Succ->liveins())
398         BranchBB->addLiveIn(LiveIn);
399     }
400 
401     BranchBB->sortUniqueLiveIns();
402     BranchBB->addSuccessor(DestBB);
403     MBB->replaceSuccessor(DestBB, BranchBB);
404   }
405 
406   DebugLoc DL = MI.getDebugLoc();
407   MI.eraseFromParent();
408   BlockInfo[BranchBB->getNumber()].Size += TII->insertIndirectBranch(
409     *BranchBB, *DestBB, DL, DestOffset - SrcOffset, RS.get());
410 
411   adjustBlockOffsets(*MBB);
412   return true;
413 }
414 
415 bool BranchRelaxation::relaxBranchInstructions() {
416   bool Changed = false;
417 
418   // Relaxing branches involves creating new basic blocks, so re-eval
419   // end() for termination.
420   for (MachineFunction::iterator I = MF->begin(); I != MF->end(); ++I) {
421     MachineBasicBlock &MBB = *I;
422 
423     // Empty block?
424     MachineBasicBlock::iterator Last = MBB.getLastNonDebugInstr();
425     if (Last == MBB.end())
426       continue;
427 
428     // Expand the unconditional branch first if necessary. If there is a
429     // conditional branch, this will end up changing the branch destination of
430     // it to be over the newly inserted indirect branch block, which may avoid
431     // the need to try expanding the conditional branch first, saving an extra
432     // jump.
433     if (Last->isUnconditionalBranch()) {
434       // Unconditional branch destination might be unanalyzable, assume these
435       // are OK.
436       if (MachineBasicBlock *DestBB = TII->getBranchDestBlock(*Last)) {
437         if (!isBlockInRange(*Last, *DestBB)) {
438           fixupUnconditionalBranch(*Last);
439           ++NumUnconditionalRelaxed;
440           Changed = true;
441         }
442       }
443     }
444 
445     // Loop over the conditional branches.
446     MachineBasicBlock::iterator Next;
447     for (MachineBasicBlock::iterator J = MBB.getFirstTerminator();
448          J != MBB.end(); J = Next) {
449       Next = std::next(J);
450       MachineInstr &MI = *J;
451 
452       if (MI.isConditionalBranch()) {
453         MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI);
454         if (!isBlockInRange(MI, *DestBB)) {
455           if (Next != MBB.end() && Next->isConditionalBranch()) {
456             // If there are multiple conditional branches, this isn't an
457             // analyzable block. Split later terminators into a new block so
458             // each one will be analyzable.
459 
460             splitBlockBeforeInstr(*Next, DestBB);
461           } else {
462             fixupConditionalBranch(MI);
463             ++NumConditionalRelaxed;
464           }
465 
466           Changed = true;
467 
468           // This may have modified all of the terminators, so start over.
469           Next = MBB.getFirstTerminator();
470         }
471       }
472     }
473   }
474 
475   return Changed;
476 }
477 
478 bool BranchRelaxation::runOnMachineFunction(MachineFunction &mf) {
479   MF = &mf;
480 
481   DEBUG(dbgs() << "***** BranchRelaxation *****\n");
482 
483   const TargetSubtargetInfo &ST = MF->getSubtarget();
484   TII = ST.getInstrInfo();
485 
486   TRI = ST.getRegisterInfo();
487   if (TRI->trackLivenessAfterRegAlloc(*MF))
488     RS.reset(new RegScavenger());
489 
490   // Renumber all of the machine basic blocks in the function, guaranteeing that
491   // the numbers agree with the position of the block in the function.
492   MF->RenumberBlocks();
493 
494   // Do the initial scan of the function, building up information about the
495   // sizes of each block.
496   scanFunction();
497 
498   DEBUG(dbgs() << "  Basic blocks before relaxation\n"; dumpBBs(););
499 
500   bool MadeChange = false;
501   while (relaxBranchInstructions())
502     MadeChange = true;
503 
504   // After a while, this might be made debug-only, but it is not expensive.
505   verify();
506 
507   DEBUG(dbgs() << "  Basic blocks after relaxation\n\n"; dumpBBs());
508 
509   BlockInfo.clear();
510 
511   return MadeChange;
512 }
513