1 //===-- BranchRelaxation.cpp ----------------------------------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 10 #include "llvm/CodeGen/Passes.h" 11 #include "llvm/ADT/SmallVector.h" 12 #include "llvm/ADT/Statistic.h" 13 #include "llvm/CodeGen/LivePhysRegs.h" 14 #include "llvm/CodeGen/MachineFunctionPass.h" 15 #include "llvm/CodeGen/RegisterScavenging.h" 16 #include "llvm/Target/TargetInstrInfo.h" 17 #include "llvm/Target/TargetSubtargetInfo.h" 18 #include "llvm/Support/Debug.h" 19 #include "llvm/Support/Format.h" 20 #include "llvm/Support/raw_ostream.h" 21 22 using namespace llvm; 23 24 #define DEBUG_TYPE "branch-relaxation" 25 26 STATISTIC(NumSplit, "Number of basic blocks split"); 27 STATISTIC(NumConditionalRelaxed, "Number of conditional branches relaxed"); 28 STATISTIC(NumUnconditionalRelaxed, "Number of unconditional branches relaxed"); 29 30 #define BRANCH_RELAX_NAME "Branch relaxation pass" 31 32 namespace { 33 class BranchRelaxation : public MachineFunctionPass { 34 /// BasicBlockInfo - Information about the offset and size of a single 35 /// basic block. 36 struct BasicBlockInfo { 37 /// Offset - Distance from the beginning of the function to the beginning 38 /// of this basic block. 39 /// 40 /// The offset is always aligned as required by the basic block. 41 unsigned Offset; 42 43 /// Size - Size of the basic block in bytes. If the block contains 44 /// inline assembly, this is a worst case estimate. 45 /// 46 /// The size does not include any alignment padding whether from the 47 /// beginning of the block, or from an aligned jump table at the end. 48 unsigned Size; 49 50 BasicBlockInfo() : Offset(0), Size(0) {} 51 52 /// Compute the offset immediately following this block. \p MBB is the next 53 /// block. 54 unsigned postOffset(const MachineBasicBlock &MBB) const { 55 unsigned PO = Offset + Size; 56 unsigned Align = MBB.getAlignment(); 57 if (Align == 0) 58 return PO; 59 60 unsigned AlignAmt = 1 << Align; 61 unsigned ParentAlign = MBB.getParent()->getAlignment(); 62 if (Align <= ParentAlign) 63 return PO + OffsetToAlignment(PO, AlignAmt); 64 65 // The alignment of this MBB is larger than the function's alignment, so we 66 // can't tell whether or not it will insert nops. Assume that it will. 67 return PO + AlignAmt + OffsetToAlignment(PO, AlignAmt); 68 } 69 }; 70 71 SmallVector<BasicBlockInfo, 16> BlockInfo; 72 std::unique_ptr<RegScavenger> RS; 73 LivePhysRegs LiveRegs; 74 75 MachineFunction *MF; 76 const TargetRegisterInfo *TRI; 77 const TargetInstrInfo *TII; 78 79 bool relaxBranchInstructions(); 80 void scanFunction(); 81 82 MachineBasicBlock *createNewBlockAfter(MachineBasicBlock &BB); 83 84 MachineBasicBlock *splitBlockBeforeInstr(MachineInstr &MI, 85 MachineBasicBlock *DestBB); 86 void adjustBlockOffsets(MachineBasicBlock &MBB); 87 bool isBlockInRange(const MachineInstr &MI, const MachineBasicBlock &BB) const; 88 89 bool fixupConditionalBranch(MachineInstr &MI); 90 bool fixupUnconditionalBranch(MachineInstr &MI); 91 uint64_t computeBlockSize(const MachineBasicBlock &MBB) const; 92 unsigned getInstrOffset(const MachineInstr &MI) const; 93 void dumpBBs(); 94 void verify(); 95 96 public: 97 static char ID; 98 BranchRelaxation() : MachineFunctionPass(ID) { } 99 100 bool runOnMachineFunction(MachineFunction &MF) override; 101 102 StringRef getPassName() const override { 103 return BRANCH_RELAX_NAME; 104 } 105 }; 106 107 } 108 109 char BranchRelaxation::ID = 0; 110 char &llvm::BranchRelaxationPassID = BranchRelaxation::ID; 111 112 INITIALIZE_PASS(BranchRelaxation, DEBUG_TYPE, BRANCH_RELAX_NAME, false, false) 113 114 /// verify - check BBOffsets, BBSizes, alignment of islands 115 void BranchRelaxation::verify() { 116 #ifndef NDEBUG 117 unsigned PrevNum = MF->begin()->getNumber(); 118 for (MachineBasicBlock &MBB : *MF) { 119 unsigned Align = MBB.getAlignment(); 120 unsigned Num = MBB.getNumber(); 121 assert(BlockInfo[Num].Offset % (1u << Align) == 0); 122 assert(!Num || BlockInfo[PrevNum].postOffset(MBB) <= BlockInfo[Num].Offset); 123 assert(BlockInfo[Num].Size == computeBlockSize(MBB)); 124 PrevNum = Num; 125 } 126 #endif 127 } 128 129 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) 130 /// print block size and offset information - debugging 131 LLVM_DUMP_METHOD void BranchRelaxation::dumpBBs() { 132 for (auto &MBB : *MF) { 133 const BasicBlockInfo &BBI = BlockInfo[MBB.getNumber()]; 134 dbgs() << format("BB#%u\toffset=%08x\t", MBB.getNumber(), BBI.Offset) 135 << format("size=%#x\n", BBI.Size); 136 } 137 } 138 #endif 139 140 /// scanFunction - Do the initial scan of the function, building up 141 /// information about each block. 142 void BranchRelaxation::scanFunction() { 143 BlockInfo.clear(); 144 BlockInfo.resize(MF->getNumBlockIDs()); 145 146 // First thing, compute the size of all basic blocks, and see if the function 147 // has any inline assembly in it. If so, we have to be conservative about 148 // alignment assumptions, as we don't know for sure the size of any 149 // instructions in the inline assembly. 150 for (MachineBasicBlock &MBB : *MF) 151 BlockInfo[MBB.getNumber()].Size = computeBlockSize(MBB); 152 153 // Compute block offsets and known bits. 154 adjustBlockOffsets(*MF->begin()); 155 } 156 157 /// computeBlockSize - Compute the size for MBB. 158 uint64_t BranchRelaxation::computeBlockSize(const MachineBasicBlock &MBB) const { 159 uint64_t Size = 0; 160 for (const MachineInstr &MI : MBB) 161 Size += TII->getInstSizeInBytes(MI); 162 return Size; 163 } 164 165 /// getInstrOffset - Return the current offset of the specified machine 166 /// instruction from the start of the function. This offset changes as stuff is 167 /// moved around inside the function. 168 unsigned BranchRelaxation::getInstrOffset(const MachineInstr &MI) const { 169 const MachineBasicBlock *MBB = MI.getParent(); 170 171 // The offset is composed of two things: the sum of the sizes of all MBB's 172 // before this instruction's block, and the offset from the start of the block 173 // it is in. 174 unsigned Offset = BlockInfo[MBB->getNumber()].Offset; 175 176 // Sum instructions before MI in MBB. 177 for (MachineBasicBlock::const_iterator I = MBB->begin(); &*I != &MI; ++I) { 178 assert(I != MBB->end() && "Didn't find MI in its own basic block?"); 179 Offset += TII->getInstSizeInBytes(*I); 180 } 181 182 return Offset; 183 } 184 185 void BranchRelaxation::adjustBlockOffsets(MachineBasicBlock &Start) { 186 unsigned PrevNum = Start.getNumber(); 187 for (auto &MBB : make_range(MachineFunction::iterator(Start), MF->end())) { 188 unsigned Num = MBB.getNumber(); 189 if (!Num) // block zero is never changed from offset zero. 190 continue; 191 // Get the offset and known bits at the end of the layout predecessor. 192 // Include the alignment of the current block. 193 BlockInfo[Num].Offset = BlockInfo[PrevNum].postOffset(MBB); 194 195 PrevNum = Num; 196 } 197 } 198 199 /// Insert a new empty basic block and insert it after \BB 200 MachineBasicBlock *BranchRelaxation::createNewBlockAfter(MachineBasicBlock &BB) { 201 // Create a new MBB for the code after the OrigBB. 202 MachineBasicBlock *NewBB = 203 MF->CreateMachineBasicBlock(BB.getBasicBlock()); 204 MF->insert(++BB.getIterator(), NewBB); 205 206 // Insert an entry into BlockInfo to align it properly with the block numbers. 207 BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo()); 208 209 return NewBB; 210 } 211 212 /// Split the basic block containing MI into two blocks, which are joined by 213 /// an unconditional branch. Update data structures and renumber blocks to 214 /// account for this change and returns the newly created block. 215 MachineBasicBlock *BranchRelaxation::splitBlockBeforeInstr(MachineInstr &MI, 216 MachineBasicBlock *DestBB) { 217 MachineBasicBlock *OrigBB = MI.getParent(); 218 219 // Create a new MBB for the code after the OrigBB. 220 MachineBasicBlock *NewBB = 221 MF->CreateMachineBasicBlock(OrigBB->getBasicBlock()); 222 MF->insert(++OrigBB->getIterator(), NewBB); 223 224 // Splice the instructions starting with MI over to NewBB. 225 NewBB->splice(NewBB->end(), OrigBB, MI.getIterator(), OrigBB->end()); 226 227 // Add an unconditional branch from OrigBB to NewBB. 228 // Note the new unconditional branch is not being recorded. 229 // There doesn't seem to be meaningful DebugInfo available; this doesn't 230 // correspond to anything in the source. 231 TII->insertUnconditionalBranch(*OrigBB, NewBB, DebugLoc()); 232 233 // Insert an entry into BlockInfo to align it properly with the block numbers. 234 BlockInfo.insert(BlockInfo.begin() + NewBB->getNumber(), BasicBlockInfo()); 235 236 237 NewBB->transferSuccessors(OrigBB); 238 OrigBB->addSuccessor(NewBB); 239 OrigBB->addSuccessor(DestBB); 240 241 // Cleanup potential unconditional branch to successor block. 242 // Note that updateTerminator may change the size of the blocks. 243 NewBB->updateTerminator(); 244 OrigBB->updateTerminator(); 245 246 // Figure out how large the OrigBB is. As the first half of the original 247 // block, it cannot contain a tablejump. The size includes 248 // the new jump we added. (It should be possible to do this without 249 // recounting everything, but it's very confusing, and this is rarely 250 // executed.) 251 BlockInfo[OrigBB->getNumber()].Size = computeBlockSize(*OrigBB); 252 253 // Figure out how large the NewMBB is. As the second half of the original 254 // block, it may contain a tablejump. 255 BlockInfo[NewBB->getNumber()].Size = computeBlockSize(*NewBB); 256 257 // All BBOffsets following these blocks must be modified. 258 adjustBlockOffsets(*OrigBB); 259 260 // Need to fix live-in lists if we track liveness. 261 if (TRI->trackLivenessAfterRegAlloc(*MF)) 262 computeLiveIns(LiveRegs, *TRI, *NewBB); 263 264 ++NumSplit; 265 266 return NewBB; 267 } 268 269 /// isBlockInRange - Returns true if the distance between specific MI and 270 /// specific BB can fit in MI's displacement field. 271 bool BranchRelaxation::isBlockInRange( 272 const MachineInstr &MI, const MachineBasicBlock &DestBB) const { 273 int64_t BrOffset = getInstrOffset(MI); 274 int64_t DestOffset = BlockInfo[DestBB.getNumber()].Offset; 275 276 if (TII->isBranchOffsetInRange(MI.getOpcode(), DestOffset - BrOffset)) 277 return true; 278 279 DEBUG( 280 dbgs() << "Out of range branch to destination BB#" << DestBB.getNumber() 281 << " from BB#" << MI.getParent()->getNumber() 282 << " to " << DestOffset 283 << " offset " << DestOffset - BrOffset 284 << '\t' << MI 285 ); 286 287 return false; 288 } 289 290 /// fixupConditionalBranch - Fix up a conditional branch whose destination is 291 /// too far away to fit in its displacement field. It is converted to an inverse 292 /// conditional branch + an unconditional branch to the destination. 293 bool BranchRelaxation::fixupConditionalBranch(MachineInstr &MI) { 294 DebugLoc DL = MI.getDebugLoc(); 295 MachineBasicBlock *MBB = MI.getParent(); 296 MachineBasicBlock *TBB = nullptr, *FBB = nullptr; 297 SmallVector<MachineOperand, 4> Cond; 298 299 bool Fail = TII->analyzeBranch(*MBB, TBB, FBB, Cond); 300 assert(!Fail && "branches to be relaxed must be analyzable"); 301 (void)Fail; 302 303 // Add an unconditional branch to the destination and invert the branch 304 // condition to jump over it: 305 // tbz L1 306 // => 307 // tbnz L2 308 // b L1 309 // L2: 310 311 if (FBB && isBlockInRange(MI, *FBB)) { 312 // Last MI in the BB is an unconditional branch. We can simply invert the 313 // condition and swap destinations: 314 // beq L1 315 // b L2 316 // => 317 // bne L2 318 // b L1 319 DEBUG(dbgs() << " Invert condition and swap " 320 "its destination with " << MBB->back()); 321 322 TII->reverseBranchCondition(Cond); 323 int OldSize = 0, NewSize = 0; 324 TII->removeBranch(*MBB, &OldSize); 325 TII->insertBranch(*MBB, FBB, TBB, Cond, DL, &NewSize); 326 327 BlockInfo[MBB->getNumber()].Size += (NewSize - OldSize); 328 return true; 329 } else if (FBB) { 330 // We need to split the basic block here to obtain two long-range 331 // unconditional branches. 332 auto &NewBB = *MF->CreateMachineBasicBlock(MBB->getBasicBlock()); 333 MF->insert(++MBB->getIterator(), &NewBB); 334 335 // Insert an entry into BlockInfo to align it properly with the block 336 // numbers. 337 BlockInfo.insert(BlockInfo.begin() + NewBB.getNumber(), BasicBlockInfo()); 338 339 unsigned &NewBBSize = BlockInfo[NewBB.getNumber()].Size; 340 int NewBrSize; 341 TII->insertUnconditionalBranch(NewBB, FBB, DL, &NewBrSize); 342 NewBBSize += NewBrSize; 343 344 // Update the successor lists according to the transformation to follow. 345 // Do it here since if there's no split, no update is needed. 346 MBB->replaceSuccessor(FBB, &NewBB); 347 NewBB.addSuccessor(FBB); 348 } 349 350 // We now have an appropriate fall-through block in place (either naturally or 351 // just created), so we can invert the condition. 352 MachineBasicBlock &NextBB = *std::next(MachineFunction::iterator(MBB)); 353 354 DEBUG(dbgs() << " Insert B to BB#" << TBB->getNumber() 355 << ", invert condition and change dest. to BB#" 356 << NextBB.getNumber() << '\n'); 357 358 unsigned &MBBSize = BlockInfo[MBB->getNumber()].Size; 359 360 // Insert a new conditional branch and a new unconditional branch. 361 int RemovedSize = 0; 362 TII->reverseBranchCondition(Cond); 363 TII->removeBranch(*MBB, &RemovedSize); 364 MBBSize -= RemovedSize; 365 366 int AddedSize = 0; 367 TII->insertBranch(*MBB, &NextBB, TBB, Cond, DL, &AddedSize); 368 MBBSize += AddedSize; 369 370 // Finally, keep the block offsets up to date. 371 adjustBlockOffsets(*MBB); 372 return true; 373 } 374 375 bool BranchRelaxation::fixupUnconditionalBranch(MachineInstr &MI) { 376 MachineBasicBlock *MBB = MI.getParent(); 377 378 unsigned OldBrSize = TII->getInstSizeInBytes(MI); 379 MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI); 380 381 int64_t DestOffset = BlockInfo[DestBB->getNumber()].Offset; 382 int64_t SrcOffset = getInstrOffset(MI); 383 384 assert(!TII->isBranchOffsetInRange(MI.getOpcode(), DestOffset - SrcOffset)); 385 386 BlockInfo[MBB->getNumber()].Size -= OldBrSize; 387 388 MachineBasicBlock *BranchBB = MBB; 389 390 // If this was an expanded conditional branch, there is already a single 391 // unconditional branch in a block. 392 if (!MBB->empty()) { 393 BranchBB = createNewBlockAfter(*MBB); 394 395 // Add live outs. 396 for (const MachineBasicBlock *Succ : MBB->successors()) { 397 for (const MachineBasicBlock::RegisterMaskPair &LiveIn : Succ->liveins()) 398 BranchBB->addLiveIn(LiveIn); 399 } 400 401 BranchBB->sortUniqueLiveIns(); 402 BranchBB->addSuccessor(DestBB); 403 MBB->replaceSuccessor(DestBB, BranchBB); 404 } 405 406 DebugLoc DL = MI.getDebugLoc(); 407 MI.eraseFromParent(); 408 BlockInfo[BranchBB->getNumber()].Size += TII->insertIndirectBranch( 409 *BranchBB, *DestBB, DL, DestOffset - SrcOffset, RS.get()); 410 411 adjustBlockOffsets(*MBB); 412 return true; 413 } 414 415 bool BranchRelaxation::relaxBranchInstructions() { 416 bool Changed = false; 417 418 // Relaxing branches involves creating new basic blocks, so re-eval 419 // end() for termination. 420 for (MachineFunction::iterator I = MF->begin(); I != MF->end(); ++I) { 421 MachineBasicBlock &MBB = *I; 422 423 // Empty block? 424 MachineBasicBlock::iterator Last = MBB.getLastNonDebugInstr(); 425 if (Last == MBB.end()) 426 continue; 427 428 // Expand the unconditional branch first if necessary. If there is a 429 // conditional branch, this will end up changing the branch destination of 430 // it to be over the newly inserted indirect branch block, which may avoid 431 // the need to try expanding the conditional branch first, saving an extra 432 // jump. 433 if (Last->isUnconditionalBranch()) { 434 // Unconditional branch destination might be unanalyzable, assume these 435 // are OK. 436 if (MachineBasicBlock *DestBB = TII->getBranchDestBlock(*Last)) { 437 if (!isBlockInRange(*Last, *DestBB)) { 438 fixupUnconditionalBranch(*Last); 439 ++NumUnconditionalRelaxed; 440 Changed = true; 441 } 442 } 443 } 444 445 // Loop over the conditional branches. 446 MachineBasicBlock::iterator Next; 447 for (MachineBasicBlock::iterator J = MBB.getFirstTerminator(); 448 J != MBB.end(); J = Next) { 449 Next = std::next(J); 450 MachineInstr &MI = *J; 451 452 if (MI.isConditionalBranch()) { 453 MachineBasicBlock *DestBB = TII->getBranchDestBlock(MI); 454 if (!isBlockInRange(MI, *DestBB)) { 455 if (Next != MBB.end() && Next->isConditionalBranch()) { 456 // If there are multiple conditional branches, this isn't an 457 // analyzable block. Split later terminators into a new block so 458 // each one will be analyzable. 459 460 splitBlockBeforeInstr(*Next, DestBB); 461 } else { 462 fixupConditionalBranch(MI); 463 ++NumConditionalRelaxed; 464 } 465 466 Changed = true; 467 468 // This may have modified all of the terminators, so start over. 469 Next = MBB.getFirstTerminator(); 470 } 471 } 472 } 473 } 474 475 return Changed; 476 } 477 478 bool BranchRelaxation::runOnMachineFunction(MachineFunction &mf) { 479 MF = &mf; 480 481 DEBUG(dbgs() << "***** BranchRelaxation *****\n"); 482 483 const TargetSubtargetInfo &ST = MF->getSubtarget(); 484 TII = ST.getInstrInfo(); 485 486 TRI = ST.getRegisterInfo(); 487 if (TRI->trackLivenessAfterRegAlloc(*MF)) 488 RS.reset(new RegScavenger()); 489 490 // Renumber all of the machine basic blocks in the function, guaranteeing that 491 // the numbers agree with the position of the block in the function. 492 MF->RenumberBlocks(); 493 494 // Do the initial scan of the function, building up information about the 495 // sizes of each block. 496 scanFunction(); 497 498 DEBUG(dbgs() << " Basic blocks before relaxation\n"; dumpBBs();); 499 500 bool MadeChange = false; 501 while (relaxBranchInstructions()) 502 MadeChange = true; 503 504 // After a while, this might be made debug-only, but it is not expensive. 505 verify(); 506 507 DEBUG(dbgs() << " Basic blocks after relaxation\n\n"; dumpBBs()); 508 509 BlockInfo.clear(); 510 511 return MadeChange; 512 } 513