1 //===- LoopSimplify.cpp - Loop Canonicalization Pass ----------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This pass performs several transformations to transform natural loops into a 11 // simpler form, which makes subsequent analyses and transformations simpler and 12 // more effective. 13 // 14 // Loop pre-header insertion guarantees that there is a single, non-critical 15 // entry edge from outside of the loop to the loop header. This simplifies a 16 // number of analyses and transformations, such as LICM. 17 // 18 // Loop exit-block insertion guarantees that all exit blocks from the loop 19 // (blocks which are outside of the loop that have predecessors inside of the 20 // loop) only have predecessors from inside of the loop (and are thus dominated 21 // by the loop header). This simplifies transformations such as store-sinking 22 // that are built into LICM. 23 // 24 // This pass also guarantees that loops will have exactly one backedge. 25 // 26 // Note that the simplifycfg pass will clean up blocks which are split out but 27 // end up being unnecessary, so usage of this pass should not pessimize 28 // generated code. 29 // 30 // This pass obviously modifies the CFG, but updates loop information and 31 // dominator information. 32 // 33 //===----------------------------------------------------------------------===// 34 35 #define DEBUG_TYPE "loopsimplify" 36 #include "llvm/Transforms/Scalar.h" 37 #include "llvm/Constants.h" 38 #include "llvm/Instructions.h" 39 #include "llvm/Function.h" 40 #include "llvm/LLVMContext.h" 41 #include "llvm/Type.h" 42 #include "llvm/Analysis/AliasAnalysis.h" 43 #include "llvm/Analysis/Dominators.h" 44 #include "llvm/Analysis/LoopInfo.h" 45 #include "llvm/Transforms/Utils/BasicBlockUtils.h" 46 #include "llvm/Transforms/Utils/Local.h" 47 #include "llvm/Support/CFG.h" 48 #include "llvm/Support/Compiler.h" 49 #include "llvm/ADT/SetOperations.h" 50 #include "llvm/ADT/SetVector.h" 51 #include "llvm/ADT/Statistic.h" 52 #include "llvm/ADT/DepthFirstIterator.h" 53 using namespace llvm; 54 55 STATISTIC(NumInserted, "Number of pre-header or exit blocks inserted"); 56 STATISTIC(NumNested , "Number of nested loops split out"); 57 58 namespace { 59 struct VISIBILITY_HIDDEN LoopSimplify : public FunctionPass { 60 static char ID; // Pass identification, replacement for typeid 61 LoopSimplify() : FunctionPass(&ID) {} 62 63 // AA - If we have an alias analysis object to update, this is it, otherwise 64 // this is null. 65 AliasAnalysis *AA; 66 LoopInfo *LI; 67 DominatorTree *DT; 68 virtual bool runOnFunction(Function &F); 69 70 virtual void getAnalysisUsage(AnalysisUsage &AU) const { 71 // We need loop information to identify the loops... 72 AU.addRequired<LoopInfo>(); 73 AU.addRequired<DominatorTree>(); 74 75 AU.addPreserved<LoopInfo>(); 76 AU.addPreserved<DominatorTree>(); 77 AU.addPreserved<DominanceFrontier>(); 78 AU.addPreserved<AliasAnalysis>(); 79 AU.addPreservedID(BreakCriticalEdgesID); // No critical edges added. 80 } 81 82 /// verifyAnalysis() - Verify loop nest. 83 void verifyAnalysis() const { 84 #ifndef NDEBUG 85 LoopInfo *NLI = &getAnalysis<LoopInfo>(); 86 for (LoopInfo::iterator I = NLI->begin(), E = NLI->end(); I != E; ++I) 87 (*I)->verifyLoop(); 88 #endif 89 } 90 91 private: 92 bool ProcessLoop(Loop *L); 93 BasicBlock *RewriteLoopExitBlock(Loop *L, BasicBlock *Exit); 94 BasicBlock *InsertPreheaderForLoop(Loop *L); 95 Loop *SeparateNestedLoop(Loop *L); 96 void InsertUniqueBackedgeBlock(Loop *L, BasicBlock *Preheader); 97 void PlaceSplitBlockCarefully(BasicBlock *NewBB, 98 SmallVectorImpl<BasicBlock*> &SplitPreds, 99 Loop *L); 100 }; 101 } 102 103 char LoopSimplify::ID = 0; 104 static RegisterPass<LoopSimplify> 105 X("loopsimplify", "Canonicalize natural loops", true); 106 107 // Publically exposed interface to pass... 108 const PassInfo *const llvm::LoopSimplifyID = &X; 109 FunctionPass *llvm::createLoopSimplifyPass() { return new LoopSimplify(); } 110 111 /// runOnFunction - Run down all loops in the CFG (recursively, but we could do 112 /// it in any convenient order) inserting preheaders... 113 /// 114 bool LoopSimplify::runOnFunction(Function &F) { 115 bool Changed = false; 116 LI = &getAnalysis<LoopInfo>(); 117 AA = getAnalysisIfAvailable<AliasAnalysis>(); 118 DT = &getAnalysis<DominatorTree>(); 119 120 // Check to see that no blocks (other than the header) in loops have 121 // predecessors that are not in loops. This is not valid for natural loops, 122 // but can occur if the blocks are unreachable. Since they are unreachable we 123 // can just shamelessly destroy their terminators to make them not branch into 124 // the loop! 125 for (Function::iterator BB = F.begin(), E = F.end(); BB != E; ++BB) { 126 // This case can only occur for unreachable blocks. Blocks that are 127 // unreachable can't be in loops, so filter those blocks out. 128 if (LI->getLoopFor(BB)) continue; 129 130 bool BlockUnreachable = false; 131 TerminatorInst *TI = BB->getTerminator(); 132 133 // Check to see if any successors of this block are non-loop-header loops 134 // that are not the header. 135 for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i) { 136 // If this successor is not in a loop, BB is clearly ok. 137 Loop *L = LI->getLoopFor(TI->getSuccessor(i)); 138 if (!L) continue; 139 140 // If the succ is the loop header, and if L is a top-level loop, then this 141 // is an entrance into a loop through the header, which is also ok. 142 if (L->getHeader() == TI->getSuccessor(i) && L->getParentLoop() == 0) 143 continue; 144 145 // Otherwise, this is an entrance into a loop from some place invalid. 146 // Either the loop structure is invalid and this is not a natural loop (in 147 // which case the compiler is buggy somewhere else) or BB is unreachable. 148 BlockUnreachable = true; 149 break; 150 } 151 152 // If this block is ok, check the next one. 153 if (!BlockUnreachable) continue; 154 155 // Otherwise, this block is dead. To clean up the CFG and to allow later 156 // loop transformations to ignore this case, we delete the edges into the 157 // loop by replacing the terminator. 158 159 // Remove PHI entries from the successors. 160 for (unsigned i = 0, e = TI->getNumSuccessors(); i != e; ++i) 161 TI->getSuccessor(i)->removePredecessor(BB); 162 163 // Add a new unreachable instruction before the old terminator. 164 new UnreachableInst(TI); 165 166 // Delete the dead terminator. 167 if (AA) AA->deleteValue(TI); 168 if (!TI->use_empty()) 169 TI->replaceAllUsesWith(F.getContext().getUndef(TI->getType())); 170 TI->eraseFromParent(); 171 Changed |= true; 172 } 173 174 for (LoopInfo::iterator I = LI->begin(), E = LI->end(); I != E; ++I) 175 Changed |= ProcessLoop(*I); 176 177 return Changed; 178 } 179 180 /// ProcessLoop - Walk the loop structure in depth first order, ensuring that 181 /// all loops have preheaders. 182 /// 183 bool LoopSimplify::ProcessLoop(Loop *L) { 184 bool Changed = false; 185 ReprocessLoop: 186 187 // Canonicalize inner loops before outer loops. Inner loop canonicalization 188 // can provide work for the outer loop to canonicalize. 189 for (Loop::iterator I = L->begin(), E = L->end(); I != E; ++I) 190 Changed |= ProcessLoop(*I); 191 192 assert(L->getBlocks()[0] == L->getHeader() && 193 "Header isn't first block in loop?"); 194 195 // Does the loop already have a preheader? If so, don't insert one. 196 BasicBlock *Preheader = L->getLoopPreheader(); 197 if (!Preheader) { 198 Preheader = InsertPreheaderForLoop(L); 199 NumInserted++; 200 Changed = true; 201 } 202 203 // Next, check to make sure that all exit nodes of the loop only have 204 // predecessors that are inside of the loop. This check guarantees that the 205 // loop preheader/header will dominate the exit blocks. If the exit block has 206 // predecessors from outside of the loop, split the edge now. 207 SmallVector<BasicBlock*, 8> ExitBlocks; 208 L->getExitBlocks(ExitBlocks); 209 210 SetVector<BasicBlock*> ExitBlockSet(ExitBlocks.begin(), ExitBlocks.end()); 211 for (SetVector<BasicBlock*>::iterator I = ExitBlockSet.begin(), 212 E = ExitBlockSet.end(); I != E; ++I) { 213 BasicBlock *ExitBlock = *I; 214 for (pred_iterator PI = pred_begin(ExitBlock), PE = pred_end(ExitBlock); 215 PI != PE; ++PI) 216 // Must be exactly this loop: no subloops, parent loops, or non-loop preds 217 // allowed. 218 if (!L->contains(*PI)) { 219 RewriteLoopExitBlock(L, ExitBlock); 220 NumInserted++; 221 Changed = true; 222 break; 223 } 224 } 225 226 // If the header has more than two predecessors at this point (from the 227 // preheader and from multiple backedges), we must adjust the loop. 228 unsigned NumBackedges = L->getNumBackEdges(); 229 if (NumBackedges != 1) { 230 // If this is really a nested loop, rip it out into a child loop. Don't do 231 // this for loops with a giant number of backedges, just factor them into a 232 // common backedge instead. 233 if (NumBackedges < 8) { 234 if (Loop *NL = SeparateNestedLoop(L)) { 235 ++NumNested; 236 // This is a big restructuring change, reprocess the whole loop. 237 ProcessLoop(NL); 238 Changed = true; 239 // GCC doesn't tail recursion eliminate this. 240 goto ReprocessLoop; 241 } 242 } 243 244 // If we either couldn't, or didn't want to, identify nesting of the loops, 245 // insert a new block that all backedges target, then make it jump to the 246 // loop header. 247 InsertUniqueBackedgeBlock(L, Preheader); 248 NumInserted++; 249 Changed = true; 250 } 251 252 // Scan over the PHI nodes in the loop header. Since they now have only two 253 // incoming values (the loop is canonicalized), we may have simplified the PHI 254 // down to 'X = phi [X, Y]', which should be replaced with 'Y'. 255 PHINode *PN; 256 for (BasicBlock::iterator I = L->getHeader()->begin(); 257 (PN = dyn_cast<PHINode>(I++)); ) 258 if (Value *V = PN->hasConstantValue()) { 259 if (AA) AA->deleteValue(PN); 260 PN->replaceAllUsesWith(V); 261 PN->eraseFromParent(); 262 } 263 264 // If this loop has muliple exits and the exits all go to the same 265 // block, attempt to merge the exits. This helps several passes, such 266 // as LoopRotation, which do not support loops with multiple exits. 267 // SimplifyCFG also does this (and this code uses the same utility 268 // function), however this code is loop-aware, where SimplifyCFG is 269 // not. That gives it the advantage of being able to hoist 270 // loop-invariant instructions out of the way to open up more 271 // opportunities, and the disadvantage of having the responsibility 272 // to preserve dominator information. 273 if (ExitBlocks.size() > 1 && L->getUniqueExitBlock()) { 274 SmallVector<BasicBlock*, 8> ExitingBlocks; 275 L->getExitingBlocks(ExitingBlocks); 276 for (unsigned i = 0, e = ExitingBlocks.size(); i != e; ++i) { 277 BasicBlock *ExitingBlock = ExitingBlocks[i]; 278 if (!ExitingBlock->getSinglePredecessor()) continue; 279 BranchInst *BI = dyn_cast<BranchInst>(ExitingBlock->getTerminator()); 280 if (!BI || !BI->isConditional()) continue; 281 CmpInst *CI = dyn_cast<CmpInst>(BI->getCondition()); 282 if (!CI || CI->getParent() != ExitingBlock) continue; 283 284 // Attempt to hoist out all instructions except for the 285 // comparison and the branch. 286 bool AllInvariant = true; 287 for (BasicBlock::iterator I = ExitingBlock->begin(); &*I != BI; ) { 288 Instruction *Inst = I++; 289 if (Inst == CI) 290 continue; 291 if (!L->makeLoopInvariant(Inst, Changed, Preheader->getTerminator())) { 292 AllInvariant = false; 293 break; 294 } 295 } 296 if (!AllInvariant) continue; 297 298 // The block has now been cleared of all instructions except for 299 // a comparison and a conditional branch. SimplifyCFG may be able 300 // to fold it now. 301 if (!FoldBranchToCommonDest(BI)) continue; 302 303 // Success. The block is now dead, so remove it from the loop, 304 // update the dominator tree and dominance frontier, and delete it. 305 assert(pred_begin(ExitingBlock) == pred_end(ExitingBlock)); 306 Changed = true; 307 LI->removeBlock(ExitingBlock); 308 309 DominanceFrontier *DF = getAnalysisIfAvailable<DominanceFrontier>(); 310 DomTreeNode *Node = DT->getNode(ExitingBlock); 311 const std::vector<DomTreeNodeBase<BasicBlock> *> &Children = 312 Node->getChildren(); 313 for (unsigned k = 0, g = Children.size(); k != g; ++k) { 314 DT->changeImmediateDominator(Children[k], Node->getIDom()); 315 if (DF) DF->changeImmediateDominator(Children[k]->getBlock(), 316 Node->getIDom()->getBlock(), 317 DT); 318 } 319 DT->eraseNode(ExitingBlock); 320 if (DF) DF->removeBlock(ExitingBlock); 321 322 BI->getSuccessor(0)->removePredecessor(ExitingBlock); 323 BI->getSuccessor(1)->removePredecessor(ExitingBlock); 324 ExitingBlock->eraseFromParent(); 325 } 326 } 327 328 return Changed; 329 } 330 331 /// InsertPreheaderForLoop - Once we discover that a loop doesn't have a 332 /// preheader, this method is called to insert one. This method has two phases: 333 /// preheader insertion and analysis updating. 334 /// 335 BasicBlock *LoopSimplify::InsertPreheaderForLoop(Loop *L) { 336 BasicBlock *Header = L->getHeader(); 337 338 // Compute the set of predecessors of the loop that are not in the loop. 339 SmallVector<BasicBlock*, 8> OutsideBlocks; 340 for (pred_iterator PI = pred_begin(Header), PE = pred_end(Header); 341 PI != PE; ++PI) 342 if (!L->contains(*PI)) // Coming in from outside the loop? 343 OutsideBlocks.push_back(*PI); // Keep track of it... 344 345 // Split out the loop pre-header. 346 BasicBlock *NewBB = 347 SplitBlockPredecessors(Header, &OutsideBlocks[0], OutsideBlocks.size(), 348 ".preheader", this); 349 350 351 //===--------------------------------------------------------------------===// 352 // Update analysis results now that we have performed the transformation 353 // 354 355 // We know that we have loop information to update... update it now. 356 if (Loop *Parent = L->getParentLoop()) 357 Parent->addBasicBlockToLoop(NewBB, LI->getBase()); 358 359 // Make sure that NewBB is put someplace intelligent, which doesn't mess up 360 // code layout too horribly. 361 PlaceSplitBlockCarefully(NewBB, OutsideBlocks, L); 362 363 return NewBB; 364 } 365 366 /// RewriteLoopExitBlock - Ensure that the loop preheader dominates all exit 367 /// blocks. This method is used to split exit blocks that have predecessors 368 /// outside of the loop. 369 BasicBlock *LoopSimplify::RewriteLoopExitBlock(Loop *L, BasicBlock *Exit) { 370 SmallVector<BasicBlock*, 8> LoopBlocks; 371 for (pred_iterator I = pred_begin(Exit), E = pred_end(Exit); I != E; ++I) 372 if (L->contains(*I)) 373 LoopBlocks.push_back(*I); 374 375 assert(!LoopBlocks.empty() && "No edges coming in from outside the loop?"); 376 BasicBlock *NewBB = SplitBlockPredecessors(Exit, &LoopBlocks[0], 377 LoopBlocks.size(), ".loopexit", 378 this); 379 380 // Update Loop Information - we know that the new block will be in whichever 381 // loop the Exit block is in. Note that it may not be in that immediate loop, 382 // if the successor is some other loop header. In that case, we continue 383 // walking up the loop tree to find a loop that contains both the successor 384 // block and the predecessor block. 385 Loop *SuccLoop = LI->getLoopFor(Exit); 386 while (SuccLoop && !SuccLoop->contains(L->getHeader())) 387 SuccLoop = SuccLoop->getParentLoop(); 388 if (SuccLoop) 389 SuccLoop->addBasicBlockToLoop(NewBB, LI->getBase()); 390 391 return NewBB; 392 } 393 394 /// AddBlockAndPredsToSet - Add the specified block, and all of its 395 /// predecessors, to the specified set, if it's not already in there. Stop 396 /// predecessor traversal when we reach StopBlock. 397 static void AddBlockAndPredsToSet(BasicBlock *InputBB, BasicBlock *StopBlock, 398 std::set<BasicBlock*> &Blocks) { 399 std::vector<BasicBlock *> WorkList; 400 WorkList.push_back(InputBB); 401 do { 402 BasicBlock *BB = WorkList.back(); WorkList.pop_back(); 403 if (Blocks.insert(BB).second && BB != StopBlock) 404 // If BB is not already processed and it is not a stop block then 405 // insert its predecessor in the work list 406 for (pred_iterator I = pred_begin(BB), E = pred_end(BB); I != E; ++I) { 407 BasicBlock *WBB = *I; 408 WorkList.push_back(WBB); 409 } 410 } while(!WorkList.empty()); 411 } 412 413 /// FindPHIToPartitionLoops - The first part of loop-nestification is to find a 414 /// PHI node that tells us how to partition the loops. 415 static PHINode *FindPHIToPartitionLoops(Loop *L, DominatorTree *DT, 416 AliasAnalysis *AA) { 417 for (BasicBlock::iterator I = L->getHeader()->begin(); isa<PHINode>(I); ) { 418 PHINode *PN = cast<PHINode>(I); 419 ++I; 420 if (Value *V = PN->hasConstantValue()) 421 if (!isa<Instruction>(V) || DT->dominates(cast<Instruction>(V), PN)) { 422 // This is a degenerate PHI already, don't modify it! 423 PN->replaceAllUsesWith(V); 424 if (AA) AA->deleteValue(PN); 425 PN->eraseFromParent(); 426 continue; 427 } 428 429 // Scan this PHI node looking for a use of the PHI node by itself. 430 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) 431 if (PN->getIncomingValue(i) == PN && 432 L->contains(PN->getIncomingBlock(i))) 433 // We found something tasty to remove. 434 return PN; 435 } 436 return 0; 437 } 438 439 // PlaceSplitBlockCarefully - If the block isn't already, move the new block to 440 // right after some 'outside block' block. This prevents the preheader from 441 // being placed inside the loop body, e.g. when the loop hasn't been rotated. 442 void LoopSimplify::PlaceSplitBlockCarefully(BasicBlock *NewBB, 443 SmallVectorImpl<BasicBlock*> &SplitPreds, 444 Loop *L) { 445 // Check to see if NewBB is already well placed. 446 Function::iterator BBI = NewBB; --BBI; 447 for (unsigned i = 0, e = SplitPreds.size(); i != e; ++i) { 448 if (&*BBI == SplitPreds[i]) 449 return; 450 } 451 452 // If it isn't already after an outside block, move it after one. This is 453 // always good as it makes the uncond branch from the outside block into a 454 // fall-through. 455 456 // Figure out *which* outside block to put this after. Prefer an outside 457 // block that neighbors a BB actually in the loop. 458 BasicBlock *FoundBB = 0; 459 for (unsigned i = 0, e = SplitPreds.size(); i != e; ++i) { 460 Function::iterator BBI = SplitPreds[i]; 461 if (++BBI != NewBB->getParent()->end() && 462 L->contains(BBI)) { 463 FoundBB = SplitPreds[i]; 464 break; 465 } 466 } 467 468 // If our heuristic for a *good* bb to place this after doesn't find 469 // anything, just pick something. It's likely better than leaving it within 470 // the loop. 471 if (!FoundBB) 472 FoundBB = SplitPreds[0]; 473 NewBB->moveAfter(FoundBB); 474 } 475 476 477 /// SeparateNestedLoop - If this loop has multiple backedges, try to pull one of 478 /// them out into a nested loop. This is important for code that looks like 479 /// this: 480 /// 481 /// Loop: 482 /// ... 483 /// br cond, Loop, Next 484 /// ... 485 /// br cond2, Loop, Out 486 /// 487 /// To identify this common case, we look at the PHI nodes in the header of the 488 /// loop. PHI nodes with unchanging values on one backedge correspond to values 489 /// that change in the "outer" loop, but not in the "inner" loop. 490 /// 491 /// If we are able to separate out a loop, return the new outer loop that was 492 /// created. 493 /// 494 Loop *LoopSimplify::SeparateNestedLoop(Loop *L) { 495 PHINode *PN = FindPHIToPartitionLoops(L, DT, AA); 496 if (PN == 0) return 0; // No known way to partition. 497 498 // Pull out all predecessors that have varying values in the loop. This 499 // handles the case when a PHI node has multiple instances of itself as 500 // arguments. 501 SmallVector<BasicBlock*, 8> OuterLoopPreds; 502 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) 503 if (PN->getIncomingValue(i) != PN || 504 !L->contains(PN->getIncomingBlock(i))) 505 OuterLoopPreds.push_back(PN->getIncomingBlock(i)); 506 507 BasicBlock *Header = L->getHeader(); 508 BasicBlock *NewBB = SplitBlockPredecessors(Header, &OuterLoopPreds[0], 509 OuterLoopPreds.size(), 510 ".outer", this); 511 512 // Make sure that NewBB is put someplace intelligent, which doesn't mess up 513 // code layout too horribly. 514 PlaceSplitBlockCarefully(NewBB, OuterLoopPreds, L); 515 516 // Create the new outer loop. 517 Loop *NewOuter = new Loop(); 518 519 // Change the parent loop to use the outer loop as its child now. 520 if (Loop *Parent = L->getParentLoop()) 521 Parent->replaceChildLoopWith(L, NewOuter); 522 else 523 LI->changeTopLevelLoop(L, NewOuter); 524 525 // This block is going to be our new header block: add it to this loop and all 526 // parent loops. 527 NewOuter->addBasicBlockToLoop(NewBB, LI->getBase()); 528 529 // L is now a subloop of our outer loop. 530 NewOuter->addChildLoop(L); 531 532 for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); 533 I != E; ++I) 534 NewOuter->addBlockEntry(*I); 535 536 // Determine which blocks should stay in L and which should be moved out to 537 // the Outer loop now. 538 std::set<BasicBlock*> BlocksInL; 539 for (pred_iterator PI = pred_begin(Header), E = pred_end(Header); PI!=E; ++PI) 540 if (DT->dominates(Header, *PI)) 541 AddBlockAndPredsToSet(*PI, Header, BlocksInL); 542 543 544 // Scan all of the loop children of L, moving them to OuterLoop if they are 545 // not part of the inner loop. 546 const std::vector<Loop*> &SubLoops = L->getSubLoops(); 547 for (size_t I = 0; I != SubLoops.size(); ) 548 if (BlocksInL.count(SubLoops[I]->getHeader())) 549 ++I; // Loop remains in L 550 else 551 NewOuter->addChildLoop(L->removeChildLoop(SubLoops.begin() + I)); 552 553 // Now that we know which blocks are in L and which need to be moved to 554 // OuterLoop, move any blocks that need it. 555 for (unsigned i = 0; i != L->getBlocks().size(); ++i) { 556 BasicBlock *BB = L->getBlocks()[i]; 557 if (!BlocksInL.count(BB)) { 558 // Move this block to the parent, updating the exit blocks sets 559 L->removeBlockFromLoop(BB); 560 if ((*LI)[BB] == L) 561 LI->changeLoopFor(BB, NewOuter); 562 --i; 563 } 564 } 565 566 return NewOuter; 567 } 568 569 570 571 /// InsertUniqueBackedgeBlock - This method is called when the specified loop 572 /// has more than one backedge in it. If this occurs, revector all of these 573 /// backedges to target a new basic block and have that block branch to the loop 574 /// header. This ensures that loops have exactly one backedge. 575 /// 576 void LoopSimplify::InsertUniqueBackedgeBlock(Loop *L, BasicBlock *Preheader) { 577 assert(L->getNumBackEdges() > 1 && "Must have > 1 backedge!"); 578 579 // Get information about the loop 580 BasicBlock *Header = L->getHeader(); 581 Function *F = Header->getParent(); 582 583 // Figure out which basic blocks contain back-edges to the loop header. 584 std::vector<BasicBlock*> BackedgeBlocks; 585 for (pred_iterator I = pred_begin(Header), E = pred_end(Header); I != E; ++I) 586 if (*I != Preheader) BackedgeBlocks.push_back(*I); 587 588 // Create and insert the new backedge block... 589 BasicBlock *BEBlock = BasicBlock::Create(Header->getName()+".backedge", F); 590 BranchInst *BETerminator = BranchInst::Create(Header, BEBlock); 591 592 // Move the new backedge block to right after the last backedge block. 593 Function::iterator InsertPos = BackedgeBlocks.back(); ++InsertPos; 594 F->getBasicBlockList().splice(InsertPos, F->getBasicBlockList(), BEBlock); 595 596 // Now that the block has been inserted into the function, create PHI nodes in 597 // the backedge block which correspond to any PHI nodes in the header block. 598 for (BasicBlock::iterator I = Header->begin(); isa<PHINode>(I); ++I) { 599 PHINode *PN = cast<PHINode>(I); 600 PHINode *NewPN = PHINode::Create(PN->getType(), PN->getName()+".be", 601 BETerminator); 602 NewPN->reserveOperandSpace(BackedgeBlocks.size()); 603 if (AA) AA->copyValue(PN, NewPN); 604 605 // Loop over the PHI node, moving all entries except the one for the 606 // preheader over to the new PHI node. 607 unsigned PreheaderIdx = ~0U; 608 bool HasUniqueIncomingValue = true; 609 Value *UniqueValue = 0; 610 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) { 611 BasicBlock *IBB = PN->getIncomingBlock(i); 612 Value *IV = PN->getIncomingValue(i); 613 if (IBB == Preheader) { 614 PreheaderIdx = i; 615 } else { 616 NewPN->addIncoming(IV, IBB); 617 if (HasUniqueIncomingValue) { 618 if (UniqueValue == 0) 619 UniqueValue = IV; 620 else if (UniqueValue != IV) 621 HasUniqueIncomingValue = false; 622 } 623 } 624 } 625 626 // Delete all of the incoming values from the old PN except the preheader's 627 assert(PreheaderIdx != ~0U && "PHI has no preheader entry??"); 628 if (PreheaderIdx != 0) { 629 PN->setIncomingValue(0, PN->getIncomingValue(PreheaderIdx)); 630 PN->setIncomingBlock(0, PN->getIncomingBlock(PreheaderIdx)); 631 } 632 // Nuke all entries except the zero'th. 633 for (unsigned i = 0, e = PN->getNumIncomingValues()-1; i != e; ++i) 634 PN->removeIncomingValue(e-i, false); 635 636 // Finally, add the newly constructed PHI node as the entry for the BEBlock. 637 PN->addIncoming(NewPN, BEBlock); 638 639 // As an optimization, if all incoming values in the new PhiNode (which is a 640 // subset of the incoming values of the old PHI node) have the same value, 641 // eliminate the PHI Node. 642 if (HasUniqueIncomingValue) { 643 NewPN->replaceAllUsesWith(UniqueValue); 644 if (AA) AA->deleteValue(NewPN); 645 BEBlock->getInstList().erase(NewPN); 646 } 647 } 648 649 // Now that all of the PHI nodes have been inserted and adjusted, modify the 650 // backedge blocks to just to the BEBlock instead of the header. 651 for (unsigned i = 0, e = BackedgeBlocks.size(); i != e; ++i) { 652 TerminatorInst *TI = BackedgeBlocks[i]->getTerminator(); 653 for (unsigned Op = 0, e = TI->getNumSuccessors(); Op != e; ++Op) 654 if (TI->getSuccessor(Op) == Header) 655 TI->setSuccessor(Op, BEBlock); 656 } 657 658 //===--- Update all analyses which we must preserve now -----------------===// 659 660 // Update Loop Information - we know that this block is now in the current 661 // loop and all parent loops. 662 L->addBasicBlockToLoop(BEBlock, LI->getBase()); 663 664 // Update dominator information 665 DT->splitBlock(BEBlock); 666 if (DominanceFrontier *DF = getAnalysisIfAvailable<DominanceFrontier>()) 667 DF->splitBlock(BEBlock); 668 } 669