1 //===- IVUsers.cpp - Induction Variable Users -------------------*- C++ -*-===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This file implements bookkeeping for "interesting" users of expressions 11 // computed from induction variables. 12 // 13 //===----------------------------------------------------------------------===// 14 15 #define DEBUG_TYPE "iv-users" 16 #include "llvm/Analysis/IVUsers.h" 17 #include "llvm/ADT/STLExtras.h" 18 #include "llvm/Analysis/LoopPass.h" 19 #include "llvm/Analysis/ScalarEvolutionExpressions.h" 20 #include "llvm/Analysis/ValueTracking.h" 21 #include "llvm/IR/Constants.h" 22 #include "llvm/IR/DataLayout.h" 23 #include "llvm/IR/DerivedTypes.h" 24 #include "llvm/IR/Dominators.h" 25 #include "llvm/IR/Instructions.h" 26 #include "llvm/IR/Type.h" 27 #include "llvm/Support/Debug.h" 28 #include "llvm/Support/raw_ostream.h" 29 #include <algorithm> 30 using namespace llvm; 31 32 char IVUsers::ID = 0; 33 INITIALIZE_PASS_BEGIN(IVUsers, "iv-users", 34 "Induction Variable Users", false, true) 35 INITIALIZE_PASS_DEPENDENCY(LoopInfo) 36 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 37 INITIALIZE_PASS_DEPENDENCY(ScalarEvolution) 38 INITIALIZE_PASS_END(IVUsers, "iv-users", 39 "Induction Variable Users", false, true) 40 41 Pass *llvm::createIVUsersPass() { 42 return new IVUsers(); 43 } 44 45 /// isInteresting - Test whether the given expression is "interesting" when 46 /// used by the given expression, within the context of analyzing the 47 /// given loop. 48 static bool isInteresting(const SCEV *S, const Instruction *I, const Loop *L, 49 ScalarEvolution *SE, LoopInfo *LI) { 50 // An addrec is interesting if it's affine or if it has an interesting start. 51 if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S)) { 52 // Keep things simple. Don't touch loop-variant strides unless they're 53 // only used outside the loop and we can simplify them. 54 if (AR->getLoop() == L) 55 return AR->isAffine() || 56 (!L->contains(I) && 57 SE->getSCEVAtScope(AR, LI->getLoopFor(I->getParent())) != AR); 58 // Otherwise recurse to see if the start value is interesting, and that 59 // the step value is not interesting, since we don't yet know how to 60 // do effective SCEV expansions for addrecs with interesting steps. 61 return isInteresting(AR->getStart(), I, L, SE, LI) && 62 !isInteresting(AR->getStepRecurrence(*SE), I, L, SE, LI); 63 } 64 65 // An add is interesting if exactly one of its operands is interesting. 66 if (const SCEVAddExpr *Add = dyn_cast<SCEVAddExpr>(S)) { 67 bool AnyInterestingYet = false; 68 for (SCEVAddExpr::op_iterator OI = Add->op_begin(), OE = Add->op_end(); 69 OI != OE; ++OI) 70 if (isInteresting(*OI, I, L, SE, LI)) { 71 if (AnyInterestingYet) 72 return false; 73 AnyInterestingYet = true; 74 } 75 return AnyInterestingYet; 76 } 77 78 // Nothing else is interesting here. 79 return false; 80 } 81 82 /// Return true if all loop headers that dominate this block are in simplified 83 /// form. 84 static bool isSimplifiedLoopNest(BasicBlock *BB, const DominatorTree *DT, 85 const LoopInfo *LI, 86 SmallPtrSet<Loop*,16> &SimpleLoopNests) { 87 Loop *NearestLoop = 0; 88 for (DomTreeNode *Rung = DT->getNode(BB); 89 Rung; Rung = Rung->getIDom()) { 90 BasicBlock *DomBB = Rung->getBlock(); 91 Loop *DomLoop = LI->getLoopFor(DomBB); 92 if (DomLoop && DomLoop->getHeader() == DomBB) { 93 // If the domtree walk reaches a loop with no preheader, return false. 94 if (!DomLoop->isLoopSimplifyForm()) 95 return false; 96 // If we have already checked this loop nest, stop checking. 97 if (SimpleLoopNests.count(DomLoop)) 98 break; 99 // If we have not already checked this loop nest, remember the loop 100 // header nearest to BB. The nearest loop may not contain BB. 101 if (!NearestLoop) 102 NearestLoop = DomLoop; 103 } 104 } 105 if (NearestLoop) 106 SimpleLoopNests.insert(NearestLoop); 107 return true; 108 } 109 110 /// AddUsersImpl - Inspect the specified instruction. If it is a 111 /// reducible SCEV, recursively add its users to the IVUsesByStride set and 112 /// return true. Otherwise, return false. 113 bool IVUsers::AddUsersImpl(Instruction *I, 114 SmallPtrSet<Loop*,16> &SimpleLoopNests) { 115 // Add this IV user to the Processed set before returning false to ensure that 116 // all IV users are members of the set. See IVUsers::isIVUserOrOperand. 117 if (!Processed.insert(I)) 118 return true; // Instruction already handled. 119 120 if (!SE->isSCEVable(I->getType())) 121 return false; // Void and FP expressions cannot be reduced. 122 123 // IVUsers is used by LSR which assumes that all SCEV expressions are safe to 124 // pass to SCEVExpander. Expressions are not safe to expand if they represent 125 // operations that are not safe to speculate, namely integer division. 126 if (!isa<PHINode>(I) && !isSafeToSpeculativelyExecute(I, TD)) 127 return false; 128 129 // LSR is not APInt clean, do not touch integers bigger than 64-bits. 130 // Also avoid creating IVs of non-native types. For example, we don't want a 131 // 64-bit IV in 32-bit code just because the loop has one 64-bit cast. 132 uint64_t Width = SE->getTypeSizeInBits(I->getType()); 133 if (Width > 64 || (TD && !TD->isLegalInteger(Width))) 134 return false; 135 136 // Get the symbolic expression for this instruction. 137 const SCEV *ISE = SE->getSCEV(I); 138 139 // If we've come to an uninteresting expression, stop the traversal and 140 // call this a user. 141 if (!isInteresting(ISE, I, L, SE, LI)) 142 return false; 143 144 SmallPtrSet<Instruction *, 4> UniqueUsers; 145 for (Value::use_iterator UI = I->use_begin(), E = I->use_end(); 146 UI != E; ++UI) { 147 Instruction *User = cast<Instruction>(*UI); 148 if (!UniqueUsers.insert(User)) 149 continue; 150 151 // Do not infinitely recurse on PHI nodes. 152 if (isa<PHINode>(User) && Processed.count(User)) 153 continue; 154 155 // Only consider IVUsers that are dominated by simplified loop 156 // headers. Otherwise, SCEVExpander will crash. 157 BasicBlock *UseBB = User->getParent(); 158 // A phi's use is live out of its predecessor block. 159 if (PHINode *PHI = dyn_cast<PHINode>(User)) { 160 unsigned OperandNo = UI.getOperandNo(); 161 unsigned ValNo = PHINode::getIncomingValueNumForOperand(OperandNo); 162 UseBB = PHI->getIncomingBlock(ValNo); 163 } 164 if (!isSimplifiedLoopNest(UseBB, DT, LI, SimpleLoopNests)) 165 return false; 166 167 // Descend recursively, but not into PHI nodes outside the current loop. 168 // It's important to see the entire expression outside the loop to get 169 // choices that depend on addressing mode use right, although we won't 170 // consider references outside the loop in all cases. 171 // If User is already in Processed, we don't want to recurse into it again, 172 // but do want to record a second reference in the same instruction. 173 bool AddUserToIVUsers = false; 174 if (LI->getLoopFor(User->getParent()) != L) { 175 if (isa<PHINode>(User) || Processed.count(User) || 176 !AddUsersImpl(User, SimpleLoopNests)) { 177 DEBUG(dbgs() << "FOUND USER in other loop: " << *User << '\n' 178 << " OF SCEV: " << *ISE << '\n'); 179 AddUserToIVUsers = true; 180 } 181 } else if (Processed.count(User) || !AddUsersImpl(User, SimpleLoopNests)) { 182 DEBUG(dbgs() << "FOUND USER: " << *User << '\n' 183 << " OF SCEV: " << *ISE << '\n'); 184 AddUserToIVUsers = true; 185 } 186 187 if (AddUserToIVUsers) { 188 // Okay, we found a user that we cannot reduce. 189 IVUses.push_back(new IVStrideUse(this, User, I)); 190 IVStrideUse &NewUse = IVUses.back(); 191 // Autodetect the post-inc loop set, populating NewUse.PostIncLoops. 192 // The regular return value here is discarded; instead of recording 193 // it, we just recompute it when we need it. 194 ISE = TransformForPostIncUse(NormalizeAutodetect, 195 ISE, User, I, 196 NewUse.PostIncLoops, 197 *SE, *DT); 198 DEBUG(if (SE->getSCEV(I) != ISE) 199 dbgs() << " NORMALIZED TO: " << *ISE << '\n'); 200 } 201 } 202 return true; 203 } 204 205 bool IVUsers::AddUsersIfInteresting(Instruction *I) { 206 // SCEVExpander can only handle users that are dominated by simplified loop 207 // entries. Keep track of all loops that are only dominated by other simple 208 // loops so we don't traverse the domtree for each user. 209 SmallPtrSet<Loop*,16> SimpleLoopNests; 210 211 return AddUsersImpl(I, SimpleLoopNests); 212 } 213 214 IVStrideUse &IVUsers::AddUser(Instruction *User, Value *Operand) { 215 IVUses.push_back(new IVStrideUse(this, User, Operand)); 216 return IVUses.back(); 217 } 218 219 IVUsers::IVUsers() 220 : LoopPass(ID) { 221 initializeIVUsersPass(*PassRegistry::getPassRegistry()); 222 } 223 224 void IVUsers::getAnalysisUsage(AnalysisUsage &AU) const { 225 AU.addRequired<LoopInfo>(); 226 AU.addRequired<DominatorTreeWrapperPass>(); 227 AU.addRequired<ScalarEvolution>(); 228 AU.setPreservesAll(); 229 } 230 231 bool IVUsers::runOnLoop(Loop *l, LPPassManager &LPM) { 232 233 L = l; 234 LI = &getAnalysis<LoopInfo>(); 235 DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 236 SE = &getAnalysis<ScalarEvolution>(); 237 TD = getAnalysisIfAvailable<DataLayout>(); 238 239 // Find all uses of induction variables in this loop, and categorize 240 // them by stride. Start by finding all of the PHI nodes in the header for 241 // this loop. If they are induction variables, inspect their uses. 242 for (BasicBlock::iterator I = L->getHeader()->begin(); isa<PHINode>(I); ++I) 243 (void)AddUsersIfInteresting(I); 244 245 return false; 246 } 247 248 void IVUsers::print(raw_ostream &OS, const Module *M) const { 249 OS << "IV Users for loop "; 250 L->getHeader()->printAsOperand(OS, false); 251 if (SE->hasLoopInvariantBackedgeTakenCount(L)) { 252 OS << " with backedge-taken count " 253 << *SE->getBackedgeTakenCount(L); 254 } 255 OS << ":\n"; 256 257 for (ilist<IVStrideUse>::const_iterator UI = IVUses.begin(), 258 E = IVUses.end(); UI != E; ++UI) { 259 OS << " "; 260 UI->getOperandValToReplace()->printAsOperand(OS, false); 261 OS << " = " << *getReplacementExpr(*UI); 262 for (PostIncLoopSet::const_iterator 263 I = UI->PostIncLoops.begin(), 264 E = UI->PostIncLoops.end(); I != E; ++I) { 265 OS << " (post-inc with loop "; 266 (*I)->getHeader()->printAsOperand(OS, false); 267 OS << ")"; 268 } 269 OS << " in "; 270 UI->getUser()->print(OS); 271 OS << '\n'; 272 } 273 } 274 275 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) 276 void IVUsers::dump() const { 277 print(dbgs()); 278 } 279 #endif 280 281 void IVUsers::releaseMemory() { 282 Processed.clear(); 283 IVUses.clear(); 284 } 285 286 /// getReplacementExpr - Return a SCEV expression which computes the 287 /// value of the OperandValToReplace. 288 const SCEV *IVUsers::getReplacementExpr(const IVStrideUse &IU) const { 289 return SE->getSCEV(IU.getOperandValToReplace()); 290 } 291 292 /// getExpr - Return the expression for the use. 293 const SCEV *IVUsers::getExpr(const IVStrideUse &IU) const { 294 return 295 TransformForPostIncUse(Normalize, getReplacementExpr(IU), 296 IU.getUser(), IU.getOperandValToReplace(), 297 const_cast<PostIncLoopSet &>(IU.getPostIncLoops()), 298 *SE, *DT); 299 } 300 301 static const SCEVAddRecExpr *findAddRecForLoop(const SCEV *S, const Loop *L) { 302 if (const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(S)) { 303 if (AR->getLoop() == L) 304 return AR; 305 return findAddRecForLoop(AR->getStart(), L); 306 } 307 308 if (const SCEVAddExpr *Add = dyn_cast<SCEVAddExpr>(S)) { 309 for (SCEVAddExpr::op_iterator I = Add->op_begin(), E = Add->op_end(); 310 I != E; ++I) 311 if (const SCEVAddRecExpr *AR = findAddRecForLoop(*I, L)) 312 return AR; 313 return 0; 314 } 315 316 return 0; 317 } 318 319 const SCEV *IVUsers::getStride(const IVStrideUse &IU, const Loop *L) const { 320 if (const SCEVAddRecExpr *AR = findAddRecForLoop(getExpr(IU), L)) 321 return AR->getStepRecurrence(*SE); 322 return 0; 323 } 324 325 void IVStrideUse::transformToPostInc(const Loop *L) { 326 PostIncLoops.insert(L); 327 } 328 329 void IVStrideUse::deleted() { 330 // Remove this user from the list. 331 Parent->Processed.erase(this->getUser()); 332 Parent->IVUses.erase(this); 333 // this now dangles! 334 } 335