1 //===- LoopDeletion.cpp - Dead Loop Deletion Pass ---------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the Dead Loop Deletion Pass. This pass is responsible
10 // for eliminating loops with non-infinite computable trip counts that have no
11 // side effects or volatile instructions, and do not contribute to the
12 // computation of the function's return value.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #include "llvm/Transforms/Scalar/LoopDeletion.h"
17 #include "llvm/ADT/SmallVector.h"
18 #include "llvm/ADT/Statistic.h"
19 #include "llvm/Analysis/CFG.h"
20 #include "llvm/Analysis/GlobalsModRef.h"
21 #include "llvm/Analysis/InstructionSimplify.h"
22 #include "llvm/Analysis/LoopIterator.h"
23 #include "llvm/Analysis/LoopPass.h"
24 #include "llvm/Analysis/MemorySSA.h"
25 #include "llvm/Analysis/OptimizationRemarkEmitter.h"
26 #include "llvm/IR/Dominators.h"
27 
28 #include "llvm/IR/PatternMatch.h"
29 #include "llvm/InitializePasses.h"
30 #include "llvm/Transforms/Scalar.h"
31 #include "llvm/Transforms/Scalar/LoopPassManager.h"
32 #include "llvm/Transforms/Utils/LoopUtils.h"
33 
34 using namespace llvm;
35 
36 #define DEBUG_TYPE "loop-delete"
37 
38 STATISTIC(NumDeleted, "Number of loops deleted");
39 
40 static cl::opt<bool> EnableSymbolicExecution(
41     "loop-deletion-enable-symbolic-execution", cl::Hidden, cl::init(true),
42     cl::desc("Break backedge through symbolic execution of 1st iteration "
43              "attempting to prove that the backedge is never taken"));
44 
45 enum class LoopDeletionResult {
46   Unmodified,
47   Modified,
48   Deleted,
49 };
50 
51 static LoopDeletionResult merge(LoopDeletionResult A, LoopDeletionResult B) {
52   if (A == LoopDeletionResult::Deleted || B == LoopDeletionResult::Deleted)
53     return LoopDeletionResult::Deleted;
54   if (A == LoopDeletionResult::Modified || B == LoopDeletionResult::Modified)
55     return LoopDeletionResult::Modified;
56   return LoopDeletionResult::Unmodified;
57 }
58 
59 /// Determines if a loop is dead.
60 ///
61 /// This assumes that we've already checked for unique exit and exiting blocks,
62 /// and that the code is in LCSSA form.
63 static bool isLoopDead(Loop *L, ScalarEvolution &SE,
64                        SmallVectorImpl<BasicBlock *> &ExitingBlocks,
65                        BasicBlock *ExitBlock, bool &Changed,
66                        BasicBlock *Preheader, LoopInfo &LI) {
67   // Make sure that all PHI entries coming from the loop are loop invariant.
68   // Because the code is in LCSSA form, any values used outside of the loop
69   // must pass through a PHI in the exit block, meaning that this check is
70   // sufficient to guarantee that no loop-variant values are used outside
71   // of the loop.
72   bool AllEntriesInvariant = true;
73   bool AllOutgoingValuesSame = true;
74   if (!L->hasNoExitBlocks()) {
75     for (PHINode &P : ExitBlock->phis()) {
76       Value *incoming = P.getIncomingValueForBlock(ExitingBlocks[0]);
77 
78       // Make sure all exiting blocks produce the same incoming value for the
79       // block. If there are different incoming values for different exiting
80       // blocks, then it is impossible to statically determine which value
81       // should be used.
82       AllOutgoingValuesSame =
83           all_of(makeArrayRef(ExitingBlocks).slice(1), [&](BasicBlock *BB) {
84             return incoming == P.getIncomingValueForBlock(BB);
85           });
86 
87       if (!AllOutgoingValuesSame)
88         break;
89 
90       if (Instruction *I = dyn_cast<Instruction>(incoming))
91         if (!L->makeLoopInvariant(I, Changed, Preheader->getTerminator())) {
92           AllEntriesInvariant = false;
93           break;
94         }
95     }
96   }
97 
98   if (Changed)
99     SE.forgetLoopDispositions(L);
100 
101   if (!AllEntriesInvariant || !AllOutgoingValuesSame)
102     return false;
103 
104   // Make sure that no instructions in the block have potential side-effects.
105   // This includes instructions that could write to memory, and loads that are
106   // marked volatile.
107   for (auto &I : L->blocks())
108     if (any_of(*I, [](Instruction &I) {
109           return I.mayHaveSideEffects() && !I.isDroppable();
110         }))
111       return false;
112 
113   // The loop or any of its sub-loops looping infinitely is legal. The loop can
114   // only be considered dead if either
115   // a. the function is mustprogress.
116   // b. all (sub-)loops are mustprogress or have a known trip-count.
117   if (L->getHeader()->getParent()->mustProgress())
118     return true;
119 
120   LoopBlocksRPO RPOT(L);
121   RPOT.perform(&LI);
122   // If the loop contains an irreducible cycle, it may loop infinitely.
123   if (containsIrreducibleCFG<const BasicBlock *>(RPOT, LI))
124     return false;
125 
126   SmallVector<Loop *, 8> WorkList;
127   WorkList.push_back(L);
128   while (!WorkList.empty()) {
129     Loop *Current = WorkList.pop_back_val();
130     if (hasMustProgress(Current))
131       continue;
132 
133     const SCEV *S = SE.getConstantMaxBackedgeTakenCount(Current);
134     if (isa<SCEVCouldNotCompute>(S)) {
135       LLVM_DEBUG(
136           dbgs() << "Could not compute SCEV MaxBackedgeTakenCount and was "
137                     "not required to make progress.\n");
138       return false;
139     }
140     WorkList.append(Current->begin(), Current->end());
141   }
142   return true;
143 }
144 
145 /// This function returns true if there is no viable path from the
146 /// entry block to the header of \p L. Right now, it only does
147 /// a local search to save compile time.
148 static bool isLoopNeverExecuted(Loop *L) {
149   using namespace PatternMatch;
150 
151   auto *Preheader = L->getLoopPreheader();
152   // TODO: We can relax this constraint, since we just need a loop
153   // predecessor.
154   assert(Preheader && "Needs preheader!");
155 
156   if (Preheader->isEntryBlock())
157     return false;
158   // All predecessors of the preheader should have a constant conditional
159   // branch, with the loop's preheader as not-taken.
160   for (auto *Pred: predecessors(Preheader)) {
161     BasicBlock *Taken, *NotTaken;
162     ConstantInt *Cond;
163     if (!match(Pred->getTerminator(),
164                m_Br(m_ConstantInt(Cond), Taken, NotTaken)))
165       return false;
166     if (!Cond->getZExtValue())
167       std::swap(Taken, NotTaken);
168     if (Taken == Preheader)
169       return false;
170   }
171   assert(!pred_empty(Preheader) &&
172          "Preheader should have predecessors at this point!");
173   // All the predecessors have the loop preheader as not-taken target.
174   return true;
175 }
176 
177 static Value *
178 getValueOnFirstIteration(Value *V, DenseMap<Value *, Value *> &FirstIterValue,
179                          const SimplifyQuery &SQ) {
180   // Quick hack: do not flood cache with non-instruction values.
181   if (!isa<Instruction>(V))
182     return V;
183   // Do we already know cached result?
184   auto Existing = FirstIterValue.find(V);
185   if (Existing != FirstIterValue.end())
186     return Existing->second;
187   Value *FirstIterV = nullptr;
188   if (auto *BO = dyn_cast<BinaryOperator>(V)) {
189     Value *LHS =
190         getValueOnFirstIteration(BO->getOperand(0), FirstIterValue, SQ);
191     Value *RHS =
192         getValueOnFirstIteration(BO->getOperand(1), FirstIterValue, SQ);
193     FirstIterV = SimplifyBinOp(BO->getOpcode(), LHS, RHS, SQ);
194   }
195   if (!FirstIterV)
196     FirstIterV = V;
197   FirstIterValue[V] = FirstIterV;
198   return FirstIterV;
199 }
200 
201 // Try to prove that one of conditions that dominates the latch must exit on 1st
202 // iteration.
203 static bool canProveExitOnFirstIteration(Loop *L, DominatorTree &DT,
204                                          LoopInfo &LI) {
205   // Disabled by option.
206   if (!EnableSymbolicExecution)
207     return false;
208 
209   BasicBlock *Predecessor = L->getLoopPredecessor();
210   BasicBlock *Latch = L->getLoopLatch();
211 
212   if (!Predecessor || !Latch)
213     return false;
214 
215   LoopBlocksRPO RPOT(L);
216   RPOT.perform(&LI);
217 
218   // For the optimization to be correct, we need RPOT to have a property that
219   // each block is processed after all its predecessors, which may only be
220   // violated for headers of the current loop and all nested loops. Irreducible
221   // CFG provides multiple ways to break this assumption, so we do not want to
222   // deal with it.
223   if (containsIrreducibleCFG<const BasicBlock *>(RPOT, LI))
224     return false;
225 
226   BasicBlock *Header = L->getHeader();
227   // Blocks that are reachable on the 1st iteration.
228   SmallPtrSet<BasicBlock *, 4> LiveBlocks;
229   // Edges that are reachable on the 1st iteration.
230   DenseSet<BasicBlockEdge> LiveEdges;
231   LiveBlocks.insert(L->getHeader());
232 
233   SmallPtrSet<BasicBlock *, 4> Visited;
234   auto MarkLiveEdge = [&](BasicBlock *From, BasicBlock *To) {
235     assert(LiveBlocks.count(From) && "Must be live!");
236     assert((LI.isLoopHeader(To) || !Visited.count(To)) &&
237            "Only canonical backedges are allowed. Irreducible CFG?");
238     assert((LiveBlocks.count(To) || !Visited.count(To)) &&
239            "We already discarded this block as dead!");
240     LiveBlocks.insert(To);
241     LiveEdges.insert({ From, To });
242   };
243 
244   auto MarkAllSuccessorsLive = [&](BasicBlock *BB) {
245     for (auto *Succ : successors(BB))
246       MarkLiveEdge(BB, Succ);
247   };
248 
249   // Check if there is only one value coming from all live predecessor blocks.
250   // Note that because we iterate in RPOT, we have already visited all its
251   // (non-latch) predecessors.
252   auto GetSoleInputOnFirstIteration = [&](PHINode & PN)->Value * {
253     BasicBlock *BB = PN.getParent();
254     bool HasLivePreds = false;
255     (void)HasLivePreds;
256     if (BB == Header)
257       return PN.getIncomingValueForBlock(Predecessor);
258     Value *OnlyInput = nullptr;
259     for (auto *Pred : predecessors(BB))
260       if (LiveEdges.count({ Pred, BB })) {
261         HasLivePreds = true;
262         Value *Incoming = PN.getIncomingValueForBlock(Pred);
263         // Skip undefs. If they are present, we can assume they are equal to
264         // the non-undef input.
265         if (isa<UndefValue>(Incoming))
266           continue;
267         // Two inputs.
268         if (OnlyInput && OnlyInput != Incoming)
269           return nullptr;
270         OnlyInput = Incoming;
271       }
272 
273     assert(HasLivePreds && "No live predecessors?");
274     // If all incoming live value were undefs, return undef.
275     return OnlyInput ? OnlyInput : UndefValue::get(PN.getType());
276   };
277   DenseMap<Value *, Value *> FirstIterValue;
278 
279   // Use the following algorithm to prove we never take the latch on the 1st
280   // iteration:
281   // 1. Traverse in topological order, so that whenever we visit a block, all
282   //    its predecessors are already visited.
283   // 2. If we can prove that the block may have only 1 predecessor on the 1st
284   //    iteration, map all its phis onto input from this predecessor.
285   // 3a. If we can prove which successor of out block is taken on the 1st
286   //     iteration, mark this successor live.
287   // 3b. If we cannot prove it, conservatively assume that all successors are
288   //     live.
289   auto &DL = L->getHeader()->getModule()->getDataLayout();
290   const SimplifyQuery SQ(DL);
291   for (auto *BB : RPOT) {
292     Visited.insert(BB);
293 
294     // This block is not reachable on the 1st iterations.
295     if (!LiveBlocks.count(BB))
296       continue;
297 
298     // Skip inner loops.
299     if (LI.getLoopFor(BB) != L) {
300       MarkAllSuccessorsLive(BB);
301       continue;
302     }
303 
304     // If Phi has only one input from all live input blocks, use it.
305     for (auto &PN : BB->phis()) {
306       if (!PN.getType()->isIntegerTy())
307         continue;
308       auto *Incoming = GetSoleInputOnFirstIteration(PN);
309       if (Incoming && DT.dominates(Incoming, BB->getTerminator())) {
310         Value *FirstIterV =
311             getValueOnFirstIteration(Incoming, FirstIterValue, SQ);
312         FirstIterValue[&PN] = FirstIterV;
313       }
314     }
315 
316     using namespace PatternMatch;
317     ICmpInst::Predicate Pred;
318     Value *LHS, *RHS;
319     BasicBlock *IfTrue, *IfFalse;
320     auto *Term = BB->getTerminator();
321     // TODO: Handle switch.
322     if (!match(Term, m_Br(m_ICmp(Pred, m_Value(LHS), m_Value(RHS)),
323                           m_BasicBlock(IfTrue), m_BasicBlock(IfFalse)))) {
324       MarkAllSuccessorsLive(BB);
325       continue;
326     }
327 
328     if (!LHS->getType()->isIntegerTy()) {
329       MarkAllSuccessorsLive(BB);
330       continue;
331     }
332 
333     // Can we prove constant true or false for this condition?
334     LHS = getValueOnFirstIteration(LHS, FirstIterValue, SQ);
335     RHS = getValueOnFirstIteration(RHS, FirstIterValue, SQ);
336     auto *KnownCondition =
337         dyn_cast_or_null<ConstantInt>(SimplifyICmpInst(Pred, LHS, RHS, SQ));
338     if (!KnownCondition) {
339       MarkAllSuccessorsLive(BB);
340       continue;
341     }
342     if (KnownCondition->isAllOnesValue())
343       MarkLiveEdge(BB, IfTrue);
344     else
345       MarkLiveEdge(BB, IfFalse);
346   }
347 
348   // We can break the latch if it wasn't live.
349   return !LiveEdges.count({ Latch, Header });
350 }
351 
352 /// If we can prove the backedge is untaken, remove it.  This destroys the
353 /// loop, but leaves the (now trivially loop invariant) control flow and
354 /// side effects (if any) in place.
355 static LoopDeletionResult
356 breakBackedgeIfNotTaken(Loop *L, DominatorTree &DT, ScalarEvolution &SE,
357                         LoopInfo &LI, MemorySSA *MSSA,
358                         OptimizationRemarkEmitter &ORE) {
359   assert(L->isLCSSAForm(DT) && "Expected LCSSA!");
360 
361   if (!L->getLoopLatch())
362     return LoopDeletionResult::Unmodified;
363 
364   auto *BTC = SE.getBackedgeTakenCount(L);
365   if (!isa<SCEVCouldNotCompute>(BTC) && SE.isKnownNonZero(BTC))
366     return LoopDeletionResult::Unmodified;
367   if (!BTC->isZero() && !canProveExitOnFirstIteration(L, DT, LI))
368     return LoopDeletionResult::Unmodified;
369 
370   breakLoopBackedge(L, DT, SE, LI, MSSA);
371   return LoopDeletionResult::Deleted;
372 }
373 
374 /// Remove a loop if it is dead.
375 ///
376 /// A loop is considered dead either if it does not impact the observable
377 /// behavior of the program other than finite running time, or if it is
378 /// required to make progress by an attribute such as 'mustprogress' or
379 /// 'llvm.loop.mustprogress' and does not make any. This may remove
380 /// infinite loops that have been required to make progress.
381 ///
382 /// This entire process relies pretty heavily on LoopSimplify form and LCSSA in
383 /// order to make various safety checks work.
384 ///
385 /// \returns true if any changes were made. This may mutate the loop even if it
386 /// is unable to delete it due to hoisting trivially loop invariant
387 /// instructions out of the loop.
388 static LoopDeletionResult deleteLoopIfDead(Loop *L, DominatorTree &DT,
389                                            ScalarEvolution &SE, LoopInfo &LI,
390                                            MemorySSA *MSSA,
391                                            OptimizationRemarkEmitter &ORE) {
392   assert(L->isLCSSAForm(DT) && "Expected LCSSA!");
393 
394   // We can only remove the loop if there is a preheader that we can branch from
395   // after removing it. Also, if LoopSimplify form is not available, stay out
396   // of trouble.
397   BasicBlock *Preheader = L->getLoopPreheader();
398   if (!Preheader || !L->hasDedicatedExits()) {
399     LLVM_DEBUG(
400         dbgs()
401         << "Deletion requires Loop with preheader and dedicated exits.\n");
402     return LoopDeletionResult::Unmodified;
403   }
404 
405   BasicBlock *ExitBlock = L->getUniqueExitBlock();
406 
407   if (ExitBlock && isLoopNeverExecuted(L)) {
408     LLVM_DEBUG(dbgs() << "Loop is proven to never execute, delete it!");
409     // We need to forget the loop before setting the incoming values of the exit
410     // phis to undef, so we properly invalidate the SCEV expressions for those
411     // phis.
412     SE.forgetLoop(L);
413     // Set incoming value to undef for phi nodes in the exit block.
414     for (PHINode &P : ExitBlock->phis()) {
415       std::fill(P.incoming_values().begin(), P.incoming_values().end(),
416                 UndefValue::get(P.getType()));
417     }
418     ORE.emit([&]() {
419       return OptimizationRemark(DEBUG_TYPE, "NeverExecutes", L->getStartLoc(),
420                                 L->getHeader())
421              << "Loop deleted because it never executes";
422     });
423     deleteDeadLoop(L, &DT, &SE, &LI, MSSA);
424     ++NumDeleted;
425     return LoopDeletionResult::Deleted;
426   }
427 
428   // The remaining checks below are for a loop being dead because all statements
429   // in the loop are invariant.
430   SmallVector<BasicBlock *, 4> ExitingBlocks;
431   L->getExitingBlocks(ExitingBlocks);
432 
433   // We require that the loop has at most one exit block. Otherwise, we'd be in
434   // the situation of needing to be able to solve statically which exit block
435   // will be branched to, or trying to preserve the branching logic in a loop
436   // invariant manner.
437   if (!ExitBlock && !L->hasNoExitBlocks()) {
438     LLVM_DEBUG(dbgs() << "Deletion requires at most one exit block.\n");
439     return LoopDeletionResult::Unmodified;
440   }
441   // Finally, we have to check that the loop really is dead.
442   bool Changed = false;
443   if (!isLoopDead(L, SE, ExitingBlocks, ExitBlock, Changed, Preheader, LI)) {
444     LLVM_DEBUG(dbgs() << "Loop is not invariant, cannot delete.\n");
445     return Changed ? LoopDeletionResult::Modified
446                    : LoopDeletionResult::Unmodified;
447   }
448 
449   LLVM_DEBUG(dbgs() << "Loop is invariant, delete it!");
450   ORE.emit([&]() {
451     return OptimizationRemark(DEBUG_TYPE, "Invariant", L->getStartLoc(),
452                               L->getHeader())
453            << "Loop deleted because it is invariant";
454   });
455   deleteDeadLoop(L, &DT, &SE, &LI, MSSA);
456   ++NumDeleted;
457 
458   return LoopDeletionResult::Deleted;
459 }
460 
461 PreservedAnalyses LoopDeletionPass::run(Loop &L, LoopAnalysisManager &AM,
462                                         LoopStandardAnalysisResults &AR,
463                                         LPMUpdater &Updater) {
464 
465   LLVM_DEBUG(dbgs() << "Analyzing Loop for deletion: ");
466   LLVM_DEBUG(L.dump());
467   std::string LoopName = std::string(L.getName());
468   // For the new PM, we can't use OptimizationRemarkEmitter as an analysis
469   // pass. Function analyses need to be preserved across loop transformations
470   // but ORE cannot be preserved (see comment before the pass definition).
471   OptimizationRemarkEmitter ORE(L.getHeader()->getParent());
472   auto Result = deleteLoopIfDead(&L, AR.DT, AR.SE, AR.LI, AR.MSSA, ORE);
473 
474   // If we can prove the backedge isn't taken, just break it and be done.  This
475   // leaves the loop structure in place which means it can handle dispatching
476   // to the right exit based on whatever loop invariant structure remains.
477   if (Result != LoopDeletionResult::Deleted)
478     Result = merge(Result, breakBackedgeIfNotTaken(&L, AR.DT, AR.SE, AR.LI,
479                                                    AR.MSSA, ORE));
480 
481   if (Result == LoopDeletionResult::Unmodified)
482     return PreservedAnalyses::all();
483 
484   if (Result == LoopDeletionResult::Deleted)
485     Updater.markLoopAsDeleted(L, LoopName);
486 
487   auto PA = getLoopPassPreservedAnalyses();
488   if (AR.MSSA)
489     PA.preserve<MemorySSAAnalysis>();
490   return PA;
491 }
492 
493 namespace {
494 class LoopDeletionLegacyPass : public LoopPass {
495 public:
496   static char ID; // Pass ID, replacement for typeid
497   LoopDeletionLegacyPass() : LoopPass(ID) {
498     initializeLoopDeletionLegacyPassPass(*PassRegistry::getPassRegistry());
499   }
500 
501   // Possibly eliminate loop L if it is dead.
502   bool runOnLoop(Loop *L, LPPassManager &) override;
503 
504   void getAnalysisUsage(AnalysisUsage &AU) const override {
505     AU.addPreserved<MemorySSAWrapperPass>();
506     getLoopAnalysisUsage(AU);
507   }
508 };
509 }
510 
511 char LoopDeletionLegacyPass::ID = 0;
512 INITIALIZE_PASS_BEGIN(LoopDeletionLegacyPass, "loop-deletion",
513                       "Delete dead loops", false, false)
514 INITIALIZE_PASS_DEPENDENCY(LoopPass)
515 INITIALIZE_PASS_END(LoopDeletionLegacyPass, "loop-deletion",
516                     "Delete dead loops", false, false)
517 
518 Pass *llvm::createLoopDeletionPass() { return new LoopDeletionLegacyPass(); }
519 
520 bool LoopDeletionLegacyPass::runOnLoop(Loop *L, LPPassManager &LPM) {
521   if (skipLoop(L))
522     return false;
523   DominatorTree &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
524   ScalarEvolution &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();
525   LoopInfo &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
526   auto *MSSAAnalysis = getAnalysisIfAvailable<MemorySSAWrapperPass>();
527   MemorySSA *MSSA = nullptr;
528   if (MSSAAnalysis)
529     MSSA = &MSSAAnalysis->getMSSA();
530   // For the old PM, we can't use OptimizationRemarkEmitter as an analysis
531   // pass.  Function analyses need to be preserved across loop transformations
532   // but ORE cannot be preserved (see comment before the pass definition).
533   OptimizationRemarkEmitter ORE(L->getHeader()->getParent());
534 
535   LLVM_DEBUG(dbgs() << "Analyzing Loop for deletion: ");
536   LLVM_DEBUG(L->dump());
537 
538   LoopDeletionResult Result = deleteLoopIfDead(L, DT, SE, LI, MSSA, ORE);
539 
540   // If we can prove the backedge isn't taken, just break it and be done.  This
541   // leaves the loop structure in place which means it can handle dispatching
542   // to the right exit based on whatever loop invariant structure remains.
543   if (Result != LoopDeletionResult::Deleted)
544     Result = merge(Result, breakBackedgeIfNotTaken(L, DT, SE, LI, MSSA, ORE));
545 
546   if (Result == LoopDeletionResult::Deleted)
547     LPM.markLoopAsDeleted(*L);
548 
549   return Result != LoopDeletionResult::Unmodified;
550 }
551