1215746b4SAdam Nemet //===- LoopVersioning.cpp - Utility to version a loop ---------------------===//
2215746b4SAdam Nemet //
3215746b4SAdam Nemet //                     The LLVM Compiler Infrastructure
4215746b4SAdam Nemet //
5215746b4SAdam Nemet // This file is distributed under the University of Illinois Open Source
6215746b4SAdam Nemet // License. See LICENSE.TXT for details.
7215746b4SAdam Nemet //
8215746b4SAdam Nemet //===----------------------------------------------------------------------===//
9215746b4SAdam Nemet //
10215746b4SAdam Nemet // This file defines a utility class to perform loop versioning.  The versioned
11215746b4SAdam Nemet // loop speculates that otherwise may-aliasing memory accesses don't overlap and
12215746b4SAdam Nemet // emits checks to prove this.
13215746b4SAdam Nemet //
14215746b4SAdam Nemet //===----------------------------------------------------------------------===//
15215746b4SAdam Nemet 
1694c83370SDavid Blaikie #include "llvm/Transforms/Utils/LoopVersioning.h"
17215746b4SAdam Nemet #include "llvm/Analysis/LoopAccessAnalysis.h"
18215746b4SAdam Nemet #include "llvm/Analysis/LoopInfo.h"
192910a4f6SSilviu Baranga #include "llvm/Analysis/ScalarEvolutionExpander.h"
20215746b4SAdam Nemet #include "llvm/IR/Dominators.h"
215eccf07dSAdam Nemet #include "llvm/IR/MDBuilder.h"
22215746b4SAdam Nemet #include "llvm/Transforms/Utils/BasicBlockUtils.h"
23215746b4SAdam Nemet #include "llvm/Transforms/Utils/Cloning.h"
24215746b4SAdam Nemet 
25215746b4SAdam Nemet using namespace llvm;
26215746b4SAdam Nemet 
275eccf07dSAdam Nemet static cl::opt<bool>
285eccf07dSAdam Nemet     AnnotateNoAlias("loop-version-annotate-no-alias", cl::init(true),
295eccf07dSAdam Nemet                     cl::Hidden,
305eccf07dSAdam Nemet                     cl::desc("Add no-alias annotation for instructions that "
315eccf07dSAdam Nemet                              "are disambiguated by memchecks"));
325eccf07dSAdam Nemet 
332910a4f6SSilviu Baranga LoopVersioning::LoopVersioning(const LoopAccessInfo &LAI, Loop *L, LoopInfo *LI,
342910a4f6SSilviu Baranga                                DominatorTree *DT, ScalarEvolution *SE,
352910a4f6SSilviu Baranga                                bool UseLAIChecks)
362910a4f6SSilviu Baranga     : VersionedLoop(L), NonVersionedLoop(nullptr), LAI(LAI), LI(LI), DT(DT),
372910a4f6SSilviu Baranga       SE(SE) {
38215746b4SAdam Nemet   assert(L->getExitBlock() && "No single exit block");
39215746b4SAdam Nemet   assert(L->getLoopPreheader() && "No preheader");
402910a4f6SSilviu Baranga   if (UseLAIChecks) {
412910a4f6SSilviu Baranga     setAliasChecks(LAI.getRuntimePointerChecking()->getChecks());
429cd9a7e3SSilviu Baranga     setSCEVChecks(LAI.PSE.getUnionPredicate());
432910a4f6SSilviu Baranga   }
44215746b4SAdam Nemet }
45215746b4SAdam Nemet 
462910a4f6SSilviu Baranga void LoopVersioning::setAliasChecks(
472910a4f6SSilviu Baranga     const SmallVector<RuntimePointerChecking::PointerCheck, 4> Checks) {
482910a4f6SSilviu Baranga   AliasChecks = std::move(Checks);
492910a4f6SSilviu Baranga }
502910a4f6SSilviu Baranga 
512910a4f6SSilviu Baranga void LoopVersioning::setSCEVChecks(SCEVUnionPredicate Check) {
522910a4f6SSilviu Baranga   Preds = std::move(Check);
53dfaeb33eSAdam Nemet }
54dfaeb33eSAdam Nemet 
55e4813409SAdam Nemet void LoopVersioning::versionLoop(
56e4813409SAdam Nemet     const SmallVectorImpl<Instruction *> &DefsUsedOutside) {
57215746b4SAdam Nemet   Instruction *FirstCheckInst;
58215746b4SAdam Nemet   Instruction *MemRuntimeCheck;
592910a4f6SSilviu Baranga   Value *SCEVRuntimeCheck;
602910a4f6SSilviu Baranga   Value *RuntimeCheck = nullptr;
612910a4f6SSilviu Baranga 
62215746b4SAdam Nemet   // Add the memcheck in the original preheader (this is empty initially).
632910a4f6SSilviu Baranga   BasicBlock *RuntimeCheckBB = VersionedLoop->getLoopPreheader();
64215746b4SAdam Nemet   std::tie(FirstCheckInst, MemRuntimeCheck) =
652910a4f6SSilviu Baranga       LAI.addRuntimeChecks(RuntimeCheckBB->getTerminator(), AliasChecks);
66215746b4SAdam Nemet 
679cd9a7e3SSilviu Baranga   const SCEVUnionPredicate &Pred = LAI.PSE.getUnionPredicate();
682910a4f6SSilviu Baranga   SCEVExpander Exp(*SE, RuntimeCheckBB->getModule()->getDataLayout(),
692910a4f6SSilviu Baranga                    "scev.check");
702910a4f6SSilviu Baranga   SCEVRuntimeCheck =
712910a4f6SSilviu Baranga       Exp.expandCodeForPredicate(&Pred, RuntimeCheckBB->getTerminator());
722910a4f6SSilviu Baranga   auto *CI = dyn_cast<ConstantInt>(SCEVRuntimeCheck);
732910a4f6SSilviu Baranga 
742910a4f6SSilviu Baranga   // Discard the SCEV runtime check if it is always true.
752910a4f6SSilviu Baranga   if (CI && CI->isZero())
762910a4f6SSilviu Baranga     SCEVRuntimeCheck = nullptr;
772910a4f6SSilviu Baranga 
782910a4f6SSilviu Baranga   if (MemRuntimeCheck && SCEVRuntimeCheck) {
792910a4f6SSilviu Baranga     RuntimeCheck = BinaryOperator::Create(Instruction::Or, MemRuntimeCheck,
802910a4f6SSilviu Baranga                                           SCEVRuntimeCheck, "ldist.safe");
812910a4f6SSilviu Baranga     if (auto *I = dyn_cast<Instruction>(RuntimeCheck))
822910a4f6SSilviu Baranga       I->insertBefore(RuntimeCheckBB->getTerminator());
832910a4f6SSilviu Baranga   } else
842910a4f6SSilviu Baranga     RuntimeCheck = MemRuntimeCheck ? MemRuntimeCheck : SCEVRuntimeCheck;
852910a4f6SSilviu Baranga 
862910a4f6SSilviu Baranga   assert(RuntimeCheck && "called even though we don't need "
872910a4f6SSilviu Baranga                          "any runtime checks");
882910a4f6SSilviu Baranga 
89215746b4SAdam Nemet   // Rename the block to make the IR more readable.
902910a4f6SSilviu Baranga   RuntimeCheckBB->setName(VersionedLoop->getHeader()->getName() +
912910a4f6SSilviu Baranga                           ".lver.check");
92215746b4SAdam Nemet 
93215746b4SAdam Nemet   // Create empty preheader for the loop (and after cloning for the
94215746b4SAdam Nemet   // non-versioned loop).
952910a4f6SSilviu Baranga   BasicBlock *PH =
962910a4f6SSilviu Baranga       SplitBlock(RuntimeCheckBB, RuntimeCheckBB->getTerminator(), DT, LI);
97215746b4SAdam Nemet   PH->setName(VersionedLoop->getHeader()->getName() + ".ph");
98215746b4SAdam Nemet 
99215746b4SAdam Nemet   // Clone the loop including the preheader.
100215746b4SAdam Nemet   //
101215746b4SAdam Nemet   // FIXME: This does not currently preserve SimplifyLoop because the exit
102215746b4SAdam Nemet   // block is a join between the two loops.
103215746b4SAdam Nemet   SmallVector<BasicBlock *, 8> NonVersionedLoopBlocks;
104215746b4SAdam Nemet   NonVersionedLoop =
1052910a4f6SSilviu Baranga       cloneLoopWithPreheader(PH, RuntimeCheckBB, VersionedLoop, VMap,
1062910a4f6SSilviu Baranga                              ".lver.orig", LI, DT, NonVersionedLoopBlocks);
107215746b4SAdam Nemet   remapInstructionsInBlocks(NonVersionedLoopBlocks, VMap);
108215746b4SAdam Nemet 
109215746b4SAdam Nemet   // Insert the conditional branch based on the result of the memchecks.
1102910a4f6SSilviu Baranga   Instruction *OrigTerm = RuntimeCheckBB->getTerminator();
111215746b4SAdam Nemet   BranchInst::Create(NonVersionedLoop->getLoopPreheader(),
1122910a4f6SSilviu Baranga                      VersionedLoop->getLoopPreheader(), RuntimeCheck, OrigTerm);
113215746b4SAdam Nemet   OrigTerm->eraseFromParent();
114215746b4SAdam Nemet 
115215746b4SAdam Nemet   // The loops merge in the original exit block.  This is now dominated by the
116215746b4SAdam Nemet   // memchecking block.
1172910a4f6SSilviu Baranga   DT->changeImmediateDominator(VersionedLoop->getExitBlock(), RuntimeCheckBB);
118e4813409SAdam Nemet 
119e4813409SAdam Nemet   // Adds the necessary PHI nodes for the versioned loops based on the
120e4813409SAdam Nemet   // loop-defined values used outside of the loop.
121e4813409SAdam Nemet   addPHINodes(DefsUsedOutside);
122215746b4SAdam Nemet }
123215746b4SAdam Nemet 
124215746b4SAdam Nemet void LoopVersioning::addPHINodes(
125215746b4SAdam Nemet     const SmallVectorImpl<Instruction *> &DefsUsedOutside) {
126215746b4SAdam Nemet   BasicBlock *PHIBlock = VersionedLoop->getExitBlock();
127215746b4SAdam Nemet   assert(PHIBlock && "No single successor to loop exit block");
128215746b4SAdam Nemet 
129215746b4SAdam Nemet   for (auto *Inst : DefsUsedOutside) {
130215746b4SAdam Nemet     auto *NonVersionedLoopInst = cast<Instruction>(VMap[Inst]);
131215746b4SAdam Nemet     PHINode *PN;
132215746b4SAdam Nemet 
133215746b4SAdam Nemet     // First see if we have a single-operand PHI with the value defined by the
134215746b4SAdam Nemet     // original loop.
135215746b4SAdam Nemet     for (auto I = PHIBlock->begin(); (PN = dyn_cast<PHINode>(I)); ++I) {
136215746b4SAdam Nemet       assert(PN->getNumOperands() == 1 &&
137215746b4SAdam Nemet              "Exit block should only have on predecessor");
138215746b4SAdam Nemet       if (PN->getIncomingValue(0) == Inst)
139215746b4SAdam Nemet         break;
140215746b4SAdam Nemet     }
141215746b4SAdam Nemet     // If not create it.
142215746b4SAdam Nemet     if (!PN) {
143215746b4SAdam Nemet       PN = PHINode::Create(Inst->getType(), 2, Inst->getName() + ".lver",
1445b4c837cSDuncan P. N. Exon Smith                            &PHIBlock->front());
145215746b4SAdam Nemet       for (auto *User : Inst->users())
146215746b4SAdam Nemet         if (!VersionedLoop->contains(cast<Instruction>(User)->getParent()))
147215746b4SAdam Nemet           User->replaceUsesOfWith(Inst, PN);
148215746b4SAdam Nemet       PN->addIncoming(Inst, VersionedLoop->getExitingBlock());
149215746b4SAdam Nemet     }
150215746b4SAdam Nemet     // Add the new incoming value from the non-versioned loop.
151215746b4SAdam Nemet     PN->addIncoming(NonVersionedLoopInst, NonVersionedLoop->getExitingBlock());
152215746b4SAdam Nemet   }
153215746b4SAdam Nemet }
154d52ed841SAdam Nemet 
1555eccf07dSAdam Nemet void LoopVersioning::prepareNoAliasMetadata() {
1565eccf07dSAdam Nemet   // We need to turn the no-alias relation between pointer checking groups into
1575eccf07dSAdam Nemet   // no-aliasing annotations between instructions.
1585eccf07dSAdam Nemet   //
1595eccf07dSAdam Nemet   // We accomplish this by mapping each pointer checking group (a set of
1605eccf07dSAdam Nemet   // pointers memchecked together) to an alias scope and then also mapping each
1615eccf07dSAdam Nemet   // group to the list of scopes it can't alias.
1625eccf07dSAdam Nemet 
1635eccf07dSAdam Nemet   const RuntimePointerChecking *RtPtrChecking = LAI.getRuntimePointerChecking();
1645eccf07dSAdam Nemet   LLVMContext &Context = VersionedLoop->getHeader()->getContext();
1655eccf07dSAdam Nemet 
1665eccf07dSAdam Nemet   // First allocate an aliasing scope for each pointer checking group.
1675eccf07dSAdam Nemet   //
1685eccf07dSAdam Nemet   // While traversing through the checking groups in the loop, also create a
1695eccf07dSAdam Nemet   // reverse map from pointers to the pointer checking group they were assigned
1705eccf07dSAdam Nemet   // to.
1715eccf07dSAdam Nemet   MDBuilder MDB(Context);
1725eccf07dSAdam Nemet   MDNode *Domain = MDB.createAnonymousAliasScopeDomain("LVerDomain");
1735eccf07dSAdam Nemet 
1745eccf07dSAdam Nemet   for (const auto &Group : RtPtrChecking->CheckingGroups) {
1755eccf07dSAdam Nemet     GroupToScope[&Group] = MDB.createAnonymousAliasScope(Domain);
1765eccf07dSAdam Nemet 
1775eccf07dSAdam Nemet     for (unsigned PtrIdx : Group.Members)
1785eccf07dSAdam Nemet       PtrToGroup[RtPtrChecking->getPointerInfo(PtrIdx).PointerValue] = &Group;
1795eccf07dSAdam Nemet   }
1805eccf07dSAdam Nemet 
1815eccf07dSAdam Nemet   // Go through the checks and for each pointer group, collect the scopes for
1825eccf07dSAdam Nemet   // each non-aliasing pointer group.
1835eccf07dSAdam Nemet   DenseMap<const RuntimePointerChecking::CheckingPtrGroup *,
1845eccf07dSAdam Nemet            SmallVector<Metadata *, 4>>
1855eccf07dSAdam Nemet       GroupToNonAliasingScopes;
1865eccf07dSAdam Nemet 
1875eccf07dSAdam Nemet   for (const auto &Check : AliasChecks)
1885eccf07dSAdam Nemet     GroupToNonAliasingScopes[Check.first].push_back(GroupToScope[Check.second]);
1895eccf07dSAdam Nemet 
1905eccf07dSAdam Nemet   // Finally, transform the above to actually map to scope list which is what
1915eccf07dSAdam Nemet   // the metadata uses.
1925eccf07dSAdam Nemet 
1935eccf07dSAdam Nemet   for (auto Pair : GroupToNonAliasingScopes)
1945eccf07dSAdam Nemet     GroupToNonAliasingScopeList[Pair.first] = MDNode::get(Context, Pair.second);
1955eccf07dSAdam Nemet }
1965eccf07dSAdam Nemet 
1975eccf07dSAdam Nemet void LoopVersioning::annotateLoopWithNoAlias() {
1985eccf07dSAdam Nemet   if (!AnnotateNoAlias)
1995eccf07dSAdam Nemet     return;
2005eccf07dSAdam Nemet 
2015eccf07dSAdam Nemet   // First prepare the maps.
2025eccf07dSAdam Nemet   prepareNoAliasMetadata();
2035eccf07dSAdam Nemet 
2045eccf07dSAdam Nemet   // Add the scope and no-alias metadata to the instructions.
2055eccf07dSAdam Nemet   for (Instruction *I : LAI.getDepChecker().getMemoryInstructions()) {
2065eccf07dSAdam Nemet     annotateInstWithNoAlias(I);
2075eccf07dSAdam Nemet   }
2085eccf07dSAdam Nemet }
2095eccf07dSAdam Nemet 
210*b0c4eae0SAdam Nemet void LoopVersioning::annotateInstWithNoAlias(Instruction *VersionedInst,
211*b0c4eae0SAdam Nemet                                              const Instruction *OrigInst) {
2125eccf07dSAdam Nemet   if (!AnnotateNoAlias)
2135eccf07dSAdam Nemet     return;
2145eccf07dSAdam Nemet 
2155eccf07dSAdam Nemet   LLVMContext &Context = VersionedLoop->getHeader()->getContext();
216*b0c4eae0SAdam Nemet   const Value *Ptr = isa<LoadInst>(OrigInst)
217*b0c4eae0SAdam Nemet                          ? cast<LoadInst>(OrigInst)->getPointerOperand()
218*b0c4eae0SAdam Nemet                          : cast<StoreInst>(OrigInst)->getPointerOperand();
2195eccf07dSAdam Nemet 
2205eccf07dSAdam Nemet   // Find the group for the pointer and then add the scope metadata.
2215eccf07dSAdam Nemet   auto Group = PtrToGroup.find(Ptr);
2225eccf07dSAdam Nemet   if (Group != PtrToGroup.end()) {
223*b0c4eae0SAdam Nemet     VersionedInst->setMetadata(
2245eccf07dSAdam Nemet         LLVMContext::MD_alias_scope,
225*b0c4eae0SAdam Nemet         MDNode::concatenate(
226*b0c4eae0SAdam Nemet             VersionedInst->getMetadata(LLVMContext::MD_alias_scope),
2275eccf07dSAdam Nemet             MDNode::get(Context, GroupToScope[Group->second])));
2285eccf07dSAdam Nemet 
2295eccf07dSAdam Nemet     // Add the no-alias metadata.
2305eccf07dSAdam Nemet     auto NonAliasingScopeList = GroupToNonAliasingScopeList.find(Group->second);
2315eccf07dSAdam Nemet     if (NonAliasingScopeList != GroupToNonAliasingScopeList.end())
232*b0c4eae0SAdam Nemet       VersionedInst->setMetadata(
2335eccf07dSAdam Nemet           LLVMContext::MD_noalias,
234*b0c4eae0SAdam Nemet           MDNode::concatenate(
235*b0c4eae0SAdam Nemet               VersionedInst->getMetadata(LLVMContext::MD_noalias),
2365eccf07dSAdam Nemet               NonAliasingScopeList->second));
2375eccf07dSAdam Nemet   }
2385eccf07dSAdam Nemet }
2395eccf07dSAdam Nemet 
240d52ed841SAdam Nemet namespace {
241d52ed841SAdam Nemet /// \brief Also expose this is a pass.  Currently this is only used for
242d52ed841SAdam Nemet /// unit-testing.  It adds all memchecks necessary to remove all may-aliasing
243d52ed841SAdam Nemet /// array accesses from the loop.
244d52ed841SAdam Nemet class LoopVersioningPass : public FunctionPass {
245d52ed841SAdam Nemet public:
246d52ed841SAdam Nemet   LoopVersioningPass() : FunctionPass(ID) {
247d52ed841SAdam Nemet     initializeLoopVersioningPassPass(*PassRegistry::getPassRegistry());
248d52ed841SAdam Nemet   }
249d52ed841SAdam Nemet 
250d52ed841SAdam Nemet   bool runOnFunction(Function &F) override {
251d52ed841SAdam Nemet     auto *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
252d52ed841SAdam Nemet     auto *LAA = &getAnalysis<LoopAccessAnalysis>();
253d52ed841SAdam Nemet     auto *DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
254d52ed841SAdam Nemet     auto *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();
255d52ed841SAdam Nemet 
256d52ed841SAdam Nemet     // Build up a worklist of inner-loops to version. This is necessary as the
257d52ed841SAdam Nemet     // act of versioning a loop creates new loops and can invalidate iterators
258d52ed841SAdam Nemet     // across the loops.
259d52ed841SAdam Nemet     SmallVector<Loop *, 8> Worklist;
260d52ed841SAdam Nemet 
261d52ed841SAdam Nemet     for (Loop *TopLevelLoop : *LI)
262d52ed841SAdam Nemet       for (Loop *L : depth_first(TopLevelLoop))
263d52ed841SAdam Nemet         // We only handle inner-most loops.
264d52ed841SAdam Nemet         if (L->empty())
265d52ed841SAdam Nemet           Worklist.push_back(L);
266d52ed841SAdam Nemet 
267d52ed841SAdam Nemet     // Now walk the identified inner loops.
268d52ed841SAdam Nemet     bool Changed = false;
269d52ed841SAdam Nemet     for (Loop *L : Worklist) {
270d52ed841SAdam Nemet       const LoopAccessInfo &LAI = LAA->getInfo(L, ValueToValueMap());
271d52ed841SAdam Nemet       if (LAI.getNumRuntimePointerChecks() ||
272d52ed841SAdam Nemet           !LAI.PSE.getUnionPredicate().isAlwaysTrue()) {
273d52ed841SAdam Nemet         LoopVersioning LVer(LAI, L, LI, DT, SE);
274d52ed841SAdam Nemet         LVer.versionLoop();
2755eccf07dSAdam Nemet         LVer.annotateLoopWithNoAlias();
276d52ed841SAdam Nemet         Changed = true;
277d52ed841SAdam Nemet       }
278d52ed841SAdam Nemet     }
279d52ed841SAdam Nemet 
280d52ed841SAdam Nemet     return Changed;
281d52ed841SAdam Nemet   }
282d52ed841SAdam Nemet 
283d52ed841SAdam Nemet   void getAnalysisUsage(AnalysisUsage &AU) const override {
284d52ed841SAdam Nemet     AU.addRequired<LoopInfoWrapperPass>();
285d52ed841SAdam Nemet     AU.addPreserved<LoopInfoWrapperPass>();
286d52ed841SAdam Nemet     AU.addRequired<LoopAccessAnalysis>();
287d52ed841SAdam Nemet     AU.addRequired<DominatorTreeWrapperPass>();
288d52ed841SAdam Nemet     AU.addPreserved<DominatorTreeWrapperPass>();
289d52ed841SAdam Nemet     AU.addRequired<ScalarEvolutionWrapperPass>();
290d52ed841SAdam Nemet   }
291d52ed841SAdam Nemet 
292d52ed841SAdam Nemet   static char ID;
293d52ed841SAdam Nemet };
294d52ed841SAdam Nemet }
295d52ed841SAdam Nemet 
296d52ed841SAdam Nemet #define LVER_OPTION "loop-versioning"
297d52ed841SAdam Nemet #define DEBUG_TYPE LVER_OPTION
298d52ed841SAdam Nemet 
299d52ed841SAdam Nemet char LoopVersioningPass::ID;
300d52ed841SAdam Nemet static const char LVer_name[] = "Loop Versioning";
301d52ed841SAdam Nemet 
302d52ed841SAdam Nemet INITIALIZE_PASS_BEGIN(LoopVersioningPass, LVER_OPTION, LVer_name, false, false)
303d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
304d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopAccessAnalysis)
305d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
306d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)
307d52ed841SAdam Nemet INITIALIZE_PASS_END(LoopVersioningPass, LVER_OPTION, LVer_name, false, false)
308d52ed841SAdam Nemet 
309d52ed841SAdam Nemet namespace llvm {
310d52ed841SAdam Nemet FunctionPass *createLoopVersioningPass() {
311d52ed841SAdam Nemet   return new LoopVersioningPass();
312d52ed841SAdam Nemet }
313d52ed841SAdam Nemet }
314