1215746b4SAdam Nemet //===- LoopVersioning.cpp - Utility to version a loop ---------------------===//
2215746b4SAdam Nemet //
3215746b4SAdam Nemet //                     The LLVM Compiler Infrastructure
4215746b4SAdam Nemet //
5215746b4SAdam Nemet // This file is distributed under the University of Illinois Open Source
6215746b4SAdam Nemet // License. See LICENSE.TXT for details.
7215746b4SAdam Nemet //
8215746b4SAdam Nemet //===----------------------------------------------------------------------===//
9215746b4SAdam Nemet //
10215746b4SAdam Nemet // This file defines a utility class to perform loop versioning.  The versioned
11215746b4SAdam Nemet // loop speculates that otherwise may-aliasing memory accesses don't overlap and
12215746b4SAdam Nemet // emits checks to prove this.
13215746b4SAdam Nemet //
14215746b4SAdam Nemet //===----------------------------------------------------------------------===//
15215746b4SAdam Nemet 
1694c83370SDavid Blaikie #include "llvm/Transforms/Utils/LoopVersioning.h"
17215746b4SAdam Nemet #include "llvm/Analysis/LoopAccessAnalysis.h"
18215746b4SAdam Nemet #include "llvm/Analysis/LoopInfo.h"
192910a4f6SSilviu Baranga #include "llvm/Analysis/ScalarEvolutionExpander.h"
20215746b4SAdam Nemet #include "llvm/IR/Dominators.h"
21*5eccf07dSAdam Nemet #include "llvm/IR/MDBuilder.h"
22215746b4SAdam Nemet #include "llvm/Transforms/Utils/BasicBlockUtils.h"
23215746b4SAdam Nemet #include "llvm/Transforms/Utils/Cloning.h"
24215746b4SAdam Nemet 
25215746b4SAdam Nemet using namespace llvm;
26215746b4SAdam Nemet 
27*5eccf07dSAdam Nemet static cl::opt<bool>
28*5eccf07dSAdam Nemet     AnnotateNoAlias("loop-version-annotate-no-alias", cl::init(true),
29*5eccf07dSAdam Nemet                     cl::Hidden,
30*5eccf07dSAdam Nemet                     cl::desc("Add no-alias annotation for instructions that "
31*5eccf07dSAdam Nemet                              "are disambiguated by memchecks"));
32*5eccf07dSAdam Nemet 
332910a4f6SSilviu Baranga LoopVersioning::LoopVersioning(const LoopAccessInfo &LAI, Loop *L, LoopInfo *LI,
342910a4f6SSilviu Baranga                                DominatorTree *DT, ScalarEvolution *SE,
352910a4f6SSilviu Baranga                                bool UseLAIChecks)
362910a4f6SSilviu Baranga     : VersionedLoop(L), NonVersionedLoop(nullptr), LAI(LAI), LI(LI), DT(DT),
372910a4f6SSilviu Baranga       SE(SE) {
38215746b4SAdam Nemet   assert(L->getExitBlock() && "No single exit block");
39215746b4SAdam Nemet   assert(L->getLoopPreheader() && "No preheader");
402910a4f6SSilviu Baranga   if (UseLAIChecks) {
412910a4f6SSilviu Baranga     setAliasChecks(LAI.getRuntimePointerChecking()->getChecks());
429cd9a7e3SSilviu Baranga     setSCEVChecks(LAI.PSE.getUnionPredicate());
432910a4f6SSilviu Baranga   }
44215746b4SAdam Nemet }
45215746b4SAdam Nemet 
462910a4f6SSilviu Baranga void LoopVersioning::setAliasChecks(
472910a4f6SSilviu Baranga     const SmallVector<RuntimePointerChecking::PointerCheck, 4> Checks) {
482910a4f6SSilviu Baranga   AliasChecks = std::move(Checks);
492910a4f6SSilviu Baranga }
502910a4f6SSilviu Baranga 
512910a4f6SSilviu Baranga void LoopVersioning::setSCEVChecks(SCEVUnionPredicate Check) {
522910a4f6SSilviu Baranga   Preds = std::move(Check);
53dfaeb33eSAdam Nemet }
54dfaeb33eSAdam Nemet 
55e4813409SAdam Nemet void LoopVersioning::versionLoop(
56e4813409SAdam Nemet     const SmallVectorImpl<Instruction *> &DefsUsedOutside) {
57215746b4SAdam Nemet   Instruction *FirstCheckInst;
58215746b4SAdam Nemet   Instruction *MemRuntimeCheck;
592910a4f6SSilviu Baranga   Value *SCEVRuntimeCheck;
602910a4f6SSilviu Baranga   Value *RuntimeCheck = nullptr;
612910a4f6SSilviu Baranga 
62215746b4SAdam Nemet   // Add the memcheck in the original preheader (this is empty initially).
632910a4f6SSilviu Baranga   BasicBlock *RuntimeCheckBB = VersionedLoop->getLoopPreheader();
64215746b4SAdam Nemet   std::tie(FirstCheckInst, MemRuntimeCheck) =
652910a4f6SSilviu Baranga       LAI.addRuntimeChecks(RuntimeCheckBB->getTerminator(), AliasChecks);
66215746b4SAdam Nemet 
679cd9a7e3SSilviu Baranga   const SCEVUnionPredicate &Pred = LAI.PSE.getUnionPredicate();
682910a4f6SSilviu Baranga   SCEVExpander Exp(*SE, RuntimeCheckBB->getModule()->getDataLayout(),
692910a4f6SSilviu Baranga                    "scev.check");
702910a4f6SSilviu Baranga   SCEVRuntimeCheck =
712910a4f6SSilviu Baranga       Exp.expandCodeForPredicate(&Pred, RuntimeCheckBB->getTerminator());
722910a4f6SSilviu Baranga   auto *CI = dyn_cast<ConstantInt>(SCEVRuntimeCheck);
732910a4f6SSilviu Baranga 
742910a4f6SSilviu Baranga   // Discard the SCEV runtime check if it is always true.
752910a4f6SSilviu Baranga   if (CI && CI->isZero())
762910a4f6SSilviu Baranga     SCEVRuntimeCheck = nullptr;
772910a4f6SSilviu Baranga 
782910a4f6SSilviu Baranga   if (MemRuntimeCheck && SCEVRuntimeCheck) {
792910a4f6SSilviu Baranga     RuntimeCheck = BinaryOperator::Create(Instruction::Or, MemRuntimeCheck,
802910a4f6SSilviu Baranga                                           SCEVRuntimeCheck, "ldist.safe");
812910a4f6SSilviu Baranga     if (auto *I = dyn_cast<Instruction>(RuntimeCheck))
822910a4f6SSilviu Baranga       I->insertBefore(RuntimeCheckBB->getTerminator());
832910a4f6SSilviu Baranga   } else
842910a4f6SSilviu Baranga     RuntimeCheck = MemRuntimeCheck ? MemRuntimeCheck : SCEVRuntimeCheck;
852910a4f6SSilviu Baranga 
862910a4f6SSilviu Baranga   assert(RuntimeCheck && "called even though we don't need "
872910a4f6SSilviu Baranga                          "any runtime checks");
882910a4f6SSilviu Baranga 
89215746b4SAdam Nemet   // Rename the block to make the IR more readable.
902910a4f6SSilviu Baranga   RuntimeCheckBB->setName(VersionedLoop->getHeader()->getName() +
912910a4f6SSilviu Baranga                           ".lver.check");
92215746b4SAdam Nemet 
93215746b4SAdam Nemet   // Create empty preheader for the loop (and after cloning for the
94215746b4SAdam Nemet   // non-versioned loop).
952910a4f6SSilviu Baranga   BasicBlock *PH =
962910a4f6SSilviu Baranga       SplitBlock(RuntimeCheckBB, RuntimeCheckBB->getTerminator(), DT, LI);
97215746b4SAdam Nemet   PH->setName(VersionedLoop->getHeader()->getName() + ".ph");
98215746b4SAdam Nemet 
99215746b4SAdam Nemet   // Clone the loop including the preheader.
100215746b4SAdam Nemet   //
101215746b4SAdam Nemet   // FIXME: This does not currently preserve SimplifyLoop because the exit
102215746b4SAdam Nemet   // block is a join between the two loops.
103215746b4SAdam Nemet   SmallVector<BasicBlock *, 8> NonVersionedLoopBlocks;
104215746b4SAdam Nemet   NonVersionedLoop =
1052910a4f6SSilviu Baranga       cloneLoopWithPreheader(PH, RuntimeCheckBB, VersionedLoop, VMap,
1062910a4f6SSilviu Baranga                              ".lver.orig", LI, DT, NonVersionedLoopBlocks);
107215746b4SAdam Nemet   remapInstructionsInBlocks(NonVersionedLoopBlocks, VMap);
108215746b4SAdam Nemet 
109215746b4SAdam Nemet   // Insert the conditional branch based on the result of the memchecks.
1102910a4f6SSilviu Baranga   Instruction *OrigTerm = RuntimeCheckBB->getTerminator();
111215746b4SAdam Nemet   BranchInst::Create(NonVersionedLoop->getLoopPreheader(),
1122910a4f6SSilviu Baranga                      VersionedLoop->getLoopPreheader(), RuntimeCheck, OrigTerm);
113215746b4SAdam Nemet   OrigTerm->eraseFromParent();
114215746b4SAdam Nemet 
115215746b4SAdam Nemet   // The loops merge in the original exit block.  This is now dominated by the
116215746b4SAdam Nemet   // memchecking block.
1172910a4f6SSilviu Baranga   DT->changeImmediateDominator(VersionedLoop->getExitBlock(), RuntimeCheckBB);
118e4813409SAdam Nemet 
119e4813409SAdam Nemet   // Adds the necessary PHI nodes for the versioned loops based on the
120e4813409SAdam Nemet   // loop-defined values used outside of the loop.
121e4813409SAdam Nemet   addPHINodes(DefsUsedOutside);
122215746b4SAdam Nemet }
123215746b4SAdam Nemet 
124215746b4SAdam Nemet void LoopVersioning::addPHINodes(
125215746b4SAdam Nemet     const SmallVectorImpl<Instruction *> &DefsUsedOutside) {
126215746b4SAdam Nemet   BasicBlock *PHIBlock = VersionedLoop->getExitBlock();
127215746b4SAdam Nemet   assert(PHIBlock && "No single successor to loop exit block");
128215746b4SAdam Nemet 
129215746b4SAdam Nemet   for (auto *Inst : DefsUsedOutside) {
130215746b4SAdam Nemet     auto *NonVersionedLoopInst = cast<Instruction>(VMap[Inst]);
131215746b4SAdam Nemet     PHINode *PN;
132215746b4SAdam Nemet 
133215746b4SAdam Nemet     // First see if we have a single-operand PHI with the value defined by the
134215746b4SAdam Nemet     // original loop.
135215746b4SAdam Nemet     for (auto I = PHIBlock->begin(); (PN = dyn_cast<PHINode>(I)); ++I) {
136215746b4SAdam Nemet       assert(PN->getNumOperands() == 1 &&
137215746b4SAdam Nemet              "Exit block should only have on predecessor");
138215746b4SAdam Nemet       if (PN->getIncomingValue(0) == Inst)
139215746b4SAdam Nemet         break;
140215746b4SAdam Nemet     }
141215746b4SAdam Nemet     // If not create it.
142215746b4SAdam Nemet     if (!PN) {
143215746b4SAdam Nemet       PN = PHINode::Create(Inst->getType(), 2, Inst->getName() + ".lver",
1445b4c837cSDuncan P. N. Exon Smith                            &PHIBlock->front());
145215746b4SAdam Nemet       for (auto *User : Inst->users())
146215746b4SAdam Nemet         if (!VersionedLoop->contains(cast<Instruction>(User)->getParent()))
147215746b4SAdam Nemet           User->replaceUsesOfWith(Inst, PN);
148215746b4SAdam Nemet       PN->addIncoming(Inst, VersionedLoop->getExitingBlock());
149215746b4SAdam Nemet     }
150215746b4SAdam Nemet     // Add the new incoming value from the non-versioned loop.
151215746b4SAdam Nemet     PN->addIncoming(NonVersionedLoopInst, NonVersionedLoop->getExitingBlock());
152215746b4SAdam Nemet   }
153215746b4SAdam Nemet }
154d52ed841SAdam Nemet 
155*5eccf07dSAdam Nemet void LoopVersioning::prepareNoAliasMetadata() {
156*5eccf07dSAdam Nemet   // We need to turn the no-alias relation between pointer checking groups into
157*5eccf07dSAdam Nemet   // no-aliasing annotations between instructions.
158*5eccf07dSAdam Nemet   //
159*5eccf07dSAdam Nemet   // We accomplish this by mapping each pointer checking group (a set of
160*5eccf07dSAdam Nemet   // pointers memchecked together) to an alias scope and then also mapping each
161*5eccf07dSAdam Nemet   // group to the list of scopes it can't alias.
162*5eccf07dSAdam Nemet 
163*5eccf07dSAdam Nemet   const RuntimePointerChecking *RtPtrChecking = LAI.getRuntimePointerChecking();
164*5eccf07dSAdam Nemet   LLVMContext &Context = VersionedLoop->getHeader()->getContext();
165*5eccf07dSAdam Nemet 
166*5eccf07dSAdam Nemet   // First allocate an aliasing scope for each pointer checking group.
167*5eccf07dSAdam Nemet   //
168*5eccf07dSAdam Nemet   // While traversing through the checking groups in the loop, also create a
169*5eccf07dSAdam Nemet   // reverse map from pointers to the pointer checking group they were assigned
170*5eccf07dSAdam Nemet   // to.
171*5eccf07dSAdam Nemet   MDBuilder MDB(Context);
172*5eccf07dSAdam Nemet   MDNode *Domain = MDB.createAnonymousAliasScopeDomain("LVerDomain");
173*5eccf07dSAdam Nemet 
174*5eccf07dSAdam Nemet   for (const auto &Group : RtPtrChecking->CheckingGroups) {
175*5eccf07dSAdam Nemet     GroupToScope[&Group] = MDB.createAnonymousAliasScope(Domain);
176*5eccf07dSAdam Nemet 
177*5eccf07dSAdam Nemet     for (unsigned PtrIdx : Group.Members)
178*5eccf07dSAdam Nemet       PtrToGroup[RtPtrChecking->getPointerInfo(PtrIdx).PointerValue] = &Group;
179*5eccf07dSAdam Nemet   }
180*5eccf07dSAdam Nemet 
181*5eccf07dSAdam Nemet   // Go through the checks and for each pointer group, collect the scopes for
182*5eccf07dSAdam Nemet   // each non-aliasing pointer group.
183*5eccf07dSAdam Nemet   DenseMap<const RuntimePointerChecking::CheckingPtrGroup *,
184*5eccf07dSAdam Nemet            SmallVector<Metadata *, 4>>
185*5eccf07dSAdam Nemet       GroupToNonAliasingScopes;
186*5eccf07dSAdam Nemet 
187*5eccf07dSAdam Nemet   for (const auto &Check : AliasChecks)
188*5eccf07dSAdam Nemet     GroupToNonAliasingScopes[Check.first].push_back(GroupToScope[Check.second]);
189*5eccf07dSAdam Nemet 
190*5eccf07dSAdam Nemet   // Finally, transform the above to actually map to scope list which is what
191*5eccf07dSAdam Nemet   // the metadata uses.
192*5eccf07dSAdam Nemet 
193*5eccf07dSAdam Nemet   for (auto Pair : GroupToNonAliasingScopes)
194*5eccf07dSAdam Nemet     GroupToNonAliasingScopeList[Pair.first] = MDNode::get(Context, Pair.second);
195*5eccf07dSAdam Nemet }
196*5eccf07dSAdam Nemet 
197*5eccf07dSAdam Nemet void LoopVersioning::annotateLoopWithNoAlias() {
198*5eccf07dSAdam Nemet   if (!AnnotateNoAlias)
199*5eccf07dSAdam Nemet     return;
200*5eccf07dSAdam Nemet 
201*5eccf07dSAdam Nemet   // First prepare the maps.
202*5eccf07dSAdam Nemet   prepareNoAliasMetadata();
203*5eccf07dSAdam Nemet 
204*5eccf07dSAdam Nemet   // Add the scope and no-alias metadata to the instructions.
205*5eccf07dSAdam Nemet   for (Instruction *I : LAI.getDepChecker().getMemoryInstructions()) {
206*5eccf07dSAdam Nemet     annotateInstWithNoAlias(I);
207*5eccf07dSAdam Nemet   }
208*5eccf07dSAdam Nemet }
209*5eccf07dSAdam Nemet 
210*5eccf07dSAdam Nemet void LoopVersioning::annotateInstWithNoAlias(Instruction *I) {
211*5eccf07dSAdam Nemet   if (!AnnotateNoAlias)
212*5eccf07dSAdam Nemet     return;
213*5eccf07dSAdam Nemet 
214*5eccf07dSAdam Nemet   LLVMContext &Context = VersionedLoop->getHeader()->getContext();
215*5eccf07dSAdam Nemet   Value *Ptr = isa<LoadInst>(I) ? cast<LoadInst>(I)->getPointerOperand()
216*5eccf07dSAdam Nemet                                 : cast<StoreInst>(I)->getPointerOperand();
217*5eccf07dSAdam Nemet 
218*5eccf07dSAdam Nemet   // Find the group for the pointer and then add the scope metadata.
219*5eccf07dSAdam Nemet   auto Group = PtrToGroup.find(Ptr);
220*5eccf07dSAdam Nemet   if (Group != PtrToGroup.end()) {
221*5eccf07dSAdam Nemet     I->setMetadata(
222*5eccf07dSAdam Nemet         LLVMContext::MD_alias_scope,
223*5eccf07dSAdam Nemet         MDNode::concatenate(I->getMetadata(LLVMContext::MD_alias_scope),
224*5eccf07dSAdam Nemet                             MDNode::get(Context, GroupToScope[Group->second])));
225*5eccf07dSAdam Nemet 
226*5eccf07dSAdam Nemet     // Add the no-alias metadata.
227*5eccf07dSAdam Nemet     auto NonAliasingScopeList = GroupToNonAliasingScopeList.find(Group->second);
228*5eccf07dSAdam Nemet     if (NonAliasingScopeList != GroupToNonAliasingScopeList.end())
229*5eccf07dSAdam Nemet       I->setMetadata(
230*5eccf07dSAdam Nemet           LLVMContext::MD_noalias,
231*5eccf07dSAdam Nemet           MDNode::concatenate(I->getMetadata(LLVMContext::MD_noalias),
232*5eccf07dSAdam Nemet                               NonAliasingScopeList->second));
233*5eccf07dSAdam Nemet   }
234*5eccf07dSAdam Nemet }
235*5eccf07dSAdam Nemet 
236d52ed841SAdam Nemet namespace {
237d52ed841SAdam Nemet /// \brief Also expose this is a pass.  Currently this is only used for
238d52ed841SAdam Nemet /// unit-testing.  It adds all memchecks necessary to remove all may-aliasing
239d52ed841SAdam Nemet /// array accesses from the loop.
240d52ed841SAdam Nemet class LoopVersioningPass : public FunctionPass {
241d52ed841SAdam Nemet public:
242d52ed841SAdam Nemet   LoopVersioningPass() : FunctionPass(ID) {
243d52ed841SAdam Nemet     initializeLoopVersioningPassPass(*PassRegistry::getPassRegistry());
244d52ed841SAdam Nemet   }
245d52ed841SAdam Nemet 
246d52ed841SAdam Nemet   bool runOnFunction(Function &F) override {
247d52ed841SAdam Nemet     auto *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
248d52ed841SAdam Nemet     auto *LAA = &getAnalysis<LoopAccessAnalysis>();
249d52ed841SAdam Nemet     auto *DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
250d52ed841SAdam Nemet     auto *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();
251d52ed841SAdam Nemet 
252d52ed841SAdam Nemet     // Build up a worklist of inner-loops to version. This is necessary as the
253d52ed841SAdam Nemet     // act of versioning a loop creates new loops and can invalidate iterators
254d52ed841SAdam Nemet     // across the loops.
255d52ed841SAdam Nemet     SmallVector<Loop *, 8> Worklist;
256d52ed841SAdam Nemet 
257d52ed841SAdam Nemet     for (Loop *TopLevelLoop : *LI)
258d52ed841SAdam Nemet       for (Loop *L : depth_first(TopLevelLoop))
259d52ed841SAdam Nemet         // We only handle inner-most loops.
260d52ed841SAdam Nemet         if (L->empty())
261d52ed841SAdam Nemet           Worklist.push_back(L);
262d52ed841SAdam Nemet 
263d52ed841SAdam Nemet     // Now walk the identified inner loops.
264d52ed841SAdam Nemet     bool Changed = false;
265d52ed841SAdam Nemet     for (Loop *L : Worklist) {
266d52ed841SAdam Nemet       const LoopAccessInfo &LAI = LAA->getInfo(L, ValueToValueMap());
267d52ed841SAdam Nemet       if (LAI.getNumRuntimePointerChecks() ||
268d52ed841SAdam Nemet           !LAI.PSE.getUnionPredicate().isAlwaysTrue()) {
269d52ed841SAdam Nemet         LoopVersioning LVer(LAI, L, LI, DT, SE);
270d52ed841SAdam Nemet         LVer.versionLoop();
271*5eccf07dSAdam Nemet         LVer.annotateLoopWithNoAlias();
272d52ed841SAdam Nemet         Changed = true;
273d52ed841SAdam Nemet       }
274d52ed841SAdam Nemet     }
275d52ed841SAdam Nemet 
276d52ed841SAdam Nemet     return Changed;
277d52ed841SAdam Nemet   }
278d52ed841SAdam Nemet 
279d52ed841SAdam Nemet   void getAnalysisUsage(AnalysisUsage &AU) const override {
280d52ed841SAdam Nemet     AU.addRequired<LoopInfoWrapperPass>();
281d52ed841SAdam Nemet     AU.addPreserved<LoopInfoWrapperPass>();
282d52ed841SAdam Nemet     AU.addRequired<LoopAccessAnalysis>();
283d52ed841SAdam Nemet     AU.addRequired<DominatorTreeWrapperPass>();
284d52ed841SAdam Nemet     AU.addPreserved<DominatorTreeWrapperPass>();
285d52ed841SAdam Nemet     AU.addRequired<ScalarEvolutionWrapperPass>();
286d52ed841SAdam Nemet   }
287d52ed841SAdam Nemet 
288d52ed841SAdam Nemet   static char ID;
289d52ed841SAdam Nemet };
290d52ed841SAdam Nemet }
291d52ed841SAdam Nemet 
292d52ed841SAdam Nemet #define LVER_OPTION "loop-versioning"
293d52ed841SAdam Nemet #define DEBUG_TYPE LVER_OPTION
294d52ed841SAdam Nemet 
295d52ed841SAdam Nemet char LoopVersioningPass::ID;
296d52ed841SAdam Nemet static const char LVer_name[] = "Loop Versioning";
297d52ed841SAdam Nemet 
298d52ed841SAdam Nemet INITIALIZE_PASS_BEGIN(LoopVersioningPass, LVER_OPTION, LVer_name, false, false)
299d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
300d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopAccessAnalysis)
301d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
302d52ed841SAdam Nemet INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)
303d52ed841SAdam Nemet INITIALIZE_PASS_END(LoopVersioningPass, LVER_OPTION, LVer_name, false, false)
304d52ed841SAdam Nemet 
305d52ed841SAdam Nemet namespace llvm {
306d52ed841SAdam Nemet FunctionPass *createLoopVersioningPass() {
307d52ed841SAdam Nemet   return new LoopVersioningPass();
308d52ed841SAdam Nemet }
309d52ed841SAdam Nemet }
310