10456327cSAdam Nemet //===- LoopAccessAnalysis.cpp - Loop Access Analysis Implementation --------==//
20456327cSAdam Nemet //
30456327cSAdam Nemet //                     The LLVM Compiler Infrastructure
40456327cSAdam Nemet //
50456327cSAdam Nemet // This file is distributed under the University of Illinois Open Source
60456327cSAdam Nemet // License. See LICENSE.TXT for details.
70456327cSAdam Nemet //
80456327cSAdam Nemet //===----------------------------------------------------------------------===//
90456327cSAdam Nemet //
100456327cSAdam Nemet // The implementation for the loop memory dependence that was originally
110456327cSAdam Nemet // developed for the loop vectorizer.
120456327cSAdam Nemet //
130456327cSAdam Nemet //===----------------------------------------------------------------------===//
140456327cSAdam Nemet 
150456327cSAdam Nemet #include "llvm/Analysis/LoopAccessAnalysis.h"
160456327cSAdam Nemet #include "llvm/Analysis/LoopInfo.h"
177206d7a5SAdam Nemet #include "llvm/Analysis/ScalarEvolutionExpander.h"
18799003bfSBenjamin Kramer #include "llvm/Analysis/TargetLibraryInfo.h"
190456327cSAdam Nemet #include "llvm/Analysis/ValueTracking.h"
200456327cSAdam Nemet #include "llvm/IR/DiagnosticInfo.h"
210456327cSAdam Nemet #include "llvm/IR/Dominators.h"
227206d7a5SAdam Nemet #include "llvm/IR/IRBuilder.h"
230456327cSAdam Nemet #include "llvm/Support/Debug.h"
24799003bfSBenjamin Kramer #include "llvm/Support/raw_ostream.h"
250456327cSAdam Nemet #include "llvm/Transforms/Utils/VectorUtils.h"
260456327cSAdam Nemet using namespace llvm;
270456327cSAdam Nemet 
28339f42b3SAdam Nemet #define DEBUG_TYPE "loop-accesses"
290456327cSAdam Nemet 
30f219c647SAdam Nemet static cl::opt<unsigned, true>
31f219c647SAdam Nemet VectorizationFactor("force-vector-width", cl::Hidden,
32f219c647SAdam Nemet                     cl::desc("Sets the SIMD width. Zero is autoselect."),
33f219c647SAdam Nemet                     cl::location(VectorizerParams::VectorizationFactor));
341d862af7SAdam Nemet unsigned VectorizerParams::VectorizationFactor;
35f219c647SAdam Nemet 
36f219c647SAdam Nemet static cl::opt<unsigned, true>
37f219c647SAdam Nemet VectorizationInterleave("force-vector-interleave", cl::Hidden,
38f219c647SAdam Nemet                         cl::desc("Sets the vectorization interleave count. "
39f219c647SAdam Nemet                                  "Zero is autoselect."),
40f219c647SAdam Nemet                         cl::location(
41f219c647SAdam Nemet                             VectorizerParams::VectorizationInterleave));
421d862af7SAdam Nemet unsigned VectorizerParams::VectorizationInterleave;
43f219c647SAdam Nemet 
441d862af7SAdam Nemet static cl::opt<unsigned, true> RuntimeMemoryCheckThreshold(
451d862af7SAdam Nemet     "runtime-memory-check-threshold", cl::Hidden,
461d862af7SAdam Nemet     cl::desc("When performing memory disambiguation checks at runtime do not "
471d862af7SAdam Nemet              "generate more than this number of comparisons (default = 8)."),
481d862af7SAdam Nemet     cl::location(VectorizerParams::RuntimeMemoryCheckThreshold), cl::init(8));
491d862af7SAdam Nemet unsigned VectorizerParams::RuntimeMemoryCheckThreshold;
50f219c647SAdam Nemet 
51f219c647SAdam Nemet /// Maximum SIMD width.
52f219c647SAdam Nemet const unsigned VectorizerParams::MaxVectorWidth = 64;
53f219c647SAdam Nemet 
549c926579SAdam Nemet /// \brief We collect interesting dependences up to this threshold.
559c926579SAdam Nemet static cl::opt<unsigned> MaxInterestingDependence(
569c926579SAdam Nemet     "max-interesting-dependences", cl::Hidden,
579c926579SAdam Nemet     cl::desc("Maximum number of interesting dependences collected by "
589c926579SAdam Nemet              "loop-access analysis (default = 100)"),
599c926579SAdam Nemet     cl::init(100));
609c926579SAdam Nemet 
61f219c647SAdam Nemet bool VectorizerParams::isInterleaveForced() {
62f219c647SAdam Nemet   return ::VectorizationInterleave.getNumOccurrences() > 0;
63f219c647SAdam Nemet }
64f219c647SAdam Nemet 
652bd6e984SAdam Nemet void LoopAccessReport::emitAnalysis(const LoopAccessReport &Message,
660456327cSAdam Nemet                                     const Function *TheFunction,
67339f42b3SAdam Nemet                                     const Loop *TheLoop,
68339f42b3SAdam Nemet                                     const char *PassName) {
690456327cSAdam Nemet   DebugLoc DL = TheLoop->getStartLoc();
703e87634fSAdam Nemet   if (const Instruction *I = Message.getInstr())
710456327cSAdam Nemet     DL = I->getDebugLoc();
72339f42b3SAdam Nemet   emitOptimizationRemarkAnalysis(TheFunction->getContext(), PassName,
730456327cSAdam Nemet                                  *TheFunction, DL, Message.str());
740456327cSAdam Nemet }
750456327cSAdam Nemet 
760456327cSAdam Nemet Value *llvm::stripIntegerCast(Value *V) {
770456327cSAdam Nemet   if (CastInst *CI = dyn_cast<CastInst>(V))
780456327cSAdam Nemet     if (CI->getOperand(0)->getType()->isIntegerTy())
790456327cSAdam Nemet       return CI->getOperand(0);
800456327cSAdam Nemet   return V;
810456327cSAdam Nemet }
820456327cSAdam Nemet 
830456327cSAdam Nemet const SCEV *llvm::replaceSymbolicStrideSCEV(ScalarEvolution *SE,
848bc61df9SAdam Nemet                                             const ValueToValueMap &PtrToStride,
850456327cSAdam Nemet                                             Value *Ptr, Value *OrigPtr) {
860456327cSAdam Nemet 
870456327cSAdam Nemet   const SCEV *OrigSCEV = SE->getSCEV(Ptr);
880456327cSAdam Nemet 
890456327cSAdam Nemet   // If there is an entry in the map return the SCEV of the pointer with the
900456327cSAdam Nemet   // symbolic stride replaced by one.
918bc61df9SAdam Nemet   ValueToValueMap::const_iterator SI =
928bc61df9SAdam Nemet       PtrToStride.find(OrigPtr ? OrigPtr : Ptr);
930456327cSAdam Nemet   if (SI != PtrToStride.end()) {
940456327cSAdam Nemet     Value *StrideVal = SI->second;
950456327cSAdam Nemet 
960456327cSAdam Nemet     // Strip casts.
970456327cSAdam Nemet     StrideVal = stripIntegerCast(StrideVal);
980456327cSAdam Nemet 
990456327cSAdam Nemet     // Replace symbolic stride by one.
1000456327cSAdam Nemet     Value *One = ConstantInt::get(StrideVal->getType(), 1);
1010456327cSAdam Nemet     ValueToValueMap RewriteMap;
1020456327cSAdam Nemet     RewriteMap[StrideVal] = One;
1030456327cSAdam Nemet 
1040456327cSAdam Nemet     const SCEV *ByOne =
1050456327cSAdam Nemet         SCEVParameterRewriter::rewrite(OrigSCEV, *SE, RewriteMap, true);
106339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Replacing SCEV: " << *OrigSCEV << " by: " << *ByOne
1070456327cSAdam Nemet                  << "\n");
1080456327cSAdam Nemet     return ByOne;
1090456327cSAdam Nemet   }
1100456327cSAdam Nemet 
1110456327cSAdam Nemet   // Otherwise, just return the SCEV of the original pointer.
1120456327cSAdam Nemet   return SE->getSCEV(Ptr);
1130456327cSAdam Nemet }
1140456327cSAdam Nemet 
1158bc61df9SAdam Nemet void LoopAccessInfo::RuntimePointerCheck::insert(
1168bc61df9SAdam Nemet     ScalarEvolution *SE, Loop *Lp, Value *Ptr, bool WritePtr, unsigned DepSetId,
1178bc61df9SAdam Nemet     unsigned ASId, const ValueToValueMap &Strides) {
1180456327cSAdam Nemet   // Get the stride replaced scev.
1190456327cSAdam Nemet   const SCEV *Sc = replaceSymbolicStrideSCEV(SE, Strides, Ptr);
1200456327cSAdam Nemet   const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(Sc);
1210456327cSAdam Nemet   assert(AR && "Invalid addrec expression");
1220456327cSAdam Nemet   const SCEV *Ex = SE->getBackedgeTakenCount(Lp);
1230456327cSAdam Nemet   const SCEV *ScEnd = AR->evaluateAtIteration(Ex, *SE);
1240456327cSAdam Nemet   Pointers.push_back(Ptr);
1250456327cSAdam Nemet   Starts.push_back(AR->getStart());
1260456327cSAdam Nemet   Ends.push_back(ScEnd);
1270456327cSAdam Nemet   IsWritePtr.push_back(WritePtr);
1280456327cSAdam Nemet   DependencySetId.push_back(DepSetId);
1290456327cSAdam Nemet   AliasSetId.push_back(ASId);
1300456327cSAdam Nemet }
1310456327cSAdam Nemet 
132ec1e2bb6SAdam Nemet bool LoopAccessInfo::RuntimePointerCheck::needsChecking(
133ec1e2bb6SAdam Nemet     unsigned I, unsigned J, const SmallVectorImpl<int> *PtrPartition) const {
134a8945b77SAdam Nemet   // No need to check if two readonly pointers intersect.
135a8945b77SAdam Nemet   if (!IsWritePtr[I] && !IsWritePtr[J])
136a8945b77SAdam Nemet     return false;
137a8945b77SAdam Nemet 
138a8945b77SAdam Nemet   // Only need to check pointers between two different dependency sets.
139a8945b77SAdam Nemet   if (DependencySetId[I] == DependencySetId[J])
140a8945b77SAdam Nemet     return false;
141a8945b77SAdam Nemet 
142a8945b77SAdam Nemet   // Only need to check pointers in the same alias set.
143a8945b77SAdam Nemet   if (AliasSetId[I] != AliasSetId[J])
144a8945b77SAdam Nemet     return false;
145a8945b77SAdam Nemet 
146ec1e2bb6SAdam Nemet   // If PtrPartition is set omit checks between pointers of the same partition.
147ec1e2bb6SAdam Nemet   // Partition number -1 means that the pointer is used in multiple partitions.
148ec1e2bb6SAdam Nemet   // In this case we can't omit the check.
149ec1e2bb6SAdam Nemet   if (PtrPartition && (*PtrPartition)[I] != -1 &&
150ec1e2bb6SAdam Nemet       (*PtrPartition)[I] == (*PtrPartition)[J])
151ec1e2bb6SAdam Nemet     return false;
152ec1e2bb6SAdam Nemet 
153a8945b77SAdam Nemet   return true;
154a8945b77SAdam Nemet }
155a8945b77SAdam Nemet 
156ec1e2bb6SAdam Nemet void LoopAccessInfo::RuntimePointerCheck::print(
157ec1e2bb6SAdam Nemet     raw_ostream &OS, unsigned Depth,
158ec1e2bb6SAdam Nemet     const SmallVectorImpl<int> *PtrPartition) const {
159e91cc6efSAdam Nemet   unsigned NumPointers = Pointers.size();
160e91cc6efSAdam Nemet   if (NumPointers == 0)
161e91cc6efSAdam Nemet     return;
162e91cc6efSAdam Nemet 
163e91cc6efSAdam Nemet   OS.indent(Depth) << "Run-time memory checks:\n";
164e91cc6efSAdam Nemet   unsigned N = 0;
165e91cc6efSAdam Nemet   for (unsigned I = 0; I < NumPointers; ++I)
166e91cc6efSAdam Nemet     for (unsigned J = I + 1; J < NumPointers; ++J)
167ec1e2bb6SAdam Nemet       if (needsChecking(I, J, PtrPartition)) {
168e91cc6efSAdam Nemet         OS.indent(Depth) << N++ << ":\n";
169ec1e2bb6SAdam Nemet         OS.indent(Depth + 2) << *Pointers[I];
170ec1e2bb6SAdam Nemet         if (PtrPartition)
171ec1e2bb6SAdam Nemet           OS << " (Partition: " << (*PtrPartition)[I] << ")";
172ec1e2bb6SAdam Nemet         OS << "\n";
173ec1e2bb6SAdam Nemet         OS.indent(Depth + 2) << *Pointers[J];
174ec1e2bb6SAdam Nemet         if (PtrPartition)
175ec1e2bb6SAdam Nemet           OS << " (Partition: " << (*PtrPartition)[J] << ")";
176ec1e2bb6SAdam Nemet         OS << "\n";
177e91cc6efSAdam Nemet       }
178e91cc6efSAdam Nemet }
179e91cc6efSAdam Nemet 
18098a13719SSilviu Baranga unsigned LoopAccessInfo::RuntimePointerCheck::getNumberOfChecks(
18151870d16SAdam Nemet     const SmallVectorImpl<int> *PtrPartition) const {
18251870d16SAdam Nemet   unsigned NumPointers = Pointers.size();
18398a13719SSilviu Baranga   unsigned CheckCount = 0;
18451870d16SAdam Nemet 
18551870d16SAdam Nemet   for (unsigned I = 0; I < NumPointers; ++I)
18651870d16SAdam Nemet     for (unsigned J = I + 1; J < NumPointers; ++J)
18751870d16SAdam Nemet       if (needsChecking(I, J, PtrPartition))
18898a13719SSilviu Baranga         CheckCount++;
18998a13719SSilviu Baranga   return CheckCount;
19098a13719SSilviu Baranga }
19198a13719SSilviu Baranga 
19298a13719SSilviu Baranga bool LoopAccessInfo::RuntimePointerCheck::needsAnyChecking(
19398a13719SSilviu Baranga     const SmallVectorImpl<int> *PtrPartition) const {
19498a13719SSilviu Baranga   return getNumberOfChecks(PtrPartition) != 0;
19551870d16SAdam Nemet }
19651870d16SAdam Nemet 
1970456327cSAdam Nemet namespace {
1980456327cSAdam Nemet /// \brief Analyses memory accesses in a loop.
1990456327cSAdam Nemet ///
2000456327cSAdam Nemet /// Checks whether run time pointer checks are needed and builds sets for data
2010456327cSAdam Nemet /// dependence checking.
2020456327cSAdam Nemet class AccessAnalysis {
2030456327cSAdam Nemet public:
2040456327cSAdam Nemet   /// \brief Read or write access location.
2050456327cSAdam Nemet   typedef PointerIntPair<Value *, 1, bool> MemAccessInfo;
2060456327cSAdam Nemet   typedef SmallPtrSet<MemAccessInfo, 8> MemAccessInfoSet;
2070456327cSAdam Nemet 
208e2b885c4SAdam Nemet   AccessAnalysis(const DataLayout &Dl, AliasAnalysis *AA, LoopInfo *LI,
209dee666bcSAdam Nemet                  MemoryDepChecker::DepCandidates &DA)
210e2b885c4SAdam Nemet       : DL(Dl), AST(*AA), LI(LI), DepCands(DA), IsRTCheckNeeded(false) {}
2110456327cSAdam Nemet 
2120456327cSAdam Nemet   /// \brief Register a load  and whether it is only read from.
213ac80dc75SChandler Carruth   void addLoad(MemoryLocation &Loc, bool IsReadOnly) {
2140456327cSAdam Nemet     Value *Ptr = const_cast<Value*>(Loc.Ptr);
215*ecbd1682SChandler Carruth     AST.add(Ptr, MemoryLocation::UnknownSize, Loc.AATags);
2160456327cSAdam Nemet     Accesses.insert(MemAccessInfo(Ptr, false));
2170456327cSAdam Nemet     if (IsReadOnly)
2180456327cSAdam Nemet       ReadOnlyPtr.insert(Ptr);
2190456327cSAdam Nemet   }
2200456327cSAdam Nemet 
2210456327cSAdam Nemet   /// \brief Register a store.
222ac80dc75SChandler Carruth   void addStore(MemoryLocation &Loc) {
2230456327cSAdam Nemet     Value *Ptr = const_cast<Value*>(Loc.Ptr);
224*ecbd1682SChandler Carruth     AST.add(Ptr, MemoryLocation::UnknownSize, Loc.AATags);
2250456327cSAdam Nemet     Accesses.insert(MemAccessInfo(Ptr, true));
2260456327cSAdam Nemet   }
2270456327cSAdam Nemet 
2280456327cSAdam Nemet   /// \brief Check whether we can check the pointers at runtime for
22998a13719SSilviu Baranga   /// non-intersection. Returns true when we have 0 pointers
23098a13719SSilviu Baranga   /// (a check on 0 pointers for non-intersection will always return true).
23130f16e16SAdam Nemet   bool canCheckPtrAtRT(LoopAccessInfo::RuntimePointerCheck &RtCheck,
23298a13719SSilviu Baranga                        bool &NeedRTCheck, ScalarEvolution *SE, Loop *TheLoop,
23398a13719SSilviu Baranga                        const ValueToValueMap &Strides,
2340456327cSAdam Nemet                        bool ShouldCheckStride = false);
2350456327cSAdam Nemet 
2360456327cSAdam Nemet   /// \brief Goes over all memory accesses, checks whether a RT check is needed
2370456327cSAdam Nemet   /// and builds sets of dependent accesses.
2380456327cSAdam Nemet   void buildDependenceSets() {
2390456327cSAdam Nemet     processMemAccesses();
2400456327cSAdam Nemet   }
2410456327cSAdam Nemet 
2420456327cSAdam Nemet   bool isRTCheckNeeded() { return IsRTCheckNeeded; }
2430456327cSAdam Nemet 
2440456327cSAdam Nemet   bool isDependencyCheckNeeded() { return !CheckDeps.empty(); }
245df3dc5b9SAdam Nemet 
246df3dc5b9SAdam Nemet   /// We decided that no dependence analysis would be used.  Reset the state.
247df3dc5b9SAdam Nemet   void resetDepChecks(MemoryDepChecker &DepChecker) {
248df3dc5b9SAdam Nemet     CheckDeps.clear();
249df3dc5b9SAdam Nemet     DepChecker.clearInterestingDependences();
250df3dc5b9SAdam Nemet   }
2510456327cSAdam Nemet 
2520456327cSAdam Nemet   MemAccessInfoSet &getDependenciesToCheck() { return CheckDeps; }
2530456327cSAdam Nemet 
2540456327cSAdam Nemet private:
2550456327cSAdam Nemet   typedef SetVector<MemAccessInfo> PtrAccessSet;
2560456327cSAdam Nemet 
2570456327cSAdam Nemet   /// \brief Go over all memory access and check whether runtime pointer checks
2580456327cSAdam Nemet   /// are needed /// and build sets of dependency check candidates.
2590456327cSAdam Nemet   void processMemAccesses();
2600456327cSAdam Nemet 
2610456327cSAdam Nemet   /// Set of all accesses.
2620456327cSAdam Nemet   PtrAccessSet Accesses;
2630456327cSAdam Nemet 
264a28d91d8SMehdi Amini   const DataLayout &DL;
265a28d91d8SMehdi Amini 
2660456327cSAdam Nemet   /// Set of accesses that need a further dependence check.
2670456327cSAdam Nemet   MemAccessInfoSet CheckDeps;
2680456327cSAdam Nemet 
2690456327cSAdam Nemet   /// Set of pointers that are read only.
2700456327cSAdam Nemet   SmallPtrSet<Value*, 16> ReadOnlyPtr;
2710456327cSAdam Nemet 
2720456327cSAdam Nemet   /// An alias set tracker to partition the access set by underlying object and
2730456327cSAdam Nemet   //intrinsic property (such as TBAA metadata).
2740456327cSAdam Nemet   AliasSetTracker AST;
2750456327cSAdam Nemet 
276e2b885c4SAdam Nemet   LoopInfo *LI;
277e2b885c4SAdam Nemet 
2780456327cSAdam Nemet   /// Sets of potentially dependent accesses - members of one set share an
2790456327cSAdam Nemet   /// underlying pointer. The set "CheckDeps" identfies which sets really need a
2800456327cSAdam Nemet   /// dependence check.
281dee666bcSAdam Nemet   MemoryDepChecker::DepCandidates &DepCands;
2820456327cSAdam Nemet 
2830456327cSAdam Nemet   bool IsRTCheckNeeded;
2840456327cSAdam Nemet };
2850456327cSAdam Nemet 
2860456327cSAdam Nemet } // end anonymous namespace
2870456327cSAdam Nemet 
2880456327cSAdam Nemet /// \brief Check whether a pointer can participate in a runtime bounds check.
2898bc61df9SAdam Nemet static bool hasComputableBounds(ScalarEvolution *SE,
2908bc61df9SAdam Nemet                                 const ValueToValueMap &Strides, Value *Ptr) {
2910456327cSAdam Nemet   const SCEV *PtrScev = replaceSymbolicStrideSCEV(SE, Strides, Ptr);
2920456327cSAdam Nemet   const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(PtrScev);
2930456327cSAdam Nemet   if (!AR)
2940456327cSAdam Nemet     return false;
2950456327cSAdam Nemet 
2960456327cSAdam Nemet   return AR->isAffine();
2970456327cSAdam Nemet }
2980456327cSAdam Nemet 
2990456327cSAdam Nemet bool AccessAnalysis::canCheckPtrAtRT(
30098a13719SSilviu Baranga     LoopAccessInfo::RuntimePointerCheck &RtCheck, bool &NeedRTCheck,
3018bc61df9SAdam Nemet     ScalarEvolution *SE, Loop *TheLoop, const ValueToValueMap &StridesMap,
3028bc61df9SAdam Nemet     bool ShouldCheckStride) {
3030456327cSAdam Nemet   // Find pointers with computable bounds. We are going to use this information
3040456327cSAdam Nemet   // to place a runtime bound check.
3050456327cSAdam Nemet   bool CanDoRT = true;
3060456327cSAdam Nemet 
30798a13719SSilviu Baranga   NeedRTCheck = false;
30898a13719SSilviu Baranga   if (!IsRTCheckNeeded) return true;
30998a13719SSilviu Baranga 
3100456327cSAdam Nemet   bool IsDepCheckNeeded = isDependencyCheckNeeded();
3110456327cSAdam Nemet 
3120456327cSAdam Nemet   // We assign a consecutive id to access from different alias sets.
3130456327cSAdam Nemet   // Accesses between different groups doesn't need to be checked.
3140456327cSAdam Nemet   unsigned ASId = 1;
3150456327cSAdam Nemet   for (auto &AS : AST) {
3160456327cSAdam Nemet     // We assign consecutive id to access from different dependence sets.
3170456327cSAdam Nemet     // Accesses within the same set don't need a runtime check.
3180456327cSAdam Nemet     unsigned RunningDepId = 1;
3190456327cSAdam Nemet     DenseMap<Value *, unsigned> DepSetId;
3200456327cSAdam Nemet 
3210456327cSAdam Nemet     for (auto A : AS) {
3220456327cSAdam Nemet       Value *Ptr = A.getValue();
3230456327cSAdam Nemet       bool IsWrite = Accesses.count(MemAccessInfo(Ptr, true));
3240456327cSAdam Nemet       MemAccessInfo Access(Ptr, IsWrite);
3250456327cSAdam Nemet 
3260456327cSAdam Nemet       if (hasComputableBounds(SE, StridesMap, Ptr) &&
327a28d91d8SMehdi Amini           // When we run after a failing dependency check we have to make sure
328a28d91d8SMehdi Amini           // we don't have wrapping pointers.
3290456327cSAdam Nemet           (!ShouldCheckStride ||
330a28d91d8SMehdi Amini            isStridedPtr(SE, Ptr, TheLoop, StridesMap) == 1)) {
3310456327cSAdam Nemet         // The id of the dependence set.
3320456327cSAdam Nemet         unsigned DepId;
3330456327cSAdam Nemet 
3340456327cSAdam Nemet         if (IsDepCheckNeeded) {
3350456327cSAdam Nemet           Value *Leader = DepCands.getLeaderValue(Access).getPointer();
3360456327cSAdam Nemet           unsigned &LeaderId = DepSetId[Leader];
3370456327cSAdam Nemet           if (!LeaderId)
3380456327cSAdam Nemet             LeaderId = RunningDepId++;
3390456327cSAdam Nemet           DepId = LeaderId;
3400456327cSAdam Nemet         } else
3410456327cSAdam Nemet           // Each access has its own dependence set.
3420456327cSAdam Nemet           DepId = RunningDepId++;
3430456327cSAdam Nemet 
3440456327cSAdam Nemet         RtCheck.insert(SE, TheLoop, Ptr, IsWrite, DepId, ASId, StridesMap);
3450456327cSAdam Nemet 
346339f42b3SAdam Nemet         DEBUG(dbgs() << "LAA: Found a runtime check ptr:" << *Ptr << '\n');
3470456327cSAdam Nemet       } else {
348f10ca278SAdam Nemet         DEBUG(dbgs() << "LAA: Can't find bounds for ptr:" << *Ptr << '\n');
3490456327cSAdam Nemet         CanDoRT = false;
3500456327cSAdam Nemet       }
3510456327cSAdam Nemet     }
3520456327cSAdam Nemet 
3530456327cSAdam Nemet     ++ASId;
3540456327cSAdam Nemet   }
3550456327cSAdam Nemet 
35698a13719SSilviu Baranga   // We need a runtime check if there are any accesses that need checking.
35798a13719SSilviu Baranga   // However, some accesses cannot be checked (for example because we
35898a13719SSilviu Baranga   // can't determine their bounds). In these cases we would need a check
35998a13719SSilviu Baranga   // but wouldn't be able to add it.
36098a13719SSilviu Baranga   NeedRTCheck = !CanDoRT || RtCheck.needsAnyChecking(nullptr);
36198a13719SSilviu Baranga 
3620456327cSAdam Nemet   // If the pointers that we would use for the bounds comparison have different
3630456327cSAdam Nemet   // address spaces, assume the values aren't directly comparable, so we can't
3640456327cSAdam Nemet   // use them for the runtime check. We also have to assume they could
3650456327cSAdam Nemet   // overlap. In the future there should be metadata for whether address spaces
3660456327cSAdam Nemet   // are disjoint.
3670456327cSAdam Nemet   unsigned NumPointers = RtCheck.Pointers.size();
3680456327cSAdam Nemet   for (unsigned i = 0; i < NumPointers; ++i) {
3690456327cSAdam Nemet     for (unsigned j = i + 1; j < NumPointers; ++j) {
3700456327cSAdam Nemet       // Only need to check pointers between two different dependency sets.
3710456327cSAdam Nemet       if (RtCheck.DependencySetId[i] == RtCheck.DependencySetId[j])
3720456327cSAdam Nemet        continue;
3730456327cSAdam Nemet       // Only need to check pointers in the same alias set.
3740456327cSAdam Nemet       if (RtCheck.AliasSetId[i] != RtCheck.AliasSetId[j])
3750456327cSAdam Nemet         continue;
3760456327cSAdam Nemet 
3770456327cSAdam Nemet       Value *PtrI = RtCheck.Pointers[i];
3780456327cSAdam Nemet       Value *PtrJ = RtCheck.Pointers[j];
3790456327cSAdam Nemet 
3800456327cSAdam Nemet       unsigned ASi = PtrI->getType()->getPointerAddressSpace();
3810456327cSAdam Nemet       unsigned ASj = PtrJ->getType()->getPointerAddressSpace();
3820456327cSAdam Nemet       if (ASi != ASj) {
383339f42b3SAdam Nemet         DEBUG(dbgs() << "LAA: Runtime check would require comparison between"
3840456327cSAdam Nemet                        " different address spaces\n");
3850456327cSAdam Nemet         return false;
3860456327cSAdam Nemet       }
3870456327cSAdam Nemet     }
3880456327cSAdam Nemet   }
3890456327cSAdam Nemet 
3900456327cSAdam Nemet   return CanDoRT;
3910456327cSAdam Nemet }
3920456327cSAdam Nemet 
3930456327cSAdam Nemet void AccessAnalysis::processMemAccesses() {
3940456327cSAdam Nemet   // We process the set twice: first we process read-write pointers, last we
3950456327cSAdam Nemet   // process read-only pointers. This allows us to skip dependence tests for
3960456327cSAdam Nemet   // read-only pointers.
3970456327cSAdam Nemet 
398339f42b3SAdam Nemet   DEBUG(dbgs() << "LAA: Processing memory accesses...\n");
3990456327cSAdam Nemet   DEBUG(dbgs() << "  AST: "; AST.dump());
4009c926579SAdam Nemet   DEBUG(dbgs() << "LAA:   Accesses(" << Accesses.size() << "):\n");
4010456327cSAdam Nemet   DEBUG({
4020456327cSAdam Nemet     for (auto A : Accesses)
4030456327cSAdam Nemet       dbgs() << "\t" << *A.getPointer() << " (" <<
4040456327cSAdam Nemet                 (A.getInt() ? "write" : (ReadOnlyPtr.count(A.getPointer()) ?
4050456327cSAdam Nemet                                          "read-only" : "read")) << ")\n";
4060456327cSAdam Nemet   });
4070456327cSAdam Nemet 
4080456327cSAdam Nemet   // The AliasSetTracker has nicely partitioned our pointers by metadata
4090456327cSAdam Nemet   // compatibility and potential for underlying-object overlap. As a result, we
4100456327cSAdam Nemet   // only need to check for potential pointer dependencies within each alias
4110456327cSAdam Nemet   // set.
4120456327cSAdam Nemet   for (auto &AS : AST) {
4130456327cSAdam Nemet     // Note that both the alias-set tracker and the alias sets themselves used
4140456327cSAdam Nemet     // linked lists internally and so the iteration order here is deterministic
4150456327cSAdam Nemet     // (matching the original instruction order within each set).
4160456327cSAdam Nemet 
4170456327cSAdam Nemet     bool SetHasWrite = false;
4180456327cSAdam Nemet 
4190456327cSAdam Nemet     // Map of pointers to last access encountered.
4200456327cSAdam Nemet     typedef DenseMap<Value*, MemAccessInfo> UnderlyingObjToAccessMap;
4210456327cSAdam Nemet     UnderlyingObjToAccessMap ObjToLastAccess;
4220456327cSAdam Nemet 
4230456327cSAdam Nemet     // Set of access to check after all writes have been processed.
4240456327cSAdam Nemet     PtrAccessSet DeferredAccesses;
4250456327cSAdam Nemet 
4260456327cSAdam Nemet     // Iterate over each alias set twice, once to process read/write pointers,
4270456327cSAdam Nemet     // and then to process read-only pointers.
4280456327cSAdam Nemet     for (int SetIteration = 0; SetIteration < 2; ++SetIteration) {
4290456327cSAdam Nemet       bool UseDeferred = SetIteration > 0;
4300456327cSAdam Nemet       PtrAccessSet &S = UseDeferred ? DeferredAccesses : Accesses;
4310456327cSAdam Nemet 
4320456327cSAdam Nemet       for (auto AV : AS) {
4330456327cSAdam Nemet         Value *Ptr = AV.getValue();
4340456327cSAdam Nemet 
4350456327cSAdam Nemet         // For a single memory access in AliasSetTracker, Accesses may contain
4360456327cSAdam Nemet         // both read and write, and they both need to be handled for CheckDeps.
4370456327cSAdam Nemet         for (auto AC : S) {
4380456327cSAdam Nemet           if (AC.getPointer() != Ptr)
4390456327cSAdam Nemet             continue;
4400456327cSAdam Nemet 
4410456327cSAdam Nemet           bool IsWrite = AC.getInt();
4420456327cSAdam Nemet 
4430456327cSAdam Nemet           // If we're using the deferred access set, then it contains only
4440456327cSAdam Nemet           // reads.
4450456327cSAdam Nemet           bool IsReadOnlyPtr = ReadOnlyPtr.count(Ptr) && !IsWrite;
4460456327cSAdam Nemet           if (UseDeferred && !IsReadOnlyPtr)
4470456327cSAdam Nemet             continue;
4480456327cSAdam Nemet           // Otherwise, the pointer must be in the PtrAccessSet, either as a
4490456327cSAdam Nemet           // read or a write.
4500456327cSAdam Nemet           assert(((IsReadOnlyPtr && UseDeferred) || IsWrite ||
4510456327cSAdam Nemet                   S.count(MemAccessInfo(Ptr, false))) &&
4520456327cSAdam Nemet                  "Alias-set pointer not in the access set?");
4530456327cSAdam Nemet 
4540456327cSAdam Nemet           MemAccessInfo Access(Ptr, IsWrite);
4550456327cSAdam Nemet           DepCands.insert(Access);
4560456327cSAdam Nemet 
4570456327cSAdam Nemet           // Memorize read-only pointers for later processing and skip them in
4580456327cSAdam Nemet           // the first round (they need to be checked after we have seen all
4590456327cSAdam Nemet           // write pointers). Note: we also mark pointer that are not
4600456327cSAdam Nemet           // consecutive as "read-only" pointers (so that we check
4610456327cSAdam Nemet           // "a[b[i]] +="). Hence, we need the second check for "!IsWrite".
4620456327cSAdam Nemet           if (!UseDeferred && IsReadOnlyPtr) {
4630456327cSAdam Nemet             DeferredAccesses.insert(Access);
4640456327cSAdam Nemet             continue;
4650456327cSAdam Nemet           }
4660456327cSAdam Nemet 
4670456327cSAdam Nemet           // If this is a write - check other reads and writes for conflicts. If
4680456327cSAdam Nemet           // this is a read only check other writes for conflicts (but only if
4690456327cSAdam Nemet           // there is no other write to the ptr - this is an optimization to
4700456327cSAdam Nemet           // catch "a[i] = a[i] + " without having to do a dependence check).
4710456327cSAdam Nemet           if ((IsWrite || IsReadOnlyPtr) && SetHasWrite) {
4720456327cSAdam Nemet             CheckDeps.insert(Access);
4730456327cSAdam Nemet             IsRTCheckNeeded = true;
4740456327cSAdam Nemet           }
4750456327cSAdam Nemet 
4760456327cSAdam Nemet           if (IsWrite)
4770456327cSAdam Nemet             SetHasWrite = true;
4780456327cSAdam Nemet 
4790456327cSAdam Nemet           // Create sets of pointers connected by a shared alias set and
4800456327cSAdam Nemet           // underlying object.
4810456327cSAdam Nemet           typedef SmallVector<Value *, 16> ValueVector;
4820456327cSAdam Nemet           ValueVector TempObjects;
483e2b885c4SAdam Nemet 
484e2b885c4SAdam Nemet           GetUnderlyingObjects(Ptr, TempObjects, DL, LI);
485e2b885c4SAdam Nemet           DEBUG(dbgs() << "Underlying objects for pointer " << *Ptr << "\n");
4860456327cSAdam Nemet           for (Value *UnderlyingObj : TempObjects) {
4870456327cSAdam Nemet             UnderlyingObjToAccessMap::iterator Prev =
4880456327cSAdam Nemet                 ObjToLastAccess.find(UnderlyingObj);
4890456327cSAdam Nemet             if (Prev != ObjToLastAccess.end())
4900456327cSAdam Nemet               DepCands.unionSets(Access, Prev->second);
4910456327cSAdam Nemet 
4920456327cSAdam Nemet             ObjToLastAccess[UnderlyingObj] = Access;
493e2b885c4SAdam Nemet             DEBUG(dbgs() << "  " << *UnderlyingObj << "\n");
4940456327cSAdam Nemet           }
4950456327cSAdam Nemet         }
4960456327cSAdam Nemet       }
4970456327cSAdam Nemet     }
4980456327cSAdam Nemet   }
4990456327cSAdam Nemet }
5000456327cSAdam Nemet 
5010456327cSAdam Nemet static bool isInBoundsGep(Value *Ptr) {
5020456327cSAdam Nemet   if (GetElementPtrInst *GEP = dyn_cast<GetElementPtrInst>(Ptr))
5030456327cSAdam Nemet     return GEP->isInBounds();
5040456327cSAdam Nemet   return false;
5050456327cSAdam Nemet }
5060456327cSAdam Nemet 
5070456327cSAdam Nemet /// \brief Check whether the access through \p Ptr has a constant stride.
50832c05396SHao Liu int llvm::isStridedPtr(ScalarEvolution *SE, Value *Ptr, const Loop *Lp,
509a28d91d8SMehdi Amini                        const ValueToValueMap &StridesMap) {
5100456327cSAdam Nemet   const Type *Ty = Ptr->getType();
5110456327cSAdam Nemet   assert(Ty->isPointerTy() && "Unexpected non-ptr");
5120456327cSAdam Nemet 
5130456327cSAdam Nemet   // Make sure that the pointer does not point to aggregate types.
5140456327cSAdam Nemet   const PointerType *PtrTy = cast<PointerType>(Ty);
5150456327cSAdam Nemet   if (PtrTy->getElementType()->isAggregateType()) {
516339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Bad stride - Not a pointer to a scalar type"
517339f42b3SAdam Nemet           << *Ptr << "\n");
5180456327cSAdam Nemet     return 0;
5190456327cSAdam Nemet   }
5200456327cSAdam Nemet 
5210456327cSAdam Nemet   const SCEV *PtrScev = replaceSymbolicStrideSCEV(SE, StridesMap, Ptr);
5220456327cSAdam Nemet 
5230456327cSAdam Nemet   const SCEVAddRecExpr *AR = dyn_cast<SCEVAddRecExpr>(PtrScev);
5240456327cSAdam Nemet   if (!AR) {
525339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Bad stride - Not an AddRecExpr pointer "
52604d4163eSAdam Nemet           << *Ptr << " SCEV: " << *PtrScev << "\n");
5270456327cSAdam Nemet     return 0;
5280456327cSAdam Nemet   }
5290456327cSAdam Nemet 
5300456327cSAdam Nemet   // The accesss function must stride over the innermost loop.
5310456327cSAdam Nemet   if (Lp != AR->getLoop()) {
532339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Bad stride - Not striding over innermost loop " <<
53304d4163eSAdam Nemet           *Ptr << " SCEV: " << *PtrScev << "\n");
5340456327cSAdam Nemet   }
5350456327cSAdam Nemet 
5360456327cSAdam Nemet   // The address calculation must not wrap. Otherwise, a dependence could be
5370456327cSAdam Nemet   // inverted.
5380456327cSAdam Nemet   // An inbounds getelementptr that is a AddRec with a unit stride
5390456327cSAdam Nemet   // cannot wrap per definition. The unit stride requirement is checked later.
5400456327cSAdam Nemet   // An getelementptr without an inbounds attribute and unit stride would have
5410456327cSAdam Nemet   // to access the pointer value "0" which is undefined behavior in address
5420456327cSAdam Nemet   // space 0, therefore we can also vectorize this case.
5430456327cSAdam Nemet   bool IsInBoundsGEP = isInBoundsGep(Ptr);
5440456327cSAdam Nemet   bool IsNoWrapAddRec = AR->getNoWrapFlags(SCEV::NoWrapMask);
5450456327cSAdam Nemet   bool IsInAddressSpaceZero = PtrTy->getAddressSpace() == 0;
5460456327cSAdam Nemet   if (!IsNoWrapAddRec && !IsInBoundsGEP && !IsInAddressSpaceZero) {
547339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Bad stride - Pointer may wrap in the address space "
5480456327cSAdam Nemet           << *Ptr << " SCEV: " << *PtrScev << "\n");
5490456327cSAdam Nemet     return 0;
5500456327cSAdam Nemet   }
5510456327cSAdam Nemet 
5520456327cSAdam Nemet   // Check the step is constant.
5530456327cSAdam Nemet   const SCEV *Step = AR->getStepRecurrence(*SE);
5540456327cSAdam Nemet 
5550456327cSAdam Nemet   // Calculate the pointer stride and check if it is consecutive.
5560456327cSAdam Nemet   const SCEVConstant *C = dyn_cast<SCEVConstant>(Step);
5570456327cSAdam Nemet   if (!C) {
558339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Bad stride - Not a constant strided " << *Ptr <<
55904d4163eSAdam Nemet           " SCEV: " << *PtrScev << "\n");
5600456327cSAdam Nemet     return 0;
5610456327cSAdam Nemet   }
5620456327cSAdam Nemet 
563a28d91d8SMehdi Amini   auto &DL = Lp->getHeader()->getModule()->getDataLayout();
564a28d91d8SMehdi Amini   int64_t Size = DL.getTypeAllocSize(PtrTy->getElementType());
5650456327cSAdam Nemet   const APInt &APStepVal = C->getValue()->getValue();
5660456327cSAdam Nemet 
5670456327cSAdam Nemet   // Huge step value - give up.
5680456327cSAdam Nemet   if (APStepVal.getBitWidth() > 64)
5690456327cSAdam Nemet     return 0;
5700456327cSAdam Nemet 
5710456327cSAdam Nemet   int64_t StepVal = APStepVal.getSExtValue();
5720456327cSAdam Nemet 
5730456327cSAdam Nemet   // Strided access.
5740456327cSAdam Nemet   int64_t Stride = StepVal / Size;
5750456327cSAdam Nemet   int64_t Rem = StepVal % Size;
5760456327cSAdam Nemet   if (Rem)
5770456327cSAdam Nemet     return 0;
5780456327cSAdam Nemet 
5790456327cSAdam Nemet   // If the SCEV could wrap but we have an inbounds gep with a unit stride we
5800456327cSAdam Nemet   // know we can't "wrap around the address space". In case of address space
5810456327cSAdam Nemet   // zero we know that this won't happen without triggering undefined behavior.
5820456327cSAdam Nemet   if (!IsNoWrapAddRec && (IsInBoundsGEP || IsInAddressSpaceZero) &&
5830456327cSAdam Nemet       Stride != 1 && Stride != -1)
5840456327cSAdam Nemet     return 0;
5850456327cSAdam Nemet 
5860456327cSAdam Nemet   return Stride;
5870456327cSAdam Nemet }
5880456327cSAdam Nemet 
5899c926579SAdam Nemet bool MemoryDepChecker::Dependence::isSafeForVectorization(DepType Type) {
5909c926579SAdam Nemet   switch (Type) {
5919c926579SAdam Nemet   case NoDep:
5929c926579SAdam Nemet   case Forward:
5939c926579SAdam Nemet   case BackwardVectorizable:
5949c926579SAdam Nemet     return true;
5959c926579SAdam Nemet 
5969c926579SAdam Nemet   case Unknown:
5979c926579SAdam Nemet   case ForwardButPreventsForwarding:
5989c926579SAdam Nemet   case Backward:
5999c926579SAdam Nemet   case BackwardVectorizableButPreventsForwarding:
6009c926579SAdam Nemet     return false;
6019c926579SAdam Nemet   }
602d388e930SDavid Majnemer   llvm_unreachable("unexpected DepType!");
6039c926579SAdam Nemet }
6049c926579SAdam Nemet 
6059c926579SAdam Nemet bool MemoryDepChecker::Dependence::isInterestingDependence(DepType Type) {
6069c926579SAdam Nemet   switch (Type) {
6079c926579SAdam Nemet   case NoDep:
6089c926579SAdam Nemet   case Forward:
6099c926579SAdam Nemet     return false;
6109c926579SAdam Nemet 
6119c926579SAdam Nemet   case BackwardVectorizable:
6129c926579SAdam Nemet   case Unknown:
6139c926579SAdam Nemet   case ForwardButPreventsForwarding:
6149c926579SAdam Nemet   case Backward:
6159c926579SAdam Nemet   case BackwardVectorizableButPreventsForwarding:
6169c926579SAdam Nemet     return true;
6179c926579SAdam Nemet   }
618d388e930SDavid Majnemer   llvm_unreachable("unexpected DepType!");
6199c926579SAdam Nemet }
6209c926579SAdam Nemet 
6219c926579SAdam Nemet bool MemoryDepChecker::Dependence::isPossiblyBackward() const {
6229c926579SAdam Nemet   switch (Type) {
6239c926579SAdam Nemet   case NoDep:
6249c926579SAdam Nemet   case Forward:
6259c926579SAdam Nemet   case ForwardButPreventsForwarding:
6269c926579SAdam Nemet     return false;
6279c926579SAdam Nemet 
6289c926579SAdam Nemet   case Unknown:
6299c926579SAdam Nemet   case BackwardVectorizable:
6309c926579SAdam Nemet   case Backward:
6319c926579SAdam Nemet   case BackwardVectorizableButPreventsForwarding:
6329c926579SAdam Nemet     return true;
6339c926579SAdam Nemet   }
634d388e930SDavid Majnemer   llvm_unreachable("unexpected DepType!");
6359c926579SAdam Nemet }
6369c926579SAdam Nemet 
6370456327cSAdam Nemet bool MemoryDepChecker::couldPreventStoreLoadForward(unsigned Distance,
6380456327cSAdam Nemet                                                     unsigned TypeByteSize) {
6390456327cSAdam Nemet   // If loads occur at a distance that is not a multiple of a feasible vector
6400456327cSAdam Nemet   // factor store-load forwarding does not take place.
6410456327cSAdam Nemet   // Positive dependences might cause troubles because vectorizing them might
6420456327cSAdam Nemet   // prevent store-load forwarding making vectorized code run a lot slower.
6430456327cSAdam Nemet   //   a[i] = a[i-3] ^ a[i-8];
6440456327cSAdam Nemet   //   The stores to a[i:i+1] don't align with the stores to a[i-3:i-2] and
6450456327cSAdam Nemet   //   hence on your typical architecture store-load forwarding does not take
6460456327cSAdam Nemet   //   place. Vectorizing in such cases does not make sense.
6470456327cSAdam Nemet   // Store-load forwarding distance.
6480456327cSAdam Nemet   const unsigned NumCyclesForStoreLoadThroughMemory = 8*TypeByteSize;
6490456327cSAdam Nemet   // Maximum vector factor.
650f219c647SAdam Nemet   unsigned MaxVFWithoutSLForwardIssues =
651f219c647SAdam Nemet     VectorizerParams::MaxVectorWidth * TypeByteSize;
6520456327cSAdam Nemet   if(MaxSafeDepDistBytes < MaxVFWithoutSLForwardIssues)
6530456327cSAdam Nemet     MaxVFWithoutSLForwardIssues = MaxSafeDepDistBytes;
6540456327cSAdam Nemet 
6550456327cSAdam Nemet   for (unsigned vf = 2*TypeByteSize; vf <= MaxVFWithoutSLForwardIssues;
6560456327cSAdam Nemet        vf *= 2) {
6570456327cSAdam Nemet     if (Distance % vf && Distance / vf < NumCyclesForStoreLoadThroughMemory) {
6580456327cSAdam Nemet       MaxVFWithoutSLForwardIssues = (vf >>=1);
6590456327cSAdam Nemet       break;
6600456327cSAdam Nemet     }
6610456327cSAdam Nemet   }
6620456327cSAdam Nemet 
6630456327cSAdam Nemet   if (MaxVFWithoutSLForwardIssues< 2*TypeByteSize) {
664339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Distance " << Distance <<
66504d4163eSAdam Nemet           " that could cause a store-load forwarding conflict\n");
6660456327cSAdam Nemet     return true;
6670456327cSAdam Nemet   }
6680456327cSAdam Nemet 
6690456327cSAdam Nemet   if (MaxVFWithoutSLForwardIssues < MaxSafeDepDistBytes &&
670f219c647SAdam Nemet       MaxVFWithoutSLForwardIssues !=
671f219c647SAdam Nemet       VectorizerParams::MaxVectorWidth * TypeByteSize)
6720456327cSAdam Nemet     MaxSafeDepDistBytes = MaxVFWithoutSLForwardIssues;
6730456327cSAdam Nemet   return false;
6740456327cSAdam Nemet }
6750456327cSAdam Nemet 
676751004a6SHao Liu /// \brief Check the dependence for two accesses with the same stride \p Stride.
677751004a6SHao Liu /// \p Distance is the positive distance and \p TypeByteSize is type size in
678751004a6SHao Liu /// bytes.
679751004a6SHao Liu ///
680751004a6SHao Liu /// \returns true if they are independent.
681751004a6SHao Liu static bool areStridedAccessesIndependent(unsigned Distance, unsigned Stride,
682751004a6SHao Liu                                           unsigned TypeByteSize) {
683751004a6SHao Liu   assert(Stride > 1 && "The stride must be greater than 1");
684751004a6SHao Liu   assert(TypeByteSize > 0 && "The type size in byte must be non-zero");
685751004a6SHao Liu   assert(Distance > 0 && "The distance must be non-zero");
686751004a6SHao Liu 
687751004a6SHao Liu   // Skip if the distance is not multiple of type byte size.
688751004a6SHao Liu   if (Distance % TypeByteSize)
689751004a6SHao Liu     return false;
690751004a6SHao Liu 
691751004a6SHao Liu   unsigned ScaledDist = Distance / TypeByteSize;
692751004a6SHao Liu 
693751004a6SHao Liu   // No dependence if the scaled distance is not multiple of the stride.
694751004a6SHao Liu   // E.g.
695751004a6SHao Liu   //      for (i = 0; i < 1024 ; i += 4)
696751004a6SHao Liu   //        A[i+2] = A[i] + 1;
697751004a6SHao Liu   //
698751004a6SHao Liu   // Two accesses in memory (scaled distance is 2, stride is 4):
699751004a6SHao Liu   //     | A[0] |      |      |      | A[4] |      |      |      |
700751004a6SHao Liu   //     |      |      | A[2] |      |      |      | A[6] |      |
701751004a6SHao Liu   //
702751004a6SHao Liu   // E.g.
703751004a6SHao Liu   //      for (i = 0; i < 1024 ; i += 3)
704751004a6SHao Liu   //        A[i+4] = A[i] + 1;
705751004a6SHao Liu   //
706751004a6SHao Liu   // Two accesses in memory (scaled distance is 4, stride is 3):
707751004a6SHao Liu   //     | A[0] |      |      | A[3] |      |      | A[6] |      |      |
708751004a6SHao Liu   //     |      |      |      |      | A[4] |      |      | A[7] |      |
709751004a6SHao Liu   return ScaledDist % Stride;
710751004a6SHao Liu }
711751004a6SHao Liu 
7129c926579SAdam Nemet MemoryDepChecker::Dependence::DepType
7139c926579SAdam Nemet MemoryDepChecker::isDependent(const MemAccessInfo &A, unsigned AIdx,
7140456327cSAdam Nemet                               const MemAccessInfo &B, unsigned BIdx,
7158bc61df9SAdam Nemet                               const ValueToValueMap &Strides) {
7160456327cSAdam Nemet   assert (AIdx < BIdx && "Must pass arguments in program order");
7170456327cSAdam Nemet 
7180456327cSAdam Nemet   Value *APtr = A.getPointer();
7190456327cSAdam Nemet   Value *BPtr = B.getPointer();
7200456327cSAdam Nemet   bool AIsWrite = A.getInt();
7210456327cSAdam Nemet   bool BIsWrite = B.getInt();
7220456327cSAdam Nemet 
7230456327cSAdam Nemet   // Two reads are independent.
7240456327cSAdam Nemet   if (!AIsWrite && !BIsWrite)
7259c926579SAdam Nemet     return Dependence::NoDep;
7260456327cSAdam Nemet 
7270456327cSAdam Nemet   // We cannot check pointers in different address spaces.
7280456327cSAdam Nemet   if (APtr->getType()->getPointerAddressSpace() !=
7290456327cSAdam Nemet       BPtr->getType()->getPointerAddressSpace())
7309c926579SAdam Nemet     return Dependence::Unknown;
7310456327cSAdam Nemet 
7320456327cSAdam Nemet   const SCEV *AScev = replaceSymbolicStrideSCEV(SE, Strides, APtr);
7330456327cSAdam Nemet   const SCEV *BScev = replaceSymbolicStrideSCEV(SE, Strides, BPtr);
7340456327cSAdam Nemet 
735a28d91d8SMehdi Amini   int StrideAPtr = isStridedPtr(SE, APtr, InnermostLoop, Strides);
736a28d91d8SMehdi Amini   int StrideBPtr = isStridedPtr(SE, BPtr, InnermostLoop, Strides);
7370456327cSAdam Nemet 
7380456327cSAdam Nemet   const SCEV *Src = AScev;
7390456327cSAdam Nemet   const SCEV *Sink = BScev;
7400456327cSAdam Nemet 
7410456327cSAdam Nemet   // If the induction step is negative we have to invert source and sink of the
7420456327cSAdam Nemet   // dependence.
7430456327cSAdam Nemet   if (StrideAPtr < 0) {
7440456327cSAdam Nemet     //Src = BScev;
7450456327cSAdam Nemet     //Sink = AScev;
7460456327cSAdam Nemet     std::swap(APtr, BPtr);
7470456327cSAdam Nemet     std::swap(Src, Sink);
7480456327cSAdam Nemet     std::swap(AIsWrite, BIsWrite);
7490456327cSAdam Nemet     std::swap(AIdx, BIdx);
7500456327cSAdam Nemet     std::swap(StrideAPtr, StrideBPtr);
7510456327cSAdam Nemet   }
7520456327cSAdam Nemet 
7530456327cSAdam Nemet   const SCEV *Dist = SE->getMinusSCEV(Sink, Src);
7540456327cSAdam Nemet 
755339f42b3SAdam Nemet   DEBUG(dbgs() << "LAA: Src Scev: " << *Src << "Sink Scev: " << *Sink
7560456327cSAdam Nemet         << "(Induction step: " << StrideAPtr <<  ")\n");
757339f42b3SAdam Nemet   DEBUG(dbgs() << "LAA: Distance for " << *InstMap[AIdx] << " to "
7580456327cSAdam Nemet         << *InstMap[BIdx] << ": " << *Dist << "\n");
7590456327cSAdam Nemet 
7600456327cSAdam Nemet   // Need consecutive accesses. We don't want to vectorize
7610456327cSAdam Nemet   // "A[B[i]] += ..." and similar code or pointer arithmetic that could wrap in
7620456327cSAdam Nemet   // the address space.
7630456327cSAdam Nemet   if (!StrideAPtr || !StrideBPtr || StrideAPtr != StrideBPtr){
7640456327cSAdam Nemet     DEBUG(dbgs() << "Non-consecutive pointer access\n");
7659c926579SAdam Nemet     return Dependence::Unknown;
7660456327cSAdam Nemet   }
7670456327cSAdam Nemet 
7680456327cSAdam Nemet   const SCEVConstant *C = dyn_cast<SCEVConstant>(Dist);
7690456327cSAdam Nemet   if (!C) {
770339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Dependence because of non-constant distance\n");
7710456327cSAdam Nemet     ShouldRetryWithRuntimeCheck = true;
7729c926579SAdam Nemet     return Dependence::Unknown;
7730456327cSAdam Nemet   }
7740456327cSAdam Nemet 
7750456327cSAdam Nemet   Type *ATy = APtr->getType()->getPointerElementType();
7760456327cSAdam Nemet   Type *BTy = BPtr->getType()->getPointerElementType();
777a28d91d8SMehdi Amini   auto &DL = InnermostLoop->getHeader()->getModule()->getDataLayout();
778a28d91d8SMehdi Amini   unsigned TypeByteSize = DL.getTypeAllocSize(ATy);
7790456327cSAdam Nemet 
7800456327cSAdam Nemet   // Negative distances are not plausible dependencies.
7810456327cSAdam Nemet   const APInt &Val = C->getValue()->getValue();
7820456327cSAdam Nemet   if (Val.isNegative()) {
7830456327cSAdam Nemet     bool IsTrueDataDependence = (AIsWrite && !BIsWrite);
7840456327cSAdam Nemet     if (IsTrueDataDependence &&
7850456327cSAdam Nemet         (couldPreventStoreLoadForward(Val.abs().getZExtValue(), TypeByteSize) ||
7860456327cSAdam Nemet          ATy != BTy))
7879c926579SAdam Nemet       return Dependence::ForwardButPreventsForwarding;
7880456327cSAdam Nemet 
789339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Dependence is negative: NoDep\n");
7909c926579SAdam Nemet     return Dependence::Forward;
7910456327cSAdam Nemet   }
7920456327cSAdam Nemet 
7930456327cSAdam Nemet   // Write to the same location with the same size.
7940456327cSAdam Nemet   // Could be improved to assert type sizes are the same (i32 == float, etc).
7950456327cSAdam Nemet   if (Val == 0) {
7960456327cSAdam Nemet     if (ATy == BTy)
7979c926579SAdam Nemet       return Dependence::NoDep;
798339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Zero dependence difference but different types\n");
7999c926579SAdam Nemet     return Dependence::Unknown;
8000456327cSAdam Nemet   }
8010456327cSAdam Nemet 
8020456327cSAdam Nemet   assert(Val.isStrictlyPositive() && "Expect a positive value");
8030456327cSAdam Nemet 
8040456327cSAdam Nemet   if (ATy != BTy) {
80504d4163eSAdam Nemet     DEBUG(dbgs() <<
806339f42b3SAdam Nemet           "LAA: ReadWrite-Write positive dependency with different types\n");
8079c926579SAdam Nemet     return Dependence::Unknown;
8080456327cSAdam Nemet   }
8090456327cSAdam Nemet 
8100456327cSAdam Nemet   unsigned Distance = (unsigned) Val.getZExtValue();
8110456327cSAdam Nemet 
812751004a6SHao Liu   unsigned Stride = std::abs(StrideAPtr);
813751004a6SHao Liu   if (Stride > 1 &&
814751004a6SHao Liu       areStridedAccessesIndependent(Distance, Stride, TypeByteSize))
815751004a6SHao Liu     return Dependence::NoDep;
816751004a6SHao Liu 
8170456327cSAdam Nemet   // Bail out early if passed-in parameters make vectorization not feasible.
818f219c647SAdam Nemet   unsigned ForcedFactor = (VectorizerParams::VectorizationFactor ?
819f219c647SAdam Nemet                            VectorizerParams::VectorizationFactor : 1);
820f219c647SAdam Nemet   unsigned ForcedUnroll = (VectorizerParams::VectorizationInterleave ?
821f219c647SAdam Nemet                            VectorizerParams::VectorizationInterleave : 1);
822751004a6SHao Liu   // The minimum number of iterations for a vectorized/unrolled version.
823751004a6SHao Liu   unsigned MinNumIter = std::max(ForcedFactor * ForcedUnroll, 2U);
8240456327cSAdam Nemet 
825751004a6SHao Liu   // It's not vectorizable if the distance is smaller than the minimum distance
826751004a6SHao Liu   // needed for a vectroized/unrolled version. Vectorizing one iteration in
827751004a6SHao Liu   // front needs TypeByteSize * Stride. Vectorizing the last iteration needs
828751004a6SHao Liu   // TypeByteSize (No need to plus the last gap distance).
829751004a6SHao Liu   //
830751004a6SHao Liu   // E.g. Assume one char is 1 byte in memory and one int is 4 bytes.
831751004a6SHao Liu   //      foo(int *A) {
832751004a6SHao Liu   //        int *B = (int *)((char *)A + 14);
833751004a6SHao Liu   //        for (i = 0 ; i < 1024 ; i += 2)
834751004a6SHao Liu   //          B[i] = A[i] + 1;
835751004a6SHao Liu   //      }
836751004a6SHao Liu   //
837751004a6SHao Liu   // Two accesses in memory (stride is 2):
838751004a6SHao Liu   //     | A[0] |      | A[2] |      | A[4] |      | A[6] |      |
839751004a6SHao Liu   //                              | B[0] |      | B[2] |      | B[4] |
840751004a6SHao Liu   //
841751004a6SHao Liu   // Distance needs for vectorizing iterations except the last iteration:
842751004a6SHao Liu   // 4 * 2 * (MinNumIter - 1). Distance needs for the last iteration: 4.
843751004a6SHao Liu   // So the minimum distance needed is: 4 * 2 * (MinNumIter - 1) + 4.
844751004a6SHao Liu   //
845751004a6SHao Liu   // If MinNumIter is 2, it is vectorizable as the minimum distance needed is
846751004a6SHao Liu   // 12, which is less than distance.
847751004a6SHao Liu   //
848751004a6SHao Liu   // If MinNumIter is 4 (Say if a user forces the vectorization factor to be 4),
849751004a6SHao Liu   // the minimum distance needed is 28, which is greater than distance. It is
850751004a6SHao Liu   // not safe to do vectorization.
851751004a6SHao Liu   unsigned MinDistanceNeeded =
852751004a6SHao Liu       TypeByteSize * Stride * (MinNumIter - 1) + TypeByteSize;
853751004a6SHao Liu   if (MinDistanceNeeded > Distance) {
854751004a6SHao Liu     DEBUG(dbgs() << "LAA: Failure because of positive distance " << Distance
855751004a6SHao Liu                  << '\n');
856751004a6SHao Liu     return Dependence::Backward;
857751004a6SHao Liu   }
858751004a6SHao Liu 
859751004a6SHao Liu   // Unsafe if the minimum distance needed is greater than max safe distance.
860751004a6SHao Liu   if (MinDistanceNeeded > MaxSafeDepDistBytes) {
861751004a6SHao Liu     DEBUG(dbgs() << "LAA: Failure because it needs at least "
862751004a6SHao Liu                  << MinDistanceNeeded << " size in bytes");
8639c926579SAdam Nemet     return Dependence::Backward;
8640456327cSAdam Nemet   }
8650456327cSAdam Nemet 
8669cc0c399SAdam Nemet   // Positive distance bigger than max vectorization factor.
867751004a6SHao Liu   // FIXME: Should use max factor instead of max distance in bytes, which could
868751004a6SHao Liu   // not handle different types.
869751004a6SHao Liu   // E.g. Assume one char is 1 byte in memory and one int is 4 bytes.
870751004a6SHao Liu   //      void foo (int *A, char *B) {
871751004a6SHao Liu   //        for (unsigned i = 0; i < 1024; i++) {
872751004a6SHao Liu   //          A[i+2] = A[i] + 1;
873751004a6SHao Liu   //          B[i+2] = B[i] + 1;
874751004a6SHao Liu   //        }
875751004a6SHao Liu   //      }
876751004a6SHao Liu   //
877751004a6SHao Liu   // This case is currently unsafe according to the max safe distance. If we
878751004a6SHao Liu   // analyze the two accesses on array B, the max safe dependence distance
879751004a6SHao Liu   // is 2. Then we analyze the accesses on array A, the minimum distance needed
880751004a6SHao Liu   // is 8, which is less than 2 and forbidden vectorization, But actually
881751004a6SHao Liu   // both A and B could be vectorized by 2 iterations.
882751004a6SHao Liu   MaxSafeDepDistBytes =
883751004a6SHao Liu       Distance < MaxSafeDepDistBytes ? Distance : MaxSafeDepDistBytes;
8840456327cSAdam Nemet 
8850456327cSAdam Nemet   bool IsTrueDataDependence = (!AIsWrite && BIsWrite);
8860456327cSAdam Nemet   if (IsTrueDataDependence &&
8870456327cSAdam Nemet       couldPreventStoreLoadForward(Distance, TypeByteSize))
8889c926579SAdam Nemet     return Dependence::BackwardVectorizableButPreventsForwarding;
8890456327cSAdam Nemet 
890751004a6SHao Liu   DEBUG(dbgs() << "LAA: Positive distance " << Val.getSExtValue()
891751004a6SHao Liu                << " with max VF = "
892751004a6SHao Liu                << MaxSafeDepDistBytes / (TypeByteSize * Stride) << '\n');
8930456327cSAdam Nemet 
8949c926579SAdam Nemet   return Dependence::BackwardVectorizable;
8950456327cSAdam Nemet }
8960456327cSAdam Nemet 
897dee666bcSAdam Nemet bool MemoryDepChecker::areDepsSafe(DepCandidates &AccessSets,
8980456327cSAdam Nemet                                    MemAccessInfoSet &CheckDeps,
8998bc61df9SAdam Nemet                                    const ValueToValueMap &Strides) {
9000456327cSAdam Nemet 
9010456327cSAdam Nemet   MaxSafeDepDistBytes = -1U;
9020456327cSAdam Nemet   while (!CheckDeps.empty()) {
9030456327cSAdam Nemet     MemAccessInfo CurAccess = *CheckDeps.begin();
9040456327cSAdam Nemet 
9050456327cSAdam Nemet     // Get the relevant memory access set.
9060456327cSAdam Nemet     EquivalenceClasses<MemAccessInfo>::iterator I =
9070456327cSAdam Nemet       AccessSets.findValue(AccessSets.getLeaderValue(CurAccess));
9080456327cSAdam Nemet 
9090456327cSAdam Nemet     // Check accesses within this set.
9100456327cSAdam Nemet     EquivalenceClasses<MemAccessInfo>::member_iterator AI, AE;
9110456327cSAdam Nemet     AI = AccessSets.member_begin(I), AE = AccessSets.member_end();
9120456327cSAdam Nemet 
9130456327cSAdam Nemet     // Check every access pair.
9140456327cSAdam Nemet     while (AI != AE) {
9150456327cSAdam Nemet       CheckDeps.erase(*AI);
9160456327cSAdam Nemet       EquivalenceClasses<MemAccessInfo>::member_iterator OI = std::next(AI);
9170456327cSAdam Nemet       while (OI != AE) {
9180456327cSAdam Nemet         // Check every accessing instruction pair in program order.
9190456327cSAdam Nemet         for (std::vector<unsigned>::iterator I1 = Accesses[*AI].begin(),
9200456327cSAdam Nemet              I1E = Accesses[*AI].end(); I1 != I1E; ++I1)
9210456327cSAdam Nemet           for (std::vector<unsigned>::iterator I2 = Accesses[*OI].begin(),
9220456327cSAdam Nemet                I2E = Accesses[*OI].end(); I2 != I2E; ++I2) {
9239c926579SAdam Nemet             auto A = std::make_pair(&*AI, *I1);
9249c926579SAdam Nemet             auto B = std::make_pair(&*OI, *I2);
9259c926579SAdam Nemet 
9269c926579SAdam Nemet             assert(*I1 != *I2);
9279c926579SAdam Nemet             if (*I1 > *I2)
9289c926579SAdam Nemet               std::swap(A, B);
9299c926579SAdam Nemet 
9309c926579SAdam Nemet             Dependence::DepType Type =
9319c926579SAdam Nemet                 isDependent(*A.first, A.second, *B.first, B.second, Strides);
9329c926579SAdam Nemet             SafeForVectorization &= Dependence::isSafeForVectorization(Type);
9339c926579SAdam Nemet 
9349c926579SAdam Nemet             // Gather dependences unless we accumulated MaxInterestingDependence
9359c926579SAdam Nemet             // dependences.  In that case return as soon as we find the first
9369c926579SAdam Nemet             // unsafe dependence.  This puts a limit on this quadratic
9379c926579SAdam Nemet             // algorithm.
9389c926579SAdam Nemet             if (RecordInterestingDependences) {
9399c926579SAdam Nemet               if (Dependence::isInterestingDependence(Type))
9409c926579SAdam Nemet                 InterestingDependences.push_back(
9419c926579SAdam Nemet                     Dependence(A.second, B.second, Type));
9429c926579SAdam Nemet 
9439c926579SAdam Nemet               if (InterestingDependences.size() >= MaxInterestingDependence) {
9449c926579SAdam Nemet                 RecordInterestingDependences = false;
9459c926579SAdam Nemet                 InterestingDependences.clear();
9469c926579SAdam Nemet                 DEBUG(dbgs() << "Too many dependences, stopped recording\n");
9479c926579SAdam Nemet               }
9489c926579SAdam Nemet             }
9499c926579SAdam Nemet             if (!RecordInterestingDependences && !SafeForVectorization)
9500456327cSAdam Nemet               return false;
9510456327cSAdam Nemet           }
9520456327cSAdam Nemet         ++OI;
9530456327cSAdam Nemet       }
9540456327cSAdam Nemet       AI++;
9550456327cSAdam Nemet     }
9560456327cSAdam Nemet   }
9579c926579SAdam Nemet 
9589c926579SAdam Nemet   DEBUG(dbgs() << "Total Interesting Dependences: "
9599c926579SAdam Nemet                << InterestingDependences.size() << "\n");
9609c926579SAdam Nemet   return SafeForVectorization;
9610456327cSAdam Nemet }
9620456327cSAdam Nemet 
963ec1e2bb6SAdam Nemet SmallVector<Instruction *, 4>
964ec1e2bb6SAdam Nemet MemoryDepChecker::getInstructionsForAccess(Value *Ptr, bool isWrite) const {
965ec1e2bb6SAdam Nemet   MemAccessInfo Access(Ptr, isWrite);
966ec1e2bb6SAdam Nemet   auto &IndexVector = Accesses.find(Access)->second;
967ec1e2bb6SAdam Nemet 
968ec1e2bb6SAdam Nemet   SmallVector<Instruction *, 4> Insts;
969ec1e2bb6SAdam Nemet   std::transform(IndexVector.begin(), IndexVector.end(),
970ec1e2bb6SAdam Nemet                  std::back_inserter(Insts),
971ec1e2bb6SAdam Nemet                  [&](unsigned Idx) { return this->InstMap[Idx]; });
972ec1e2bb6SAdam Nemet   return Insts;
973ec1e2bb6SAdam Nemet }
974ec1e2bb6SAdam Nemet 
97558913d65SAdam Nemet const char *MemoryDepChecker::Dependence::DepName[] = {
97658913d65SAdam Nemet     "NoDep", "Unknown", "Forward", "ForwardButPreventsForwarding", "Backward",
97758913d65SAdam Nemet     "BackwardVectorizable", "BackwardVectorizableButPreventsForwarding"};
97858913d65SAdam Nemet 
97958913d65SAdam Nemet void MemoryDepChecker::Dependence::print(
98058913d65SAdam Nemet     raw_ostream &OS, unsigned Depth,
98158913d65SAdam Nemet     const SmallVectorImpl<Instruction *> &Instrs) const {
98258913d65SAdam Nemet   OS.indent(Depth) << DepName[Type] << ":\n";
98358913d65SAdam Nemet   OS.indent(Depth + 2) << *Instrs[Source] << " -> \n";
98458913d65SAdam Nemet   OS.indent(Depth + 2) << *Instrs[Destination] << "\n";
98558913d65SAdam Nemet }
98658913d65SAdam Nemet 
987929c38e8SAdam Nemet bool LoopAccessInfo::canAnalyzeLoop() {
9888dcb3b6aSAdam Nemet   // We need to have a loop header.
9898dcb3b6aSAdam Nemet   DEBUG(dbgs() << "LAA: Found a loop: " <<
9908dcb3b6aSAdam Nemet         TheLoop->getHeader()->getName() << '\n');
9918dcb3b6aSAdam Nemet 
992929c38e8SAdam Nemet     // We can only analyze innermost loops.
993929c38e8SAdam Nemet   if (!TheLoop->empty()) {
9948dcb3b6aSAdam Nemet     DEBUG(dbgs() << "LAA: loop is not the innermost loop\n");
9952bd6e984SAdam Nemet     emitAnalysis(LoopAccessReport() << "loop is not the innermost loop");
996929c38e8SAdam Nemet     return false;
997929c38e8SAdam Nemet   }
998929c38e8SAdam Nemet 
999929c38e8SAdam Nemet   // We must have a single backedge.
1000929c38e8SAdam Nemet   if (TheLoop->getNumBackEdges() != 1) {
10018dcb3b6aSAdam Nemet     DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
1002929c38e8SAdam Nemet     emitAnalysis(
10032bd6e984SAdam Nemet         LoopAccessReport() <<
1004929c38e8SAdam Nemet         "loop control flow is not understood by analyzer");
1005929c38e8SAdam Nemet     return false;
1006929c38e8SAdam Nemet   }
1007929c38e8SAdam Nemet 
1008929c38e8SAdam Nemet   // We must have a single exiting block.
1009929c38e8SAdam Nemet   if (!TheLoop->getExitingBlock()) {
10108dcb3b6aSAdam Nemet     DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
1011929c38e8SAdam Nemet     emitAnalysis(
10122bd6e984SAdam Nemet         LoopAccessReport() <<
1013929c38e8SAdam Nemet         "loop control flow is not understood by analyzer");
1014929c38e8SAdam Nemet     return false;
1015929c38e8SAdam Nemet   }
1016929c38e8SAdam Nemet 
1017929c38e8SAdam Nemet   // We only handle bottom-tested loops, i.e. loop in which the condition is
1018929c38e8SAdam Nemet   // checked at the end of each iteration. With that we can assume that all
1019929c38e8SAdam Nemet   // instructions in the loop are executed the same number of times.
1020929c38e8SAdam Nemet   if (TheLoop->getExitingBlock() != TheLoop->getLoopLatch()) {
10218dcb3b6aSAdam Nemet     DEBUG(dbgs() << "LAA: loop control flow is not understood by analyzer\n");
1022929c38e8SAdam Nemet     emitAnalysis(
10232bd6e984SAdam Nemet         LoopAccessReport() <<
1024929c38e8SAdam Nemet         "loop control flow is not understood by analyzer");
1025929c38e8SAdam Nemet     return false;
1026929c38e8SAdam Nemet   }
1027929c38e8SAdam Nemet 
1028929c38e8SAdam Nemet   // ScalarEvolution needs to be able to find the exit count.
1029929c38e8SAdam Nemet   const SCEV *ExitCount = SE->getBackedgeTakenCount(TheLoop);
1030929c38e8SAdam Nemet   if (ExitCount == SE->getCouldNotCompute()) {
10312bd6e984SAdam Nemet     emitAnalysis(LoopAccessReport() <<
1032929c38e8SAdam Nemet                  "could not determine number of loop iterations");
1033929c38e8SAdam Nemet     DEBUG(dbgs() << "LAA: SCEV could not compute the loop exit count.\n");
1034929c38e8SAdam Nemet     return false;
1035929c38e8SAdam Nemet   }
1036929c38e8SAdam Nemet 
1037929c38e8SAdam Nemet   return true;
1038929c38e8SAdam Nemet }
1039929c38e8SAdam Nemet 
10408bc61df9SAdam Nemet void LoopAccessInfo::analyzeLoop(const ValueToValueMap &Strides) {
10410456327cSAdam Nemet 
10420456327cSAdam Nemet   typedef SmallVector<Value*, 16> ValueVector;
10430456327cSAdam Nemet   typedef SmallPtrSet<Value*, 16> ValueSet;
10440456327cSAdam Nemet 
10450456327cSAdam Nemet   // Holds the Load and Store *instructions*.
10460456327cSAdam Nemet   ValueVector Loads;
10470456327cSAdam Nemet   ValueVector Stores;
10480456327cSAdam Nemet 
10490456327cSAdam Nemet   // Holds all the different accesses in the loop.
10500456327cSAdam Nemet   unsigned NumReads = 0;
10510456327cSAdam Nemet   unsigned NumReadWrites = 0;
10520456327cSAdam Nemet 
10530456327cSAdam Nemet   PtrRtCheck.Pointers.clear();
10540456327cSAdam Nemet   PtrRtCheck.Need = false;
10550456327cSAdam Nemet 
10560456327cSAdam Nemet   const bool IsAnnotatedParallel = TheLoop->isAnnotatedParallel();
10570456327cSAdam Nemet 
10580456327cSAdam Nemet   // For each block.
10590456327cSAdam Nemet   for (Loop::block_iterator bb = TheLoop->block_begin(),
10600456327cSAdam Nemet        be = TheLoop->block_end(); bb != be; ++bb) {
10610456327cSAdam Nemet 
10620456327cSAdam Nemet     // Scan the BB and collect legal loads and stores.
10630456327cSAdam Nemet     for (BasicBlock::iterator it = (*bb)->begin(), e = (*bb)->end(); it != e;
10640456327cSAdam Nemet          ++it) {
10650456327cSAdam Nemet 
10660456327cSAdam Nemet       // If this is a load, save it. If this instruction can read from memory
10670456327cSAdam Nemet       // but is not a load, then we quit. Notice that we don't handle function
10680456327cSAdam Nemet       // calls that read or write.
10690456327cSAdam Nemet       if (it->mayReadFromMemory()) {
10700456327cSAdam Nemet         // Many math library functions read the rounding mode. We will only
10710456327cSAdam Nemet         // vectorize a loop if it contains known function calls that don't set
10720456327cSAdam Nemet         // the flag. Therefore, it is safe to ignore this read from memory.
10730456327cSAdam Nemet         CallInst *Call = dyn_cast<CallInst>(it);
10740456327cSAdam Nemet         if (Call && getIntrinsicIDForCall(Call, TLI))
10750456327cSAdam Nemet           continue;
10760456327cSAdam Nemet 
10779b3cf604SMichael Zolotukhin         // If the function has an explicit vectorized counterpart, we can safely
10789b3cf604SMichael Zolotukhin         // assume that it can be vectorized.
10799b3cf604SMichael Zolotukhin         if (Call && !Call->isNoBuiltin() && Call->getCalledFunction() &&
10809b3cf604SMichael Zolotukhin             TLI->isFunctionVectorizable(Call->getCalledFunction()->getName()))
10819b3cf604SMichael Zolotukhin           continue;
10829b3cf604SMichael Zolotukhin 
10830456327cSAdam Nemet         LoadInst *Ld = dyn_cast<LoadInst>(it);
10840456327cSAdam Nemet         if (!Ld || (!Ld->isSimple() && !IsAnnotatedParallel)) {
10852bd6e984SAdam Nemet           emitAnalysis(LoopAccessReport(Ld)
10860456327cSAdam Nemet                        << "read with atomic ordering or volatile read");
1087339f42b3SAdam Nemet           DEBUG(dbgs() << "LAA: Found a non-simple load.\n");
1088436018c3SAdam Nemet           CanVecMem = false;
1089436018c3SAdam Nemet           return;
10900456327cSAdam Nemet         }
10910456327cSAdam Nemet         NumLoads++;
10920456327cSAdam Nemet         Loads.push_back(Ld);
10930456327cSAdam Nemet         DepChecker.addAccess(Ld);
10940456327cSAdam Nemet         continue;
10950456327cSAdam Nemet       }
10960456327cSAdam Nemet 
10970456327cSAdam Nemet       // Save 'store' instructions. Abort if other instructions write to memory.
10980456327cSAdam Nemet       if (it->mayWriteToMemory()) {
10990456327cSAdam Nemet         StoreInst *St = dyn_cast<StoreInst>(it);
11000456327cSAdam Nemet         if (!St) {
11012bd6e984SAdam Nemet           emitAnalysis(LoopAccessReport(it) <<
110204d4163eSAdam Nemet                        "instruction cannot be vectorized");
1103436018c3SAdam Nemet           CanVecMem = false;
1104436018c3SAdam Nemet           return;
11050456327cSAdam Nemet         }
11060456327cSAdam Nemet         if (!St->isSimple() && !IsAnnotatedParallel) {
11072bd6e984SAdam Nemet           emitAnalysis(LoopAccessReport(St)
11080456327cSAdam Nemet                        << "write with atomic ordering or volatile write");
1109339f42b3SAdam Nemet           DEBUG(dbgs() << "LAA: Found a non-simple store.\n");
1110436018c3SAdam Nemet           CanVecMem = false;
1111436018c3SAdam Nemet           return;
11120456327cSAdam Nemet         }
11130456327cSAdam Nemet         NumStores++;
11140456327cSAdam Nemet         Stores.push_back(St);
11150456327cSAdam Nemet         DepChecker.addAccess(St);
11160456327cSAdam Nemet       }
11170456327cSAdam Nemet     } // Next instr.
11180456327cSAdam Nemet   } // Next block.
11190456327cSAdam Nemet 
11200456327cSAdam Nemet   // Now we have two lists that hold the loads and the stores.
11210456327cSAdam Nemet   // Next, we find the pointers that they use.
11220456327cSAdam Nemet 
11230456327cSAdam Nemet   // Check if we see any stores. If there are no stores, then we don't
11240456327cSAdam Nemet   // care if the pointers are *restrict*.
11250456327cSAdam Nemet   if (!Stores.size()) {
1126339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Found a read-only loop!\n");
1127436018c3SAdam Nemet     CanVecMem = true;
1128436018c3SAdam Nemet     return;
11290456327cSAdam Nemet   }
11300456327cSAdam Nemet 
1131dee666bcSAdam Nemet   MemoryDepChecker::DepCandidates DependentAccesses;
1132a28d91d8SMehdi Amini   AccessAnalysis Accesses(TheLoop->getHeader()->getModule()->getDataLayout(),
1133e2b885c4SAdam Nemet                           AA, LI, DependentAccesses);
11340456327cSAdam Nemet 
11350456327cSAdam Nemet   // Holds the analyzed pointers. We don't want to call GetUnderlyingObjects
11360456327cSAdam Nemet   // multiple times on the same object. If the ptr is accessed twice, once
11370456327cSAdam Nemet   // for read and once for write, it will only appear once (on the write
11380456327cSAdam Nemet   // list). This is okay, since we are going to check for conflicts between
11390456327cSAdam Nemet   // writes and between reads and writes, but not between reads and reads.
11400456327cSAdam Nemet   ValueSet Seen;
11410456327cSAdam Nemet 
11420456327cSAdam Nemet   ValueVector::iterator I, IE;
11430456327cSAdam Nemet   for (I = Stores.begin(), IE = Stores.end(); I != IE; ++I) {
11440456327cSAdam Nemet     StoreInst *ST = cast<StoreInst>(*I);
11450456327cSAdam Nemet     Value* Ptr = ST->getPointerOperand();
1146ce48250fSAdam Nemet     // Check for store to loop invariant address.
1147ce48250fSAdam Nemet     StoreToLoopInvariantAddress |= isUniform(Ptr);
11480456327cSAdam Nemet     // If we did *not* see this pointer before, insert it to  the read-write
11490456327cSAdam Nemet     // list. At this phase it is only a 'write' list.
11500456327cSAdam Nemet     if (Seen.insert(Ptr).second) {
11510456327cSAdam Nemet       ++NumReadWrites;
11520456327cSAdam Nemet 
1153ac80dc75SChandler Carruth       MemoryLocation Loc = MemoryLocation::get(ST);
11540456327cSAdam Nemet       // The TBAA metadata could have a control dependency on the predication
11550456327cSAdam Nemet       // condition, so we cannot rely on it when determining whether or not we
11560456327cSAdam Nemet       // need runtime pointer checks.
115701abb2c3SAdam Nemet       if (blockNeedsPredication(ST->getParent(), TheLoop, DT))
11580456327cSAdam Nemet         Loc.AATags.TBAA = nullptr;
11590456327cSAdam Nemet 
11600456327cSAdam Nemet       Accesses.addStore(Loc);
11610456327cSAdam Nemet     }
11620456327cSAdam Nemet   }
11630456327cSAdam Nemet 
11640456327cSAdam Nemet   if (IsAnnotatedParallel) {
116504d4163eSAdam Nemet     DEBUG(dbgs()
1166339f42b3SAdam Nemet           << "LAA: A loop annotated parallel, ignore memory dependency "
11670456327cSAdam Nemet           << "checks.\n");
1168436018c3SAdam Nemet     CanVecMem = true;
1169436018c3SAdam Nemet     return;
11700456327cSAdam Nemet   }
11710456327cSAdam Nemet 
11720456327cSAdam Nemet   for (I = Loads.begin(), IE = Loads.end(); I != IE; ++I) {
11730456327cSAdam Nemet     LoadInst *LD = cast<LoadInst>(*I);
11740456327cSAdam Nemet     Value* Ptr = LD->getPointerOperand();
11750456327cSAdam Nemet     // If we did *not* see this pointer before, insert it to the
11760456327cSAdam Nemet     // read list. If we *did* see it before, then it is already in
11770456327cSAdam Nemet     // the read-write list. This allows us to vectorize expressions
11780456327cSAdam Nemet     // such as A[i] += x;  Because the address of A[i] is a read-write
11790456327cSAdam Nemet     // pointer. This only works if the index of A[i] is consecutive.
11800456327cSAdam Nemet     // If the address of i is unknown (for example A[B[i]]) then we may
11810456327cSAdam Nemet     // read a few words, modify, and write a few words, and some of the
11820456327cSAdam Nemet     // words may be written to the same address.
11830456327cSAdam Nemet     bool IsReadOnlyPtr = false;
1184a28d91d8SMehdi Amini     if (Seen.insert(Ptr).second || !isStridedPtr(SE, Ptr, TheLoop, Strides)) {
11850456327cSAdam Nemet       ++NumReads;
11860456327cSAdam Nemet       IsReadOnlyPtr = true;
11870456327cSAdam Nemet     }
11880456327cSAdam Nemet 
1189ac80dc75SChandler Carruth     MemoryLocation Loc = MemoryLocation::get(LD);
11900456327cSAdam Nemet     // The TBAA metadata could have a control dependency on the predication
11910456327cSAdam Nemet     // condition, so we cannot rely on it when determining whether or not we
11920456327cSAdam Nemet     // need runtime pointer checks.
119301abb2c3SAdam Nemet     if (blockNeedsPredication(LD->getParent(), TheLoop, DT))
11940456327cSAdam Nemet       Loc.AATags.TBAA = nullptr;
11950456327cSAdam Nemet 
11960456327cSAdam Nemet     Accesses.addLoad(Loc, IsReadOnlyPtr);
11970456327cSAdam Nemet   }
11980456327cSAdam Nemet 
11990456327cSAdam Nemet   // If we write (or read-write) to a single destination and there are no
12000456327cSAdam Nemet   // other reads in this loop then is it safe to vectorize.
12010456327cSAdam Nemet   if (NumReadWrites == 1 && NumReads == 0) {
1202339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Found a write-only loop!\n");
1203436018c3SAdam Nemet     CanVecMem = true;
1204436018c3SAdam Nemet     return;
12050456327cSAdam Nemet   }
12060456327cSAdam Nemet 
12070456327cSAdam Nemet   // Build dependence sets and check whether we need a runtime pointer bounds
12080456327cSAdam Nemet   // check.
12090456327cSAdam Nemet   Accesses.buildDependenceSets();
12100456327cSAdam Nemet 
12110456327cSAdam Nemet   // Find pointers with computable bounds. We are going to use this information
12120456327cSAdam Nemet   // to place a runtime bound check.
121398a13719SSilviu Baranga   bool NeedRTCheck;
121498a13719SSilviu Baranga   bool CanDoRT = Accesses.canCheckPtrAtRT(PtrRtCheck,
121598a13719SSilviu Baranga                                           NeedRTCheck, SE,
121698a13719SSilviu Baranga                                           TheLoop, Strides);
12170456327cSAdam Nemet 
121898a13719SSilviu Baranga   DEBUG(dbgs() << "LAA: We need to do "
121998a13719SSilviu Baranga                << PtrRtCheck.getNumberOfChecks(nullptr)
122098a13719SSilviu Baranga                << " pointer comparisons.\n");
12210456327cSAdam Nemet 
1222949e91a6SAdam Nemet   // Check that we found the bounds for the pointer.
1223b6dc76ffSAdam Nemet   if (CanDoRT)
1224339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: We can perform a memory runtime check if needed.\n");
1225b6dc76ffSAdam Nemet   else if (NeedRTCheck) {
12262bd6e984SAdam Nemet     emitAnalysis(LoopAccessReport() << "cannot identify array bounds");
1227339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: We can't vectorize because we can't find " <<
122804d4163eSAdam Nemet           "the array bounds.\n");
12290456327cSAdam Nemet     PtrRtCheck.reset();
1230436018c3SAdam Nemet     CanVecMem = false;
1231436018c3SAdam Nemet     return;
12320456327cSAdam Nemet   }
12330456327cSAdam Nemet 
12340456327cSAdam Nemet   PtrRtCheck.Need = NeedRTCheck;
12350456327cSAdam Nemet 
1236436018c3SAdam Nemet   CanVecMem = true;
12370456327cSAdam Nemet   if (Accesses.isDependencyCheckNeeded()) {
1238339f42b3SAdam Nemet     DEBUG(dbgs() << "LAA: Checking memory dependencies\n");
12390456327cSAdam Nemet     CanVecMem = DepChecker.areDepsSafe(
12400456327cSAdam Nemet         DependentAccesses, Accesses.getDependenciesToCheck(), Strides);
12410456327cSAdam Nemet     MaxSafeDepDistBytes = DepChecker.getMaxSafeDepDistBytes();
12420456327cSAdam Nemet 
12430456327cSAdam Nemet     if (!CanVecMem && DepChecker.shouldRetryWithRuntimeCheck()) {
1244339f42b3SAdam Nemet       DEBUG(dbgs() << "LAA: Retrying with memory checks\n");
12450456327cSAdam Nemet       NeedRTCheck = true;
12460456327cSAdam Nemet 
12470456327cSAdam Nemet       // Clear the dependency checks. We assume they are not needed.
1248df3dc5b9SAdam Nemet       Accesses.resetDepChecks(DepChecker);
12490456327cSAdam Nemet 
12500456327cSAdam Nemet       PtrRtCheck.reset();
12510456327cSAdam Nemet       PtrRtCheck.Need = true;
12520456327cSAdam Nemet 
125398a13719SSilviu Baranga       CanDoRT = Accesses.canCheckPtrAtRT(PtrRtCheck, NeedRTCheck, SE,
12540456327cSAdam Nemet                                          TheLoop, Strides, true);
125598a13719SSilviu Baranga 
1256949e91a6SAdam Nemet       // Check that we found the bounds for the pointer.
125798a13719SSilviu Baranga       if (NeedRTCheck && !CanDoRT) {
12582bd6e984SAdam Nemet         emitAnalysis(LoopAccessReport()
12590456327cSAdam Nemet                      << "cannot check memory dependencies at runtime");
1260b6dc76ffSAdam Nemet         DEBUG(dbgs() << "LAA: Can't vectorize with memory checks\n");
1261b6dc76ffSAdam Nemet         PtrRtCheck.reset();
1262b6dc76ffSAdam Nemet         CanVecMem = false;
1263b6dc76ffSAdam Nemet         return;
1264b6dc76ffSAdam Nemet       }
1265b6dc76ffSAdam Nemet 
12660456327cSAdam Nemet       CanVecMem = true;
12670456327cSAdam Nemet     }
12680456327cSAdam Nemet   }
12690456327cSAdam Nemet 
12704bb90a71SAdam Nemet   if (CanVecMem)
12714bb90a71SAdam Nemet     DEBUG(dbgs() << "LAA: No unsafe dependent memory operations in loop.  We"
12724bb90a71SAdam Nemet                  << (NeedRTCheck ? "" : " don't")
12734bb90a71SAdam Nemet                  << " need a runtime memory check.\n");
12744bb90a71SAdam Nemet   else {
12752bd6e984SAdam Nemet     emitAnalysis(LoopAccessReport() <<
127604d4163eSAdam Nemet                  "unsafe dependent memory operations in loop");
12774bb90a71SAdam Nemet     DEBUG(dbgs() << "LAA: unsafe dependent memory operations in loop\n");
12784bb90a71SAdam Nemet   }
12790456327cSAdam Nemet }
12800456327cSAdam Nemet 
128101abb2c3SAdam Nemet bool LoopAccessInfo::blockNeedsPredication(BasicBlock *BB, Loop *TheLoop,
128201abb2c3SAdam Nemet                                            DominatorTree *DT)  {
12830456327cSAdam Nemet   assert(TheLoop->contains(BB) && "Unknown block used");
12840456327cSAdam Nemet 
12850456327cSAdam Nemet   // Blocks that do not dominate the latch need predication.
12860456327cSAdam Nemet   BasicBlock* Latch = TheLoop->getLoopLatch();
12870456327cSAdam Nemet   return !DT->dominates(BB, Latch);
12880456327cSAdam Nemet }
12890456327cSAdam Nemet 
12902bd6e984SAdam Nemet void LoopAccessInfo::emitAnalysis(LoopAccessReport &Message) {
1291c922853bSAdam Nemet   assert(!Report && "Multiple reports generated");
1292c922853bSAdam Nemet   Report = Message;
12930456327cSAdam Nemet }
12940456327cSAdam Nemet 
129557ac766eSAdam Nemet bool LoopAccessInfo::isUniform(Value *V) const {
12960456327cSAdam Nemet   return (SE->isLoopInvariant(SE->getSCEV(V), TheLoop));
12970456327cSAdam Nemet }
12987206d7a5SAdam Nemet 
12997206d7a5SAdam Nemet // FIXME: this function is currently a duplicate of the one in
13007206d7a5SAdam Nemet // LoopVectorize.cpp.
13017206d7a5SAdam Nemet static Instruction *getFirstInst(Instruction *FirstInst, Value *V,
13027206d7a5SAdam Nemet                                  Instruction *Loc) {
13037206d7a5SAdam Nemet   if (FirstInst)
13047206d7a5SAdam Nemet     return FirstInst;
13057206d7a5SAdam Nemet   if (Instruction *I = dyn_cast<Instruction>(V))
13067206d7a5SAdam Nemet     return I->getParent() == Loc->getParent() ? I : nullptr;
13077206d7a5SAdam Nemet   return nullptr;
13087206d7a5SAdam Nemet }
13097206d7a5SAdam Nemet 
1310ec1e2bb6SAdam Nemet std::pair<Instruction *, Instruction *> LoopAccessInfo::addRuntimeCheck(
1311ec1e2bb6SAdam Nemet     Instruction *Loc, const SmallVectorImpl<int> *PtrPartition) const {
13127206d7a5SAdam Nemet   if (!PtrRtCheck.Need)
131390fec840SAdam Nemet     return std::make_pair(nullptr, nullptr);
13147206d7a5SAdam Nemet 
13157206d7a5SAdam Nemet   unsigned NumPointers = PtrRtCheck.Pointers.size();
13167206d7a5SAdam Nemet   SmallVector<TrackingVH<Value> , 2> Starts;
13177206d7a5SAdam Nemet   SmallVector<TrackingVH<Value> , 2> Ends;
13187206d7a5SAdam Nemet 
13197206d7a5SAdam Nemet   LLVMContext &Ctx = Loc->getContext();
1320a28d91d8SMehdi Amini   SCEVExpander Exp(*SE, DL, "induction");
13217206d7a5SAdam Nemet   Instruction *FirstInst = nullptr;
13227206d7a5SAdam Nemet 
13237206d7a5SAdam Nemet   for (unsigned i = 0; i < NumPointers; ++i) {
13247206d7a5SAdam Nemet     Value *Ptr = PtrRtCheck.Pointers[i];
13257206d7a5SAdam Nemet     const SCEV *Sc = SE->getSCEV(Ptr);
13267206d7a5SAdam Nemet 
13277206d7a5SAdam Nemet     if (SE->isLoopInvariant(Sc, TheLoop)) {
1328339f42b3SAdam Nemet       DEBUG(dbgs() << "LAA: Adding RT check for a loop invariant ptr:" <<
132904d4163eSAdam Nemet             *Ptr <<"\n");
13307206d7a5SAdam Nemet       Starts.push_back(Ptr);
13317206d7a5SAdam Nemet       Ends.push_back(Ptr);
13327206d7a5SAdam Nemet     } else {
1333339f42b3SAdam Nemet       DEBUG(dbgs() << "LAA: Adding RT check for range:" << *Ptr << '\n');
13347206d7a5SAdam Nemet       unsigned AS = Ptr->getType()->getPointerAddressSpace();
13357206d7a5SAdam Nemet 
13367206d7a5SAdam Nemet       // Use this type for pointer arithmetic.
13377206d7a5SAdam Nemet       Type *PtrArithTy = Type::getInt8PtrTy(Ctx, AS);
13387206d7a5SAdam Nemet 
13397206d7a5SAdam Nemet       Value *Start = Exp.expandCodeFor(PtrRtCheck.Starts[i], PtrArithTy, Loc);
13407206d7a5SAdam Nemet       Value *End = Exp.expandCodeFor(PtrRtCheck.Ends[i], PtrArithTy, Loc);
13417206d7a5SAdam Nemet       Starts.push_back(Start);
13427206d7a5SAdam Nemet       Ends.push_back(End);
13437206d7a5SAdam Nemet     }
13447206d7a5SAdam Nemet   }
13457206d7a5SAdam Nemet 
13467206d7a5SAdam Nemet   IRBuilder<> ChkBuilder(Loc);
13477206d7a5SAdam Nemet   // Our instructions might fold to a constant.
13487206d7a5SAdam Nemet   Value *MemoryRuntimeCheck = nullptr;
13497206d7a5SAdam Nemet   for (unsigned i = 0; i < NumPointers; ++i) {
13507206d7a5SAdam Nemet     for (unsigned j = i+1; j < NumPointers; ++j) {
1351ec1e2bb6SAdam Nemet       if (!PtrRtCheck.needsChecking(i, j, PtrPartition))
13527206d7a5SAdam Nemet         continue;
13537206d7a5SAdam Nemet 
13547206d7a5SAdam Nemet       unsigned AS0 = Starts[i]->getType()->getPointerAddressSpace();
13557206d7a5SAdam Nemet       unsigned AS1 = Starts[j]->getType()->getPointerAddressSpace();
13567206d7a5SAdam Nemet 
13577206d7a5SAdam Nemet       assert((AS0 == Ends[j]->getType()->getPointerAddressSpace()) &&
13587206d7a5SAdam Nemet              (AS1 == Ends[i]->getType()->getPointerAddressSpace()) &&
13597206d7a5SAdam Nemet              "Trying to bounds check pointers with different address spaces");
13607206d7a5SAdam Nemet 
13617206d7a5SAdam Nemet       Type *PtrArithTy0 = Type::getInt8PtrTy(Ctx, AS0);
13627206d7a5SAdam Nemet       Type *PtrArithTy1 = Type::getInt8PtrTy(Ctx, AS1);
13637206d7a5SAdam Nemet 
13647206d7a5SAdam Nemet       Value *Start0 = ChkBuilder.CreateBitCast(Starts[i], PtrArithTy0, "bc");
13657206d7a5SAdam Nemet       Value *Start1 = ChkBuilder.CreateBitCast(Starts[j], PtrArithTy1, "bc");
13667206d7a5SAdam Nemet       Value *End0 =   ChkBuilder.CreateBitCast(Ends[i],   PtrArithTy1, "bc");
13677206d7a5SAdam Nemet       Value *End1 =   ChkBuilder.CreateBitCast(Ends[j],   PtrArithTy0, "bc");
13687206d7a5SAdam Nemet 
13697206d7a5SAdam Nemet       Value *Cmp0 = ChkBuilder.CreateICmpULE(Start0, End1, "bound0");
13707206d7a5SAdam Nemet       FirstInst = getFirstInst(FirstInst, Cmp0, Loc);
13717206d7a5SAdam Nemet       Value *Cmp1 = ChkBuilder.CreateICmpULE(Start1, End0, "bound1");
13727206d7a5SAdam Nemet       FirstInst = getFirstInst(FirstInst, Cmp1, Loc);
13737206d7a5SAdam Nemet       Value *IsConflict = ChkBuilder.CreateAnd(Cmp0, Cmp1, "found.conflict");
13747206d7a5SAdam Nemet       FirstInst = getFirstInst(FirstInst, IsConflict, Loc);
13757206d7a5SAdam Nemet       if (MemoryRuntimeCheck) {
13767206d7a5SAdam Nemet         IsConflict = ChkBuilder.CreateOr(MemoryRuntimeCheck, IsConflict,
13777206d7a5SAdam Nemet                                          "conflict.rdx");
13787206d7a5SAdam Nemet         FirstInst = getFirstInst(FirstInst, IsConflict, Loc);
13797206d7a5SAdam Nemet       }
13807206d7a5SAdam Nemet       MemoryRuntimeCheck = IsConflict;
13817206d7a5SAdam Nemet     }
13827206d7a5SAdam Nemet   }
13837206d7a5SAdam Nemet 
138490fec840SAdam Nemet   if (!MemoryRuntimeCheck)
138590fec840SAdam Nemet     return std::make_pair(nullptr, nullptr);
138690fec840SAdam Nemet 
13877206d7a5SAdam Nemet   // We have to do this trickery because the IRBuilder might fold the check to a
13887206d7a5SAdam Nemet   // constant expression in which case there is no Instruction anchored in a
13897206d7a5SAdam Nemet   // the block.
13907206d7a5SAdam Nemet   Instruction *Check = BinaryOperator::CreateAnd(MemoryRuntimeCheck,
13917206d7a5SAdam Nemet                                                  ConstantInt::getTrue(Ctx));
13927206d7a5SAdam Nemet   ChkBuilder.Insert(Check, "memcheck.conflict");
13937206d7a5SAdam Nemet   FirstInst = getFirstInst(FirstInst, Check, Loc);
13947206d7a5SAdam Nemet   return std::make_pair(FirstInst, Check);
13957206d7a5SAdam Nemet }
13963bfd93d7SAdam Nemet 
13973bfd93d7SAdam Nemet LoopAccessInfo::LoopAccessInfo(Loop *L, ScalarEvolution *SE,
1398a28d91d8SMehdi Amini                                const DataLayout &DL,
13993bfd93d7SAdam Nemet                                const TargetLibraryInfo *TLI, AliasAnalysis *AA,
1400e2b885c4SAdam Nemet                                DominatorTree *DT, LoopInfo *LI,
14018bc61df9SAdam Nemet                                const ValueToValueMap &Strides)
140298a13719SSilviu Baranga     : DepChecker(SE, L), TheLoop(L), SE(SE), DL(DL),
1403e2b885c4SAdam Nemet       TLI(TLI), AA(AA), DT(DT), LI(LI), NumLoads(0), NumStores(0),
1404ce48250fSAdam Nemet       MaxSafeDepDistBytes(-1U), CanVecMem(false),
1405ce48250fSAdam Nemet       StoreToLoopInvariantAddress(false) {
1406929c38e8SAdam Nemet   if (canAnalyzeLoop())
14073bfd93d7SAdam Nemet     analyzeLoop(Strides);
14083bfd93d7SAdam Nemet }
14093bfd93d7SAdam Nemet 
1410e91cc6efSAdam Nemet void LoopAccessInfo::print(raw_ostream &OS, unsigned Depth) const {
1411e91cc6efSAdam Nemet   if (CanVecMem) {
141226da8e98SAdam Nemet     if (PtrRtCheck.Need)
1413e91cc6efSAdam Nemet       OS.indent(Depth) << "Memory dependences are safe with run-time checks\n";
141426da8e98SAdam Nemet     else
141526da8e98SAdam Nemet       OS.indent(Depth) << "Memory dependences are safe\n";
1416e91cc6efSAdam Nemet   }
1417e91cc6efSAdam Nemet 
1418e91cc6efSAdam Nemet   if (Report)
1419e91cc6efSAdam Nemet     OS.indent(Depth) << "Report: " << Report->str() << "\n";
1420e91cc6efSAdam Nemet 
142158913d65SAdam Nemet   if (auto *InterestingDependences = DepChecker.getInterestingDependences()) {
142258913d65SAdam Nemet     OS.indent(Depth) << "Interesting Dependences:\n";
142358913d65SAdam Nemet     for (auto &Dep : *InterestingDependences) {
142458913d65SAdam Nemet       Dep.print(OS, Depth + 2, DepChecker.getMemoryInstructions());
142558913d65SAdam Nemet       OS << "\n";
142658913d65SAdam Nemet     }
142758913d65SAdam Nemet   } else
142858913d65SAdam Nemet     OS.indent(Depth) << "Too many interesting dependences, not recorded\n";
1429e91cc6efSAdam Nemet 
1430e91cc6efSAdam Nemet   // List the pair of accesses need run-time checks to prove independence.
1431e91cc6efSAdam Nemet   PtrRtCheck.print(OS, Depth);
1432e91cc6efSAdam Nemet   OS << "\n";
1433c3384320SAdam Nemet 
1434c3384320SAdam Nemet   OS.indent(Depth) << "Store to invariant address was "
1435c3384320SAdam Nemet                    << (StoreToLoopInvariantAddress ? "" : "not ")
1436c3384320SAdam Nemet                    << "found in loop.\n";
1437e91cc6efSAdam Nemet }
1438e91cc6efSAdam Nemet 
14398bc61df9SAdam Nemet const LoopAccessInfo &
14408bc61df9SAdam Nemet LoopAccessAnalysis::getInfo(Loop *L, const ValueToValueMap &Strides) {
14413bfd93d7SAdam Nemet   auto &LAI = LoopAccessInfoMap[L];
14423bfd93d7SAdam Nemet 
14433bfd93d7SAdam Nemet #ifndef NDEBUG
14443bfd93d7SAdam Nemet   assert((!LAI || LAI->NumSymbolicStrides == Strides.size()) &&
14453bfd93d7SAdam Nemet          "Symbolic strides changed for loop");
14463bfd93d7SAdam Nemet #endif
14473bfd93d7SAdam Nemet 
14483bfd93d7SAdam Nemet   if (!LAI) {
1449a28d91d8SMehdi Amini     const DataLayout &DL = L->getHeader()->getModule()->getDataLayout();
1450e2b885c4SAdam Nemet     LAI = llvm::make_unique<LoopAccessInfo>(L, SE, DL, TLI, AA, DT, LI,
1451e2b885c4SAdam Nemet                                             Strides);
14523bfd93d7SAdam Nemet #ifndef NDEBUG
14533bfd93d7SAdam Nemet     LAI->NumSymbolicStrides = Strides.size();
14543bfd93d7SAdam Nemet #endif
14553bfd93d7SAdam Nemet   }
14563bfd93d7SAdam Nemet   return *LAI.get();
14573bfd93d7SAdam Nemet }
14583bfd93d7SAdam Nemet 
1459e91cc6efSAdam Nemet void LoopAccessAnalysis::print(raw_ostream &OS, const Module *M) const {
1460e91cc6efSAdam Nemet   LoopAccessAnalysis &LAA = *const_cast<LoopAccessAnalysis *>(this);
1461e91cc6efSAdam Nemet 
1462e91cc6efSAdam Nemet   ValueToValueMap NoSymbolicStrides;
1463e91cc6efSAdam Nemet 
1464e91cc6efSAdam Nemet   for (Loop *TopLevelLoop : *LI)
1465e91cc6efSAdam Nemet     for (Loop *L : depth_first(TopLevelLoop)) {
1466e91cc6efSAdam Nemet       OS.indent(2) << L->getHeader()->getName() << ":\n";
1467e91cc6efSAdam Nemet       auto &LAI = LAA.getInfo(L, NoSymbolicStrides);
1468e91cc6efSAdam Nemet       LAI.print(OS, 4);
1469e91cc6efSAdam Nemet     }
1470e91cc6efSAdam Nemet }
1471e91cc6efSAdam Nemet 
14723bfd93d7SAdam Nemet bool LoopAccessAnalysis::runOnFunction(Function &F) {
14733bfd93d7SAdam Nemet   SE = &getAnalysis<ScalarEvolution>();
14743bfd93d7SAdam Nemet   auto *TLIP = getAnalysisIfAvailable<TargetLibraryInfoWrapperPass>();
14753bfd93d7SAdam Nemet   TLI = TLIP ? &TLIP->getTLI() : nullptr;
14763bfd93d7SAdam Nemet   AA = &getAnalysis<AliasAnalysis>();
14773bfd93d7SAdam Nemet   DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();
1478e2b885c4SAdam Nemet   LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
14793bfd93d7SAdam Nemet 
14803bfd93d7SAdam Nemet   return false;
14813bfd93d7SAdam Nemet }
14823bfd93d7SAdam Nemet 
14833bfd93d7SAdam Nemet void LoopAccessAnalysis::getAnalysisUsage(AnalysisUsage &AU) const {
14843bfd93d7SAdam Nemet     AU.addRequired<ScalarEvolution>();
14853bfd93d7SAdam Nemet     AU.addRequired<AliasAnalysis>();
14863bfd93d7SAdam Nemet     AU.addRequired<DominatorTreeWrapperPass>();
1487e91cc6efSAdam Nemet     AU.addRequired<LoopInfoWrapperPass>();
14883bfd93d7SAdam Nemet 
14893bfd93d7SAdam Nemet     AU.setPreservesAll();
14903bfd93d7SAdam Nemet }
14913bfd93d7SAdam Nemet 
14923bfd93d7SAdam Nemet char LoopAccessAnalysis::ID = 0;
14933bfd93d7SAdam Nemet static const char laa_name[] = "Loop Access Analysis";
14943bfd93d7SAdam Nemet #define LAA_NAME "loop-accesses"
14953bfd93d7SAdam Nemet 
14963bfd93d7SAdam Nemet INITIALIZE_PASS_BEGIN(LoopAccessAnalysis, LAA_NAME, laa_name, false, true)
14973bfd93d7SAdam Nemet INITIALIZE_AG_DEPENDENCY(AliasAnalysis)
14983bfd93d7SAdam Nemet INITIALIZE_PASS_DEPENDENCY(ScalarEvolution)
14993bfd93d7SAdam Nemet INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
1500e91cc6efSAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
15013bfd93d7SAdam Nemet INITIALIZE_PASS_END(LoopAccessAnalysis, LAA_NAME, laa_name, false, true)
15023bfd93d7SAdam Nemet 
15033bfd93d7SAdam Nemet namespace llvm {
15043bfd93d7SAdam Nemet   Pass *createLAAPass() {
15053bfd93d7SAdam Nemet     return new LoopAccessAnalysis();
15063bfd93d7SAdam Nemet   }
15073bfd93d7SAdam Nemet }
1508