19d9cb274SAdam Nemet //===-------- LoopDataPrefetch.cpp - Loop Data Prefetching Pass -----------===//
29d9cb274SAdam Nemet //
39d9cb274SAdam Nemet //                     The LLVM Compiler Infrastructure
49d9cb274SAdam Nemet //
59d9cb274SAdam Nemet // This file is distributed under the University of Illinois Open Source
69d9cb274SAdam Nemet // License. See LICENSE.TXT for details.
79d9cb274SAdam Nemet //
89d9cb274SAdam Nemet //===----------------------------------------------------------------------===//
99d9cb274SAdam Nemet //
109d9cb274SAdam Nemet // This file implements a Loop Data Prefetching Pass.
119d9cb274SAdam Nemet //
129d9cb274SAdam Nemet //===----------------------------------------------------------------------===//
139d9cb274SAdam Nemet 
141eca6bc6STeresa Johnson #include "llvm/Transforms/Scalar/LoopDataPrefetch.h"
151eca6bc6STeresa Johnson 
169d9cb274SAdam Nemet #define DEBUG_TYPE "loop-data-prefetch"
179d9cb274SAdam Nemet #include "llvm/ADT/DepthFirstIterator.h"
189d9cb274SAdam Nemet #include "llvm/ADT/Statistic.h"
19*aec2fa35SDaniel Jasper #include "llvm/Analysis/AssumptionCache.h"
209d9cb274SAdam Nemet #include "llvm/Analysis/CodeMetrics.h"
219d9cb274SAdam Nemet #include "llvm/Analysis/InstructionSimplify.h"
229d9cb274SAdam Nemet #include "llvm/Analysis/LoopInfo.h"
239e6e63fbSAdam Nemet #include "llvm/Analysis/OptimizationDiagnosticInfo.h"
249d9cb274SAdam Nemet #include "llvm/Analysis/ScalarEvolution.h"
259d9cb274SAdam Nemet #include "llvm/Analysis/ScalarEvolutionAliasAnalysis.h"
269d9cb274SAdam Nemet #include "llvm/Analysis/ScalarEvolutionExpander.h"
279d9cb274SAdam Nemet #include "llvm/Analysis/ScalarEvolutionExpressions.h"
289d9cb274SAdam Nemet #include "llvm/Analysis/TargetTransformInfo.h"
299d9cb274SAdam Nemet #include "llvm/Analysis/ValueTracking.h"
309d9cb274SAdam Nemet #include "llvm/IR/CFG.h"
319d9cb274SAdam Nemet #include "llvm/IR/Dominators.h"
329d9cb274SAdam Nemet #include "llvm/IR/Function.h"
339d9cb274SAdam Nemet #include "llvm/IR/IntrinsicInst.h"
349d9cb274SAdam Nemet #include "llvm/IR/Module.h"
359d9cb274SAdam Nemet #include "llvm/Support/CommandLine.h"
369d9cb274SAdam Nemet #include "llvm/Support/Debug.h"
37885f1de4SAdam Nemet #include "llvm/Transforms/Scalar.h"
389d9cb274SAdam Nemet #include "llvm/Transforms/Utils/BasicBlockUtils.h"
399d9cb274SAdam Nemet #include "llvm/Transforms/Utils/Local.h"
409d9cb274SAdam Nemet #include "llvm/Transforms/Utils/ValueMapper.h"
419d9cb274SAdam Nemet using namespace llvm;
429d9cb274SAdam Nemet 
439d9cb274SAdam Nemet // By default, we limit this to creating 16 PHIs (which is a little over half
449d9cb274SAdam Nemet // of the allocatable register set).
459d9cb274SAdam Nemet static cl::opt<bool>
469d9cb274SAdam Nemet PrefetchWrites("loop-prefetch-writes", cl::Hidden, cl::init(false),
479d9cb274SAdam Nemet                cl::desc("Prefetch write addresses"));
489d9cb274SAdam Nemet 
491428d41fSAdam Nemet static cl::opt<unsigned>
501428d41fSAdam Nemet     PrefetchDistance("prefetch-distance",
511428d41fSAdam Nemet                      cl::desc("Number of instructions to prefetch ahead"),
521428d41fSAdam Nemet                      cl::Hidden);
531428d41fSAdam Nemet 
541428d41fSAdam Nemet static cl::opt<unsigned>
551428d41fSAdam Nemet     MinPrefetchStride("min-prefetch-stride",
561428d41fSAdam Nemet                       cl::desc("Min stride to add prefetches"), cl::Hidden);
571428d41fSAdam Nemet 
581428d41fSAdam Nemet static cl::opt<unsigned> MaxPrefetchIterationsAhead(
591428d41fSAdam Nemet     "max-prefetch-iters-ahead",
601428d41fSAdam Nemet     cl::desc("Max number of iterations to prefetch ahead"), cl::Hidden);
611428d41fSAdam Nemet 
6234785ecfSAdam Nemet STATISTIC(NumPrefetches, "Number of prefetches inserted");
6334785ecfSAdam Nemet 
649d9cb274SAdam Nemet namespace {
659d9cb274SAdam Nemet 
661eca6bc6STeresa Johnson /// Loop prefetch implementation class.
671eca6bc6STeresa Johnson class LoopDataPrefetch {
689d9cb274SAdam Nemet public:
69*aec2fa35SDaniel Jasper   LoopDataPrefetch(AssumptionCache *AC, LoopInfo *LI, ScalarEvolution *SE,
701eca6bc6STeresa Johnson                    const TargetTransformInfo *TTI,
711eca6bc6STeresa Johnson                    OptimizationRemarkEmitter *ORE)
72*aec2fa35SDaniel Jasper       : AC(AC), LI(LI), SE(SE), TTI(TTI), ORE(ORE) {}
739d9cb274SAdam Nemet 
741eca6bc6STeresa Johnson   bool run();
7585fba393SAdam Nemet 
7685fba393SAdam Nemet private:
779d9cb274SAdam Nemet   bool runOnLoop(Loop *L);
789d9cb274SAdam Nemet 
796d8beecaSAdam Nemet   /// \brief Check if the the stride of the accesses is large enough to
806d8beecaSAdam Nemet   /// warrant a prefetch.
816d8beecaSAdam Nemet   bool isStrideLargeEnough(const SCEVAddRecExpr *AR);
826d8beecaSAdam Nemet 
831428d41fSAdam Nemet   unsigned getMinPrefetchStride() {
841428d41fSAdam Nemet     if (MinPrefetchStride.getNumOccurrences() > 0)
851428d41fSAdam Nemet       return MinPrefetchStride;
861428d41fSAdam Nemet     return TTI->getMinPrefetchStride();
871428d41fSAdam Nemet   }
881428d41fSAdam Nemet 
891428d41fSAdam Nemet   unsigned getPrefetchDistance() {
901428d41fSAdam Nemet     if (PrefetchDistance.getNumOccurrences() > 0)
911428d41fSAdam Nemet       return PrefetchDistance;
921428d41fSAdam Nemet     return TTI->getPrefetchDistance();
931428d41fSAdam Nemet   }
941428d41fSAdam Nemet 
951428d41fSAdam Nemet   unsigned getMaxPrefetchIterationsAhead() {
961428d41fSAdam Nemet     if (MaxPrefetchIterationsAhead.getNumOccurrences() > 0)
971428d41fSAdam Nemet       return MaxPrefetchIterationsAhead;
981428d41fSAdam Nemet     return TTI->getMaxPrefetchIterationsAhead();
991428d41fSAdam Nemet   }
1001428d41fSAdam Nemet 
101*aec2fa35SDaniel Jasper   AssumptionCache *AC;
1029d9cb274SAdam Nemet   LoopInfo *LI;
1039d9cb274SAdam Nemet   ScalarEvolution *SE;
1049d9cb274SAdam Nemet   const TargetTransformInfo *TTI;
1059e6e63fbSAdam Nemet   OptimizationRemarkEmitter *ORE;
1069d9cb274SAdam Nemet };
1071eca6bc6STeresa Johnson 
1081eca6bc6STeresa Johnson /// Legacy class for inserting loop data prefetches.
1091eca6bc6STeresa Johnson class LoopDataPrefetchLegacyPass : public FunctionPass {
1101eca6bc6STeresa Johnson public:
1111eca6bc6STeresa Johnson   static char ID; // Pass ID, replacement for typeid
1121eca6bc6STeresa Johnson   LoopDataPrefetchLegacyPass() : FunctionPass(ID) {
1131eca6bc6STeresa Johnson     initializeLoopDataPrefetchLegacyPassPass(*PassRegistry::getPassRegistry());
1141eca6bc6STeresa Johnson   }
1151eca6bc6STeresa Johnson 
1161eca6bc6STeresa Johnson   void getAnalysisUsage(AnalysisUsage &AU) const override {
117*aec2fa35SDaniel Jasper     AU.addRequired<AssumptionCacheTracker>();
1181eca6bc6STeresa Johnson     AU.addPreserved<DominatorTreeWrapperPass>();
1191eca6bc6STeresa Johnson     AU.addRequired<LoopInfoWrapperPass>();
1201eca6bc6STeresa Johnson     AU.addPreserved<LoopInfoWrapperPass>();
1211eca6bc6STeresa Johnson     AU.addRequired<OptimizationRemarkEmitterWrapperPass>();
1221eca6bc6STeresa Johnson     AU.addRequired<ScalarEvolutionWrapperPass>();
1231eca6bc6STeresa Johnson     // FIXME: For some reason, preserving SE here breaks LSR (even if
1241eca6bc6STeresa Johnson     // this pass changes nothing).
1251eca6bc6STeresa Johnson     // AU.addPreserved<ScalarEvolutionWrapperPass>();
1261eca6bc6STeresa Johnson     AU.addRequired<TargetTransformInfoWrapperPass>();
1271eca6bc6STeresa Johnson   }
1281eca6bc6STeresa Johnson 
1291eca6bc6STeresa Johnson   bool runOnFunction(Function &F) override;
1301eca6bc6STeresa Johnson   };
1319d9cb274SAdam Nemet }
1329d9cb274SAdam Nemet 
1331eca6bc6STeresa Johnson char LoopDataPrefetchLegacyPass::ID = 0;
1341eca6bc6STeresa Johnson INITIALIZE_PASS_BEGIN(LoopDataPrefetchLegacyPass, "loop-data-prefetch",
1359d9cb274SAdam Nemet                       "Loop Data Prefetch", false, false)
136*aec2fa35SDaniel Jasper INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
1379d9cb274SAdam Nemet INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
1389d9cb274SAdam Nemet INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)
1399e6e63fbSAdam Nemet INITIALIZE_PASS_DEPENDENCY(OptimizationRemarkEmitterWrapperPass)
1409d9cb274SAdam Nemet INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)
1411eca6bc6STeresa Johnson INITIALIZE_PASS_END(LoopDataPrefetchLegacyPass, "loop-data-prefetch",
1429d9cb274SAdam Nemet                     "Loop Data Prefetch", false, false)
1439d9cb274SAdam Nemet 
1441eca6bc6STeresa Johnson FunctionPass *llvm::createLoopDataPrefetchPass() {
1451eca6bc6STeresa Johnson   return new LoopDataPrefetchLegacyPass();
1461eca6bc6STeresa Johnson }
1479d9cb274SAdam Nemet 
1486d8beecaSAdam Nemet bool LoopDataPrefetch::isStrideLargeEnough(const SCEVAddRecExpr *AR) {
1491428d41fSAdam Nemet   unsigned TargetMinStride = getMinPrefetchStride();
1506d8beecaSAdam Nemet   // No need to check if any stride goes.
1516d8beecaSAdam Nemet   if (TargetMinStride <= 1)
1526d8beecaSAdam Nemet     return true;
1536d8beecaSAdam Nemet 
1546d8beecaSAdam Nemet   const auto *ConstStride = dyn_cast<SCEVConstant>(AR->getStepRecurrence(*SE));
1556d8beecaSAdam Nemet   // If MinStride is set, don't prefetch unless we can ensure that stride is
1566d8beecaSAdam Nemet   // larger.
1576d8beecaSAdam Nemet   if (!ConstStride)
1586d8beecaSAdam Nemet     return false;
1596d8beecaSAdam Nemet 
1606d8beecaSAdam Nemet   unsigned AbsStride = std::abs(ConstStride->getAPInt().getSExtValue());
1616d8beecaSAdam Nemet   return TargetMinStride <= AbsStride;
1626d8beecaSAdam Nemet }
1636d8beecaSAdam Nemet 
1641eca6bc6STeresa Johnson PreservedAnalyses LoopDataPrefetchPass::run(Function &F,
1651eca6bc6STeresa Johnson                                             FunctionAnalysisManager &AM) {
1661eca6bc6STeresa Johnson   LoopInfo *LI = &AM.getResult<LoopAnalysis>(F);
1671eca6bc6STeresa Johnson   ScalarEvolution *SE = &AM.getResult<ScalarEvolutionAnalysis>(F);
168*aec2fa35SDaniel Jasper   AssumptionCache *AC = &AM.getResult<AssumptionAnalysis>(F);
1691eca6bc6STeresa Johnson   OptimizationRemarkEmitter *ORE =
1701eca6bc6STeresa Johnson       &AM.getResult<OptimizationRemarkEmitterAnalysis>(F);
1711eca6bc6STeresa Johnson   const TargetTransformInfo *TTI = &AM.getResult<TargetIRAnalysis>(F);
1721eca6bc6STeresa Johnson 
173*aec2fa35SDaniel Jasper   LoopDataPrefetch LDP(AC, LI, SE, TTI, ORE);
1741eca6bc6STeresa Johnson   bool Changed = LDP.run();
1751eca6bc6STeresa Johnson 
1761eca6bc6STeresa Johnson   if (Changed) {
1771eca6bc6STeresa Johnson     PreservedAnalyses PA;
1781eca6bc6STeresa Johnson     PA.preserve<DominatorTreeAnalysis>();
1791eca6bc6STeresa Johnson     PA.preserve<LoopAnalysis>();
1801eca6bc6STeresa Johnson     return PA;
1811eca6bc6STeresa Johnson   }
1821eca6bc6STeresa Johnson 
1831eca6bc6STeresa Johnson   return PreservedAnalyses::all();
1841eca6bc6STeresa Johnson }
1851eca6bc6STeresa Johnson 
1861eca6bc6STeresa Johnson bool LoopDataPrefetchLegacyPass::runOnFunction(Function &F) {
18750271f78SAndrew Kaylor   if (skipFunction(F))
18850271f78SAndrew Kaylor     return false;
18950271f78SAndrew Kaylor 
1901eca6bc6STeresa Johnson   LoopInfo *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
1911eca6bc6STeresa Johnson   ScalarEvolution *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();
192*aec2fa35SDaniel Jasper   AssumptionCache *AC =
193*aec2fa35SDaniel Jasper       &getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
1941eca6bc6STeresa Johnson   OptimizationRemarkEmitter *ORE =
1951eca6bc6STeresa Johnson       &getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE();
1961eca6bc6STeresa Johnson   const TargetTransformInfo *TTI =
1971eca6bc6STeresa Johnson       &getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
1989d9cb274SAdam Nemet 
199*aec2fa35SDaniel Jasper   LoopDataPrefetch LDP(AC, LI, SE, TTI, ORE);
2001eca6bc6STeresa Johnson   return LDP.run();
2011eca6bc6STeresa Johnson }
2021eca6bc6STeresa Johnson 
2031eca6bc6STeresa Johnson bool LoopDataPrefetch::run() {
204bb3680bdSAdam Nemet   // If PrefetchDistance is not set, don't run the pass.  This gives an
205bb3680bdSAdam Nemet   // opportunity for targets to run this pass for selected subtargets only
206bb3680bdSAdam Nemet   // (whose TTI sets PrefetchDistance).
2071428d41fSAdam Nemet   if (getPrefetchDistance() == 0)
208bb3680bdSAdam Nemet     return false;
2099d9cb274SAdam Nemet   assert(TTI->getCacheLineSize() && "Cache line size is not set for target");
2109d9cb274SAdam Nemet 
2119d9cb274SAdam Nemet   bool MadeChange = false;
2129d9cb274SAdam Nemet 
213135f735aSBenjamin Kramer   for (Loop *I : *LI)
214135f735aSBenjamin Kramer     for (auto L = df_begin(I), LE = df_end(I); L != LE; ++L)
2159d9cb274SAdam Nemet       MadeChange |= runOnLoop(*L);
2169d9cb274SAdam Nemet 
2179d9cb274SAdam Nemet   return MadeChange;
2189d9cb274SAdam Nemet }
2199d9cb274SAdam Nemet 
2209d9cb274SAdam Nemet bool LoopDataPrefetch::runOnLoop(Loop *L) {
2219d9cb274SAdam Nemet   bool MadeChange = false;
2229d9cb274SAdam Nemet 
2239d9cb274SAdam Nemet   // Only prefetch in the inner-most loop
2249d9cb274SAdam Nemet   if (!L->empty())
2259d9cb274SAdam Nemet     return MadeChange;
2269d9cb274SAdam Nemet 
2279d9cb274SAdam Nemet   SmallPtrSet<const Value *, 32> EphValues;
228*aec2fa35SDaniel Jasper   CodeMetrics::collectEphemeralValues(L, AC, EphValues);
2299d9cb274SAdam Nemet 
2309d9cb274SAdam Nemet   // Calculate the number of iterations ahead to prefetch
2319d9cb274SAdam Nemet   CodeMetrics Metrics;
232c6cebf72SBalaram Makam   for (const auto BB : L->blocks()) {
2339d9cb274SAdam Nemet     // If the loop already has prefetches, then assume that the user knows
2342cf5e89eSNico Weber     // what they are doing and don't add any more.
235c6cebf72SBalaram Makam     for (auto &I : *BB)
236c6cebf72SBalaram Makam       if (CallInst *CI = dyn_cast<CallInst>(&I))
2379d9cb274SAdam Nemet         if (Function *F = CI->getCalledFunction())
2389d9cb274SAdam Nemet           if (F->getIntrinsicID() == Intrinsic::prefetch)
2399d9cb274SAdam Nemet             return MadeChange;
2409d9cb274SAdam Nemet 
241c6cebf72SBalaram Makam     Metrics.analyzeBasicBlock(BB, *TTI, EphValues);
2429d9cb274SAdam Nemet   }
2439d9cb274SAdam Nemet   unsigned LoopSize = Metrics.NumInsts;
2449d9cb274SAdam Nemet   if (!LoopSize)
2459d9cb274SAdam Nemet     LoopSize = 1;
2469d9cb274SAdam Nemet 
2471428d41fSAdam Nemet   unsigned ItersAhead = getPrefetchDistance() / LoopSize;
2489d9cb274SAdam Nemet   if (!ItersAhead)
2499d9cb274SAdam Nemet     ItersAhead = 1;
2509d9cb274SAdam Nemet 
2511428d41fSAdam Nemet   if (ItersAhead > getMaxPrefetchIterationsAhead())
252709e3046SAdam Nemet     return MadeChange;
253709e3046SAdam Nemet 
25434785ecfSAdam Nemet   DEBUG(dbgs() << "Prefetching " << ItersAhead
25534785ecfSAdam Nemet                << " iterations ahead (loop size: " << LoopSize << ") in "
256eea7c267SAdam Nemet                << L->getHeader()->getParent()->getName() << ": " << *L);
25734785ecfSAdam Nemet 
2589d9cb274SAdam Nemet   SmallVector<std::pair<Instruction *, const SCEVAddRecExpr *>, 16> PrefLoads;
259c6cebf72SBalaram Makam   for (const auto BB : L->blocks()) {
260c6cebf72SBalaram Makam     for (auto &I : *BB) {
2619d9cb274SAdam Nemet       Value *PtrValue;
2629d9cb274SAdam Nemet       Instruction *MemI;
2639d9cb274SAdam Nemet 
264c6cebf72SBalaram Makam       if (LoadInst *LMemI = dyn_cast<LoadInst>(&I)) {
2659d9cb274SAdam Nemet         MemI = LMemI;
2669d9cb274SAdam Nemet         PtrValue = LMemI->getPointerOperand();
267c6cebf72SBalaram Makam       } else if (StoreInst *SMemI = dyn_cast<StoreInst>(&I)) {
2689d9cb274SAdam Nemet         if (!PrefetchWrites) continue;
2699d9cb274SAdam Nemet         MemI = SMemI;
2709d9cb274SAdam Nemet         PtrValue = SMemI->getPointerOperand();
2719d9cb274SAdam Nemet       } else continue;
2729d9cb274SAdam Nemet 
2739d9cb274SAdam Nemet       unsigned PtrAddrSpace = PtrValue->getType()->getPointerAddressSpace();
2749d9cb274SAdam Nemet       if (PtrAddrSpace)
2759d9cb274SAdam Nemet         continue;
2769d9cb274SAdam Nemet 
2779d9cb274SAdam Nemet       if (L->isLoopInvariant(PtrValue))
2789d9cb274SAdam Nemet         continue;
2799d9cb274SAdam Nemet 
2809d9cb274SAdam Nemet       const SCEV *LSCEV = SE->getSCEV(PtrValue);
2819d9cb274SAdam Nemet       const SCEVAddRecExpr *LSCEVAddRec = dyn_cast<SCEVAddRecExpr>(LSCEV);
2829d9cb274SAdam Nemet       if (!LSCEVAddRec)
2839d9cb274SAdam Nemet         continue;
2849d9cb274SAdam Nemet 
2856d8beecaSAdam Nemet       // Check if the the stride of the accesses is large enough to warrant a
2866d8beecaSAdam Nemet       // prefetch.
2876d8beecaSAdam Nemet       if (!isStrideLargeEnough(LSCEVAddRec))
2886d8beecaSAdam Nemet         continue;
2896d8beecaSAdam Nemet 
2909d9cb274SAdam Nemet       // We don't want to double prefetch individual cache lines. If this load
2919d9cb274SAdam Nemet       // is known to be within one cache line of some other load that has
2929d9cb274SAdam Nemet       // already been prefetched, then don't prefetch this one as well.
2939d9cb274SAdam Nemet       bool DupPref = false;
294135f735aSBenjamin Kramer       for (const auto &PrefLoad : PrefLoads) {
295135f735aSBenjamin Kramer         const SCEV *PtrDiff = SE->getMinusSCEV(LSCEVAddRec, PrefLoad.second);
2969d9cb274SAdam Nemet         if (const SCEVConstant *ConstPtrDiff =
2979d9cb274SAdam Nemet             dyn_cast<SCEVConstant>(PtrDiff)) {
2989d9cb274SAdam Nemet           int64_t PD = std::abs(ConstPtrDiff->getValue()->getSExtValue());
2999d9cb274SAdam Nemet           if (PD < (int64_t) TTI->getCacheLineSize()) {
3009d9cb274SAdam Nemet             DupPref = true;
3019d9cb274SAdam Nemet             break;
3029d9cb274SAdam Nemet           }
3039d9cb274SAdam Nemet         }
3049d9cb274SAdam Nemet       }
3059d9cb274SAdam Nemet       if (DupPref)
3069d9cb274SAdam Nemet         continue;
3079d9cb274SAdam Nemet 
3089d9cb274SAdam Nemet       const SCEV *NextLSCEV = SE->getAddExpr(LSCEVAddRec, SE->getMulExpr(
3099d9cb274SAdam Nemet         SE->getConstant(LSCEVAddRec->getType(), ItersAhead),
3109d9cb274SAdam Nemet         LSCEVAddRec->getStepRecurrence(*SE)));
3119d9cb274SAdam Nemet       if (!isSafeToExpand(NextLSCEV, *SE))
3129d9cb274SAdam Nemet         continue;
3139d9cb274SAdam Nemet 
3149d9cb274SAdam Nemet       PrefLoads.push_back(std::make_pair(MemI, LSCEVAddRec));
3159d9cb274SAdam Nemet 
316c6cebf72SBalaram Makam       Type *I8Ptr = Type::getInt8PtrTy(BB->getContext(), PtrAddrSpace);
317c6cebf72SBalaram Makam       SCEVExpander SCEVE(*SE, I.getModule()->getDataLayout(), "prefaddr");
3189d9cb274SAdam Nemet       Value *PrefPtrValue = SCEVE.expandCodeFor(NextLSCEV, I8Ptr, MemI);
3199d9cb274SAdam Nemet 
3209d9cb274SAdam Nemet       IRBuilder<> Builder(MemI);
321c6cebf72SBalaram Makam       Module *M = BB->getParent()->getParent();
322c6cebf72SBalaram Makam       Type *I32 = Type::getInt32Ty(BB->getContext());
3239d9cb274SAdam Nemet       Value *PrefetchFunc = Intrinsic::getDeclaration(M, Intrinsic::prefetch);
3249d9cb274SAdam Nemet       Builder.CreateCall(
3259d9cb274SAdam Nemet           PrefetchFunc,
3269d9cb274SAdam Nemet           {PrefPtrValue,
3279d9cb274SAdam Nemet            ConstantInt::get(I32, MemI->mayReadFromMemory() ? 0 : 1),
3289d9cb274SAdam Nemet            ConstantInt::get(I32, 3), ConstantInt::get(I32, 1)});
32934785ecfSAdam Nemet       ++NumPrefetches;
33034785ecfSAdam Nemet       DEBUG(dbgs() << "  Access: " << *PtrValue << ", SCEV: " << *LSCEV
33134785ecfSAdam Nemet                    << "\n");
332fce01788SAdam Nemet       ORE->emit(OptimizationRemark(DEBUG_TYPE, "Prefetched", MemI)
333fce01788SAdam Nemet                 << "prefetched memory access");
3349d9cb274SAdam Nemet 
3359d9cb274SAdam Nemet       MadeChange = true;
3369d9cb274SAdam Nemet     }
3379d9cb274SAdam Nemet   }
3389d9cb274SAdam Nemet 
3399d9cb274SAdam Nemet   return MadeChange;
3409d9cb274SAdam Nemet }
3419d9cb274SAdam Nemet 
342