19775a620SHiroshi Yamauchi //===-- ControlHeightReduction.cpp - Control Height Reduction -------------===// 29775a620SHiroshi Yamauchi // 39775a620SHiroshi Yamauchi // The LLVM Compiler Infrastructure 49775a620SHiroshi Yamauchi // 59775a620SHiroshi Yamauchi // This file is distributed under the University of Illinois Open Source 69775a620SHiroshi Yamauchi // License. See LICENSE.TXT for details. 79775a620SHiroshi Yamauchi // 89775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 99775a620SHiroshi Yamauchi // 109775a620SHiroshi Yamauchi // This pass merges conditional blocks of code and reduces the number of 119775a620SHiroshi Yamauchi // conditional branches in the hot paths based on profiles. 129775a620SHiroshi Yamauchi // 139775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 149775a620SHiroshi Yamauchi 159775a620SHiroshi Yamauchi #include "llvm/Transforms/Instrumentation/ControlHeightReduction.h" 169775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils.h" 179775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/BasicBlockUtils.h" 189775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/Cloning.h" 199775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/ValueMapper.h" 209775a620SHiroshi Yamauchi #include "llvm/ADT/DenseMap.h" 219775a620SHiroshi Yamauchi #include "llvm/ADT/DenseSet.h" 229775a620SHiroshi Yamauchi #include "llvm/ADT/SmallVector.h" 239775a620SHiroshi Yamauchi #include "llvm/ADT/StringSet.h" 249775a620SHiroshi Yamauchi #include "llvm/Analysis/BlockFrequencyInfo.h" 259775a620SHiroshi Yamauchi #include "llvm/Analysis/ProfileSummaryInfo.h" 269775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionInfo.h" 279775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionIterator.h" 289775a620SHiroshi Yamauchi #include "llvm/Analysis/ValueTracking.h" 299775a620SHiroshi Yamauchi #include "llvm/IR/CFG.h" 309775a620SHiroshi Yamauchi #include "llvm/IR/Dominators.h" 319775a620SHiroshi Yamauchi #include "llvm/IR/IRBuilder.h" 329775a620SHiroshi Yamauchi #include "llvm/IR/MDBuilder.h" 339775a620SHiroshi Yamauchi #include "llvm/Support/BranchProbability.h" 349775a620SHiroshi Yamauchi #include "llvm/Support/MemoryBuffer.h" 359775a620SHiroshi Yamauchi #include "llvm/Transforms/Scalar.h" 369775a620SHiroshi Yamauchi 3772ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 389775a620SHiroshi Yamauchi #include <cxxabi.h> 3972ee6d60SHiroshi Yamauchi #endif 409775a620SHiroshi Yamauchi #include <set> 419775a620SHiroshi Yamauchi #include <sstream> 429775a620SHiroshi Yamauchi 439775a620SHiroshi Yamauchi using namespace llvm; 449775a620SHiroshi Yamauchi 459775a620SHiroshi Yamauchi #define DEBUG_TYPE "chr" 469775a620SHiroshi Yamauchi 479775a620SHiroshi Yamauchi #define CHR_DEBUG(X) LLVM_DEBUG(X) 489775a620SHiroshi Yamauchi 499775a620SHiroshi Yamauchi static cl::opt<bool> ForceCHR("force-chr", cl::init(false), cl::Hidden, 509775a620SHiroshi Yamauchi cl::desc("Apply CHR for all functions")); 519775a620SHiroshi Yamauchi 529775a620SHiroshi Yamauchi static cl::opt<double> CHRBiasThreshold( 539775a620SHiroshi Yamauchi "chr-bias-threshold", cl::init(0.99), cl::Hidden, 549775a620SHiroshi Yamauchi cl::desc("CHR considers a branch bias greater than this ratio as biased")); 559775a620SHiroshi Yamauchi 569775a620SHiroshi Yamauchi static cl::opt<unsigned> CHRMergeThreshold( 579775a620SHiroshi Yamauchi "chr-merge-threshold", cl::init(2), cl::Hidden, 589775a620SHiroshi Yamauchi cl::desc("CHR merges a group of N branches/selects where N >= this value")); 599775a620SHiroshi Yamauchi 609775a620SHiroshi Yamauchi static cl::opt<std::string> CHRModuleList( 619775a620SHiroshi Yamauchi "chr-module-list", cl::init(""), cl::Hidden, 629775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of modules to apply CHR to")); 639775a620SHiroshi Yamauchi 649775a620SHiroshi Yamauchi static cl::opt<std::string> CHRFunctionList( 659775a620SHiroshi Yamauchi "chr-function-list", cl::init(""), cl::Hidden, 669775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of functions to apply CHR to")); 679775a620SHiroshi Yamauchi 689775a620SHiroshi Yamauchi static StringSet<> CHRModules; 699775a620SHiroshi Yamauchi static StringSet<> CHRFunctions; 709775a620SHiroshi Yamauchi 719775a620SHiroshi Yamauchi static void ParseCHRFilterFiles() { 729775a620SHiroshi Yamauchi if (!CHRModuleList.empty()) { 739775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRModuleList); 749775a620SHiroshi Yamauchi if (!FileOrErr) { 759775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-module-list file " << CHRModuleList << "\n"; 769775a620SHiroshi Yamauchi std::exit(1); 779775a620SHiroshi Yamauchi } 789775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 799775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 809775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 819775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 829775a620SHiroshi Yamauchi Line = Line.trim(); 839775a620SHiroshi Yamauchi if (!Line.empty()) 849775a620SHiroshi Yamauchi CHRModules.insert(Line); 859775a620SHiroshi Yamauchi } 869775a620SHiroshi Yamauchi } 879775a620SHiroshi Yamauchi if (!CHRFunctionList.empty()) { 889775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRFunctionList); 899775a620SHiroshi Yamauchi if (!FileOrErr) { 909775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-function-list file " << CHRFunctionList << "\n"; 919775a620SHiroshi Yamauchi std::exit(1); 929775a620SHiroshi Yamauchi } 939775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 949775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 959775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 969775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 979775a620SHiroshi Yamauchi Line = Line.trim(); 989775a620SHiroshi Yamauchi if (!Line.empty()) 999775a620SHiroshi Yamauchi CHRFunctions.insert(Line); 1009775a620SHiroshi Yamauchi } 1019775a620SHiroshi Yamauchi } 1029775a620SHiroshi Yamauchi } 1039775a620SHiroshi Yamauchi 1049775a620SHiroshi Yamauchi namespace { 1059775a620SHiroshi Yamauchi class ControlHeightReductionLegacyPass : public FunctionPass { 1069775a620SHiroshi Yamauchi public: 1079775a620SHiroshi Yamauchi static char ID; 1089775a620SHiroshi Yamauchi 1099775a620SHiroshi Yamauchi ControlHeightReductionLegacyPass() : FunctionPass(ID) { 1109775a620SHiroshi Yamauchi initializeControlHeightReductionLegacyPassPass( 1119775a620SHiroshi Yamauchi *PassRegistry::getPassRegistry()); 1129775a620SHiroshi Yamauchi ParseCHRFilterFiles(); 1139775a620SHiroshi Yamauchi } 1149775a620SHiroshi Yamauchi 1159775a620SHiroshi Yamauchi bool runOnFunction(Function &F) override; 1169775a620SHiroshi Yamauchi void getAnalysisUsage(AnalysisUsage &AU) const override { 1179775a620SHiroshi Yamauchi AU.addRequired<BlockFrequencyInfoWrapperPass>(); 1189775a620SHiroshi Yamauchi AU.addRequired<DominatorTreeWrapperPass>(); 1199775a620SHiroshi Yamauchi AU.addRequired<ProfileSummaryInfoWrapperPass>(); 1209775a620SHiroshi Yamauchi AU.addRequired<RegionInfoPass>(); 1219775a620SHiroshi Yamauchi AU.addPreserved<GlobalsAAWrapperPass>(); 1229775a620SHiroshi Yamauchi } 1239775a620SHiroshi Yamauchi }; 1249775a620SHiroshi Yamauchi } // end anonymous namespace 1259775a620SHiroshi Yamauchi 1269775a620SHiroshi Yamauchi char ControlHeightReductionLegacyPass::ID = 0; 1279775a620SHiroshi Yamauchi 1289775a620SHiroshi Yamauchi INITIALIZE_PASS_BEGIN(ControlHeightReductionLegacyPass, 1299775a620SHiroshi Yamauchi "chr", 1309775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1319775a620SHiroshi Yamauchi false, false) 1329775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) 1339775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 1349775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) 1359775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(RegionInfoPass) 1369775a620SHiroshi Yamauchi INITIALIZE_PASS_END(ControlHeightReductionLegacyPass, 1379775a620SHiroshi Yamauchi "chr", 1389775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1399775a620SHiroshi Yamauchi false, false) 1409775a620SHiroshi Yamauchi 1419775a620SHiroshi Yamauchi FunctionPass *llvm::createControlHeightReductionLegacyPass() { 1429775a620SHiroshi Yamauchi return new ControlHeightReductionLegacyPass(); 1439775a620SHiroshi Yamauchi } 1449775a620SHiroshi Yamauchi 1459775a620SHiroshi Yamauchi namespace { 1469775a620SHiroshi Yamauchi 1479775a620SHiroshi Yamauchi struct CHRStats { 1489775a620SHiroshi Yamauchi CHRStats() : NumBranches(0), NumBranchesDelta(0), 1499775a620SHiroshi Yamauchi WeightedNumBranchesDelta(0) {} 1509775a620SHiroshi Yamauchi void print(raw_ostream &OS) const { 1519775a620SHiroshi Yamauchi OS << "CHRStats: NumBranches " << NumBranches 1529775a620SHiroshi Yamauchi << " NumBranchesDelta " << NumBranchesDelta 1539775a620SHiroshi Yamauchi << " WeightedNumBranchesDelta " << WeightedNumBranchesDelta; 1549775a620SHiroshi Yamauchi } 1559775a620SHiroshi Yamauchi uint64_t NumBranches; // The original number of conditional branches / 1569775a620SHiroshi Yamauchi // selects 1579775a620SHiroshi Yamauchi uint64_t NumBranchesDelta; // The decrease of the number of conditional 1589775a620SHiroshi Yamauchi // branches / selects in the hot paths due to CHR. 1599775a620SHiroshi Yamauchi uint64_t WeightedNumBranchesDelta; // NumBranchesDelta weighted by the profile 1609775a620SHiroshi Yamauchi // count at the scope entry. 1619775a620SHiroshi Yamauchi }; 1629775a620SHiroshi Yamauchi 1639775a620SHiroshi Yamauchi inline raw_ostream &operator<<(raw_ostream &OS, const CHRStats &Stats) { 1649775a620SHiroshi Yamauchi Stats.print(OS); 1659775a620SHiroshi Yamauchi return OS; 1669775a620SHiroshi Yamauchi } 1679775a620SHiroshi Yamauchi 1689775a620SHiroshi Yamauchi // RegInfo - some properties of a Region. 1699775a620SHiroshi Yamauchi struct RegInfo { 1709775a620SHiroshi Yamauchi RegInfo() : R(nullptr), HasBranch(false) {} 1719775a620SHiroshi Yamauchi RegInfo(Region *RegionIn) : R(RegionIn), HasBranch(false) {} 1729775a620SHiroshi Yamauchi Region *R; 1739775a620SHiroshi Yamauchi bool HasBranch; 1749775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 1759775a620SHiroshi Yamauchi }; 1769775a620SHiroshi Yamauchi 1779775a620SHiroshi Yamauchi typedef DenseMap<Region *, DenseSet<Instruction *>> HoistStopMapTy; 1789775a620SHiroshi Yamauchi 1799775a620SHiroshi Yamauchi // CHRScope - a sequence of regions to CHR together. It corresponds to a 1809775a620SHiroshi Yamauchi // sequence of conditional blocks. It can have subscopes which correspond to 1819775a620SHiroshi Yamauchi // nested conditional blocks. Nested CHRScopes form a tree. 1829775a620SHiroshi Yamauchi class CHRScope { 1839775a620SHiroshi Yamauchi public: 1849775a620SHiroshi Yamauchi CHRScope(RegInfo RI) : BranchInsertPoint(nullptr) { 1859775a620SHiroshi Yamauchi assert(RI.R && "Null RegionIn"); 1869775a620SHiroshi Yamauchi RegInfos.push_back(RI); 1879775a620SHiroshi Yamauchi } 1889775a620SHiroshi Yamauchi 1899775a620SHiroshi Yamauchi Region *getParentRegion() { 1909775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1919775a620SHiroshi Yamauchi Region *Parent = RegInfos[0].R->getParent(); 1929775a620SHiroshi Yamauchi assert(Parent && "Unexpected to call this on the top-level region"); 1939775a620SHiroshi Yamauchi return Parent; 1949775a620SHiroshi Yamauchi } 1959775a620SHiroshi Yamauchi 1969775a620SHiroshi Yamauchi BasicBlock *getEntryBlock() { 1979775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1989775a620SHiroshi Yamauchi return RegInfos.front().R->getEntry(); 1999775a620SHiroshi Yamauchi } 2009775a620SHiroshi Yamauchi 2019775a620SHiroshi Yamauchi BasicBlock *getExitBlock() { 2029775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 2039775a620SHiroshi Yamauchi return RegInfos.back().R->getExit(); 2049775a620SHiroshi Yamauchi } 2059775a620SHiroshi Yamauchi 2069775a620SHiroshi Yamauchi bool appendable(CHRScope *Next) { 2079775a620SHiroshi Yamauchi // The next scope is appendable only if this scope is directly connected to 2089775a620SHiroshi Yamauchi // it (which implies it post-dominates this scope) and this scope dominates 2099775a620SHiroshi Yamauchi // it (no edge to the next scope outside this scope). 2109775a620SHiroshi Yamauchi BasicBlock *NextEntry = Next->getEntryBlock(); 2119775a620SHiroshi Yamauchi if (getExitBlock() != NextEntry) 2129775a620SHiroshi Yamauchi // Not directly connected. 2139775a620SHiroshi Yamauchi return false; 2149775a620SHiroshi Yamauchi Region *LastRegion = RegInfos.back().R; 2159775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(NextEntry)) 2169775a620SHiroshi Yamauchi if (!LastRegion->contains(Pred)) 2179775a620SHiroshi Yamauchi // There's an edge going into the entry of the next scope from outside 2189775a620SHiroshi Yamauchi // of this scope. 2199775a620SHiroshi Yamauchi return false; 2209775a620SHiroshi Yamauchi return true; 2219775a620SHiroshi Yamauchi } 2229775a620SHiroshi Yamauchi 2239775a620SHiroshi Yamauchi void append(CHRScope *Next) { 2249775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 2259775a620SHiroshi Yamauchi assert(Next->RegInfos.size() > 0 && "Empty CHRScope"); 2269775a620SHiroshi Yamauchi assert(getParentRegion() == Next->getParentRegion() && 2279775a620SHiroshi Yamauchi "Must be siblings"); 2289775a620SHiroshi Yamauchi assert(getExitBlock() == Next->getEntryBlock() && 2299775a620SHiroshi Yamauchi "Must be adjacent"); 2309775a620SHiroshi Yamauchi for (RegInfo &RI : Next->RegInfos) 2319775a620SHiroshi Yamauchi RegInfos.push_back(RI); 2329775a620SHiroshi Yamauchi for (CHRScope *Sub : Next->Subs) 2339775a620SHiroshi Yamauchi Subs.push_back(Sub); 2349775a620SHiroshi Yamauchi } 2359775a620SHiroshi Yamauchi 2369775a620SHiroshi Yamauchi void addSub(CHRScope *SubIn) { 2379775a620SHiroshi Yamauchi #ifndef NDEBUG 2389775a620SHiroshi Yamauchi bool is_child = false; 2399775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) 2409775a620SHiroshi Yamauchi if (RI.R == SubIn->getParentRegion()) { 2419775a620SHiroshi Yamauchi is_child = true; 2429775a620SHiroshi Yamauchi break; 2439775a620SHiroshi Yamauchi } 2449775a620SHiroshi Yamauchi assert(is_child && "Must be a child"); 2459775a620SHiroshi Yamauchi #endif 2469775a620SHiroshi Yamauchi Subs.push_back(SubIn); 2479775a620SHiroshi Yamauchi } 2489775a620SHiroshi Yamauchi 2499775a620SHiroshi Yamauchi // Split this scope at the boundary region into two, which will belong to the 2509775a620SHiroshi Yamauchi // tail and returns the tail. 2519775a620SHiroshi Yamauchi CHRScope *split(Region *Boundary) { 2529775a620SHiroshi Yamauchi assert(Boundary && "Boundary null"); 2539775a620SHiroshi Yamauchi assert(RegInfos.begin()->R != Boundary && 2549775a620SHiroshi Yamauchi "Can't be split at beginning"); 2559775a620SHiroshi Yamauchi auto BoundaryIt = std::find_if(RegInfos.begin(), RegInfos.end(), 2569775a620SHiroshi Yamauchi [&Boundary](const RegInfo& RI) { 2579775a620SHiroshi Yamauchi return Boundary == RI.R; 2589775a620SHiroshi Yamauchi }); 2599775a620SHiroshi Yamauchi if (BoundaryIt == RegInfos.end()) 2609775a620SHiroshi Yamauchi return nullptr; 2619775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> TailRegInfos; 2629775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> TailSubs; 2639775a620SHiroshi Yamauchi TailRegInfos.insert(TailRegInfos.begin(), BoundaryIt, RegInfos.end()); 2649775a620SHiroshi Yamauchi RegInfos.resize(BoundaryIt - RegInfos.begin()); 2659775a620SHiroshi Yamauchi DenseSet<Region *> TailRegionSet; 2669775a620SHiroshi Yamauchi for (RegInfo &RI : TailRegInfos) 2679775a620SHiroshi Yamauchi TailRegionSet.insert(RI.R); 2689775a620SHiroshi Yamauchi for (auto It = Subs.begin(); It != Subs.end(); ) { 2699775a620SHiroshi Yamauchi CHRScope *Sub = *It; 2709775a620SHiroshi Yamauchi assert(Sub && "null Sub"); 2719775a620SHiroshi Yamauchi Region *Parent = Sub->getParentRegion(); 2729775a620SHiroshi Yamauchi if (TailRegionSet.count(Parent)) { 2739775a620SHiroshi Yamauchi TailSubs.push_back(Sub); 2749775a620SHiroshi Yamauchi It = Subs.erase(It); 2759775a620SHiroshi Yamauchi } else { 2769775a620SHiroshi Yamauchi assert(std::find_if(RegInfos.begin(), RegInfos.end(), 2779775a620SHiroshi Yamauchi [&Parent](const RegInfo& RI) { 2789775a620SHiroshi Yamauchi return Parent == RI.R; 2799775a620SHiroshi Yamauchi }) != RegInfos.end() && 2809775a620SHiroshi Yamauchi "Must be in head"); 2819775a620SHiroshi Yamauchi ++It; 2829775a620SHiroshi Yamauchi } 2839775a620SHiroshi Yamauchi } 2849775a620SHiroshi Yamauchi assert(HoistStopMap.empty() && "MapHoistStops must be empty"); 2859775a620SHiroshi Yamauchi return new CHRScope(TailRegInfos, TailSubs); 2869775a620SHiroshi Yamauchi } 2879775a620SHiroshi Yamauchi 2889775a620SHiroshi Yamauchi bool contains(Instruction *I) const { 2899775a620SHiroshi Yamauchi BasicBlock *Parent = I->getParent(); 2909775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) 2919775a620SHiroshi Yamauchi if (RI.R->contains(Parent)) 2929775a620SHiroshi Yamauchi return true; 2939775a620SHiroshi Yamauchi return false; 2949775a620SHiroshi Yamauchi } 2959775a620SHiroshi Yamauchi 2969775a620SHiroshi Yamauchi void print(raw_ostream &OS) const; 2979775a620SHiroshi Yamauchi 2989775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos; // Regions that belong to this scope 2999775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subs; // Subscopes. 3009775a620SHiroshi Yamauchi 3019775a620SHiroshi Yamauchi // The instruction at which to insert the CHR conditional branch (and hoist 3029775a620SHiroshi Yamauchi // the dependent condition values). 3039775a620SHiroshi Yamauchi Instruction *BranchInsertPoint; 3049775a620SHiroshi Yamauchi 3059775a620SHiroshi Yamauchi // True-biased and false-biased regions (conditional blocks), 3069775a620SHiroshi Yamauchi // respectively. Used only for the outermost scope and includes regions in 3079775a620SHiroshi Yamauchi // subscopes. The rest are unbiased. 3089775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegions; 3099775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegions; 3109775a620SHiroshi Yamauchi // Among the biased regions, the regions that get CHRed. 3119775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> CHRRegions; 3129775a620SHiroshi Yamauchi 3139775a620SHiroshi Yamauchi // True-biased and false-biased selects, respectively. Used only for the 3149775a620SHiroshi Yamauchi // outermost scope and includes ones in subscopes. 3159775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelects; 3169775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelects; 3179775a620SHiroshi Yamauchi 3189775a620SHiroshi Yamauchi // Map from one of the above regions to the instructions to stop 3199775a620SHiroshi Yamauchi // hoisting instructions at through use-def chains. 3209775a620SHiroshi Yamauchi HoistStopMapTy HoistStopMap; 3219775a620SHiroshi Yamauchi 3229775a620SHiroshi Yamauchi private: 3239775a620SHiroshi Yamauchi CHRScope(SmallVector<RegInfo, 8> &RegInfosIn, 3249775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> &SubsIn) 3259775a620SHiroshi Yamauchi : RegInfos(RegInfosIn), Subs(SubsIn), BranchInsertPoint(nullptr) {} 3269775a620SHiroshi Yamauchi }; 3279775a620SHiroshi Yamauchi 3289775a620SHiroshi Yamauchi inline raw_ostream &operator<<(raw_ostream &OS, const CHRScope &Scope) { 3299775a620SHiroshi Yamauchi Scope.print(OS); 3309775a620SHiroshi Yamauchi return OS; 3319775a620SHiroshi Yamauchi } 3329775a620SHiroshi Yamauchi 3339775a620SHiroshi Yamauchi class CHR { 3349775a620SHiroshi Yamauchi public: 3359775a620SHiroshi Yamauchi CHR(Function &Fin, BlockFrequencyInfo &BFIin, DominatorTree &DTin, 3369775a620SHiroshi Yamauchi ProfileSummaryInfo &PSIin, RegionInfo &RIin) 3379775a620SHiroshi Yamauchi : F(Fin), BFI(BFIin), DT(DTin), PSI(PSIin), RI(RIin) {} 3389775a620SHiroshi Yamauchi 3399775a620SHiroshi Yamauchi ~CHR() { 3409775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 3419775a620SHiroshi Yamauchi delete Scope; 3429775a620SHiroshi Yamauchi } 3439775a620SHiroshi Yamauchi } 3449775a620SHiroshi Yamauchi 3459775a620SHiroshi Yamauchi bool run(); 3469775a620SHiroshi Yamauchi 3479775a620SHiroshi Yamauchi private: 3489775a620SHiroshi Yamauchi // See the comments in CHR::run() for the high level flow of the algorithm and 3499775a620SHiroshi Yamauchi // what the following functions do. 3509775a620SHiroshi Yamauchi 3519775a620SHiroshi Yamauchi void findScopes(SmallVectorImpl<CHRScope *> &Output) { 3529775a620SHiroshi Yamauchi Region *R = RI.getTopLevelRegion(); 3539775a620SHiroshi Yamauchi CHRScope *Scope = findScopes(R, nullptr, nullptr, Output); 3549775a620SHiroshi Yamauchi if (Scope) { 3559775a620SHiroshi Yamauchi Output.push_back(Scope); 3569775a620SHiroshi Yamauchi } 3579775a620SHiroshi Yamauchi } 3589775a620SHiroshi Yamauchi CHRScope *findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 3599775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes); 3609775a620SHiroshi Yamauchi CHRScope *findScope(Region *R); 3619775a620SHiroshi Yamauchi void checkScopeHoistable(CHRScope *Scope); 3629775a620SHiroshi Yamauchi 3639775a620SHiroshi Yamauchi void splitScopes(SmallVectorImpl<CHRScope *> &Input, 3649775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3659775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> splitScope(CHRScope *Scope, 3669775a620SHiroshi Yamauchi CHRScope *Outer, 3679775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 3689775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 3699775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 3709775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables); 3719775a620SHiroshi Yamauchi 3729775a620SHiroshi Yamauchi void classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes); 3739775a620SHiroshi Yamauchi void classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope); 3749775a620SHiroshi Yamauchi 3759775a620SHiroshi Yamauchi void filterScopes(SmallVectorImpl<CHRScope *> &Input, 3769775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3779775a620SHiroshi Yamauchi 3789775a620SHiroshi Yamauchi void setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 3799775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3809775a620SHiroshi Yamauchi void setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope); 3819775a620SHiroshi Yamauchi 3829775a620SHiroshi Yamauchi void sortScopes(SmallVectorImpl<CHRScope *> &Input, 3839775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3849775a620SHiroshi Yamauchi 3859775a620SHiroshi Yamauchi void transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes); 3869775a620SHiroshi Yamauchi void transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs); 3879775a620SHiroshi Yamauchi void cloneScopeBlocks(CHRScope *Scope, 3889775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3899775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 3909775a620SHiroshi Yamauchi Region *LastRegion, 3919775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3929775a620SHiroshi Yamauchi BranchInst *createMergedBranch(BasicBlock *PreEntryBlock, 3939775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 3949775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 3959775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3969775a620SHiroshi Yamauchi void fixupBranchesAndSelects(CHRScope *Scope, 3979775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3989775a620SHiroshi Yamauchi BranchInst *MergedBR, 3999775a620SHiroshi Yamauchi uint64_t ProfileCount); 4009775a620SHiroshi Yamauchi void fixupBranch(Region *R, 4019775a620SHiroshi Yamauchi CHRScope *Scope, 4029775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4039775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 4049775a620SHiroshi Yamauchi void fixupSelect(SelectInst* SI, 4059775a620SHiroshi Yamauchi CHRScope *Scope, 4069775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4079775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 4089775a620SHiroshi Yamauchi void addToMergedCondition(bool IsTrueBiased, Value *Cond, 4099775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 4109775a620SHiroshi Yamauchi CHRScope *Scope, 4119775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4129775a620SHiroshi Yamauchi Value *&MergedCondition); 4139775a620SHiroshi Yamauchi 4149775a620SHiroshi Yamauchi Function &F; 4159775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI; 4169775a620SHiroshi Yamauchi DominatorTree &DT; 4179775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI; 4189775a620SHiroshi Yamauchi RegionInfo &RI; 4199775a620SHiroshi Yamauchi CHRStats Stats; 4209775a620SHiroshi Yamauchi 4219775a620SHiroshi Yamauchi // All the true-biased regions in the function 4229775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegionsGlobal; 4239775a620SHiroshi Yamauchi // All the false-biased regions in the function 4249775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegionsGlobal; 4259775a620SHiroshi Yamauchi // All the true-biased selects in the function 4269775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelectsGlobal; 4279775a620SHiroshi Yamauchi // All the false-biased selects in the function 4289775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelectsGlobal; 4299775a620SHiroshi Yamauchi // A map from biased regions to their branch bias 4309775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> BranchBiasMap; 4319775a620SHiroshi Yamauchi // A map from biased selects to their branch bias 4329775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> SelectBiasMap; 4339775a620SHiroshi Yamauchi // All the scopes. 4349775a620SHiroshi Yamauchi DenseSet<CHRScope *> Scopes; 4359775a620SHiroshi Yamauchi }; 4369775a620SHiroshi Yamauchi 4379775a620SHiroshi Yamauchi } // end anonymous namespace 4389775a620SHiroshi Yamauchi 4399775a620SHiroshi Yamauchi static bool shouldApply(Function &F, ProfileSummaryInfo& PSI) { 4409775a620SHiroshi Yamauchi if (ForceCHR) 4419775a620SHiroshi Yamauchi return true; 4429775a620SHiroshi Yamauchi 4439775a620SHiroshi Yamauchi if (!CHRModuleList.empty() || !CHRFunctionList.empty()) { 4449775a620SHiroshi Yamauchi if (CHRModules.count(F.getParent()->getName())) 4459775a620SHiroshi Yamauchi return true; 4469775a620SHiroshi Yamauchi StringRef Name = F.getName(); 4479775a620SHiroshi Yamauchi if (CHRFunctions.count(Name)) 4489775a620SHiroshi Yamauchi return true; 4499775a620SHiroshi Yamauchi const char* DemangledName = nullptr; 45072ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 451*792a4f8aSReid Kleckner int Status = -1; 4529775a620SHiroshi Yamauchi DemangledName = abi::__cxa_demangle(Name.str().c_str(), 4539775a620SHiroshi Yamauchi nullptr, nullptr, &Status); 45472ee6d60SHiroshi Yamauchi #endif 4559775a620SHiroshi Yamauchi return DemangledName && CHRFunctions.count(DemangledName); 4569775a620SHiroshi Yamauchi } 4579775a620SHiroshi Yamauchi 4589775a620SHiroshi Yamauchi assert(PSI.hasProfileSummary() && "Empty PSI?"); 4599775a620SHiroshi Yamauchi return PSI.isFunctionEntryHot(&F); 4609775a620SHiroshi Yamauchi } 4619775a620SHiroshi Yamauchi 4629775a620SHiroshi Yamauchi static void dumpIR(Function &F, const char *Label, CHRStats *Stats) { 4639775a620SHiroshi Yamauchi std::string Name = F.getName().str(); 4649775a620SHiroshi Yamauchi const char *DemangledName = nullptr; 46572ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 466*792a4f8aSReid Kleckner int Status = -1; 4679775a620SHiroshi Yamauchi DemangledName = abi::__cxa_demangle(Name.c_str(), 4689775a620SHiroshi Yamauchi nullptr, nullptr, &Status); 46972ee6d60SHiroshi Yamauchi #endif 4709775a620SHiroshi Yamauchi if (DemangledName == nullptr) { 4719775a620SHiroshi Yamauchi DemangledName = "<NOT-MANGLED>"; 4729775a620SHiroshi Yamauchi } 4739775a620SHiroshi Yamauchi std::string ModuleName = F.getParent()->getName().str(); 4749775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR IR dump " << Label << " " << ModuleName << " " 4759775a620SHiroshi Yamauchi << Name); 4769775a620SHiroshi Yamauchi if (Stats) 4779775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << " " << *Stats); 4789775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "\n"); 4799775a620SHiroshi Yamauchi CHR_DEBUG(F.dump()); 4809775a620SHiroshi Yamauchi } 4819775a620SHiroshi Yamauchi 4829775a620SHiroshi Yamauchi 4839775a620SHiroshi Yamauchi void CHRScope::print(raw_ostream &OS) const { 4849775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 4859775a620SHiroshi Yamauchi OS << "CHRScope["; 4869775a620SHiroshi Yamauchi OS << RegInfos.size() << ", Regions["; 4879775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) { 4889775a620SHiroshi Yamauchi OS << RI.R->getNameStr(); 4899775a620SHiroshi Yamauchi if (RI.HasBranch) 4909775a620SHiroshi Yamauchi OS << " B"; 4919775a620SHiroshi Yamauchi if (RI.Selects.size() > 0) 4929775a620SHiroshi Yamauchi OS << " S" << RI.Selects.size(); 4939775a620SHiroshi Yamauchi OS << ", "; 4949775a620SHiroshi Yamauchi } 4959775a620SHiroshi Yamauchi if (RegInfos[0].R->getParent()) { 4969775a620SHiroshi Yamauchi OS << "], Parent " << RegInfos[0].R->getParent()->getNameStr(); 4979775a620SHiroshi Yamauchi } else { 4989775a620SHiroshi Yamauchi // top level region 4999775a620SHiroshi Yamauchi OS << "]"; 5009775a620SHiroshi Yamauchi } 5019775a620SHiroshi Yamauchi OS << ", Subs["; 5029775a620SHiroshi Yamauchi for (CHRScope *Sub : Subs) { 5039775a620SHiroshi Yamauchi OS << *Sub << ", "; 5049775a620SHiroshi Yamauchi } 5059775a620SHiroshi Yamauchi OS << "]]"; 5069775a620SHiroshi Yamauchi } 5079775a620SHiroshi Yamauchi 5089775a620SHiroshi Yamauchi // Return true if the given instruction type can be hoisted by CHR. 5099775a620SHiroshi Yamauchi static bool isHoistableInstructionType(Instruction *I) { 5109775a620SHiroshi Yamauchi return isa<BinaryOperator>(I) || isa<CastInst>(I) || isa<SelectInst>(I) || 5119775a620SHiroshi Yamauchi isa<GetElementPtrInst>(I) || isa<CmpInst>(I) || 5129775a620SHiroshi Yamauchi isa<InsertElementInst>(I) || isa<ExtractElementInst>(I) || 5139775a620SHiroshi Yamauchi isa<ShuffleVectorInst>(I) || isa<ExtractValueInst>(I) || 5149775a620SHiroshi Yamauchi isa<InsertValueInst>(I); 5159775a620SHiroshi Yamauchi } 5169775a620SHiroshi Yamauchi 5179775a620SHiroshi Yamauchi // Return true if the given instruction can be hoisted by CHR. 5189775a620SHiroshi Yamauchi static bool isHoistable(Instruction *I, DominatorTree &DT) { 5199775a620SHiroshi Yamauchi if (!isHoistableInstructionType(I)) 5209775a620SHiroshi Yamauchi return false; 5219775a620SHiroshi Yamauchi return isSafeToSpeculativelyExecute(I, nullptr, &DT); 5229775a620SHiroshi Yamauchi } 5239775a620SHiroshi Yamauchi 5249775a620SHiroshi Yamauchi // Recursively traverse the use-def chains of the given value and return a set 5259775a620SHiroshi Yamauchi // of the unhoistable base values defined within the scope (excluding the 5269775a620SHiroshi Yamauchi // first-region entry block) or the (hoistable or unhoistable) base values that 5279775a620SHiroshi Yamauchi // are defined outside (including the first-region entry block) of the 5289775a620SHiroshi Yamauchi // scope. The returned set doesn't include constants. 5299775a620SHiroshi Yamauchi static std::set<Value *> getBaseValues(Value *V, 5309775a620SHiroshi Yamauchi DominatorTree &DT) { 5319775a620SHiroshi Yamauchi std::set<Value *> Result; 5329775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 5339775a620SHiroshi Yamauchi // We don't stop at a block that's not in the Scope because we would miss some 5349775a620SHiroshi Yamauchi // instructions that are based on the same base values if we stop there. 5359775a620SHiroshi Yamauchi if (!isHoistable(I, DT)) { 5369775a620SHiroshi Yamauchi Result.insert(I); 5379775a620SHiroshi Yamauchi return Result; 5389775a620SHiroshi Yamauchi } 5399775a620SHiroshi Yamauchi // I is hoistable above the Scope. 5409775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 5419775a620SHiroshi Yamauchi std::set<Value *> OpResult = getBaseValues(Op, DT); 5429775a620SHiroshi Yamauchi Result.insert(OpResult.begin(), OpResult.end()); 5439775a620SHiroshi Yamauchi } 5449775a620SHiroshi Yamauchi return Result; 5459775a620SHiroshi Yamauchi } 5469775a620SHiroshi Yamauchi if (isa<Argument>(V)) { 5479775a620SHiroshi Yamauchi Result.insert(V); 5489775a620SHiroshi Yamauchi return Result; 5499775a620SHiroshi Yamauchi } 5509775a620SHiroshi Yamauchi // We don't include others like constants because those won't lead to any 5519775a620SHiroshi Yamauchi // chance of folding of conditions (eg two bit checks merged into one check) 5529775a620SHiroshi Yamauchi // after CHR. 5539775a620SHiroshi Yamauchi return Result; // empty 5549775a620SHiroshi Yamauchi } 5559775a620SHiroshi Yamauchi 5569775a620SHiroshi Yamauchi // Return true if V is already hoisted or can be hoisted (along with its 5579775a620SHiroshi Yamauchi // operands) above the insert point. When it returns true and HoistStops is 5589775a620SHiroshi Yamauchi // non-null, the instructions to stop hoisting at through the use-def chains are 5599775a620SHiroshi Yamauchi // inserted into HoistStops. 5609775a620SHiroshi Yamauchi static bool 5619775a620SHiroshi Yamauchi checkHoistValue(Value *V, Instruction *InsertPoint, DominatorTree &DT, 5629775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables, 5639775a620SHiroshi Yamauchi DenseSet<Instruction *> *HoistStops) { 5649775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 5659775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 5669775a620SHiroshi Yamauchi assert(DT.getNode(I->getParent()) && "DT must contain I's parent block"); 5679775a620SHiroshi Yamauchi assert(DT.getNode(InsertPoint->getParent()) && "DT must contain Destination"); 5689775a620SHiroshi Yamauchi if (Unhoistables.count(I)) { 5699775a620SHiroshi Yamauchi // Don't hoist if they are not to be hoisted. 5709775a620SHiroshi Yamauchi return false; 5719775a620SHiroshi Yamauchi } 5729775a620SHiroshi Yamauchi if (DT.dominates(I, InsertPoint)) { 5739775a620SHiroshi Yamauchi // We are already above the insert point. Stop here. 5749775a620SHiroshi Yamauchi if (HoistStops) 5759775a620SHiroshi Yamauchi HoistStops->insert(I); 5769775a620SHiroshi Yamauchi return true; 5779775a620SHiroshi Yamauchi } 5789775a620SHiroshi Yamauchi // We aren't not above the insert point, check if we can hoist it above the 5799775a620SHiroshi Yamauchi // insert point. 5809775a620SHiroshi Yamauchi if (isHoistable(I, DT)) { 5819775a620SHiroshi Yamauchi // Check operands first. 5829775a620SHiroshi Yamauchi DenseSet<Instruction *> OpsHoistStops; 5839775a620SHiroshi Yamauchi bool AllOpsHoisted = true; 5849775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 5859775a620SHiroshi Yamauchi if (!checkHoistValue(Op, InsertPoint, DT, Unhoistables, &OpsHoistStops)) { 5869775a620SHiroshi Yamauchi AllOpsHoisted = false; 5879775a620SHiroshi Yamauchi break; 5889775a620SHiroshi Yamauchi } 5899775a620SHiroshi Yamauchi } 5909775a620SHiroshi Yamauchi if (AllOpsHoisted) { 5919775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "checkHoistValue " << *I << "\n"); 5929775a620SHiroshi Yamauchi if (HoistStops) 5939775a620SHiroshi Yamauchi HoistStops->insert(OpsHoistStops.begin(), OpsHoistStops.end()); 5949775a620SHiroshi Yamauchi return true; 5959775a620SHiroshi Yamauchi } 5969775a620SHiroshi Yamauchi } 5979775a620SHiroshi Yamauchi return false; 5989775a620SHiroshi Yamauchi } 5999775a620SHiroshi Yamauchi // Non-instructions are considered hoistable. 6009775a620SHiroshi Yamauchi return true; 6019775a620SHiroshi Yamauchi } 6029775a620SHiroshi Yamauchi 6039775a620SHiroshi Yamauchi // Returns true and sets the true probability and false probability of an 6049775a620SHiroshi Yamauchi // MD_prof metadata if it's well-formed. 6059775a620SHiroshi Yamauchi static bool CheckMDProf(MDNode *MD, BranchProbability &TrueProb, 6069775a620SHiroshi Yamauchi BranchProbability &FalseProb) { 6079775a620SHiroshi Yamauchi if (!MD) return false; 6089775a620SHiroshi Yamauchi MDString *MDName = cast<MDString>(MD->getOperand(0)); 6099775a620SHiroshi Yamauchi if (MDName->getString() != "branch_weights" || 6109775a620SHiroshi Yamauchi MD->getNumOperands() != 3) 6119775a620SHiroshi Yamauchi return false; 6129775a620SHiroshi Yamauchi ConstantInt *TrueWeight = mdconst::extract<ConstantInt>(MD->getOperand(1)); 6139775a620SHiroshi Yamauchi ConstantInt *FalseWeight = mdconst::extract<ConstantInt>(MD->getOperand(2)); 6149775a620SHiroshi Yamauchi if (!TrueWeight || !FalseWeight) 6159775a620SHiroshi Yamauchi return false; 6169775a620SHiroshi Yamauchi APInt TrueWt = TrueWeight->getValue(); 6179775a620SHiroshi Yamauchi APInt FalseWt = FalseWeight->getValue(); 6189775a620SHiroshi Yamauchi APInt SumWt = TrueWt + FalseWt; 6199775a620SHiroshi Yamauchi TrueProb = BranchProbability::getBranchProbability(TrueWt.getZExtValue(), 6209775a620SHiroshi Yamauchi SumWt.getZExtValue()); 6219775a620SHiroshi Yamauchi FalseProb = BranchProbability::getBranchProbability(FalseWt.getZExtValue(), 6229775a620SHiroshi Yamauchi SumWt.getZExtValue()); 6239775a620SHiroshi Yamauchi return true; 6249775a620SHiroshi Yamauchi } 6259775a620SHiroshi Yamauchi 6269775a620SHiroshi Yamauchi static BranchProbability getCHRBiasThreshold() { 6279775a620SHiroshi Yamauchi return BranchProbability::getBranchProbability( 6289775a620SHiroshi Yamauchi static_cast<uint64_t>(CHRBiasThreshold * 1000000), 1000000); 6299775a620SHiroshi Yamauchi } 6309775a620SHiroshi Yamauchi 6319775a620SHiroshi Yamauchi // A helper for CheckBiasedBranch and CheckBiasedSelect. If TrueProb >= 6329775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into TrueSet and return true. If FalseProb >= 6339775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into FalseSet and return true. Otherwise, return 6349775a620SHiroshi Yamauchi // false. 6359775a620SHiroshi Yamauchi template<typename K, typename S, typename M> 6369775a620SHiroshi Yamauchi bool CheckBias(K *Key, BranchProbability TrueProb, BranchProbability FalseProb, 6379775a620SHiroshi Yamauchi S &TrueSet, S &FalseSet, M &BiasMap) { 6389775a620SHiroshi Yamauchi BranchProbability Threshold = getCHRBiasThreshold(); 6399775a620SHiroshi Yamauchi if (TrueProb >= Threshold) { 6409775a620SHiroshi Yamauchi TrueSet.insert(Key); 6419775a620SHiroshi Yamauchi BiasMap[Key] = TrueProb; 6429775a620SHiroshi Yamauchi return true; 6439775a620SHiroshi Yamauchi } else if (FalseProb >= Threshold) { 6449775a620SHiroshi Yamauchi FalseSet.insert(Key); 6459775a620SHiroshi Yamauchi BiasMap[Key] = FalseProb; 6469775a620SHiroshi Yamauchi return true; 6479775a620SHiroshi Yamauchi } 6489775a620SHiroshi Yamauchi return false; 6499775a620SHiroshi Yamauchi } 6509775a620SHiroshi Yamauchi 6519775a620SHiroshi Yamauchi // Returns true and insert a region into the right biased set and the map if the 6529775a620SHiroshi Yamauchi // branch of the region is biased. 6539775a620SHiroshi Yamauchi static bool CheckBiasedBranch(BranchInst *BI, Region *R, 6549775a620SHiroshi Yamauchi DenseSet<Region *> &TrueBiasedRegionsGlobal, 6559775a620SHiroshi Yamauchi DenseSet<Region *> &FalseBiasedRegionsGlobal, 6569775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> &BranchBiasMap) { 6579775a620SHiroshi Yamauchi if (!BI->isConditional()) 6589775a620SHiroshi Yamauchi return false; 6599775a620SHiroshi Yamauchi BranchProbability ThenProb, ElseProb; 6609775a620SHiroshi Yamauchi if (!CheckMDProf(BI->getMetadata(LLVMContext::MD_prof), 6619775a620SHiroshi Yamauchi ThenProb, ElseProb)) 6629775a620SHiroshi Yamauchi return false; 6639775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(0); 6649775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(1); 6659775a620SHiroshi Yamauchi assert((IfThen == R->getExit() || IfElse == R->getExit()) && 6669775a620SHiroshi Yamauchi IfThen != IfElse && 6679775a620SHiroshi Yamauchi "Invariant from findScopes"); 6689775a620SHiroshi Yamauchi if (IfThen == R->getExit()) { 6699775a620SHiroshi Yamauchi // Swap them so that IfThen/ThenProb means going into the conditional code 6709775a620SHiroshi Yamauchi // and IfElse/ElseProb means skipping it. 6719775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 6729775a620SHiroshi Yamauchi std::swap(ThenProb, ElseProb); 6739775a620SHiroshi Yamauchi } 6749775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *BI << " "); 6759775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ThenProb " << ThenProb << " "); 6769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ElseProb " << ElseProb << "\n"); 6779775a620SHiroshi Yamauchi return CheckBias(R, ThenProb, ElseProb, 6789775a620SHiroshi Yamauchi TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 6799775a620SHiroshi Yamauchi BranchBiasMap); 6809775a620SHiroshi Yamauchi } 6819775a620SHiroshi Yamauchi 6829775a620SHiroshi Yamauchi // Returns true and insert a select into the right biased set and the map if the 6839775a620SHiroshi Yamauchi // select is biased. 6849775a620SHiroshi Yamauchi static bool CheckBiasedSelect( 6859775a620SHiroshi Yamauchi SelectInst *SI, Region *R, 6869775a620SHiroshi Yamauchi DenseSet<SelectInst *> &TrueBiasedSelectsGlobal, 6879775a620SHiroshi Yamauchi DenseSet<SelectInst *> &FalseBiasedSelectsGlobal, 6889775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> &SelectBiasMap) { 6899775a620SHiroshi Yamauchi BranchProbability TrueProb, FalseProb; 6909775a620SHiroshi Yamauchi if (!CheckMDProf(SI->getMetadata(LLVMContext::MD_prof), 6919775a620SHiroshi Yamauchi TrueProb, FalseProb)) 6929775a620SHiroshi Yamauchi return false; 6939775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << " "); 6949775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "TrueProb " << TrueProb << " "); 6959775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "FalseProb " << FalseProb << "\n"); 6969775a620SHiroshi Yamauchi return CheckBias(SI, TrueProb, FalseProb, 6979775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, FalseBiasedSelectsGlobal, 6989775a620SHiroshi Yamauchi SelectBiasMap); 6999775a620SHiroshi Yamauchi } 7009775a620SHiroshi Yamauchi 7019775a620SHiroshi Yamauchi // Returns the instruction at which to hoist the dependent condition values and 7029775a620SHiroshi Yamauchi // insert the CHR branch for a region. This is the terminator branch in the 7039775a620SHiroshi Yamauchi // entry block or the first select in the entry block, if any. 7049775a620SHiroshi Yamauchi static Instruction* getBranchInsertPoint(RegInfo &RI) { 7059775a620SHiroshi Yamauchi Region *R = RI.R; 7069775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 7079775a620SHiroshi Yamauchi // The hoist point is by default the terminator of the entry block, which is 7089775a620SHiroshi Yamauchi // the same as the branch instruction if RI.HasBranch is true. 7099775a620SHiroshi Yamauchi Instruction *HoistPoint = EntryBB->getTerminator(); 7109775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7119775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7129775a620SHiroshi Yamauchi // Pick the first select in Selects in the entry block. Note Selects is 7139775a620SHiroshi Yamauchi // sorted in the instruction order within a block (asserted below). 7149775a620SHiroshi Yamauchi HoistPoint = SI; 7159775a620SHiroshi Yamauchi break; 7169775a620SHiroshi Yamauchi } 7179775a620SHiroshi Yamauchi } 7189775a620SHiroshi Yamauchi assert(HoistPoint && "Null HoistPoint"); 7199775a620SHiroshi Yamauchi #ifndef NDEBUG 7209775a620SHiroshi Yamauchi // Check that HoistPoint is the first one in Selects in the entry block, 7219775a620SHiroshi Yamauchi // if any. 7229775a620SHiroshi Yamauchi DenseSet<Instruction *> EntryBlockSelectSet; 7239775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7249775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7259775a620SHiroshi Yamauchi EntryBlockSelectSet.insert(SI); 7269775a620SHiroshi Yamauchi } 7279775a620SHiroshi Yamauchi } 7289775a620SHiroshi Yamauchi for (Instruction &I : *EntryBB) { 7299775a620SHiroshi Yamauchi if (EntryBlockSelectSet.count(&I) > 0) { 7309775a620SHiroshi Yamauchi assert(&I == HoistPoint && 7319775a620SHiroshi Yamauchi "HoistPoint must be the first one in Selects"); 7329775a620SHiroshi Yamauchi break; 7339775a620SHiroshi Yamauchi } 7349775a620SHiroshi Yamauchi } 7359775a620SHiroshi Yamauchi #endif 7369775a620SHiroshi Yamauchi return HoistPoint; 7379775a620SHiroshi Yamauchi } 7389775a620SHiroshi Yamauchi 7399775a620SHiroshi Yamauchi // Find a CHR scope in the given region. 7409775a620SHiroshi Yamauchi CHRScope * CHR::findScope(Region *R) { 7419775a620SHiroshi Yamauchi CHRScope *Result = nullptr; 7429775a620SHiroshi Yamauchi BasicBlock *Entry = R->getEntry(); 7439775a620SHiroshi Yamauchi BasicBlock *Exit = R->getExit(); // null if top level. 7449775a620SHiroshi Yamauchi assert(Entry && "Entry must not be null"); 7459775a620SHiroshi Yamauchi assert((Exit == nullptr) == (R->isTopLevelRegion()) && 7469775a620SHiroshi Yamauchi "Only top level region has a null exit"); 7479775a620SHiroshi Yamauchi if (Entry) 7489775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry " << Entry->getName() << "\n"); 7499775a620SHiroshi Yamauchi else 7509775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry null\n"); 7519775a620SHiroshi Yamauchi if (Exit) 7529775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit " << Exit->getName() << "\n"); 7539775a620SHiroshi Yamauchi else 7549775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit null\n"); 7559775a620SHiroshi Yamauchi // Exclude cases where Entry is part of a subregion (hence it doesn't belong 7569775a620SHiroshi Yamauchi // to this region). 7579775a620SHiroshi Yamauchi bool EntryInSubregion = RI.getRegionFor(Entry) != R; 7589775a620SHiroshi Yamauchi if (EntryInSubregion) 7599775a620SHiroshi Yamauchi return nullptr; 7609775a620SHiroshi Yamauchi // Exclude loops 7619775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(Entry)) 7629775a620SHiroshi Yamauchi if (R->contains(Pred)) 7639775a620SHiroshi Yamauchi return nullptr; 7649775a620SHiroshi Yamauchi if (Exit) { 7659775a620SHiroshi Yamauchi // Try to find an if-then block (check if R is an if-then). 7669775a620SHiroshi Yamauchi // if (cond) { 7679775a620SHiroshi Yamauchi // ... 7689775a620SHiroshi Yamauchi // } 7699775a620SHiroshi Yamauchi auto *BI = dyn_cast<BranchInst>(Entry->getTerminator()); 7709775a620SHiroshi Yamauchi if (BI) 7719775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI.isConditional " << BI->isConditional() << "\n"); 7729775a620SHiroshi Yamauchi else 7739775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI null\n"); 7749775a620SHiroshi Yamauchi if (BI && BI->isConditional()) { 7759775a620SHiroshi Yamauchi BasicBlock *S0 = BI->getSuccessor(0); 7769775a620SHiroshi Yamauchi BasicBlock *S1 = BI->getSuccessor(1); 7779775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S0 " << S0->getName() << "\n"); 7789775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S1 " << S1->getName() << "\n"); 7799775a620SHiroshi Yamauchi if (S0 != S1 && (S0 == Exit || S1 == Exit)) { 7809775a620SHiroshi Yamauchi RegInfo RI(R); 7819775a620SHiroshi Yamauchi RI.HasBranch = CheckBiasedBranch( 7829775a620SHiroshi Yamauchi BI, R, TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 7839775a620SHiroshi Yamauchi BranchBiasMap); 7849775a620SHiroshi Yamauchi Result = new CHRScope(RI); 7859775a620SHiroshi Yamauchi Scopes.insert(Result); 7869775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a region with a branch\n"); 7879775a620SHiroshi Yamauchi ++Stats.NumBranches; 7889775a620SHiroshi Yamauchi } 7899775a620SHiroshi Yamauchi } 7909775a620SHiroshi Yamauchi } 7919775a620SHiroshi Yamauchi { 7929775a620SHiroshi Yamauchi // Try to look for selects in the direct child blocks (as opposed to in 7939775a620SHiroshi Yamauchi // subregions) of R. 7949775a620SHiroshi Yamauchi // ... 7959775a620SHiroshi Yamauchi // if (..) { // Some subregion 7969775a620SHiroshi Yamauchi // ... 7979775a620SHiroshi Yamauchi // } 7989775a620SHiroshi Yamauchi // if (..) { // Some subregion 7999775a620SHiroshi Yamauchi // ... 8009775a620SHiroshi Yamauchi // } 8019775a620SHiroshi Yamauchi // ... 8029775a620SHiroshi Yamauchi // a = cond ? b : c; 8039775a620SHiroshi Yamauchi // ... 8049775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 8059775a620SHiroshi Yamauchi for (RegionNode *E : R->elements()) { 8069775a620SHiroshi Yamauchi if (E->isSubRegion()) 8079775a620SHiroshi Yamauchi continue; 8089775a620SHiroshi Yamauchi // This returns the basic block of E if E is a direct child of R (not a 8099775a620SHiroshi Yamauchi // subregion.) 8109775a620SHiroshi Yamauchi BasicBlock *BB = E->getEntry(); 8119775a620SHiroshi Yamauchi // Need to push in the order to make it easier to find the first Select 8129775a620SHiroshi Yamauchi // later. 8139775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 8149775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(&I)) { 8159775a620SHiroshi Yamauchi Selects.push_back(SI); 8169775a620SHiroshi Yamauchi ++Stats.NumBranches; 8179775a620SHiroshi Yamauchi } 8189775a620SHiroshi Yamauchi } 8199775a620SHiroshi Yamauchi } 8209775a620SHiroshi Yamauchi if (Selects.size() > 0) { 8219775a620SHiroshi Yamauchi auto AddSelects = [&](RegInfo &RI) { 8229775a620SHiroshi Yamauchi for (auto *SI : Selects) 8239775a620SHiroshi Yamauchi if (CheckBiasedSelect(SI, RI.R, 8249775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, 8259775a620SHiroshi Yamauchi FalseBiasedSelectsGlobal, 8269775a620SHiroshi Yamauchi SelectBiasMap)) 8279775a620SHiroshi Yamauchi RI.Selects.push_back(SI); 8289775a620SHiroshi Yamauchi }; 8299775a620SHiroshi Yamauchi if (!Result) { 8309775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a select-only region\n"); 8319775a620SHiroshi Yamauchi RegInfo RI(R); 8329775a620SHiroshi Yamauchi AddSelects(RI); 8339775a620SHiroshi Yamauchi Result = new CHRScope(RI); 8349775a620SHiroshi Yamauchi Scopes.insert(Result); 8359775a620SHiroshi Yamauchi } else { 8369775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found select(s) in a region with a branch\n"); 8379775a620SHiroshi Yamauchi AddSelects(Result->RegInfos[0]); 8389775a620SHiroshi Yamauchi } 8399775a620SHiroshi Yamauchi } 8409775a620SHiroshi Yamauchi } 8419775a620SHiroshi Yamauchi 8429775a620SHiroshi Yamauchi if (Result) { 8439775a620SHiroshi Yamauchi checkScopeHoistable(Result); 8449775a620SHiroshi Yamauchi } 8459775a620SHiroshi Yamauchi return Result; 8469775a620SHiroshi Yamauchi } 8479775a620SHiroshi Yamauchi 8489775a620SHiroshi Yamauchi // Check that any of the branch and the selects in the region could be 8499775a620SHiroshi Yamauchi // hoisted above the the CHR branch insert point (the most dominating of 8509775a620SHiroshi Yamauchi // them, either the branch (at the end of the first block) or the first 8519775a620SHiroshi Yamauchi // select in the first block). If the branch can't be hoisted, drop the 8529775a620SHiroshi Yamauchi // selects in the first blocks. 8539775a620SHiroshi Yamauchi // 8549775a620SHiroshi Yamauchi // For example, for the following scope/region with selects, we want to insert 8559775a620SHiroshi Yamauchi // the merged branch right before the first select in the first/entry block by 8569775a620SHiroshi Yamauchi // hoisting c1, c2, c3, and c4. 8579775a620SHiroshi Yamauchi // 8589775a620SHiroshi Yamauchi // // Branch insert point here. 8599775a620SHiroshi Yamauchi // a = c1 ? b : c; // Select 1 8609775a620SHiroshi Yamauchi // d = c2 ? e : f; // Select 2 8619775a620SHiroshi Yamauchi // if (c3) { // Branch 8629775a620SHiroshi Yamauchi // ... 8639775a620SHiroshi Yamauchi // c4 = foo() // A call. 8649775a620SHiroshi Yamauchi // g = c4 ? h : i; // Select 3 8659775a620SHiroshi Yamauchi // } 8669775a620SHiroshi Yamauchi // 8679775a620SHiroshi Yamauchi // But suppose we can't hoist c4 because it's dependent on the preceding 8689775a620SHiroshi Yamauchi // call. Then, we drop Select 3. Furthermore, if we can't hoist c2, we also drop 8699775a620SHiroshi Yamauchi // Select 2. If we can't hoist c3, we drop Selects 1 & 2. 8709775a620SHiroshi Yamauchi void CHR::checkScopeHoistable(CHRScope *Scope) { 8719775a620SHiroshi Yamauchi RegInfo &RI = Scope->RegInfos[0]; 8729775a620SHiroshi Yamauchi Region *R = RI.R; 8739775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 8749775a620SHiroshi Yamauchi auto *Branch = RI.HasBranch ? 8759775a620SHiroshi Yamauchi cast<BranchInst>(EntryBB->getTerminator()) : nullptr; 8769775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> &Selects = RI.Selects; 8779775a620SHiroshi Yamauchi if (RI.HasBranch || !Selects.empty()) { 8789775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 8799775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 8809775a620SHiroshi Yamauchi // Avoid a data dependence from a select or a branch to a(nother) 8819775a620SHiroshi Yamauchi // select. Note no instruction can't data-depend on a branch (a branch 8829775a620SHiroshi Yamauchi // instruction doesn't produce a value). 8839775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 8849775a620SHiroshi Yamauchi // Initialize Unhoistables with the selects. 8859775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 8869775a620SHiroshi Yamauchi Unhoistables.insert(SI); 8879775a620SHiroshi Yamauchi } 8889775a620SHiroshi Yamauchi // Remove Selects that can't be hoisted. 8899775a620SHiroshi Yamauchi for (auto it = Selects.begin(); it != Selects.end(); ) { 8909775a620SHiroshi Yamauchi SelectInst *SI = *it; 8919775a620SHiroshi Yamauchi if (SI == InsertPoint) { 8929775a620SHiroshi Yamauchi ++it; 8939775a620SHiroshi Yamauchi continue; 8949775a620SHiroshi Yamauchi } 8959775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, 8969775a620SHiroshi Yamauchi DT, Unhoistables, nullptr); 8979775a620SHiroshi Yamauchi if (!IsHoistable) { 8989775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping select " << *SI << "\n"); 8999775a620SHiroshi Yamauchi it = Selects.erase(it); 9009775a620SHiroshi Yamauchi // Since we are dropping the select here, we also drop it from 9019775a620SHiroshi Yamauchi // Unhoistables. 9029775a620SHiroshi Yamauchi Unhoistables.erase(SI); 9039775a620SHiroshi Yamauchi } else 9049775a620SHiroshi Yamauchi ++it; 9059775a620SHiroshi Yamauchi } 9069775a620SHiroshi Yamauchi // Update InsertPoint after potentially removing selects. 9079775a620SHiroshi Yamauchi InsertPoint = getBranchInsertPoint(RI); 9089775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9099775a620SHiroshi Yamauchi if (RI.HasBranch && InsertPoint != Branch) { 9109775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(Branch->getCondition(), InsertPoint, 9119775a620SHiroshi Yamauchi DT, Unhoistables, nullptr); 9129775a620SHiroshi Yamauchi if (!IsHoistable) { 9139775a620SHiroshi Yamauchi // If the branch isn't hoistable, drop the selects in the entry 9149775a620SHiroshi Yamauchi // block, preferring the branch, which makes the branch the hoist 9159775a620SHiroshi Yamauchi // point. 9169775a620SHiroshi Yamauchi assert(InsertPoint != Branch && "Branch must not be the hoist point"); 9179775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping selects in entry block \n"); 9189775a620SHiroshi Yamauchi CHR_DEBUG( 9199775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 9209775a620SHiroshi Yamauchi dbgs() << "SI " << *SI << "\n"; 9219775a620SHiroshi Yamauchi }); 9229775a620SHiroshi Yamauchi Selects.erase(std::remove_if(Selects.begin(), Selects.end(), 9239775a620SHiroshi Yamauchi [EntryBB](SelectInst *SI) { 9249775a620SHiroshi Yamauchi return SI->getParent() == EntryBB; 9259775a620SHiroshi Yamauchi }), Selects.end()); 9269775a620SHiroshi Yamauchi Unhoistables.clear(); 9279775a620SHiroshi Yamauchi InsertPoint = Branch; 9289775a620SHiroshi Yamauchi } 9299775a620SHiroshi Yamauchi } 9309775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9319775a620SHiroshi Yamauchi #ifndef NDEBUG 9329775a620SHiroshi Yamauchi if (RI.HasBranch) { 9339775a620SHiroshi Yamauchi assert(!DT.dominates(Branch, InsertPoint) && 9349775a620SHiroshi Yamauchi "Branch can't be already above the hoist point"); 9359775a620SHiroshi Yamauchi assert(checkHoistValue(Branch->getCondition(), InsertPoint, 9369775a620SHiroshi Yamauchi DT, Unhoistables, nullptr) && 9379775a620SHiroshi Yamauchi "checkHoistValue for branch"); 9389775a620SHiroshi Yamauchi } 9399775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9409775a620SHiroshi Yamauchi assert(!DT.dominates(SI, InsertPoint) && 9419775a620SHiroshi Yamauchi "SI can't be already above the hoist point"); 9429775a620SHiroshi Yamauchi assert(checkHoistValue(SI->getCondition(), InsertPoint, DT, 9439775a620SHiroshi Yamauchi Unhoistables, nullptr) && 9449775a620SHiroshi Yamauchi "checkHoistValue for selects"); 9459775a620SHiroshi Yamauchi } 9469775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Result\n"); 9479775a620SHiroshi Yamauchi if (RI.HasBranch) { 9489775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *Branch << "\n"); 9499775a620SHiroshi Yamauchi } 9509775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9519775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << "\n"); 9529775a620SHiroshi Yamauchi } 9539775a620SHiroshi Yamauchi #endif 9549775a620SHiroshi Yamauchi } 9559775a620SHiroshi Yamauchi } 9569775a620SHiroshi Yamauchi 9579775a620SHiroshi Yamauchi // Traverse the region tree, find all nested scopes and merge them if possible. 9589775a620SHiroshi Yamauchi CHRScope * CHR::findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 9599775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes) { 9609775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "findScopes " << R->getNameStr() << "\n"); 9619775a620SHiroshi Yamauchi CHRScope *Result = findScope(R); 9629775a620SHiroshi Yamauchi // Visit subscopes. 9639775a620SHiroshi Yamauchi CHRScope *ConsecutiveSubscope = nullptr; 9649775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subscopes; 9659775a620SHiroshi Yamauchi for (auto It = R->begin(); It != R->end(); ++It) { 9669775a620SHiroshi Yamauchi const std::unique_ptr<Region> &SubR = *It; 9679775a620SHiroshi Yamauchi auto Next_It = std::next(It); 9689775a620SHiroshi Yamauchi Region *NextSubR = Next_It != R->end() ? Next_It->get() : nullptr; 9699775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Looking at subregion " << SubR.get()->getNameStr() 9709775a620SHiroshi Yamauchi << "\n"); 9719775a620SHiroshi Yamauchi CHRScope *SubCHRScope = findScopes(SubR.get(), NextSubR, R, Scopes); 9729775a620SHiroshi Yamauchi if (SubCHRScope) { 9739775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope " << *SubCHRScope << "\n"); 9749775a620SHiroshi Yamauchi } else { 9759775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope null\n"); 9769775a620SHiroshi Yamauchi } 9779775a620SHiroshi Yamauchi if (SubCHRScope) { 9789775a620SHiroshi Yamauchi if (!ConsecutiveSubscope) 9799775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 9809775a620SHiroshi Yamauchi else if (!ConsecutiveSubscope->appendable(SubCHRScope)) { 9819775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9829775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 9839775a620SHiroshi Yamauchi } else 9849775a620SHiroshi Yamauchi ConsecutiveSubscope->append(SubCHRScope); 9859775a620SHiroshi Yamauchi } else { 9869775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 9879775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9889775a620SHiroshi Yamauchi } 9899775a620SHiroshi Yamauchi ConsecutiveSubscope = nullptr; 9909775a620SHiroshi Yamauchi } 9919775a620SHiroshi Yamauchi } 9929775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 9939775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9949775a620SHiroshi Yamauchi } 9959775a620SHiroshi Yamauchi for (CHRScope *Sub : Subscopes) { 9969775a620SHiroshi Yamauchi if (Result) { 9979775a620SHiroshi Yamauchi // Combine it with the parent. 9989775a620SHiroshi Yamauchi Result->addSub(Sub); 9999775a620SHiroshi Yamauchi } else { 10009775a620SHiroshi Yamauchi // Push Subscopes as they won't be combined with the parent. 10019775a620SHiroshi Yamauchi Scopes.push_back(Sub); 10029775a620SHiroshi Yamauchi } 10039775a620SHiroshi Yamauchi } 10049775a620SHiroshi Yamauchi return Result; 10059775a620SHiroshi Yamauchi } 10069775a620SHiroshi Yamauchi 10079775a620SHiroshi Yamauchi static DenseSet<Value *> getCHRConditionValuesForRegion(RegInfo &RI) { 10089775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues; 10099775a620SHiroshi Yamauchi if (RI.HasBranch) { 10109775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(RI.R->getEntry()->getTerminator()); 10119775a620SHiroshi Yamauchi ConditionValues.insert(BI->getCondition()); 10129775a620SHiroshi Yamauchi } 10139775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 10149775a620SHiroshi Yamauchi ConditionValues.insert(SI->getCondition()); 10159775a620SHiroshi Yamauchi } 10169775a620SHiroshi Yamauchi return ConditionValues; 10179775a620SHiroshi Yamauchi } 10189775a620SHiroshi Yamauchi 10199775a620SHiroshi Yamauchi 10209775a620SHiroshi Yamauchi // Determine whether to split a scope depending on the sets of the branch 10219775a620SHiroshi Yamauchi // condition values of the previous region and the current region. We split 10229775a620SHiroshi Yamauchi // (return true) it if 1) the condition values of the inner/lower scope can't be 10239775a620SHiroshi Yamauchi // hoisted up to the outer/upper scope, or 2) the two sets of the condition 10249775a620SHiroshi Yamauchi // values have an empty intersection (because the combined branch conditions 10259775a620SHiroshi Yamauchi // won't probably lead to a simpler combined condition). 10269775a620SHiroshi Yamauchi static bool shouldSplit(Instruction *InsertPoint, 10279775a620SHiroshi Yamauchi DenseSet<Value *> &PrevConditionValues, 10289775a620SHiroshi Yamauchi DenseSet<Value *> &ConditionValues, 10299775a620SHiroshi Yamauchi DominatorTree &DT, 10309775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 10319775a620SHiroshi Yamauchi CHR_DEBUG( 10329775a620SHiroshi Yamauchi dbgs() << "shouldSplit " << *InsertPoint << " PrevConditionValues "; 10339775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10349775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10359775a620SHiroshi Yamauchi } 10369775a620SHiroshi Yamauchi dbgs() << " ConditionValues "; 10379775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10389775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10399775a620SHiroshi Yamauchi } 10409775a620SHiroshi Yamauchi dbgs() << "\n"); 10419775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 10429775a620SHiroshi Yamauchi // If any of Bases isn't hoistable to the hoist point, split. 10439775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10449775a620SHiroshi Yamauchi if (!checkHoistValue(V, InsertPoint, DT, Unhoistables, nullptr)) { 10459775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. checkHoistValue false " << *V << "\n"); 10469775a620SHiroshi Yamauchi return true; // Not hoistable, split. 10479775a620SHiroshi Yamauchi } 10489775a620SHiroshi Yamauchi } 10499775a620SHiroshi Yamauchi // If PrevConditionValues or ConditionValues is empty, don't split to avoid 10509775a620SHiroshi Yamauchi // unnecessary splits at scopes with no branch/selects. If 10519775a620SHiroshi Yamauchi // PrevConditionValues and ConditionValues don't intersect at all, split. 10529775a620SHiroshi Yamauchi if (!PrevConditionValues.empty() && !ConditionValues.empty()) { 10539775a620SHiroshi Yamauchi // Use std::set as DenseSet doesn't work with set_intersection. 10549775a620SHiroshi Yamauchi std::set<Value *> PrevBases, Bases; 10559775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10569775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10579775a620SHiroshi Yamauchi PrevBases.insert(BaseValues.begin(), BaseValues.end()); 10589775a620SHiroshi Yamauchi } 10599775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10609775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10619775a620SHiroshi Yamauchi Bases.insert(BaseValues.begin(), BaseValues.end()); 10629775a620SHiroshi Yamauchi } 10639775a620SHiroshi Yamauchi CHR_DEBUG( 10649775a620SHiroshi Yamauchi dbgs() << "PrevBases "; 10659775a620SHiroshi Yamauchi for (Value *V : PrevBases) { 10669775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10679775a620SHiroshi Yamauchi } 10689775a620SHiroshi Yamauchi dbgs() << " Bases "; 10699775a620SHiroshi Yamauchi for (Value *V : Bases) { 10709775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10719775a620SHiroshi Yamauchi } 10729775a620SHiroshi Yamauchi dbgs() << "\n"); 10739775a620SHiroshi Yamauchi std::set<Value *> Intersection; 10749775a620SHiroshi Yamauchi std::set_intersection(PrevBases.begin(), PrevBases.end(), 10759775a620SHiroshi Yamauchi Bases.begin(), Bases.end(), 10769775a620SHiroshi Yamauchi std::inserter(Intersection, Intersection.begin())); 10779775a620SHiroshi Yamauchi if (Intersection.empty()) { 10789775a620SHiroshi Yamauchi // Empty intersection, split. 10799775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. Intersection empty\n"); 10809775a620SHiroshi Yamauchi return true; 10819775a620SHiroshi Yamauchi } 10829775a620SHiroshi Yamauchi } 10839775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "No split\n"); 10849775a620SHiroshi Yamauchi return false; // Don't split. 10859775a620SHiroshi Yamauchi } 10869775a620SHiroshi Yamauchi 10879775a620SHiroshi Yamauchi static void GetSelectsInScope(CHRScope *Scope, 10889775a620SHiroshi Yamauchi DenseSet<Instruction *> &Output) { 10899775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 10909775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 10919775a620SHiroshi Yamauchi Output.insert(SI); 10929775a620SHiroshi Yamauchi } 10939775a620SHiroshi Yamauchi } 10949775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) { 10959775a620SHiroshi Yamauchi GetSelectsInScope(Sub, Output); 10969775a620SHiroshi Yamauchi } 10979775a620SHiroshi Yamauchi } 10989775a620SHiroshi Yamauchi 10999775a620SHiroshi Yamauchi void CHR::splitScopes(SmallVectorImpl<CHRScope *> &Input, 11009775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 11019775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 11029775a620SHiroshi Yamauchi assert(!Scope->BranchInsertPoint && 11039775a620SHiroshi Yamauchi "BranchInsertPoint must not be set"); 11049775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 11059775a620SHiroshi Yamauchi GetSelectsInScope(Scope, Unhoistables); 11069775a620SHiroshi Yamauchi splitScope(Scope, nullptr, nullptr, nullptr, Output, Unhoistables); 11079775a620SHiroshi Yamauchi } 11089775a620SHiroshi Yamauchi #ifndef NDEBUG 11099775a620SHiroshi Yamauchi for (CHRScope *Scope : Output) { 11109775a620SHiroshi Yamauchi assert(Scope->BranchInsertPoint && "BranchInsertPoint must be set"); 11119775a620SHiroshi Yamauchi } 11129775a620SHiroshi Yamauchi #endif 11139775a620SHiroshi Yamauchi } 11149775a620SHiroshi Yamauchi 11159775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> CHR::splitScope( 11169775a620SHiroshi Yamauchi CHRScope *Scope, 11179775a620SHiroshi Yamauchi CHRScope *Outer, 11189775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 11199775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 11209775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 11219775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 11229775a620SHiroshi Yamauchi if (Outer) { 11239775a620SHiroshi Yamauchi assert(OuterConditionValues && "Null OuterConditionValues"); 11249775a620SHiroshi Yamauchi assert(OuterInsertPoint && "Null OuterInsertPoint"); 11259775a620SHiroshi Yamauchi } 11269775a620SHiroshi Yamauchi bool PrevSplitFromOuter = true; 11279775a620SHiroshi Yamauchi DenseSet<Value *> PrevConditionValues; 11289775a620SHiroshi Yamauchi Instruction *PrevInsertPoint = nullptr; 11299775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Splits; 11309775a620SHiroshi Yamauchi SmallVector<bool, 8> SplitsSplitFromOuter; 11319775a620SHiroshi Yamauchi SmallVector<DenseSet<Value *>, 8> SplitsConditionValues; 11329775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> SplitsInsertPoints; 11339775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos(Scope->RegInfos); // Copy 11349775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) { 11359775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 11369775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues = getCHRConditionValuesForRegion(RI); 11379775a620SHiroshi Yamauchi CHR_DEBUG( 11389775a620SHiroshi Yamauchi dbgs() << "ConditionValues "; 11399775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 11409775a620SHiroshi Yamauchi dbgs() << *V << ", "; 11419775a620SHiroshi Yamauchi } 11429775a620SHiroshi Yamauchi dbgs() << "\n"); 11439775a620SHiroshi Yamauchi if (RI.R == RegInfos[0].R) { 11449775a620SHiroshi Yamauchi // First iteration. Check to see if we should split from the outer. 11459775a620SHiroshi Yamauchi if (Outer) { 11469775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer " << *Outer << "\n"); 11479775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from outer at " 11489775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 11499775a620SHiroshi Yamauchi if (shouldSplit(OuterInsertPoint, *OuterConditionValues, 11509775a620SHiroshi Yamauchi ConditionValues, DT, Unhoistables)) { 11519775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11529775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11539775a620SHiroshi Yamauchi } else { 11549775a620SHiroshi Yamauchi // Not splitting from the outer. Use the outer bases and insert 11559775a620SHiroshi Yamauchi // point. Union the bases. 11569775a620SHiroshi Yamauchi PrevSplitFromOuter = false; 11579775a620SHiroshi Yamauchi PrevConditionValues = *OuterConditionValues; 11589775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), 11599775a620SHiroshi Yamauchi ConditionValues.end()); 11609775a620SHiroshi Yamauchi PrevInsertPoint = OuterInsertPoint; 11619775a620SHiroshi Yamauchi } 11629775a620SHiroshi Yamauchi } else { 11639775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer null\n"); 11649775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11659775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11669775a620SHiroshi Yamauchi } 11679775a620SHiroshi Yamauchi } else { 11689775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from prev at " 11699775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 11709775a620SHiroshi Yamauchi if (shouldSplit(PrevInsertPoint, PrevConditionValues, ConditionValues, 11719775a620SHiroshi Yamauchi DT, Unhoistables)) { 11729775a620SHiroshi Yamauchi CHRScope *Tail = Scope->split(RI.R); 11739775a620SHiroshi Yamauchi Scopes.insert(Tail); 11749775a620SHiroshi Yamauchi Splits.push_back(Scope); 11759775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 11769775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 11779775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 11789775a620SHiroshi Yamauchi Scope = Tail; 11799775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11809775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11819775a620SHiroshi Yamauchi PrevSplitFromOuter = true; 11829775a620SHiroshi Yamauchi } else { 11839775a620SHiroshi Yamauchi // Not splitting. Union the bases. Keep the hoist point. 11849775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), ConditionValues.end()); 11859775a620SHiroshi Yamauchi } 11869775a620SHiroshi Yamauchi } 11879775a620SHiroshi Yamauchi } 11889775a620SHiroshi Yamauchi Splits.push_back(Scope); 11899775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 11909775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 11919775a620SHiroshi Yamauchi assert(PrevInsertPoint && "Null PrevInsertPoint"); 11929775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 11939775a620SHiroshi Yamauchi assert(Splits.size() == SplitsConditionValues.size() && 11949775a620SHiroshi Yamauchi Splits.size() == SplitsSplitFromOuter.size() && 11959775a620SHiroshi Yamauchi Splits.size() == SplitsInsertPoints.size() && "Mismatching sizes"); 11969775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 11979775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 11989775a620SHiroshi Yamauchi DenseSet<Value *> &SplitConditionValues = SplitsConditionValues[I]; 11999775a620SHiroshi Yamauchi Instruction *SplitInsertPoint = SplitsInsertPoints[I]; 12009775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> NewSubs; 12019775a620SHiroshi Yamauchi DenseSet<Instruction *> SplitUnhoistables; 12029775a620SHiroshi Yamauchi GetSelectsInScope(Split, SplitUnhoistables); 12039775a620SHiroshi Yamauchi for (CHRScope *Sub : Split->Subs) { 12049775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SubSplits = splitScope( 12059775a620SHiroshi Yamauchi Sub, Split, &SplitConditionValues, SplitInsertPoint, Output, 12069775a620SHiroshi Yamauchi SplitUnhoistables); 12079775a620SHiroshi Yamauchi NewSubs.insert(NewSubs.end(), SubSplits.begin(), SubSplits.end()); 12089775a620SHiroshi Yamauchi } 12099775a620SHiroshi Yamauchi Split->Subs = NewSubs; 12109775a620SHiroshi Yamauchi } 12119775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Result; 12129775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 12139775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 12149775a620SHiroshi Yamauchi if (SplitsSplitFromOuter[I]) { 12159775a620SHiroshi Yamauchi // Split from the outer. 12169775a620SHiroshi Yamauchi Output.push_back(Split); 12179775a620SHiroshi Yamauchi Split->BranchInsertPoint = SplitsInsertPoints[I]; 12189775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BranchInsertPoint " << *SplitsInsertPoints[I] 12199775a620SHiroshi Yamauchi << "\n"); 12209775a620SHiroshi Yamauchi } else { 12219775a620SHiroshi Yamauchi // Connected to the outer. 12229775a620SHiroshi Yamauchi Result.push_back(Split); 12239775a620SHiroshi Yamauchi } 12249775a620SHiroshi Yamauchi } 12259775a620SHiroshi Yamauchi if (!Outer) 12269775a620SHiroshi Yamauchi assert(Result.empty() && 12279775a620SHiroshi Yamauchi "If no outer (top-level), must return no nested ones"); 12289775a620SHiroshi Yamauchi return Result; 12299775a620SHiroshi Yamauchi } 12309775a620SHiroshi Yamauchi 12319775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes) { 12329775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 12339775a620SHiroshi Yamauchi assert(Scope->TrueBiasedRegions.empty() && Scope->FalseBiasedRegions.empty() && "Empty"); 12349775a620SHiroshi Yamauchi classifyBiasedScopes(Scope, Scope); 12359775a620SHiroshi Yamauchi CHR_DEBUG( 12369775a620SHiroshi Yamauchi dbgs() << "classifyBiasedScopes " << *Scope << "\n"; 12379775a620SHiroshi Yamauchi dbgs() << "TrueBiasedRegions "; 12389775a620SHiroshi Yamauchi for (Region *R : Scope->TrueBiasedRegions) { 12399775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12409775a620SHiroshi Yamauchi } 12419775a620SHiroshi Yamauchi dbgs() << "\n"; 12429775a620SHiroshi Yamauchi dbgs() << "FalseBiasedRegions "; 12439775a620SHiroshi Yamauchi for (Region *R : Scope->FalseBiasedRegions) { 12449775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12459775a620SHiroshi Yamauchi } 12469775a620SHiroshi Yamauchi dbgs() << "\n"; 12479775a620SHiroshi Yamauchi dbgs() << "TrueBiasedSelects "; 12489775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->TrueBiasedSelects) { 12499775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12509775a620SHiroshi Yamauchi } 12519775a620SHiroshi Yamauchi dbgs() << "\n"; 12529775a620SHiroshi Yamauchi dbgs() << "FalseBiasedSelects "; 12539775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->FalseBiasedSelects) { 12549775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12559775a620SHiroshi Yamauchi } 12569775a620SHiroshi Yamauchi dbgs() << "\n";); 12579775a620SHiroshi Yamauchi } 12589775a620SHiroshi Yamauchi } 12599775a620SHiroshi Yamauchi 12609775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope) { 12619775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 12629775a620SHiroshi Yamauchi if (RI.HasBranch) { 12639775a620SHiroshi Yamauchi Region *R = RI.R; 12649775a620SHiroshi Yamauchi if (TrueBiasedRegionsGlobal.count(R) > 0) 12659775a620SHiroshi Yamauchi OutermostScope->TrueBiasedRegions.insert(R); 12669775a620SHiroshi Yamauchi else if (FalseBiasedRegionsGlobal.count(R) > 0) 12679775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.insert(R); 12689775a620SHiroshi Yamauchi else 12699775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 12709775a620SHiroshi Yamauchi } 12719775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 12729775a620SHiroshi Yamauchi if (TrueBiasedSelectsGlobal.count(SI) > 0) 12739775a620SHiroshi Yamauchi OutermostScope->TrueBiasedSelects.insert(SI); 12749775a620SHiroshi Yamauchi else if (FalseBiasedSelectsGlobal.count(SI) > 0) 12759775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.insert(SI); 12769775a620SHiroshi Yamauchi else 12779775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 12789775a620SHiroshi Yamauchi } 12799775a620SHiroshi Yamauchi } 12809775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) { 12819775a620SHiroshi Yamauchi classifyBiasedScopes(Sub, OutermostScope); 12829775a620SHiroshi Yamauchi } 12839775a620SHiroshi Yamauchi } 12849775a620SHiroshi Yamauchi 12859775a620SHiroshi Yamauchi static bool hasAtLeastTwoBiasedBranches(CHRScope *Scope) { 12869775a620SHiroshi Yamauchi unsigned NumBiased = Scope->TrueBiasedRegions.size() + 12879775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.size() + 12889775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.size() + 12899775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.size(); 12909775a620SHiroshi Yamauchi return NumBiased >= CHRMergeThreshold; 12919775a620SHiroshi Yamauchi } 12929775a620SHiroshi Yamauchi 12939775a620SHiroshi Yamauchi void CHR::filterScopes(SmallVectorImpl<CHRScope *> &Input, 12949775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 12959775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 12969775a620SHiroshi Yamauchi // Filter out the ones with only one region and no subs. 12979775a620SHiroshi Yamauchi if (!hasAtLeastTwoBiasedBranches(Scope)) { 12989775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Filtered out by biased branches truthy-regions " 12999775a620SHiroshi Yamauchi << Scope->TrueBiasedRegions.size() 13009775a620SHiroshi Yamauchi << " falsy-regions " << Scope->FalseBiasedRegions.size() 13019775a620SHiroshi Yamauchi << " true-selects " << Scope->TrueBiasedSelects.size() 13029775a620SHiroshi Yamauchi << " false-selects " << Scope->FalseBiasedSelects.size() << "\n"); 13039775a620SHiroshi Yamauchi continue; 13049775a620SHiroshi Yamauchi } 13059775a620SHiroshi Yamauchi Output.push_back(Scope); 13069775a620SHiroshi Yamauchi } 13079775a620SHiroshi Yamauchi } 13089775a620SHiroshi Yamauchi 13099775a620SHiroshi Yamauchi void CHR::setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 13109775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13119775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 13129775a620SHiroshi Yamauchi assert(Scope->HoistStopMap.empty() && Scope->CHRRegions.empty() && 13139775a620SHiroshi Yamauchi "Empty"); 13149775a620SHiroshi Yamauchi setCHRRegions(Scope, Scope); 13159775a620SHiroshi Yamauchi Output.push_back(Scope); 13169775a620SHiroshi Yamauchi CHR_DEBUG( 13179775a620SHiroshi Yamauchi dbgs() << "setCHRRegions HoistStopMap " << *Scope << "\n"; 13189775a620SHiroshi Yamauchi for (auto pair : Scope->HoistStopMap) { 13199775a620SHiroshi Yamauchi Region *R = pair.first; 13209775a620SHiroshi Yamauchi dbgs() << "Region " << R->getNameStr() << "\n"; 13219775a620SHiroshi Yamauchi for (Instruction *I : pair.second) { 13229775a620SHiroshi Yamauchi dbgs() << "HoistStop " << *I << "\n"; 13239775a620SHiroshi Yamauchi } 13249775a620SHiroshi Yamauchi } 13259775a620SHiroshi Yamauchi dbgs() << "CHRRegions" << "\n"; 13269775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 13279775a620SHiroshi Yamauchi dbgs() << RI.R->getNameStr() << "\n"; 13289775a620SHiroshi Yamauchi }); 13299775a620SHiroshi Yamauchi } 13309775a620SHiroshi Yamauchi } 13319775a620SHiroshi Yamauchi 13329775a620SHiroshi Yamauchi void CHR::setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope) { 13339775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 13349775a620SHiroshi Yamauchi // Put the biased selects in Unhoistables because they should stay where they 13359775a620SHiroshi Yamauchi // are and constant-folded after CHR (in case one biased select or a branch 13369775a620SHiroshi Yamauchi // can depend on another biased select.) 13379775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13389775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13399775a620SHiroshi Yamauchi Unhoistables.insert(SI); 13409775a620SHiroshi Yamauchi } 13419775a620SHiroshi Yamauchi } 13429775a620SHiroshi Yamauchi Instruction *InsertPoint = OutermostScope->BranchInsertPoint; 13439775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13449775a620SHiroshi Yamauchi Region *R = RI.R; 13459775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistStops; 13469775a620SHiroshi Yamauchi bool IsHoisted = false; 13479775a620SHiroshi Yamauchi if (RI.HasBranch) { 13489775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedRegions.count(R) > 0 || 13499775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.count(R) > 0) && 13509775a620SHiroshi Yamauchi "Must be truthy or falsy"); 13519775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 13529775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 13539775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(BI->getCondition(), InsertPoint, DT, 13549775a620SHiroshi Yamauchi Unhoistables, &HoistStops); 13559775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 13569775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 13579775a620SHiroshi Yamauchi IsHoisted = true; 13589775a620SHiroshi Yamauchi } 13599775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13609775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedSelects.count(SI) > 0 || 13619775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.count(SI) > 0) && 13629775a620SHiroshi Yamauchi "Must be true or false biased"); 13639775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 13649775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, DT, 13659775a620SHiroshi Yamauchi Unhoistables, &HoistStops); 13669775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 13679775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 13689775a620SHiroshi Yamauchi IsHoisted = true; 13699775a620SHiroshi Yamauchi } 13709775a620SHiroshi Yamauchi if (IsHoisted) { 13719775a620SHiroshi Yamauchi OutermostScope->CHRRegions.push_back(RI); 13729775a620SHiroshi Yamauchi OutermostScope->HoistStopMap[R] = HoistStops; 13739775a620SHiroshi Yamauchi } 13749775a620SHiroshi Yamauchi } 13759775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) 13769775a620SHiroshi Yamauchi setCHRRegions(Sub, OutermostScope); 13779775a620SHiroshi Yamauchi } 13789775a620SHiroshi Yamauchi 13799775a620SHiroshi Yamauchi bool CHRScopeSorter(CHRScope *Scope1, CHRScope *Scope2) { 13809775a620SHiroshi Yamauchi return Scope1->RegInfos[0].R->getDepth() < Scope2->RegInfos[0].R->getDepth(); 13819775a620SHiroshi Yamauchi } 13829775a620SHiroshi Yamauchi 13839775a620SHiroshi Yamauchi void CHR::sortScopes(SmallVectorImpl<CHRScope *> &Input, 13849775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13859775a620SHiroshi Yamauchi Output.resize(Input.size()); 13869775a620SHiroshi Yamauchi std::copy(Input.begin(), Input.end(), Output.begin()); 13879775a620SHiroshi Yamauchi std::stable_sort(Output.begin(), Output.end(), CHRScopeSorter); 13889775a620SHiroshi Yamauchi } 13899775a620SHiroshi Yamauchi 13909775a620SHiroshi Yamauchi // Return true if V is already hoisted or was hoisted (along with its operands) 13919775a620SHiroshi Yamauchi // to the insert point. 13929775a620SHiroshi Yamauchi static void hoistValue(Value *V, Instruction *HoistPoint, Region *R, 13939775a620SHiroshi Yamauchi HoistStopMapTy &HoistStopMap, 13949775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistedSet, 13959775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 13969775a620SHiroshi Yamauchi auto IT = HoistStopMap.find(R); 13979775a620SHiroshi Yamauchi assert(IT != HoistStopMap.end() && "Region must be in hoist stop map"); 13989775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistStops = IT->second; 13999775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 14009775a620SHiroshi Yamauchi if (I == HoistPoint) 14019775a620SHiroshi Yamauchi return; 14029775a620SHiroshi Yamauchi if (HoistStops.count(I)) 14039775a620SHiroshi Yamauchi return; 14049775a620SHiroshi Yamauchi if (auto *PN = dyn_cast<PHINode>(I)) 14059775a620SHiroshi Yamauchi if (TrivialPHIs.count(PN)) 14069775a620SHiroshi Yamauchi // The trivial phi inserted by the previous CHR scope could replace a 14079775a620SHiroshi Yamauchi // non-phi in HoistStops. Note that since this phi is at the exit of a 14089775a620SHiroshi Yamauchi // previous CHR scope, which dominates this scope, it's safe to stop 14099775a620SHiroshi Yamauchi // hoisting there. 14109775a620SHiroshi Yamauchi return; 14119775a620SHiroshi Yamauchi if (HoistedSet.count(I)) 14129775a620SHiroshi Yamauchi // Already hoisted, return. 14139775a620SHiroshi Yamauchi return; 14149775a620SHiroshi Yamauchi assert(isHoistableInstructionType(I) && "Unhoistable instruction type"); 14159775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 14169775a620SHiroshi Yamauchi hoistValue(Op, HoistPoint, R, HoistStopMap, HoistedSet, TrivialPHIs); 14179775a620SHiroshi Yamauchi } 14189775a620SHiroshi Yamauchi I->moveBefore(HoistPoint); 14199775a620SHiroshi Yamauchi HoistedSet.insert(I); 14209775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "hoistValue " << *I << "\n"); 14219775a620SHiroshi Yamauchi } 14229775a620SHiroshi Yamauchi } 14239775a620SHiroshi Yamauchi 14249775a620SHiroshi Yamauchi // Hoist the dependent condition values of the branches and the selects in the 14259775a620SHiroshi Yamauchi // scope to the insert point. 14269775a620SHiroshi Yamauchi static void hoistScopeConditions(CHRScope *Scope, Instruction *HoistPoint, 14279775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 14289775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistedSet; 14299775a620SHiroshi Yamauchi for (const RegInfo &RI : Scope->CHRRegions) { 14309775a620SHiroshi Yamauchi Region *R = RI.R; 14319775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 14329775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 14339775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 14349775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 14359775a620SHiroshi Yamauchi hoistValue(BI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 14369775a620SHiroshi Yamauchi HoistedSet, TrivialPHIs); 14379775a620SHiroshi Yamauchi } 14389775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 14399775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 14409775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 14419775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 14429775a620SHiroshi Yamauchi continue; 14439775a620SHiroshi Yamauchi hoistValue(SI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 14449775a620SHiroshi Yamauchi HoistedSet, TrivialPHIs); 14459775a620SHiroshi Yamauchi } 14469775a620SHiroshi Yamauchi } 14479775a620SHiroshi Yamauchi } 14489775a620SHiroshi Yamauchi 14499775a620SHiroshi Yamauchi // Negate the predicate if an ICmp if it's used only by branches or selects by 14509775a620SHiroshi Yamauchi // swapping the operands of the branches or the selects. Returns true if success. 14519775a620SHiroshi Yamauchi static bool NegateICmpIfUsedByBranchOrSelectOnly(ICmpInst *ICmp, 14529775a620SHiroshi Yamauchi Instruction *ExcludedUser, 14539775a620SHiroshi Yamauchi CHRScope *Scope) { 14549775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 14559775a620SHiroshi Yamauchi if (U == ExcludedUser) 14569775a620SHiroshi Yamauchi continue; 14579775a620SHiroshi Yamauchi if (isa<BranchInst>(U) && cast<BranchInst>(U)->isConditional()) 14589775a620SHiroshi Yamauchi continue; 14599775a620SHiroshi Yamauchi if (isa<SelectInst>(U) && cast<SelectInst>(U)->getCondition() == ICmp) 14609775a620SHiroshi Yamauchi continue; 14619775a620SHiroshi Yamauchi return false; 14629775a620SHiroshi Yamauchi } 14639775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 14649775a620SHiroshi Yamauchi if (U == ExcludedUser) 14659775a620SHiroshi Yamauchi continue; 14669775a620SHiroshi Yamauchi if (auto *BI = dyn_cast<BranchInst>(U)) { 14679775a620SHiroshi Yamauchi assert(BI->isConditional() && "Must be conditional"); 14689775a620SHiroshi Yamauchi BI->swapSuccessors(); 14699775a620SHiroshi Yamauchi // Don't need to swap this in terms of 14709775a620SHiroshi Yamauchi // TrueBiasedRegions/FalseBiasedRegions because true-based/false-based 14719775a620SHiroshi Yamauchi // mean whehter the branch is likely go into the if-then rather than 14729775a620SHiroshi Yamauchi // successor0/successor1 and because we can tell which edge is the then or 14739775a620SHiroshi Yamauchi // the else one by comparing the destination to the region exit block. 14749775a620SHiroshi Yamauchi continue; 14759775a620SHiroshi Yamauchi } 14769775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(U)) { 14779775a620SHiroshi Yamauchi // Swap operands 14789775a620SHiroshi Yamauchi Value *TrueValue = SI->getTrueValue(); 14799775a620SHiroshi Yamauchi Value *FalseValue = SI->getFalseValue(); 14809775a620SHiroshi Yamauchi SI->setTrueValue(FalseValue); 14819775a620SHiroshi Yamauchi SI->setFalseValue(TrueValue); 14829775a620SHiroshi Yamauchi SI->swapProfMetadata(); 14839775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI)) { 14849775a620SHiroshi Yamauchi assert(Scope->FalseBiasedSelects.count(SI) == 0 && 14859775a620SHiroshi Yamauchi "Must not be already in"); 14869775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.insert(SI); 14879775a620SHiroshi Yamauchi } else if (Scope->FalseBiasedSelects.count(SI)) { 14889775a620SHiroshi Yamauchi assert(Scope->TrueBiasedSelects.count(SI) == 0 && 14899775a620SHiroshi Yamauchi "Must not be already in"); 14909775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.insert(SI); 14919775a620SHiroshi Yamauchi } 14929775a620SHiroshi Yamauchi continue; 14939775a620SHiroshi Yamauchi } 14949775a620SHiroshi Yamauchi llvm_unreachable("Must be a branch or a select"); 14959775a620SHiroshi Yamauchi } 14969775a620SHiroshi Yamauchi ICmp->setPredicate(CmpInst::getInversePredicate(ICmp->getPredicate())); 14979775a620SHiroshi Yamauchi return true; 14989775a620SHiroshi Yamauchi } 14999775a620SHiroshi Yamauchi 15009775a620SHiroshi Yamauchi // A helper for transformScopes. Insert a trivial phi at the scope exit block 15019775a620SHiroshi Yamauchi // for a value that's defined in the scope but used outside it (meaning it's 15029775a620SHiroshi Yamauchi // alive at the exit block). 15039775a620SHiroshi Yamauchi static void insertTrivialPHIs(CHRScope *Scope, 15049775a620SHiroshi Yamauchi BasicBlock *EntryBlock, BasicBlock *ExitBlock, 15059775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 15069775a620SHiroshi Yamauchi DenseSet<BasicBlock *> BlocksInScopeSet; 15079775a620SHiroshi Yamauchi SmallVector<BasicBlock *, 8> BlocksInScopeVec; 15089775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 15099775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 15109775a620SHiroshi Yamauchi // sub-Scopes. 15119775a620SHiroshi Yamauchi BlocksInScopeSet.insert(BB); 15129775a620SHiroshi Yamauchi BlocksInScopeVec.push_back(BB); 15139775a620SHiroshi Yamauchi } 15149775a620SHiroshi Yamauchi } 15159775a620SHiroshi Yamauchi CHR_DEBUG( 15169775a620SHiroshi Yamauchi dbgs() << "Inserting redudant phis\n"; 15179775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15189775a620SHiroshi Yamauchi dbgs() << "BlockInScope " << BB->getName() << "\n"; 15199775a620SHiroshi Yamauchi }); 15209775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15219775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 15229775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> Users; 15239775a620SHiroshi Yamauchi for (User *U : I.users()) { 15249775a620SHiroshi Yamauchi if (auto *UI = dyn_cast<Instruction>(U)) { 15259775a620SHiroshi Yamauchi if (BlocksInScopeSet.count(UI->getParent()) == 0 && 15269775a620SHiroshi Yamauchi // Unless there's already a phi for I at the exit block. 15279775a620SHiroshi Yamauchi !(isa<PHINode>(UI) && UI->getParent() == ExitBlock)) { 15289775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15299775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Used outside scope by user " << *UI << "\n"); 15309775a620SHiroshi Yamauchi Users.push_back(UI); 15319775a620SHiroshi Yamauchi } else if (UI->getParent() == EntryBlock && isa<PHINode>(UI)) { 15329775a620SHiroshi Yamauchi // There's a loop backedge from a block that's dominated by this 15339775a620SHiroshi Yamauchi // scope to the entry block. 15349775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15359775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() 15369775a620SHiroshi Yamauchi << "Used at entry block (for a back edge) by a phi user " 15379775a620SHiroshi Yamauchi << *UI << "\n"); 15389775a620SHiroshi Yamauchi Users.push_back(UI); 15399775a620SHiroshi Yamauchi } 15409775a620SHiroshi Yamauchi } 15419775a620SHiroshi Yamauchi } 15429775a620SHiroshi Yamauchi if (Users.size() > 0) { 15439775a620SHiroshi Yamauchi // Insert a trivial phi for I (phi [&I, P0], [&I, P1], ...) at 15449775a620SHiroshi Yamauchi // ExitBlock. Replace I with the new phi in UI unless UI is another 15459775a620SHiroshi Yamauchi // phi at ExitBlock. 15469775a620SHiroshi Yamauchi unsigned PredCount = std::distance(pred_begin(ExitBlock), 15479775a620SHiroshi Yamauchi pred_end(ExitBlock)); 15489775a620SHiroshi Yamauchi PHINode *PN = PHINode::Create(I.getType(), PredCount, "", 15499775a620SHiroshi Yamauchi &ExitBlock->front()); 15509775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(ExitBlock)) { 15519775a620SHiroshi Yamauchi PN->addIncoming(&I, Pred); 15529775a620SHiroshi Yamauchi } 15539775a620SHiroshi Yamauchi TrivialPHIs.insert(PN); 15549775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Insert phi " << *PN << "\n"); 15559775a620SHiroshi Yamauchi for (Instruction *UI : Users) { 15569775a620SHiroshi Yamauchi for (unsigned J = 0, NumOps = UI->getNumOperands(); J < NumOps; ++J) { 15579775a620SHiroshi Yamauchi if (UI->getOperand(J) == &I) { 15589775a620SHiroshi Yamauchi UI->setOperand(J, PN); 15599775a620SHiroshi Yamauchi } 15609775a620SHiroshi Yamauchi } 15619775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Updated user " << *UI << "\n"); 15629775a620SHiroshi Yamauchi } 15639775a620SHiroshi Yamauchi } 15649775a620SHiroshi Yamauchi } 15659775a620SHiroshi Yamauchi } 15669775a620SHiroshi Yamauchi } 15679775a620SHiroshi Yamauchi 15689775a620SHiroshi Yamauchi // Assert that all the CHR regions of the scope have a biased branch or select. 15699775a620SHiroshi Yamauchi static void assertCHRRegionsHaveBiasedBranchOrSelect(CHRScope *Scope) { 15709775a620SHiroshi Yamauchi #ifndef NDEBUG 15719775a620SHiroshi Yamauchi auto HasBiasedBranchOrSelect = [](RegInfo &RI, CHRScope *Scope) { 15729775a620SHiroshi Yamauchi if (Scope->TrueBiasedRegions.count(RI.R) || 15739775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.count(RI.R)) 15749775a620SHiroshi Yamauchi return true; 15759775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) 15769775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI) || 15779775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) 15789775a620SHiroshi Yamauchi return true; 15799775a620SHiroshi Yamauchi return false; 15809775a620SHiroshi Yamauchi }; 15819775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 15829775a620SHiroshi Yamauchi assert(HasBiasedBranchOrSelect(RI, Scope) && 15839775a620SHiroshi Yamauchi "Must have biased branch or select"); 15849775a620SHiroshi Yamauchi } 15859775a620SHiroshi Yamauchi #endif 15869775a620SHiroshi Yamauchi } 15879775a620SHiroshi Yamauchi 15889775a620SHiroshi Yamauchi // Assert that all the condition values of the biased branches and selects have 15899775a620SHiroshi Yamauchi // been hoisted to the pre-entry block or outside of the scope. 15909775a620SHiroshi Yamauchi static void assertBranchOrSelectConditionHoisted(CHRScope *Scope, 15919775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock) { 15929775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Biased regions condition values \n"); 15939775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 15949775a620SHiroshi Yamauchi Region *R = RI.R; 15959775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 15969775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 15979775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 15989775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 15999775a620SHiroshi Yamauchi Value *V = BI->getCondition(); 16009775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16019775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 160272ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16039775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16049775a620SHiroshi Yamauchi !Scope->contains(I)) && 16059775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16069775a620SHiroshi Yamauchi } 16079775a620SHiroshi Yamauchi } 16089775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 16099775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 16109775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 16119775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 16129775a620SHiroshi Yamauchi continue; 16139775a620SHiroshi Yamauchi Value *V = SI->getCondition(); 16149775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16159775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 161672ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16179775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16189775a620SHiroshi Yamauchi !Scope->contains(I)) && 16199775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16209775a620SHiroshi Yamauchi } 16219775a620SHiroshi Yamauchi } 16229775a620SHiroshi Yamauchi } 16239775a620SHiroshi Yamauchi } 16249775a620SHiroshi Yamauchi 16259775a620SHiroshi Yamauchi void CHR::transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs) { 16269775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "transformScopes " << *Scope << "\n"); 16279775a620SHiroshi Yamauchi 16289775a620SHiroshi Yamauchi assert(Scope->RegInfos.size() >= 1 && "Should have at least one Region"); 16299775a620SHiroshi Yamauchi Region *FirstRegion = Scope->RegInfos[0].R; 16309775a620SHiroshi Yamauchi BasicBlock *EntryBlock = FirstRegion->getEntry(); 16319775a620SHiroshi Yamauchi Region *LastRegion = Scope->RegInfos[Scope->RegInfos.size() - 1].R; 16329775a620SHiroshi Yamauchi BasicBlock *ExitBlock = LastRegion->getExit(); 16339775a620SHiroshi Yamauchi Optional<uint64_t> ProfileCount = BFI.getBlockProfileCount(EntryBlock); 16349775a620SHiroshi Yamauchi 16359775a620SHiroshi Yamauchi if (ExitBlock) { 16369775a620SHiroshi Yamauchi // Insert a trivial phi at the exit block (where the CHR hot path and the 16379775a620SHiroshi Yamauchi // cold path merges) for a value that's defined in the scope but used 16389775a620SHiroshi Yamauchi // outside it (meaning it's alive at the exit block). We will add the 16399775a620SHiroshi Yamauchi // incoming values for the CHR cold paths to it below. Without this, we'd 16409775a620SHiroshi Yamauchi // miss updating phi's for such values unless there happens to already be a 16419775a620SHiroshi Yamauchi // phi for that value there. 16429775a620SHiroshi Yamauchi insertTrivialPHIs(Scope, EntryBlock, ExitBlock, TrivialPHIs); 16439775a620SHiroshi Yamauchi } 16449775a620SHiroshi Yamauchi 16459775a620SHiroshi Yamauchi // Split the entry block of the first region. The new block becomes the new 16469775a620SHiroshi Yamauchi // entry block of the first region. The old entry block becomes the block to 16479775a620SHiroshi Yamauchi // insert the CHR branch into. Note DT gets updated. Since DT gets updated 16489775a620SHiroshi Yamauchi // through the split, we update the entry of the first region after the split, 16499775a620SHiroshi Yamauchi // and Region only points to the entry and the exit blocks, rather than 16509775a620SHiroshi Yamauchi // keeping everything in a list or set, the blocks membership and the 16519775a620SHiroshi Yamauchi // entry/exit blocks of the region are still valid after the split. 16529775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Splitting entry block " << EntryBlock->getName() 16539775a620SHiroshi Yamauchi << " at " << *Scope->BranchInsertPoint << "\n"); 16549775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock = 16559775a620SHiroshi Yamauchi SplitBlock(EntryBlock, Scope->BranchInsertPoint, &DT); 16569775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 16579775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 16589775a620SHiroshi Yamauchi FirstRegion->replaceEntryRecursive(NewEntryBlock); 16599775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock = EntryBlock; 16609775a620SHiroshi Yamauchi 16619775a620SHiroshi Yamauchi ValueToValueMapTy VMap; 16629775a620SHiroshi Yamauchi // Clone the blocks in the scope (excluding the PreEntryBlock) to split into a 16639775a620SHiroshi Yamauchi // hot path (originals) and a cold path (clones) and update the PHIs at the 16649775a620SHiroshi Yamauchi // exit block. 16659775a620SHiroshi Yamauchi cloneScopeBlocks(Scope, PreEntryBlock, ExitBlock, LastRegion, VMap); 16669775a620SHiroshi Yamauchi 16679775a620SHiroshi Yamauchi // Replace the old (placeholder) branch with the new (merged) conditional 16689775a620SHiroshi Yamauchi // branch. 16699775a620SHiroshi Yamauchi BranchInst *MergedBr = createMergedBranch(PreEntryBlock, EntryBlock, 16709775a620SHiroshi Yamauchi NewEntryBlock, VMap); 16719775a620SHiroshi Yamauchi 16729775a620SHiroshi Yamauchi #ifndef NDEBUG 16739775a620SHiroshi Yamauchi assertCHRRegionsHaveBiasedBranchOrSelect(Scope); 16749775a620SHiroshi Yamauchi #endif 16759775a620SHiroshi Yamauchi 16769775a620SHiroshi Yamauchi // Hoist the conditional values of the branches/selects. 16779775a620SHiroshi Yamauchi hoistScopeConditions(Scope, PreEntryBlock->getTerminator(), TrivialPHIs); 16789775a620SHiroshi Yamauchi 16799775a620SHiroshi Yamauchi #ifndef NDEBUG 16809775a620SHiroshi Yamauchi assertBranchOrSelectConditionHoisted(Scope, PreEntryBlock); 16819775a620SHiroshi Yamauchi #endif 16829775a620SHiroshi Yamauchi 16839775a620SHiroshi Yamauchi // Create the combined branch condition and constant-fold the branches/selects 16849775a620SHiroshi Yamauchi // in the hot path. 16859775a620SHiroshi Yamauchi fixupBranchesAndSelects(Scope, PreEntryBlock, MergedBr, 16869775a620SHiroshi Yamauchi ProfileCount ? ProfileCount.getValue() : 0); 16879775a620SHiroshi Yamauchi } 16889775a620SHiroshi Yamauchi 16899775a620SHiroshi Yamauchi // A helper for transformScopes. Clone the blocks in the scope (excluding the 16909775a620SHiroshi Yamauchi // PreEntryBlock) to split into a hot path and a cold path and update the PHIs 16919775a620SHiroshi Yamauchi // at the exit block. 16929775a620SHiroshi Yamauchi void CHR::cloneScopeBlocks(CHRScope *Scope, 16939775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 16949775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 16959775a620SHiroshi Yamauchi Region *LastRegion, 16969775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 16979775a620SHiroshi Yamauchi // Clone all the blocks. The original blocks will be the hot-path 16989775a620SHiroshi Yamauchi // CHR-optimized code and the cloned blocks will be the original unoptimized 16999775a620SHiroshi Yamauchi // code. This is so that the block pointers from the 17009775a620SHiroshi Yamauchi // CHRScope/Region/RegionInfo can stay valid in pointing to the hot-path code 17019775a620SHiroshi Yamauchi // which CHR should apply to. 17029775a620SHiroshi Yamauchi SmallVector<BasicBlock*, 8> NewBlocks; 17039775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) 17049775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 17059775a620SHiroshi Yamauchi // sub-Scopes. 17069775a620SHiroshi Yamauchi assert(BB != PreEntryBlock && "Don't copy the preetntry block"); 17079775a620SHiroshi Yamauchi BasicBlock *NewBB = CloneBasicBlock(BB, VMap, ".nonchr", &F); 17089775a620SHiroshi Yamauchi NewBlocks.push_back(NewBB); 17099775a620SHiroshi Yamauchi VMap[BB] = NewBB; 17109775a620SHiroshi Yamauchi } 17119775a620SHiroshi Yamauchi 17129775a620SHiroshi Yamauchi // Place the cloned blocks right after the original blocks (right before the 17139775a620SHiroshi Yamauchi // exit block of.) 17149775a620SHiroshi Yamauchi if (ExitBlock) 17159775a620SHiroshi Yamauchi F.getBasicBlockList().splice(ExitBlock->getIterator(), 17169775a620SHiroshi Yamauchi F.getBasicBlockList(), 17179775a620SHiroshi Yamauchi NewBlocks[0]->getIterator(), F.end()); 17189775a620SHiroshi Yamauchi 17199775a620SHiroshi Yamauchi // Update the cloned blocks/instructions to refer to themselves. 17209775a620SHiroshi Yamauchi for (unsigned i = 0, e = NewBlocks.size(); i != e; ++i) 17219775a620SHiroshi Yamauchi for (Instruction &I : *NewBlocks[i]) 17229775a620SHiroshi Yamauchi RemapInstruction(&I, VMap, 17239775a620SHiroshi Yamauchi RF_NoModuleLevelChanges | RF_IgnoreMissingLocals); 17249775a620SHiroshi Yamauchi 17259775a620SHiroshi Yamauchi // Add the cloned blocks to the PHIs of the exit blocks. ExitBlock is null for 17269775a620SHiroshi Yamauchi // the top-level region but we don't need to add PHIs. The trivial PHIs 17279775a620SHiroshi Yamauchi // inserted above will be updated here. 17289775a620SHiroshi Yamauchi if (ExitBlock) 17299775a620SHiroshi Yamauchi for (PHINode &PN : ExitBlock->phis()) 17309775a620SHiroshi Yamauchi for (unsigned I = 0, NumOps = PN.getNumIncomingValues(); I < NumOps; 17319775a620SHiroshi Yamauchi ++I) { 17329775a620SHiroshi Yamauchi BasicBlock *Pred = PN.getIncomingBlock(I); 17339775a620SHiroshi Yamauchi if (LastRegion->contains(Pred)) { 17349775a620SHiroshi Yamauchi Value *V = PN.getIncomingValue(I); 17359775a620SHiroshi Yamauchi auto It = VMap.find(V); 17369775a620SHiroshi Yamauchi if (It != VMap.end()) V = It->second; 17379775a620SHiroshi Yamauchi assert(VMap.find(Pred) != VMap.end() && "Pred must have been cloned"); 17389775a620SHiroshi Yamauchi PN.addIncoming(V, cast<BasicBlock>(VMap[Pred])); 17399775a620SHiroshi Yamauchi } 17409775a620SHiroshi Yamauchi } 17419775a620SHiroshi Yamauchi } 17429775a620SHiroshi Yamauchi 17439775a620SHiroshi Yamauchi // A helper for transformScope. Replace the old (placeholder) branch with the 17449775a620SHiroshi Yamauchi // new (merged) conditional branch. 17459775a620SHiroshi Yamauchi BranchInst *CHR::createMergedBranch(BasicBlock *PreEntryBlock, 17469775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 17479775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 17489775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 17499775a620SHiroshi Yamauchi BranchInst *OldBR = cast<BranchInst>(PreEntryBlock->getTerminator()); 17509775a620SHiroshi Yamauchi assert(OldBR->isUnconditional() && OldBR->getSuccessor(0) == NewEntryBlock && 17519775a620SHiroshi Yamauchi "SplitBlock did not work correctly!"); 17529775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 17539775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 17549775a620SHiroshi Yamauchi assert(VMap.find(NewEntryBlock) != VMap.end() && 17559775a620SHiroshi Yamauchi "NewEntryBlock must have been copied"); 17569775a620SHiroshi Yamauchi OldBR->removeFromParent(); 17579775a620SHiroshi Yamauchi OldBR->dropAllReferences(); 17589775a620SHiroshi Yamauchi // The true predicate is a placeholder. It will be replaced later in 17599775a620SHiroshi Yamauchi // fixupBranchesAndSelects(). 17609775a620SHiroshi Yamauchi BranchInst *NewBR = BranchInst::Create(NewEntryBlock, 17619775a620SHiroshi Yamauchi cast<BasicBlock>(VMap[NewEntryBlock]), 17629775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext())); 17639775a620SHiroshi Yamauchi PreEntryBlock->getInstList().push_back(NewBR); 17649775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 17659775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 17669775a620SHiroshi Yamauchi return NewBR; 17679775a620SHiroshi Yamauchi } 17689775a620SHiroshi Yamauchi 17699775a620SHiroshi Yamauchi // A helper for transformScopes. Create the combined branch condition and 17709775a620SHiroshi Yamauchi // constant-fold the branches/selects in the hot path. 17719775a620SHiroshi Yamauchi void CHR::fixupBranchesAndSelects(CHRScope *Scope, 17729775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 17739775a620SHiroshi Yamauchi BranchInst *MergedBR, 17749775a620SHiroshi Yamauchi uint64_t ProfileCount) { 17759775a620SHiroshi Yamauchi Value *MergedCondition = ConstantInt::getTrue(F.getContext()); 17769775a620SHiroshi Yamauchi BranchProbability CHRBranchBias(1, 1); 17779775a620SHiroshi Yamauchi uint64_t NumCHRedBranches = 0; 17789775a620SHiroshi Yamauchi IRBuilder<> IRB(PreEntryBlock->getTerminator()); 17799775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 17809775a620SHiroshi Yamauchi Region *R = RI.R; 17819775a620SHiroshi Yamauchi if (RI.HasBranch) { 17829775a620SHiroshi Yamauchi fixupBranch(R, Scope, IRB, MergedCondition, CHRBranchBias); 17839775a620SHiroshi Yamauchi ++NumCHRedBranches; 17849775a620SHiroshi Yamauchi } 17859775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 17869775a620SHiroshi Yamauchi fixupSelect(SI, Scope, IRB, MergedCondition, CHRBranchBias); 17879775a620SHiroshi Yamauchi ++NumCHRedBranches; 17889775a620SHiroshi Yamauchi } 17899775a620SHiroshi Yamauchi } 17909775a620SHiroshi Yamauchi Stats.NumBranchesDelta += NumCHRedBranches - 1; 17919775a620SHiroshi Yamauchi Stats.WeightedNumBranchesDelta += (NumCHRedBranches - 1) * ProfileCount; 17929775a620SHiroshi Yamauchi MergedBR->setCondition(MergedCondition); 17939775a620SHiroshi Yamauchi SmallVector<uint32_t, 2> Weights; 17949775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.scale(1000))); 17959775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.getCompl().scale(1000))); 17969775a620SHiroshi Yamauchi MDBuilder MDB(F.getContext()); 17979775a620SHiroshi Yamauchi MergedBR->setMetadata(LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); 17989775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR branch bias " << Weights[0] << ":" << Weights[1] 17999775a620SHiroshi Yamauchi << "\n"); 18009775a620SHiroshi Yamauchi } 18019775a620SHiroshi Yamauchi 18029775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 18039775a620SHiroshi Yamauchi // and constant-fold a branch in the hot path. 18049775a620SHiroshi Yamauchi void CHR::fixupBranch(Region *R, CHRScope *Scope, 18059775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18069775a620SHiroshi Yamauchi Value *&MergedCondition, 18079775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 18089775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 18099775a620SHiroshi Yamauchi assert((IsTrueBiased || Scope->FalseBiasedRegions.count(R)) && 18109775a620SHiroshi Yamauchi "Must be truthy or falsy"); 18119775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 18129775a620SHiroshi Yamauchi assert(BranchBiasMap.find(R) != BranchBiasMap.end() && 18139775a620SHiroshi Yamauchi "Must be in the bias map"); 18149775a620SHiroshi Yamauchi BranchProbability Bias = BranchBiasMap[R]; 18159775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 18169775a620SHiroshi Yamauchi // Take the min. 18179775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 18189775a620SHiroshi Yamauchi CHRBranchBias = Bias; 18199775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(1); 18209775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(0); 18219775a620SHiroshi Yamauchi BasicBlock *RegionExitBlock = R->getExit(); 18229775a620SHiroshi Yamauchi assert(RegionExitBlock && "Null ExitBlock"); 18239775a620SHiroshi Yamauchi assert((IfThen == RegionExitBlock || IfElse == RegionExitBlock) && 18249775a620SHiroshi Yamauchi IfThen != IfElse && "Invariant from findScopes"); 18259775a620SHiroshi Yamauchi if (IfThen == RegionExitBlock) { 18269775a620SHiroshi Yamauchi // Swap them so that IfThen means going into it and IfElse means skipping 18279775a620SHiroshi Yamauchi // it. 18289775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 18299775a620SHiroshi Yamauchi } 18309775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "IfThen " << IfThen->getName() 18319775a620SHiroshi Yamauchi << " IfElse " << IfElse->getName() << "\n"); 18329775a620SHiroshi Yamauchi Value *Cond = BI->getCondition(); 18339775a620SHiroshi Yamauchi BasicBlock *HotTarget = IsTrueBiased ? IfThen : IfElse; 18349775a620SHiroshi Yamauchi bool ConditionTrue = HotTarget == BI->getSuccessor(0); 18359775a620SHiroshi Yamauchi addToMergedCondition(ConditionTrue, Cond, BI, Scope, IRB, 18369775a620SHiroshi Yamauchi MergedCondition); 18379775a620SHiroshi Yamauchi // Constant-fold the branch at ClonedEntryBlock. 18389775a620SHiroshi Yamauchi assert(ConditionTrue == (HotTarget == BI->getSuccessor(0)) && 18399775a620SHiroshi Yamauchi "The successor shouldn't change"); 18409775a620SHiroshi Yamauchi Value *NewCondition = ConditionTrue ? 18419775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 18429775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 18439775a620SHiroshi Yamauchi BI->setCondition(NewCondition); 18449775a620SHiroshi Yamauchi } 18459775a620SHiroshi Yamauchi 18469775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 18479775a620SHiroshi Yamauchi // and constant-fold a select in the hot path. 18489775a620SHiroshi Yamauchi void CHR::fixupSelect(SelectInst *SI, CHRScope *Scope, 18499775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18509775a620SHiroshi Yamauchi Value *&MergedCondition, 18519775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 18529775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 18539775a620SHiroshi Yamauchi assert((IsTrueBiased || 18549775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) && "Must be biased"); 18559775a620SHiroshi Yamauchi assert(SelectBiasMap.find(SI) != SelectBiasMap.end() && 18569775a620SHiroshi Yamauchi "Must be in the bias map"); 18579775a620SHiroshi Yamauchi BranchProbability Bias = SelectBiasMap[SI]; 18589775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 18599775a620SHiroshi Yamauchi // Take the min. 18609775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 18619775a620SHiroshi Yamauchi CHRBranchBias = Bias; 18629775a620SHiroshi Yamauchi Value *Cond = SI->getCondition(); 18639775a620SHiroshi Yamauchi addToMergedCondition(IsTrueBiased, Cond, SI, Scope, IRB, 18649775a620SHiroshi Yamauchi MergedCondition); 18659775a620SHiroshi Yamauchi Value *NewCondition = IsTrueBiased ? 18669775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 18679775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 18689775a620SHiroshi Yamauchi SI->setCondition(NewCondition); 18699775a620SHiroshi Yamauchi } 18709775a620SHiroshi Yamauchi 18719775a620SHiroshi Yamauchi // A helper for fixupBranch/fixupSelect. Add a branch condition to the merged 18729775a620SHiroshi Yamauchi // condition. 18739775a620SHiroshi Yamauchi void CHR::addToMergedCondition(bool IsTrueBiased, Value *Cond, 18749775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 18759775a620SHiroshi Yamauchi CHRScope *Scope, 18769775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18779775a620SHiroshi Yamauchi Value *&MergedCondition) { 18789775a620SHiroshi Yamauchi if (IsTrueBiased) { 18799775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 18809775a620SHiroshi Yamauchi } else { 18819775a620SHiroshi Yamauchi // If Cond is an icmp and all users of V except for BranchOrSelect is a 18829775a620SHiroshi Yamauchi // branch, negate the icmp predicate and swap the branch targets and avoid 18839775a620SHiroshi Yamauchi // inserting an Xor to negate Cond. 18849775a620SHiroshi Yamauchi bool Done = false; 18859775a620SHiroshi Yamauchi if (auto *ICmp = dyn_cast<ICmpInst>(Cond)) 18869775a620SHiroshi Yamauchi if (NegateICmpIfUsedByBranchOrSelectOnly(ICmp, BranchOrSelect, Scope)) { 18879775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 18889775a620SHiroshi Yamauchi Done = true; 18899775a620SHiroshi Yamauchi } 18909775a620SHiroshi Yamauchi if (!Done) { 18919775a620SHiroshi Yamauchi Value *Negate = IRB.CreateXor( 18929775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()), Cond); 18939775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Negate); 18949775a620SHiroshi Yamauchi } 18959775a620SHiroshi Yamauchi } 18969775a620SHiroshi Yamauchi } 18979775a620SHiroshi Yamauchi 18989775a620SHiroshi Yamauchi void CHR::transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes) { 18999775a620SHiroshi Yamauchi unsigned i = 0; 19009775a620SHiroshi Yamauchi (void)(i); // Unused in release build. 19019775a620SHiroshi Yamauchi DenseSet<PHINode *> TrivialPHIs; 19029775a620SHiroshi Yamauchi for (CHRScope *Scope : CHRScopes) { 19039775a620SHiroshi Yamauchi transformScopes(Scope, TrivialPHIs); 19049775a620SHiroshi Yamauchi CHR_DEBUG( 19059775a620SHiroshi Yamauchi std::ostringstream oss; 19069775a620SHiroshi Yamauchi oss << " after transformScopes " << i++; 19079775a620SHiroshi Yamauchi dumpIR(F, oss.str().c_str(), nullptr)); 19089775a620SHiroshi Yamauchi } 19099775a620SHiroshi Yamauchi } 19109775a620SHiroshi Yamauchi 19119775a620SHiroshi Yamauchi static void dumpScopes(SmallVectorImpl<CHRScope *> &Scopes, const char * Label) { 19129775a620SHiroshi Yamauchi dbgs() << Label << " " << Scopes.size() << "\n"; 19139775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 19149775a620SHiroshi Yamauchi dbgs() << *Scope << "\n"; 19159775a620SHiroshi Yamauchi } 19169775a620SHiroshi Yamauchi } 19179775a620SHiroshi Yamauchi 19189775a620SHiroshi Yamauchi bool CHR::run() { 19199775a620SHiroshi Yamauchi if (!shouldApply(F, PSI)) 19209775a620SHiroshi Yamauchi return false; 19219775a620SHiroshi Yamauchi 19229775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "before", nullptr)); 19239775a620SHiroshi Yamauchi 19249775a620SHiroshi Yamauchi bool Changed = false; 19259775a620SHiroshi Yamauchi { 19269775a620SHiroshi Yamauchi CHR_DEBUG( 19279775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 19289775a620SHiroshi Yamauchi RI.print(dbgs())); 19299775a620SHiroshi Yamauchi 19309775a620SHiroshi Yamauchi // Recursively traverse the region tree and find regions that have biased 19319775a620SHiroshi Yamauchi // branches and/or selects and create scopes. 19329775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> AllScopes; 19339775a620SHiroshi Yamauchi findScopes(AllScopes); 19349775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(AllScopes, "All scopes")); 19359775a620SHiroshi Yamauchi 19369775a620SHiroshi Yamauchi // Split the scopes if 1) the conditiona values of the biased 19379775a620SHiroshi Yamauchi // branches/selects of the inner/lower scope can't be hoisted up to the 19389775a620SHiroshi Yamauchi // outermost/uppermost scope entry, or 2) the condition values of the biased 19399775a620SHiroshi Yamauchi // branches/selects in a scope (including subscopes) don't share at least 19409775a620SHiroshi Yamauchi // one common value. 19419775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SplitScopes; 19429775a620SHiroshi Yamauchi splitScopes(AllScopes, SplitScopes); 19439775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SplitScopes, "Split scopes")); 19449775a620SHiroshi Yamauchi 19459775a620SHiroshi Yamauchi // After splitting, set the biased regions and selects of a scope (a tree 19469775a620SHiroshi Yamauchi // root) that include those of the subscopes. 19479775a620SHiroshi Yamauchi classifyBiasedScopes(SplitScopes); 19489775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Set per-scope bias " << SplitScopes.size() << "\n"); 19499775a620SHiroshi Yamauchi 19509775a620SHiroshi Yamauchi // Filter out the scopes that has only one biased region or select (CHR 19519775a620SHiroshi Yamauchi // isn't useful in such a case). 19529775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> FilteredScopes; 19539775a620SHiroshi Yamauchi filterScopes(SplitScopes, FilteredScopes); 19549775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(FilteredScopes, "Filtered scopes")); 19559775a620SHiroshi Yamauchi 19569775a620SHiroshi Yamauchi // Set the regions to be CHR'ed and their hoist stops for each scope. 19579775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SetScopes; 19589775a620SHiroshi Yamauchi setCHRRegions(FilteredScopes, SetScopes); 19599775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SetScopes, "Set CHR regions")); 19609775a620SHiroshi Yamauchi 19619775a620SHiroshi Yamauchi // Sort CHRScopes by the depth so that outer CHRScopes comes before inner 19629775a620SHiroshi Yamauchi // ones. We need to apply CHR from outer to inner so that we apply CHR only 19639775a620SHiroshi Yamauchi // to the hot path, rather than both hot and cold paths. 19649775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SortedScopes; 19659775a620SHiroshi Yamauchi sortScopes(SetScopes, SortedScopes); 19669775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SortedScopes, "Sorted scopes")); 19679775a620SHiroshi Yamauchi 19689775a620SHiroshi Yamauchi CHR_DEBUG( 19699775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 19709775a620SHiroshi Yamauchi RI.print(dbgs())); 19719775a620SHiroshi Yamauchi 19729775a620SHiroshi Yamauchi // Apply the CHR transformation. 19739775a620SHiroshi Yamauchi if (!SortedScopes.empty()) { 19749775a620SHiroshi Yamauchi transformScopes(SortedScopes); 19759775a620SHiroshi Yamauchi Changed = true; 19769775a620SHiroshi Yamauchi } 19779775a620SHiroshi Yamauchi } 19789775a620SHiroshi Yamauchi 19799775a620SHiroshi Yamauchi if (Changed) 19809775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "after", &Stats)); 19819775a620SHiroshi Yamauchi 19829775a620SHiroshi Yamauchi return Changed; 19839775a620SHiroshi Yamauchi } 19849775a620SHiroshi Yamauchi 19859775a620SHiroshi Yamauchi bool ControlHeightReductionLegacyPass::runOnFunction(Function &F) { 19869775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI = 19879775a620SHiroshi Yamauchi getAnalysis<BlockFrequencyInfoWrapperPass>().getBFI(); 19889775a620SHiroshi Yamauchi DominatorTree &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 19899775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI = 19909775a620SHiroshi Yamauchi *getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI(); 19919775a620SHiroshi Yamauchi RegionInfo &RI = getAnalysis<RegionInfoPass>().getRegionInfo(); 19929775a620SHiroshi Yamauchi return CHR(F, BFI, DT, PSI, RI).run(); 19939775a620SHiroshi Yamauchi } 19949775a620SHiroshi Yamauchi 19959775a620SHiroshi Yamauchi namespace llvm { 19969775a620SHiroshi Yamauchi 19979775a620SHiroshi Yamauchi ControlHeightReductionPass::ControlHeightReductionPass() { 19989775a620SHiroshi Yamauchi ParseCHRFilterFiles(); 19999775a620SHiroshi Yamauchi } 20009775a620SHiroshi Yamauchi 20019775a620SHiroshi Yamauchi PreservedAnalyses ControlHeightReductionPass::run( 20029775a620SHiroshi Yamauchi Function &F, 20039775a620SHiroshi Yamauchi FunctionAnalysisManager &FAM) { 20049775a620SHiroshi Yamauchi auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F); 20059775a620SHiroshi Yamauchi auto &DT = FAM.getResult<DominatorTreeAnalysis>(F); 20069775a620SHiroshi Yamauchi auto &MAMProxy = FAM.getResult<ModuleAnalysisManagerFunctionProxy>(F); 20079775a620SHiroshi Yamauchi auto &MAM = MAMProxy.getManager(); 20089775a620SHiroshi Yamauchi auto &PSI = *MAM.getCachedResult<ProfileSummaryAnalysis>(*F.getParent()); 20099775a620SHiroshi Yamauchi auto &RI = FAM.getResult<RegionInfoAnalysis>(F); 20109775a620SHiroshi Yamauchi bool Changed = CHR(F, BFI, DT, PSI, RI).run(); 20119775a620SHiroshi Yamauchi if (!Changed) 20129775a620SHiroshi Yamauchi return PreservedAnalyses::all(); 20139775a620SHiroshi Yamauchi auto PA = PreservedAnalyses(); 20149775a620SHiroshi Yamauchi PA.preserve<GlobalsAA>(); 20159775a620SHiroshi Yamauchi return PA; 20169775a620SHiroshi Yamauchi } 20179775a620SHiroshi Yamauchi 20189775a620SHiroshi Yamauchi } // namespace llvm 2019