19775a620SHiroshi Yamauchi //===-- ControlHeightReduction.cpp - Control Height Reduction -------------===// 29775a620SHiroshi Yamauchi // 39775a620SHiroshi Yamauchi // The LLVM Compiler Infrastructure 49775a620SHiroshi Yamauchi // 59775a620SHiroshi Yamauchi // This file is distributed under the University of Illinois Open Source 69775a620SHiroshi Yamauchi // License. See LICENSE.TXT for details. 79775a620SHiroshi Yamauchi // 89775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 99775a620SHiroshi Yamauchi // 109775a620SHiroshi Yamauchi // This pass merges conditional blocks of code and reduces the number of 119775a620SHiroshi Yamauchi // conditional branches in the hot paths based on profiles. 129775a620SHiroshi Yamauchi // 139775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 149775a620SHiroshi Yamauchi 159775a620SHiroshi Yamauchi #include "llvm/Transforms/Instrumentation/ControlHeightReduction.h" 169775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils.h" 179775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/BasicBlockUtils.h" 189775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/Cloning.h" 199775a620SHiroshi Yamauchi #include "llvm/Transforms/Utils/ValueMapper.h" 209775a620SHiroshi Yamauchi #include "llvm/ADT/DenseMap.h" 219775a620SHiroshi Yamauchi #include "llvm/ADT/DenseSet.h" 229775a620SHiroshi Yamauchi #include "llvm/ADT/SmallVector.h" 239775a620SHiroshi Yamauchi #include "llvm/ADT/StringSet.h" 249775a620SHiroshi Yamauchi #include "llvm/Analysis/BlockFrequencyInfo.h" 259775a620SHiroshi Yamauchi #include "llvm/Analysis/ProfileSummaryInfo.h" 269775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionInfo.h" 279775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionIterator.h" 289775a620SHiroshi Yamauchi #include "llvm/Analysis/ValueTracking.h" 299775a620SHiroshi Yamauchi #include "llvm/IR/CFG.h" 309775a620SHiroshi Yamauchi #include "llvm/IR/Dominators.h" 319775a620SHiroshi Yamauchi #include "llvm/IR/IRBuilder.h" 329775a620SHiroshi Yamauchi #include "llvm/IR/MDBuilder.h" 339775a620SHiroshi Yamauchi #include "llvm/Support/BranchProbability.h" 349775a620SHiroshi Yamauchi #include "llvm/Support/MemoryBuffer.h" 359775a620SHiroshi Yamauchi #include "llvm/Transforms/Scalar.h" 369775a620SHiroshi Yamauchi 3772ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 389775a620SHiroshi Yamauchi #include <cxxabi.h> 3972ee6d60SHiroshi Yamauchi #endif 409775a620SHiroshi Yamauchi #include <set> 419775a620SHiroshi Yamauchi #include <sstream> 429775a620SHiroshi Yamauchi 439775a620SHiroshi Yamauchi using namespace llvm; 449775a620SHiroshi Yamauchi 459775a620SHiroshi Yamauchi #define DEBUG_TYPE "chr" 469775a620SHiroshi Yamauchi 479775a620SHiroshi Yamauchi #define CHR_DEBUG(X) LLVM_DEBUG(X) 489775a620SHiroshi Yamauchi 499775a620SHiroshi Yamauchi static cl::opt<bool> ForceCHR("force-chr", cl::init(false), cl::Hidden, 509775a620SHiroshi Yamauchi cl::desc("Apply CHR for all functions")); 519775a620SHiroshi Yamauchi 529775a620SHiroshi Yamauchi static cl::opt<double> CHRBiasThreshold( 539775a620SHiroshi Yamauchi "chr-bias-threshold", cl::init(0.99), cl::Hidden, 549775a620SHiroshi Yamauchi cl::desc("CHR considers a branch bias greater than this ratio as biased")); 559775a620SHiroshi Yamauchi 569775a620SHiroshi Yamauchi static cl::opt<unsigned> CHRMergeThreshold( 579775a620SHiroshi Yamauchi "chr-merge-threshold", cl::init(2), cl::Hidden, 589775a620SHiroshi Yamauchi cl::desc("CHR merges a group of N branches/selects where N >= this value")); 599775a620SHiroshi Yamauchi 609775a620SHiroshi Yamauchi static cl::opt<std::string> CHRModuleList( 619775a620SHiroshi Yamauchi "chr-module-list", cl::init(""), cl::Hidden, 629775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of modules to apply CHR to")); 639775a620SHiroshi Yamauchi 649775a620SHiroshi Yamauchi static cl::opt<std::string> CHRFunctionList( 659775a620SHiroshi Yamauchi "chr-function-list", cl::init(""), cl::Hidden, 669775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of functions to apply CHR to")); 679775a620SHiroshi Yamauchi 689775a620SHiroshi Yamauchi static StringSet<> CHRModules; 699775a620SHiroshi Yamauchi static StringSet<> CHRFunctions; 709775a620SHiroshi Yamauchi 719775a620SHiroshi Yamauchi static void ParseCHRFilterFiles() { 729775a620SHiroshi Yamauchi if (!CHRModuleList.empty()) { 739775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRModuleList); 749775a620SHiroshi Yamauchi if (!FileOrErr) { 759775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-module-list file " << CHRModuleList << "\n"; 769775a620SHiroshi Yamauchi std::exit(1); 779775a620SHiroshi Yamauchi } 789775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 799775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 809775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 819775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 829775a620SHiroshi Yamauchi Line = Line.trim(); 839775a620SHiroshi Yamauchi if (!Line.empty()) 849775a620SHiroshi Yamauchi CHRModules.insert(Line); 859775a620SHiroshi Yamauchi } 869775a620SHiroshi Yamauchi } 879775a620SHiroshi Yamauchi if (!CHRFunctionList.empty()) { 889775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRFunctionList); 899775a620SHiroshi Yamauchi if (!FileOrErr) { 909775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-function-list file " << CHRFunctionList << "\n"; 919775a620SHiroshi Yamauchi std::exit(1); 929775a620SHiroshi Yamauchi } 939775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 949775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 959775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 969775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 979775a620SHiroshi Yamauchi Line = Line.trim(); 989775a620SHiroshi Yamauchi if (!Line.empty()) 999775a620SHiroshi Yamauchi CHRFunctions.insert(Line); 1009775a620SHiroshi Yamauchi } 1019775a620SHiroshi Yamauchi } 1029775a620SHiroshi Yamauchi } 1039775a620SHiroshi Yamauchi 1049775a620SHiroshi Yamauchi namespace { 1059775a620SHiroshi Yamauchi class ControlHeightReductionLegacyPass : public FunctionPass { 1069775a620SHiroshi Yamauchi public: 1079775a620SHiroshi Yamauchi static char ID; 1089775a620SHiroshi Yamauchi 1099775a620SHiroshi Yamauchi ControlHeightReductionLegacyPass() : FunctionPass(ID) { 1109775a620SHiroshi Yamauchi initializeControlHeightReductionLegacyPassPass( 1119775a620SHiroshi Yamauchi *PassRegistry::getPassRegistry()); 1129775a620SHiroshi Yamauchi ParseCHRFilterFiles(); 1139775a620SHiroshi Yamauchi } 1149775a620SHiroshi Yamauchi 1159775a620SHiroshi Yamauchi bool runOnFunction(Function &F) override; 1169775a620SHiroshi Yamauchi void getAnalysisUsage(AnalysisUsage &AU) const override { 1179775a620SHiroshi Yamauchi AU.addRequired<BlockFrequencyInfoWrapperPass>(); 1189775a620SHiroshi Yamauchi AU.addRequired<DominatorTreeWrapperPass>(); 1199775a620SHiroshi Yamauchi AU.addRequired<ProfileSummaryInfoWrapperPass>(); 1209775a620SHiroshi Yamauchi AU.addRequired<RegionInfoPass>(); 1219775a620SHiroshi Yamauchi AU.addPreserved<GlobalsAAWrapperPass>(); 1229775a620SHiroshi Yamauchi } 1239775a620SHiroshi Yamauchi }; 1249775a620SHiroshi Yamauchi } // end anonymous namespace 1259775a620SHiroshi Yamauchi 1269775a620SHiroshi Yamauchi char ControlHeightReductionLegacyPass::ID = 0; 1279775a620SHiroshi Yamauchi 1289775a620SHiroshi Yamauchi INITIALIZE_PASS_BEGIN(ControlHeightReductionLegacyPass, 1299775a620SHiroshi Yamauchi "chr", 1309775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1319775a620SHiroshi Yamauchi false, false) 1329775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) 1339775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 1349775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) 1359775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(RegionInfoPass) 1369775a620SHiroshi Yamauchi INITIALIZE_PASS_END(ControlHeightReductionLegacyPass, 1379775a620SHiroshi Yamauchi "chr", 1389775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1399775a620SHiroshi Yamauchi false, false) 1409775a620SHiroshi Yamauchi 1419775a620SHiroshi Yamauchi FunctionPass *llvm::createControlHeightReductionLegacyPass() { 1429775a620SHiroshi Yamauchi return new ControlHeightReductionLegacyPass(); 1439775a620SHiroshi Yamauchi } 1449775a620SHiroshi Yamauchi 1459775a620SHiroshi Yamauchi namespace { 1469775a620SHiroshi Yamauchi 1479775a620SHiroshi Yamauchi struct CHRStats { 1489775a620SHiroshi Yamauchi CHRStats() : NumBranches(0), NumBranchesDelta(0), 1499775a620SHiroshi Yamauchi WeightedNumBranchesDelta(0) {} 1509775a620SHiroshi Yamauchi void print(raw_ostream &OS) const { 1519775a620SHiroshi Yamauchi OS << "CHRStats: NumBranches " << NumBranches 1529775a620SHiroshi Yamauchi << " NumBranchesDelta " << NumBranchesDelta 1539775a620SHiroshi Yamauchi << " WeightedNumBranchesDelta " << WeightedNumBranchesDelta; 1549775a620SHiroshi Yamauchi } 1559775a620SHiroshi Yamauchi uint64_t NumBranches; // The original number of conditional branches / 1569775a620SHiroshi Yamauchi // selects 1579775a620SHiroshi Yamauchi uint64_t NumBranchesDelta; // The decrease of the number of conditional 1589775a620SHiroshi Yamauchi // branches / selects in the hot paths due to CHR. 1599775a620SHiroshi Yamauchi uint64_t WeightedNumBranchesDelta; // NumBranchesDelta weighted by the profile 1609775a620SHiroshi Yamauchi // count at the scope entry. 1619775a620SHiroshi Yamauchi }; 1629775a620SHiroshi Yamauchi 163*c8f348cbSFangrui Song inline raw_ostream LLVM_ATTRIBUTE_UNUSED &operator<<(raw_ostream &OS, 164*c8f348cbSFangrui Song const CHRStats &Stats) { 1659775a620SHiroshi Yamauchi Stats.print(OS); 1669775a620SHiroshi Yamauchi return OS; 1679775a620SHiroshi Yamauchi } 1689775a620SHiroshi Yamauchi 1699775a620SHiroshi Yamauchi // RegInfo - some properties of a Region. 1709775a620SHiroshi Yamauchi struct RegInfo { 1719775a620SHiroshi Yamauchi RegInfo() : R(nullptr), HasBranch(false) {} 1729775a620SHiroshi Yamauchi RegInfo(Region *RegionIn) : R(RegionIn), HasBranch(false) {} 1739775a620SHiroshi Yamauchi Region *R; 1749775a620SHiroshi Yamauchi bool HasBranch; 1759775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 1769775a620SHiroshi Yamauchi }; 1779775a620SHiroshi Yamauchi 1789775a620SHiroshi Yamauchi typedef DenseMap<Region *, DenseSet<Instruction *>> HoistStopMapTy; 1799775a620SHiroshi Yamauchi 1809775a620SHiroshi Yamauchi // CHRScope - a sequence of regions to CHR together. It corresponds to a 1819775a620SHiroshi Yamauchi // sequence of conditional blocks. It can have subscopes which correspond to 1829775a620SHiroshi Yamauchi // nested conditional blocks. Nested CHRScopes form a tree. 1839775a620SHiroshi Yamauchi class CHRScope { 1849775a620SHiroshi Yamauchi public: 1859775a620SHiroshi Yamauchi CHRScope(RegInfo RI) : BranchInsertPoint(nullptr) { 1869775a620SHiroshi Yamauchi assert(RI.R && "Null RegionIn"); 1879775a620SHiroshi Yamauchi RegInfos.push_back(RI); 1889775a620SHiroshi Yamauchi } 1899775a620SHiroshi Yamauchi 1909775a620SHiroshi Yamauchi Region *getParentRegion() { 1919775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1929775a620SHiroshi Yamauchi Region *Parent = RegInfos[0].R->getParent(); 1939775a620SHiroshi Yamauchi assert(Parent && "Unexpected to call this on the top-level region"); 1949775a620SHiroshi Yamauchi return Parent; 1959775a620SHiroshi Yamauchi } 1969775a620SHiroshi Yamauchi 1979775a620SHiroshi Yamauchi BasicBlock *getEntryBlock() { 1989775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1999775a620SHiroshi Yamauchi return RegInfos.front().R->getEntry(); 2009775a620SHiroshi Yamauchi } 2019775a620SHiroshi Yamauchi 2029775a620SHiroshi Yamauchi BasicBlock *getExitBlock() { 2039775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 2049775a620SHiroshi Yamauchi return RegInfos.back().R->getExit(); 2059775a620SHiroshi Yamauchi } 2069775a620SHiroshi Yamauchi 2079775a620SHiroshi Yamauchi bool appendable(CHRScope *Next) { 2089775a620SHiroshi Yamauchi // The next scope is appendable only if this scope is directly connected to 2099775a620SHiroshi Yamauchi // it (which implies it post-dominates this scope) and this scope dominates 2109775a620SHiroshi Yamauchi // it (no edge to the next scope outside this scope). 2119775a620SHiroshi Yamauchi BasicBlock *NextEntry = Next->getEntryBlock(); 2129775a620SHiroshi Yamauchi if (getExitBlock() != NextEntry) 2139775a620SHiroshi Yamauchi // Not directly connected. 2149775a620SHiroshi Yamauchi return false; 2159775a620SHiroshi Yamauchi Region *LastRegion = RegInfos.back().R; 2169775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(NextEntry)) 2179775a620SHiroshi Yamauchi if (!LastRegion->contains(Pred)) 2189775a620SHiroshi Yamauchi // There's an edge going into the entry of the next scope from outside 2199775a620SHiroshi Yamauchi // of this scope. 2209775a620SHiroshi Yamauchi return false; 2219775a620SHiroshi Yamauchi return true; 2229775a620SHiroshi Yamauchi } 2239775a620SHiroshi Yamauchi 2249775a620SHiroshi Yamauchi void append(CHRScope *Next) { 2259775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 2269775a620SHiroshi Yamauchi assert(Next->RegInfos.size() > 0 && "Empty CHRScope"); 2279775a620SHiroshi Yamauchi assert(getParentRegion() == Next->getParentRegion() && 2289775a620SHiroshi Yamauchi "Must be siblings"); 2299775a620SHiroshi Yamauchi assert(getExitBlock() == Next->getEntryBlock() && 2309775a620SHiroshi Yamauchi "Must be adjacent"); 2319775a620SHiroshi Yamauchi for (RegInfo &RI : Next->RegInfos) 2329775a620SHiroshi Yamauchi RegInfos.push_back(RI); 2339775a620SHiroshi Yamauchi for (CHRScope *Sub : Next->Subs) 2349775a620SHiroshi Yamauchi Subs.push_back(Sub); 2359775a620SHiroshi Yamauchi } 2369775a620SHiroshi Yamauchi 2379775a620SHiroshi Yamauchi void addSub(CHRScope *SubIn) { 2389775a620SHiroshi Yamauchi #ifndef NDEBUG 2399775a620SHiroshi Yamauchi bool is_child = false; 2409775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) 2419775a620SHiroshi Yamauchi if (RI.R == SubIn->getParentRegion()) { 2429775a620SHiroshi Yamauchi is_child = true; 2439775a620SHiroshi Yamauchi break; 2449775a620SHiroshi Yamauchi } 2459775a620SHiroshi Yamauchi assert(is_child && "Must be a child"); 2469775a620SHiroshi Yamauchi #endif 2479775a620SHiroshi Yamauchi Subs.push_back(SubIn); 2489775a620SHiroshi Yamauchi } 2499775a620SHiroshi Yamauchi 2509775a620SHiroshi Yamauchi // Split this scope at the boundary region into two, which will belong to the 2519775a620SHiroshi Yamauchi // tail and returns the tail. 2529775a620SHiroshi Yamauchi CHRScope *split(Region *Boundary) { 2539775a620SHiroshi Yamauchi assert(Boundary && "Boundary null"); 2549775a620SHiroshi Yamauchi assert(RegInfos.begin()->R != Boundary && 2559775a620SHiroshi Yamauchi "Can't be split at beginning"); 2569775a620SHiroshi Yamauchi auto BoundaryIt = std::find_if(RegInfos.begin(), RegInfos.end(), 2579775a620SHiroshi Yamauchi [&Boundary](const RegInfo& RI) { 2589775a620SHiroshi Yamauchi return Boundary == RI.R; 2599775a620SHiroshi Yamauchi }); 2609775a620SHiroshi Yamauchi if (BoundaryIt == RegInfos.end()) 2619775a620SHiroshi Yamauchi return nullptr; 2629775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> TailRegInfos; 2639775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> TailSubs; 2649775a620SHiroshi Yamauchi TailRegInfos.insert(TailRegInfos.begin(), BoundaryIt, RegInfos.end()); 2659775a620SHiroshi Yamauchi RegInfos.resize(BoundaryIt - RegInfos.begin()); 2669775a620SHiroshi Yamauchi DenseSet<Region *> TailRegionSet; 2679775a620SHiroshi Yamauchi for (RegInfo &RI : TailRegInfos) 2689775a620SHiroshi Yamauchi TailRegionSet.insert(RI.R); 2699775a620SHiroshi Yamauchi for (auto It = Subs.begin(); It != Subs.end(); ) { 2709775a620SHiroshi Yamauchi CHRScope *Sub = *It; 2719775a620SHiroshi Yamauchi assert(Sub && "null Sub"); 2729775a620SHiroshi Yamauchi Region *Parent = Sub->getParentRegion(); 2739775a620SHiroshi Yamauchi if (TailRegionSet.count(Parent)) { 2749775a620SHiroshi Yamauchi TailSubs.push_back(Sub); 2759775a620SHiroshi Yamauchi It = Subs.erase(It); 2769775a620SHiroshi Yamauchi } else { 2779775a620SHiroshi Yamauchi assert(std::find_if(RegInfos.begin(), RegInfos.end(), 2789775a620SHiroshi Yamauchi [&Parent](const RegInfo& RI) { 2799775a620SHiroshi Yamauchi return Parent == RI.R; 2809775a620SHiroshi Yamauchi }) != RegInfos.end() && 2819775a620SHiroshi Yamauchi "Must be in head"); 2829775a620SHiroshi Yamauchi ++It; 2839775a620SHiroshi Yamauchi } 2849775a620SHiroshi Yamauchi } 2859775a620SHiroshi Yamauchi assert(HoistStopMap.empty() && "MapHoistStops must be empty"); 2869775a620SHiroshi Yamauchi return new CHRScope(TailRegInfos, TailSubs); 2879775a620SHiroshi Yamauchi } 2889775a620SHiroshi Yamauchi 2899775a620SHiroshi Yamauchi bool contains(Instruction *I) const { 2909775a620SHiroshi Yamauchi BasicBlock *Parent = I->getParent(); 2919775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) 2929775a620SHiroshi Yamauchi if (RI.R->contains(Parent)) 2939775a620SHiroshi Yamauchi return true; 2949775a620SHiroshi Yamauchi return false; 2959775a620SHiroshi Yamauchi } 2969775a620SHiroshi Yamauchi 2979775a620SHiroshi Yamauchi void print(raw_ostream &OS) const; 2989775a620SHiroshi Yamauchi 2999775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos; // Regions that belong to this scope 3009775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subs; // Subscopes. 3019775a620SHiroshi Yamauchi 3029775a620SHiroshi Yamauchi // The instruction at which to insert the CHR conditional branch (and hoist 3039775a620SHiroshi Yamauchi // the dependent condition values). 3049775a620SHiroshi Yamauchi Instruction *BranchInsertPoint; 3059775a620SHiroshi Yamauchi 3069775a620SHiroshi Yamauchi // True-biased and false-biased regions (conditional blocks), 3079775a620SHiroshi Yamauchi // respectively. Used only for the outermost scope and includes regions in 3089775a620SHiroshi Yamauchi // subscopes. The rest are unbiased. 3099775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegions; 3109775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegions; 3119775a620SHiroshi Yamauchi // Among the biased regions, the regions that get CHRed. 3129775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> CHRRegions; 3139775a620SHiroshi Yamauchi 3149775a620SHiroshi Yamauchi // True-biased and false-biased selects, respectively. Used only for the 3159775a620SHiroshi Yamauchi // outermost scope and includes ones in subscopes. 3169775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelects; 3179775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelects; 3189775a620SHiroshi Yamauchi 3199775a620SHiroshi Yamauchi // Map from one of the above regions to the instructions to stop 3209775a620SHiroshi Yamauchi // hoisting instructions at through use-def chains. 3219775a620SHiroshi Yamauchi HoistStopMapTy HoistStopMap; 3229775a620SHiroshi Yamauchi 3239775a620SHiroshi Yamauchi private: 3249775a620SHiroshi Yamauchi CHRScope(SmallVector<RegInfo, 8> &RegInfosIn, 3259775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> &SubsIn) 3269775a620SHiroshi Yamauchi : RegInfos(RegInfosIn), Subs(SubsIn), BranchInsertPoint(nullptr) {} 3279775a620SHiroshi Yamauchi }; 3289775a620SHiroshi Yamauchi 3299775a620SHiroshi Yamauchi inline raw_ostream &operator<<(raw_ostream &OS, const CHRScope &Scope) { 3309775a620SHiroshi Yamauchi Scope.print(OS); 3319775a620SHiroshi Yamauchi return OS; 3329775a620SHiroshi Yamauchi } 3339775a620SHiroshi Yamauchi 3349775a620SHiroshi Yamauchi class CHR { 3359775a620SHiroshi Yamauchi public: 3369775a620SHiroshi Yamauchi CHR(Function &Fin, BlockFrequencyInfo &BFIin, DominatorTree &DTin, 3379775a620SHiroshi Yamauchi ProfileSummaryInfo &PSIin, RegionInfo &RIin) 3389775a620SHiroshi Yamauchi : F(Fin), BFI(BFIin), DT(DTin), PSI(PSIin), RI(RIin) {} 3399775a620SHiroshi Yamauchi 3409775a620SHiroshi Yamauchi ~CHR() { 3419775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 3429775a620SHiroshi Yamauchi delete Scope; 3439775a620SHiroshi Yamauchi } 3449775a620SHiroshi Yamauchi } 3459775a620SHiroshi Yamauchi 3469775a620SHiroshi Yamauchi bool run(); 3479775a620SHiroshi Yamauchi 3489775a620SHiroshi Yamauchi private: 3499775a620SHiroshi Yamauchi // See the comments in CHR::run() for the high level flow of the algorithm and 3509775a620SHiroshi Yamauchi // what the following functions do. 3519775a620SHiroshi Yamauchi 3529775a620SHiroshi Yamauchi void findScopes(SmallVectorImpl<CHRScope *> &Output) { 3539775a620SHiroshi Yamauchi Region *R = RI.getTopLevelRegion(); 3549775a620SHiroshi Yamauchi CHRScope *Scope = findScopes(R, nullptr, nullptr, Output); 3559775a620SHiroshi Yamauchi if (Scope) { 3569775a620SHiroshi Yamauchi Output.push_back(Scope); 3579775a620SHiroshi Yamauchi } 3589775a620SHiroshi Yamauchi } 3599775a620SHiroshi Yamauchi CHRScope *findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 3609775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes); 3619775a620SHiroshi Yamauchi CHRScope *findScope(Region *R); 3629775a620SHiroshi Yamauchi void checkScopeHoistable(CHRScope *Scope); 3639775a620SHiroshi Yamauchi 3649775a620SHiroshi Yamauchi void splitScopes(SmallVectorImpl<CHRScope *> &Input, 3659775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3669775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> splitScope(CHRScope *Scope, 3679775a620SHiroshi Yamauchi CHRScope *Outer, 3689775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 3699775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 3709775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 3719775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables); 3729775a620SHiroshi Yamauchi 3739775a620SHiroshi Yamauchi void classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes); 3749775a620SHiroshi Yamauchi void classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope); 3759775a620SHiroshi Yamauchi 3769775a620SHiroshi Yamauchi void filterScopes(SmallVectorImpl<CHRScope *> &Input, 3779775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3789775a620SHiroshi Yamauchi 3799775a620SHiroshi Yamauchi void setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 3809775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3819775a620SHiroshi Yamauchi void setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope); 3829775a620SHiroshi Yamauchi 3839775a620SHiroshi Yamauchi void sortScopes(SmallVectorImpl<CHRScope *> &Input, 3849775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3859775a620SHiroshi Yamauchi 3869775a620SHiroshi Yamauchi void transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes); 3879775a620SHiroshi Yamauchi void transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs); 3889775a620SHiroshi Yamauchi void cloneScopeBlocks(CHRScope *Scope, 3899775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3909775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 3919775a620SHiroshi Yamauchi Region *LastRegion, 3929775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3939775a620SHiroshi Yamauchi BranchInst *createMergedBranch(BasicBlock *PreEntryBlock, 3949775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 3959775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 3969775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3979775a620SHiroshi Yamauchi void fixupBranchesAndSelects(CHRScope *Scope, 3989775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3999775a620SHiroshi Yamauchi BranchInst *MergedBR, 4009775a620SHiroshi Yamauchi uint64_t ProfileCount); 4019775a620SHiroshi Yamauchi void fixupBranch(Region *R, 4029775a620SHiroshi Yamauchi CHRScope *Scope, 4039775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4049775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 4059775a620SHiroshi Yamauchi void fixupSelect(SelectInst* SI, 4069775a620SHiroshi Yamauchi CHRScope *Scope, 4079775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4089775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 4099775a620SHiroshi Yamauchi void addToMergedCondition(bool IsTrueBiased, Value *Cond, 4109775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 4119775a620SHiroshi Yamauchi CHRScope *Scope, 4129775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4139775a620SHiroshi Yamauchi Value *&MergedCondition); 4149775a620SHiroshi Yamauchi 4159775a620SHiroshi Yamauchi Function &F; 4169775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI; 4179775a620SHiroshi Yamauchi DominatorTree &DT; 4189775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI; 4199775a620SHiroshi Yamauchi RegionInfo &RI; 4209775a620SHiroshi Yamauchi CHRStats Stats; 4219775a620SHiroshi Yamauchi 4229775a620SHiroshi Yamauchi // All the true-biased regions in the function 4239775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegionsGlobal; 4249775a620SHiroshi Yamauchi // All the false-biased regions in the function 4259775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegionsGlobal; 4269775a620SHiroshi Yamauchi // All the true-biased selects in the function 4279775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelectsGlobal; 4289775a620SHiroshi Yamauchi // All the false-biased selects in the function 4299775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelectsGlobal; 4309775a620SHiroshi Yamauchi // A map from biased regions to their branch bias 4319775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> BranchBiasMap; 4329775a620SHiroshi Yamauchi // A map from biased selects to their branch bias 4339775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> SelectBiasMap; 4349775a620SHiroshi Yamauchi // All the scopes. 4359775a620SHiroshi Yamauchi DenseSet<CHRScope *> Scopes; 4369775a620SHiroshi Yamauchi }; 4379775a620SHiroshi Yamauchi 4389775a620SHiroshi Yamauchi } // end anonymous namespace 4399775a620SHiroshi Yamauchi 4409775a620SHiroshi Yamauchi static bool shouldApply(Function &F, ProfileSummaryInfo& PSI) { 4419775a620SHiroshi Yamauchi if (ForceCHR) 4429775a620SHiroshi Yamauchi return true; 4439775a620SHiroshi Yamauchi 4449775a620SHiroshi Yamauchi if (!CHRModuleList.empty() || !CHRFunctionList.empty()) { 4459775a620SHiroshi Yamauchi if (CHRModules.count(F.getParent()->getName())) 4469775a620SHiroshi Yamauchi return true; 4479775a620SHiroshi Yamauchi StringRef Name = F.getName(); 4489775a620SHiroshi Yamauchi if (CHRFunctions.count(Name)) 4499775a620SHiroshi Yamauchi return true; 4509775a620SHiroshi Yamauchi const char* DemangledName = nullptr; 45172ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 452792a4f8aSReid Kleckner int Status = -1; 4539775a620SHiroshi Yamauchi DemangledName = abi::__cxa_demangle(Name.str().c_str(), 4549775a620SHiroshi Yamauchi nullptr, nullptr, &Status); 45572ee6d60SHiroshi Yamauchi #endif 4569775a620SHiroshi Yamauchi return DemangledName && CHRFunctions.count(DemangledName); 4579775a620SHiroshi Yamauchi } 4589775a620SHiroshi Yamauchi 4599775a620SHiroshi Yamauchi assert(PSI.hasProfileSummary() && "Empty PSI?"); 4609775a620SHiroshi Yamauchi return PSI.isFunctionEntryHot(&F); 4619775a620SHiroshi Yamauchi } 4629775a620SHiroshi Yamauchi 463*c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED dumpIR(Function &F, const char *Label, 464*c8f348cbSFangrui Song CHRStats *Stats) { 4659775a620SHiroshi Yamauchi std::string Name = F.getName().str(); 4669775a620SHiroshi Yamauchi const char *DemangledName = nullptr; 46772ee6d60SHiroshi Yamauchi #if !defined(_MSC_VER) 468792a4f8aSReid Kleckner int Status = -1; 4699775a620SHiroshi Yamauchi DemangledName = abi::__cxa_demangle(Name.c_str(), 4709775a620SHiroshi Yamauchi nullptr, nullptr, &Status); 47172ee6d60SHiroshi Yamauchi #endif 4729775a620SHiroshi Yamauchi if (DemangledName == nullptr) { 4739775a620SHiroshi Yamauchi DemangledName = "<NOT-MANGLED>"; 4749775a620SHiroshi Yamauchi } 4759775a620SHiroshi Yamauchi std::string ModuleName = F.getParent()->getName().str(); 4769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR IR dump " << Label << " " << ModuleName << " " 4779775a620SHiroshi Yamauchi << Name); 4789775a620SHiroshi Yamauchi if (Stats) 4799775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << " " << *Stats); 4809775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "\n"); 4819775a620SHiroshi Yamauchi CHR_DEBUG(F.dump()); 4829775a620SHiroshi Yamauchi } 4839775a620SHiroshi Yamauchi 4849775a620SHiroshi Yamauchi void CHRScope::print(raw_ostream &OS) const { 4859775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 4869775a620SHiroshi Yamauchi OS << "CHRScope["; 4879775a620SHiroshi Yamauchi OS << RegInfos.size() << ", Regions["; 4889775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) { 4899775a620SHiroshi Yamauchi OS << RI.R->getNameStr(); 4909775a620SHiroshi Yamauchi if (RI.HasBranch) 4919775a620SHiroshi Yamauchi OS << " B"; 4929775a620SHiroshi Yamauchi if (RI.Selects.size() > 0) 4939775a620SHiroshi Yamauchi OS << " S" << RI.Selects.size(); 4949775a620SHiroshi Yamauchi OS << ", "; 4959775a620SHiroshi Yamauchi } 4969775a620SHiroshi Yamauchi if (RegInfos[0].R->getParent()) { 4979775a620SHiroshi Yamauchi OS << "], Parent " << RegInfos[0].R->getParent()->getNameStr(); 4989775a620SHiroshi Yamauchi } else { 4999775a620SHiroshi Yamauchi // top level region 5009775a620SHiroshi Yamauchi OS << "]"; 5019775a620SHiroshi Yamauchi } 5029775a620SHiroshi Yamauchi OS << ", Subs["; 5039775a620SHiroshi Yamauchi for (CHRScope *Sub : Subs) { 5049775a620SHiroshi Yamauchi OS << *Sub << ", "; 5059775a620SHiroshi Yamauchi } 5069775a620SHiroshi Yamauchi OS << "]]"; 5079775a620SHiroshi Yamauchi } 5089775a620SHiroshi Yamauchi 5099775a620SHiroshi Yamauchi // Return true if the given instruction type can be hoisted by CHR. 5109775a620SHiroshi Yamauchi static bool isHoistableInstructionType(Instruction *I) { 5119775a620SHiroshi Yamauchi return isa<BinaryOperator>(I) || isa<CastInst>(I) || isa<SelectInst>(I) || 5129775a620SHiroshi Yamauchi isa<GetElementPtrInst>(I) || isa<CmpInst>(I) || 5139775a620SHiroshi Yamauchi isa<InsertElementInst>(I) || isa<ExtractElementInst>(I) || 5149775a620SHiroshi Yamauchi isa<ShuffleVectorInst>(I) || isa<ExtractValueInst>(I) || 5159775a620SHiroshi Yamauchi isa<InsertValueInst>(I); 5169775a620SHiroshi Yamauchi } 5179775a620SHiroshi Yamauchi 5189775a620SHiroshi Yamauchi // Return true if the given instruction can be hoisted by CHR. 5199775a620SHiroshi Yamauchi static bool isHoistable(Instruction *I, DominatorTree &DT) { 5209775a620SHiroshi Yamauchi if (!isHoistableInstructionType(I)) 5219775a620SHiroshi Yamauchi return false; 5229775a620SHiroshi Yamauchi return isSafeToSpeculativelyExecute(I, nullptr, &DT); 5239775a620SHiroshi Yamauchi } 5249775a620SHiroshi Yamauchi 5259775a620SHiroshi Yamauchi // Recursively traverse the use-def chains of the given value and return a set 5269775a620SHiroshi Yamauchi // of the unhoistable base values defined within the scope (excluding the 5279775a620SHiroshi Yamauchi // first-region entry block) or the (hoistable or unhoistable) base values that 5289775a620SHiroshi Yamauchi // are defined outside (including the first-region entry block) of the 5299775a620SHiroshi Yamauchi // scope. The returned set doesn't include constants. 5309775a620SHiroshi Yamauchi static std::set<Value *> getBaseValues(Value *V, 5319775a620SHiroshi Yamauchi DominatorTree &DT) { 5329775a620SHiroshi Yamauchi std::set<Value *> Result; 5339775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 5349775a620SHiroshi Yamauchi // We don't stop at a block that's not in the Scope because we would miss some 5359775a620SHiroshi Yamauchi // instructions that are based on the same base values if we stop there. 5369775a620SHiroshi Yamauchi if (!isHoistable(I, DT)) { 5379775a620SHiroshi Yamauchi Result.insert(I); 5389775a620SHiroshi Yamauchi return Result; 5399775a620SHiroshi Yamauchi } 5409775a620SHiroshi Yamauchi // I is hoistable above the Scope. 5419775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 5429775a620SHiroshi Yamauchi std::set<Value *> OpResult = getBaseValues(Op, DT); 5439775a620SHiroshi Yamauchi Result.insert(OpResult.begin(), OpResult.end()); 5449775a620SHiroshi Yamauchi } 5459775a620SHiroshi Yamauchi return Result; 5469775a620SHiroshi Yamauchi } 5479775a620SHiroshi Yamauchi if (isa<Argument>(V)) { 5489775a620SHiroshi Yamauchi Result.insert(V); 5499775a620SHiroshi Yamauchi return Result; 5509775a620SHiroshi Yamauchi } 5519775a620SHiroshi Yamauchi // We don't include others like constants because those won't lead to any 5529775a620SHiroshi Yamauchi // chance of folding of conditions (eg two bit checks merged into one check) 5539775a620SHiroshi Yamauchi // after CHR. 5549775a620SHiroshi Yamauchi return Result; // empty 5559775a620SHiroshi Yamauchi } 5569775a620SHiroshi Yamauchi 5579775a620SHiroshi Yamauchi // Return true if V is already hoisted or can be hoisted (along with its 5589775a620SHiroshi Yamauchi // operands) above the insert point. When it returns true and HoistStops is 5599775a620SHiroshi Yamauchi // non-null, the instructions to stop hoisting at through the use-def chains are 5609775a620SHiroshi Yamauchi // inserted into HoistStops. 5619775a620SHiroshi Yamauchi static bool 5629775a620SHiroshi Yamauchi checkHoistValue(Value *V, Instruction *InsertPoint, DominatorTree &DT, 5639775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables, 5649775a620SHiroshi Yamauchi DenseSet<Instruction *> *HoistStops) { 5659775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 5669775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 5679775a620SHiroshi Yamauchi assert(DT.getNode(I->getParent()) && "DT must contain I's parent block"); 5689775a620SHiroshi Yamauchi assert(DT.getNode(InsertPoint->getParent()) && "DT must contain Destination"); 5699775a620SHiroshi Yamauchi if (Unhoistables.count(I)) { 5709775a620SHiroshi Yamauchi // Don't hoist if they are not to be hoisted. 5719775a620SHiroshi Yamauchi return false; 5729775a620SHiroshi Yamauchi } 5739775a620SHiroshi Yamauchi if (DT.dominates(I, InsertPoint)) { 5749775a620SHiroshi Yamauchi // We are already above the insert point. Stop here. 5759775a620SHiroshi Yamauchi if (HoistStops) 5769775a620SHiroshi Yamauchi HoistStops->insert(I); 5779775a620SHiroshi Yamauchi return true; 5789775a620SHiroshi Yamauchi } 5799775a620SHiroshi Yamauchi // We aren't not above the insert point, check if we can hoist it above the 5809775a620SHiroshi Yamauchi // insert point. 5819775a620SHiroshi Yamauchi if (isHoistable(I, DT)) { 5829775a620SHiroshi Yamauchi // Check operands first. 5839775a620SHiroshi Yamauchi DenseSet<Instruction *> OpsHoistStops; 5849775a620SHiroshi Yamauchi bool AllOpsHoisted = true; 5859775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 5869775a620SHiroshi Yamauchi if (!checkHoistValue(Op, InsertPoint, DT, Unhoistables, &OpsHoistStops)) { 5879775a620SHiroshi Yamauchi AllOpsHoisted = false; 5889775a620SHiroshi Yamauchi break; 5899775a620SHiroshi Yamauchi } 5909775a620SHiroshi Yamauchi } 5919775a620SHiroshi Yamauchi if (AllOpsHoisted) { 5929775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "checkHoistValue " << *I << "\n"); 5939775a620SHiroshi Yamauchi if (HoistStops) 5949775a620SHiroshi Yamauchi HoistStops->insert(OpsHoistStops.begin(), OpsHoistStops.end()); 5959775a620SHiroshi Yamauchi return true; 5969775a620SHiroshi Yamauchi } 5979775a620SHiroshi Yamauchi } 5989775a620SHiroshi Yamauchi return false; 5999775a620SHiroshi Yamauchi } 6009775a620SHiroshi Yamauchi // Non-instructions are considered hoistable. 6019775a620SHiroshi Yamauchi return true; 6029775a620SHiroshi Yamauchi } 6039775a620SHiroshi Yamauchi 6049775a620SHiroshi Yamauchi // Returns true and sets the true probability and false probability of an 6059775a620SHiroshi Yamauchi // MD_prof metadata if it's well-formed. 6069775a620SHiroshi Yamauchi static bool CheckMDProf(MDNode *MD, BranchProbability &TrueProb, 6079775a620SHiroshi Yamauchi BranchProbability &FalseProb) { 6089775a620SHiroshi Yamauchi if (!MD) return false; 6099775a620SHiroshi Yamauchi MDString *MDName = cast<MDString>(MD->getOperand(0)); 6109775a620SHiroshi Yamauchi if (MDName->getString() != "branch_weights" || 6119775a620SHiroshi Yamauchi MD->getNumOperands() != 3) 6129775a620SHiroshi Yamauchi return false; 6139775a620SHiroshi Yamauchi ConstantInt *TrueWeight = mdconst::extract<ConstantInt>(MD->getOperand(1)); 6149775a620SHiroshi Yamauchi ConstantInt *FalseWeight = mdconst::extract<ConstantInt>(MD->getOperand(2)); 6159775a620SHiroshi Yamauchi if (!TrueWeight || !FalseWeight) 6169775a620SHiroshi Yamauchi return false; 6179775a620SHiroshi Yamauchi APInt TrueWt = TrueWeight->getValue(); 6189775a620SHiroshi Yamauchi APInt FalseWt = FalseWeight->getValue(); 6199775a620SHiroshi Yamauchi APInt SumWt = TrueWt + FalseWt; 6209775a620SHiroshi Yamauchi TrueProb = BranchProbability::getBranchProbability(TrueWt.getZExtValue(), 6219775a620SHiroshi Yamauchi SumWt.getZExtValue()); 6229775a620SHiroshi Yamauchi FalseProb = BranchProbability::getBranchProbability(FalseWt.getZExtValue(), 6239775a620SHiroshi Yamauchi SumWt.getZExtValue()); 6249775a620SHiroshi Yamauchi return true; 6259775a620SHiroshi Yamauchi } 6269775a620SHiroshi Yamauchi 6279775a620SHiroshi Yamauchi static BranchProbability getCHRBiasThreshold() { 6289775a620SHiroshi Yamauchi return BranchProbability::getBranchProbability( 6299775a620SHiroshi Yamauchi static_cast<uint64_t>(CHRBiasThreshold * 1000000), 1000000); 6309775a620SHiroshi Yamauchi } 6319775a620SHiroshi Yamauchi 6329775a620SHiroshi Yamauchi // A helper for CheckBiasedBranch and CheckBiasedSelect. If TrueProb >= 6339775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into TrueSet and return true. If FalseProb >= 6349775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into FalseSet and return true. Otherwise, return 6359775a620SHiroshi Yamauchi // false. 6369775a620SHiroshi Yamauchi template<typename K, typename S, typename M> 6379775a620SHiroshi Yamauchi bool CheckBias(K *Key, BranchProbability TrueProb, BranchProbability FalseProb, 6389775a620SHiroshi Yamauchi S &TrueSet, S &FalseSet, M &BiasMap) { 6399775a620SHiroshi Yamauchi BranchProbability Threshold = getCHRBiasThreshold(); 6409775a620SHiroshi Yamauchi if (TrueProb >= Threshold) { 6419775a620SHiroshi Yamauchi TrueSet.insert(Key); 6429775a620SHiroshi Yamauchi BiasMap[Key] = TrueProb; 6439775a620SHiroshi Yamauchi return true; 6449775a620SHiroshi Yamauchi } else if (FalseProb >= Threshold) { 6459775a620SHiroshi Yamauchi FalseSet.insert(Key); 6469775a620SHiroshi Yamauchi BiasMap[Key] = FalseProb; 6479775a620SHiroshi Yamauchi return true; 6489775a620SHiroshi Yamauchi } 6499775a620SHiroshi Yamauchi return false; 6509775a620SHiroshi Yamauchi } 6519775a620SHiroshi Yamauchi 6529775a620SHiroshi Yamauchi // Returns true and insert a region into the right biased set and the map if the 6539775a620SHiroshi Yamauchi // branch of the region is biased. 6549775a620SHiroshi Yamauchi static bool CheckBiasedBranch(BranchInst *BI, Region *R, 6559775a620SHiroshi Yamauchi DenseSet<Region *> &TrueBiasedRegionsGlobal, 6569775a620SHiroshi Yamauchi DenseSet<Region *> &FalseBiasedRegionsGlobal, 6579775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> &BranchBiasMap) { 6589775a620SHiroshi Yamauchi if (!BI->isConditional()) 6599775a620SHiroshi Yamauchi return false; 6609775a620SHiroshi Yamauchi BranchProbability ThenProb, ElseProb; 6619775a620SHiroshi Yamauchi if (!CheckMDProf(BI->getMetadata(LLVMContext::MD_prof), 6629775a620SHiroshi Yamauchi ThenProb, ElseProb)) 6639775a620SHiroshi Yamauchi return false; 6649775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(0); 6659775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(1); 6669775a620SHiroshi Yamauchi assert((IfThen == R->getExit() || IfElse == R->getExit()) && 6679775a620SHiroshi Yamauchi IfThen != IfElse && 6689775a620SHiroshi Yamauchi "Invariant from findScopes"); 6699775a620SHiroshi Yamauchi if (IfThen == R->getExit()) { 6709775a620SHiroshi Yamauchi // Swap them so that IfThen/ThenProb means going into the conditional code 6719775a620SHiroshi Yamauchi // and IfElse/ElseProb means skipping it. 6729775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 6739775a620SHiroshi Yamauchi std::swap(ThenProb, ElseProb); 6749775a620SHiroshi Yamauchi } 6759775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *BI << " "); 6769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ThenProb " << ThenProb << " "); 6779775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ElseProb " << ElseProb << "\n"); 6789775a620SHiroshi Yamauchi return CheckBias(R, ThenProb, ElseProb, 6799775a620SHiroshi Yamauchi TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 6809775a620SHiroshi Yamauchi BranchBiasMap); 6819775a620SHiroshi Yamauchi } 6829775a620SHiroshi Yamauchi 6839775a620SHiroshi Yamauchi // Returns true and insert a select into the right biased set and the map if the 6849775a620SHiroshi Yamauchi // select is biased. 6859775a620SHiroshi Yamauchi static bool CheckBiasedSelect( 6869775a620SHiroshi Yamauchi SelectInst *SI, Region *R, 6879775a620SHiroshi Yamauchi DenseSet<SelectInst *> &TrueBiasedSelectsGlobal, 6889775a620SHiroshi Yamauchi DenseSet<SelectInst *> &FalseBiasedSelectsGlobal, 6899775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> &SelectBiasMap) { 6909775a620SHiroshi Yamauchi BranchProbability TrueProb, FalseProb; 6919775a620SHiroshi Yamauchi if (!CheckMDProf(SI->getMetadata(LLVMContext::MD_prof), 6929775a620SHiroshi Yamauchi TrueProb, FalseProb)) 6939775a620SHiroshi Yamauchi return false; 6949775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << " "); 6959775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "TrueProb " << TrueProb << " "); 6969775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "FalseProb " << FalseProb << "\n"); 6979775a620SHiroshi Yamauchi return CheckBias(SI, TrueProb, FalseProb, 6989775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, FalseBiasedSelectsGlobal, 6999775a620SHiroshi Yamauchi SelectBiasMap); 7009775a620SHiroshi Yamauchi } 7019775a620SHiroshi Yamauchi 7029775a620SHiroshi Yamauchi // Returns the instruction at which to hoist the dependent condition values and 7039775a620SHiroshi Yamauchi // insert the CHR branch for a region. This is the terminator branch in the 7049775a620SHiroshi Yamauchi // entry block or the first select in the entry block, if any. 7059775a620SHiroshi Yamauchi static Instruction* getBranchInsertPoint(RegInfo &RI) { 7069775a620SHiroshi Yamauchi Region *R = RI.R; 7079775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 7089775a620SHiroshi Yamauchi // The hoist point is by default the terminator of the entry block, which is 7099775a620SHiroshi Yamauchi // the same as the branch instruction if RI.HasBranch is true. 7109775a620SHiroshi Yamauchi Instruction *HoistPoint = EntryBB->getTerminator(); 7119775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7129775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7139775a620SHiroshi Yamauchi // Pick the first select in Selects in the entry block. Note Selects is 7149775a620SHiroshi Yamauchi // sorted in the instruction order within a block (asserted below). 7159775a620SHiroshi Yamauchi HoistPoint = SI; 7169775a620SHiroshi Yamauchi break; 7179775a620SHiroshi Yamauchi } 7189775a620SHiroshi Yamauchi } 7199775a620SHiroshi Yamauchi assert(HoistPoint && "Null HoistPoint"); 7209775a620SHiroshi Yamauchi #ifndef NDEBUG 7219775a620SHiroshi Yamauchi // Check that HoistPoint is the first one in Selects in the entry block, 7229775a620SHiroshi Yamauchi // if any. 7239775a620SHiroshi Yamauchi DenseSet<Instruction *> EntryBlockSelectSet; 7249775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7259775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7269775a620SHiroshi Yamauchi EntryBlockSelectSet.insert(SI); 7279775a620SHiroshi Yamauchi } 7289775a620SHiroshi Yamauchi } 7299775a620SHiroshi Yamauchi for (Instruction &I : *EntryBB) { 7309775a620SHiroshi Yamauchi if (EntryBlockSelectSet.count(&I) > 0) { 7319775a620SHiroshi Yamauchi assert(&I == HoistPoint && 7329775a620SHiroshi Yamauchi "HoistPoint must be the first one in Selects"); 7339775a620SHiroshi Yamauchi break; 7349775a620SHiroshi Yamauchi } 7359775a620SHiroshi Yamauchi } 7369775a620SHiroshi Yamauchi #endif 7379775a620SHiroshi Yamauchi return HoistPoint; 7389775a620SHiroshi Yamauchi } 7399775a620SHiroshi Yamauchi 7409775a620SHiroshi Yamauchi // Find a CHR scope in the given region. 7419775a620SHiroshi Yamauchi CHRScope * CHR::findScope(Region *R) { 7429775a620SHiroshi Yamauchi CHRScope *Result = nullptr; 7439775a620SHiroshi Yamauchi BasicBlock *Entry = R->getEntry(); 7449775a620SHiroshi Yamauchi BasicBlock *Exit = R->getExit(); // null if top level. 7459775a620SHiroshi Yamauchi assert(Entry && "Entry must not be null"); 7469775a620SHiroshi Yamauchi assert((Exit == nullptr) == (R->isTopLevelRegion()) && 7479775a620SHiroshi Yamauchi "Only top level region has a null exit"); 7489775a620SHiroshi Yamauchi if (Entry) 7499775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry " << Entry->getName() << "\n"); 7509775a620SHiroshi Yamauchi else 7519775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry null\n"); 7529775a620SHiroshi Yamauchi if (Exit) 7539775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit " << Exit->getName() << "\n"); 7549775a620SHiroshi Yamauchi else 7559775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit null\n"); 7569775a620SHiroshi Yamauchi // Exclude cases where Entry is part of a subregion (hence it doesn't belong 7579775a620SHiroshi Yamauchi // to this region). 7589775a620SHiroshi Yamauchi bool EntryInSubregion = RI.getRegionFor(Entry) != R; 7599775a620SHiroshi Yamauchi if (EntryInSubregion) 7609775a620SHiroshi Yamauchi return nullptr; 7619775a620SHiroshi Yamauchi // Exclude loops 7629775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(Entry)) 7639775a620SHiroshi Yamauchi if (R->contains(Pred)) 7649775a620SHiroshi Yamauchi return nullptr; 7659775a620SHiroshi Yamauchi if (Exit) { 7669775a620SHiroshi Yamauchi // Try to find an if-then block (check if R is an if-then). 7679775a620SHiroshi Yamauchi // if (cond) { 7689775a620SHiroshi Yamauchi // ... 7699775a620SHiroshi Yamauchi // } 7709775a620SHiroshi Yamauchi auto *BI = dyn_cast<BranchInst>(Entry->getTerminator()); 7719775a620SHiroshi Yamauchi if (BI) 7729775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI.isConditional " << BI->isConditional() << "\n"); 7739775a620SHiroshi Yamauchi else 7749775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI null\n"); 7759775a620SHiroshi Yamauchi if (BI && BI->isConditional()) { 7769775a620SHiroshi Yamauchi BasicBlock *S0 = BI->getSuccessor(0); 7779775a620SHiroshi Yamauchi BasicBlock *S1 = BI->getSuccessor(1); 7789775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S0 " << S0->getName() << "\n"); 7799775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S1 " << S1->getName() << "\n"); 7809775a620SHiroshi Yamauchi if (S0 != S1 && (S0 == Exit || S1 == Exit)) { 7819775a620SHiroshi Yamauchi RegInfo RI(R); 7829775a620SHiroshi Yamauchi RI.HasBranch = CheckBiasedBranch( 7839775a620SHiroshi Yamauchi BI, R, TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 7849775a620SHiroshi Yamauchi BranchBiasMap); 7859775a620SHiroshi Yamauchi Result = new CHRScope(RI); 7869775a620SHiroshi Yamauchi Scopes.insert(Result); 7879775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a region with a branch\n"); 7889775a620SHiroshi Yamauchi ++Stats.NumBranches; 7899775a620SHiroshi Yamauchi } 7909775a620SHiroshi Yamauchi } 7919775a620SHiroshi Yamauchi } 7929775a620SHiroshi Yamauchi { 7939775a620SHiroshi Yamauchi // Try to look for selects in the direct child blocks (as opposed to in 7949775a620SHiroshi Yamauchi // subregions) of R. 7959775a620SHiroshi Yamauchi // ... 7969775a620SHiroshi Yamauchi // if (..) { // Some subregion 7979775a620SHiroshi Yamauchi // ... 7989775a620SHiroshi Yamauchi // } 7999775a620SHiroshi Yamauchi // if (..) { // Some subregion 8009775a620SHiroshi Yamauchi // ... 8019775a620SHiroshi Yamauchi // } 8029775a620SHiroshi Yamauchi // ... 8039775a620SHiroshi Yamauchi // a = cond ? b : c; 8049775a620SHiroshi Yamauchi // ... 8059775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 8069775a620SHiroshi Yamauchi for (RegionNode *E : R->elements()) { 8079775a620SHiroshi Yamauchi if (E->isSubRegion()) 8089775a620SHiroshi Yamauchi continue; 8099775a620SHiroshi Yamauchi // This returns the basic block of E if E is a direct child of R (not a 8109775a620SHiroshi Yamauchi // subregion.) 8119775a620SHiroshi Yamauchi BasicBlock *BB = E->getEntry(); 8129775a620SHiroshi Yamauchi // Need to push in the order to make it easier to find the first Select 8139775a620SHiroshi Yamauchi // later. 8149775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 8159775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(&I)) { 8169775a620SHiroshi Yamauchi Selects.push_back(SI); 8179775a620SHiroshi Yamauchi ++Stats.NumBranches; 8189775a620SHiroshi Yamauchi } 8199775a620SHiroshi Yamauchi } 8209775a620SHiroshi Yamauchi } 8219775a620SHiroshi Yamauchi if (Selects.size() > 0) { 8229775a620SHiroshi Yamauchi auto AddSelects = [&](RegInfo &RI) { 8239775a620SHiroshi Yamauchi for (auto *SI : Selects) 8249775a620SHiroshi Yamauchi if (CheckBiasedSelect(SI, RI.R, 8259775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, 8269775a620SHiroshi Yamauchi FalseBiasedSelectsGlobal, 8279775a620SHiroshi Yamauchi SelectBiasMap)) 8289775a620SHiroshi Yamauchi RI.Selects.push_back(SI); 8299775a620SHiroshi Yamauchi }; 8309775a620SHiroshi Yamauchi if (!Result) { 8319775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a select-only region\n"); 8329775a620SHiroshi Yamauchi RegInfo RI(R); 8339775a620SHiroshi Yamauchi AddSelects(RI); 8349775a620SHiroshi Yamauchi Result = new CHRScope(RI); 8359775a620SHiroshi Yamauchi Scopes.insert(Result); 8369775a620SHiroshi Yamauchi } else { 8379775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found select(s) in a region with a branch\n"); 8389775a620SHiroshi Yamauchi AddSelects(Result->RegInfos[0]); 8399775a620SHiroshi Yamauchi } 8409775a620SHiroshi Yamauchi } 8419775a620SHiroshi Yamauchi } 8429775a620SHiroshi Yamauchi 8439775a620SHiroshi Yamauchi if (Result) { 8449775a620SHiroshi Yamauchi checkScopeHoistable(Result); 8459775a620SHiroshi Yamauchi } 8469775a620SHiroshi Yamauchi return Result; 8479775a620SHiroshi Yamauchi } 8489775a620SHiroshi Yamauchi 8499775a620SHiroshi Yamauchi // Check that any of the branch and the selects in the region could be 8509775a620SHiroshi Yamauchi // hoisted above the the CHR branch insert point (the most dominating of 8519775a620SHiroshi Yamauchi // them, either the branch (at the end of the first block) or the first 8529775a620SHiroshi Yamauchi // select in the first block). If the branch can't be hoisted, drop the 8539775a620SHiroshi Yamauchi // selects in the first blocks. 8549775a620SHiroshi Yamauchi // 8559775a620SHiroshi Yamauchi // For example, for the following scope/region with selects, we want to insert 8569775a620SHiroshi Yamauchi // the merged branch right before the first select in the first/entry block by 8579775a620SHiroshi Yamauchi // hoisting c1, c2, c3, and c4. 8589775a620SHiroshi Yamauchi // 8599775a620SHiroshi Yamauchi // // Branch insert point here. 8609775a620SHiroshi Yamauchi // a = c1 ? b : c; // Select 1 8619775a620SHiroshi Yamauchi // d = c2 ? e : f; // Select 2 8629775a620SHiroshi Yamauchi // if (c3) { // Branch 8639775a620SHiroshi Yamauchi // ... 8649775a620SHiroshi Yamauchi // c4 = foo() // A call. 8659775a620SHiroshi Yamauchi // g = c4 ? h : i; // Select 3 8669775a620SHiroshi Yamauchi // } 8679775a620SHiroshi Yamauchi // 8689775a620SHiroshi Yamauchi // But suppose we can't hoist c4 because it's dependent on the preceding 8699775a620SHiroshi Yamauchi // call. Then, we drop Select 3. Furthermore, if we can't hoist c2, we also drop 8709775a620SHiroshi Yamauchi // Select 2. If we can't hoist c3, we drop Selects 1 & 2. 8719775a620SHiroshi Yamauchi void CHR::checkScopeHoistable(CHRScope *Scope) { 8729775a620SHiroshi Yamauchi RegInfo &RI = Scope->RegInfos[0]; 8739775a620SHiroshi Yamauchi Region *R = RI.R; 8749775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 8759775a620SHiroshi Yamauchi auto *Branch = RI.HasBranch ? 8769775a620SHiroshi Yamauchi cast<BranchInst>(EntryBB->getTerminator()) : nullptr; 8779775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> &Selects = RI.Selects; 8789775a620SHiroshi Yamauchi if (RI.HasBranch || !Selects.empty()) { 8799775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 8809775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 8819775a620SHiroshi Yamauchi // Avoid a data dependence from a select or a branch to a(nother) 8829775a620SHiroshi Yamauchi // select. Note no instruction can't data-depend on a branch (a branch 8839775a620SHiroshi Yamauchi // instruction doesn't produce a value). 8849775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 8859775a620SHiroshi Yamauchi // Initialize Unhoistables with the selects. 8869775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 8879775a620SHiroshi Yamauchi Unhoistables.insert(SI); 8889775a620SHiroshi Yamauchi } 8899775a620SHiroshi Yamauchi // Remove Selects that can't be hoisted. 8909775a620SHiroshi Yamauchi for (auto it = Selects.begin(); it != Selects.end(); ) { 8919775a620SHiroshi Yamauchi SelectInst *SI = *it; 8929775a620SHiroshi Yamauchi if (SI == InsertPoint) { 8939775a620SHiroshi Yamauchi ++it; 8949775a620SHiroshi Yamauchi continue; 8959775a620SHiroshi Yamauchi } 8969775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, 8979775a620SHiroshi Yamauchi DT, Unhoistables, nullptr); 8989775a620SHiroshi Yamauchi if (!IsHoistable) { 8999775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping select " << *SI << "\n"); 9009775a620SHiroshi Yamauchi it = Selects.erase(it); 9019775a620SHiroshi Yamauchi // Since we are dropping the select here, we also drop it from 9029775a620SHiroshi Yamauchi // Unhoistables. 9039775a620SHiroshi Yamauchi Unhoistables.erase(SI); 9049775a620SHiroshi Yamauchi } else 9059775a620SHiroshi Yamauchi ++it; 9069775a620SHiroshi Yamauchi } 9079775a620SHiroshi Yamauchi // Update InsertPoint after potentially removing selects. 9089775a620SHiroshi Yamauchi InsertPoint = getBranchInsertPoint(RI); 9099775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9109775a620SHiroshi Yamauchi if (RI.HasBranch && InsertPoint != Branch) { 9119775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(Branch->getCondition(), InsertPoint, 9129775a620SHiroshi Yamauchi DT, Unhoistables, nullptr); 9139775a620SHiroshi Yamauchi if (!IsHoistable) { 9149775a620SHiroshi Yamauchi // If the branch isn't hoistable, drop the selects in the entry 9159775a620SHiroshi Yamauchi // block, preferring the branch, which makes the branch the hoist 9169775a620SHiroshi Yamauchi // point. 9179775a620SHiroshi Yamauchi assert(InsertPoint != Branch && "Branch must not be the hoist point"); 9189775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping selects in entry block \n"); 9199775a620SHiroshi Yamauchi CHR_DEBUG( 9209775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 9219775a620SHiroshi Yamauchi dbgs() << "SI " << *SI << "\n"; 9229775a620SHiroshi Yamauchi }); 9239775a620SHiroshi Yamauchi Selects.erase(std::remove_if(Selects.begin(), Selects.end(), 9249775a620SHiroshi Yamauchi [EntryBB](SelectInst *SI) { 9259775a620SHiroshi Yamauchi return SI->getParent() == EntryBB; 9269775a620SHiroshi Yamauchi }), Selects.end()); 9279775a620SHiroshi Yamauchi Unhoistables.clear(); 9289775a620SHiroshi Yamauchi InsertPoint = Branch; 9299775a620SHiroshi Yamauchi } 9309775a620SHiroshi Yamauchi } 9319775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9329775a620SHiroshi Yamauchi #ifndef NDEBUG 9339775a620SHiroshi Yamauchi if (RI.HasBranch) { 9349775a620SHiroshi Yamauchi assert(!DT.dominates(Branch, InsertPoint) && 9359775a620SHiroshi Yamauchi "Branch can't be already above the hoist point"); 9369775a620SHiroshi Yamauchi assert(checkHoistValue(Branch->getCondition(), InsertPoint, 9379775a620SHiroshi Yamauchi DT, Unhoistables, nullptr) && 9389775a620SHiroshi Yamauchi "checkHoistValue for branch"); 9399775a620SHiroshi Yamauchi } 9409775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9419775a620SHiroshi Yamauchi assert(!DT.dominates(SI, InsertPoint) && 9429775a620SHiroshi Yamauchi "SI can't be already above the hoist point"); 9439775a620SHiroshi Yamauchi assert(checkHoistValue(SI->getCondition(), InsertPoint, DT, 9449775a620SHiroshi Yamauchi Unhoistables, nullptr) && 9459775a620SHiroshi Yamauchi "checkHoistValue for selects"); 9469775a620SHiroshi Yamauchi } 9479775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Result\n"); 9489775a620SHiroshi Yamauchi if (RI.HasBranch) { 9499775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *Branch << "\n"); 9509775a620SHiroshi Yamauchi } 9519775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9529775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << "\n"); 9539775a620SHiroshi Yamauchi } 9549775a620SHiroshi Yamauchi #endif 9559775a620SHiroshi Yamauchi } 9569775a620SHiroshi Yamauchi } 9579775a620SHiroshi Yamauchi 9589775a620SHiroshi Yamauchi // Traverse the region tree, find all nested scopes and merge them if possible. 9599775a620SHiroshi Yamauchi CHRScope * CHR::findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 9609775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes) { 9619775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "findScopes " << R->getNameStr() << "\n"); 9629775a620SHiroshi Yamauchi CHRScope *Result = findScope(R); 9639775a620SHiroshi Yamauchi // Visit subscopes. 9649775a620SHiroshi Yamauchi CHRScope *ConsecutiveSubscope = nullptr; 9659775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subscopes; 9669775a620SHiroshi Yamauchi for (auto It = R->begin(); It != R->end(); ++It) { 9679775a620SHiroshi Yamauchi const std::unique_ptr<Region> &SubR = *It; 9689775a620SHiroshi Yamauchi auto Next_It = std::next(It); 9699775a620SHiroshi Yamauchi Region *NextSubR = Next_It != R->end() ? Next_It->get() : nullptr; 9709775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Looking at subregion " << SubR.get()->getNameStr() 9719775a620SHiroshi Yamauchi << "\n"); 9729775a620SHiroshi Yamauchi CHRScope *SubCHRScope = findScopes(SubR.get(), NextSubR, R, Scopes); 9739775a620SHiroshi Yamauchi if (SubCHRScope) { 9749775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope " << *SubCHRScope << "\n"); 9759775a620SHiroshi Yamauchi } else { 9769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope null\n"); 9779775a620SHiroshi Yamauchi } 9789775a620SHiroshi Yamauchi if (SubCHRScope) { 9799775a620SHiroshi Yamauchi if (!ConsecutiveSubscope) 9809775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 9819775a620SHiroshi Yamauchi else if (!ConsecutiveSubscope->appendable(SubCHRScope)) { 9829775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9839775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 9849775a620SHiroshi Yamauchi } else 9859775a620SHiroshi Yamauchi ConsecutiveSubscope->append(SubCHRScope); 9869775a620SHiroshi Yamauchi } else { 9879775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 9889775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9899775a620SHiroshi Yamauchi } 9909775a620SHiroshi Yamauchi ConsecutiveSubscope = nullptr; 9919775a620SHiroshi Yamauchi } 9929775a620SHiroshi Yamauchi } 9939775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 9949775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 9959775a620SHiroshi Yamauchi } 9969775a620SHiroshi Yamauchi for (CHRScope *Sub : Subscopes) { 9979775a620SHiroshi Yamauchi if (Result) { 9989775a620SHiroshi Yamauchi // Combine it with the parent. 9999775a620SHiroshi Yamauchi Result->addSub(Sub); 10009775a620SHiroshi Yamauchi } else { 10019775a620SHiroshi Yamauchi // Push Subscopes as they won't be combined with the parent. 10029775a620SHiroshi Yamauchi Scopes.push_back(Sub); 10039775a620SHiroshi Yamauchi } 10049775a620SHiroshi Yamauchi } 10059775a620SHiroshi Yamauchi return Result; 10069775a620SHiroshi Yamauchi } 10079775a620SHiroshi Yamauchi 10089775a620SHiroshi Yamauchi static DenseSet<Value *> getCHRConditionValuesForRegion(RegInfo &RI) { 10099775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues; 10109775a620SHiroshi Yamauchi if (RI.HasBranch) { 10119775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(RI.R->getEntry()->getTerminator()); 10129775a620SHiroshi Yamauchi ConditionValues.insert(BI->getCondition()); 10139775a620SHiroshi Yamauchi } 10149775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 10159775a620SHiroshi Yamauchi ConditionValues.insert(SI->getCondition()); 10169775a620SHiroshi Yamauchi } 10179775a620SHiroshi Yamauchi return ConditionValues; 10189775a620SHiroshi Yamauchi } 10199775a620SHiroshi Yamauchi 10209775a620SHiroshi Yamauchi 10219775a620SHiroshi Yamauchi // Determine whether to split a scope depending on the sets of the branch 10229775a620SHiroshi Yamauchi // condition values of the previous region and the current region. We split 10239775a620SHiroshi Yamauchi // (return true) it if 1) the condition values of the inner/lower scope can't be 10249775a620SHiroshi Yamauchi // hoisted up to the outer/upper scope, or 2) the two sets of the condition 10259775a620SHiroshi Yamauchi // values have an empty intersection (because the combined branch conditions 10269775a620SHiroshi Yamauchi // won't probably lead to a simpler combined condition). 10279775a620SHiroshi Yamauchi static bool shouldSplit(Instruction *InsertPoint, 10289775a620SHiroshi Yamauchi DenseSet<Value *> &PrevConditionValues, 10299775a620SHiroshi Yamauchi DenseSet<Value *> &ConditionValues, 10309775a620SHiroshi Yamauchi DominatorTree &DT, 10319775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 10329775a620SHiroshi Yamauchi CHR_DEBUG( 10339775a620SHiroshi Yamauchi dbgs() << "shouldSplit " << *InsertPoint << " PrevConditionValues "; 10349775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10359775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10369775a620SHiroshi Yamauchi } 10379775a620SHiroshi Yamauchi dbgs() << " ConditionValues "; 10389775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10399775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10409775a620SHiroshi Yamauchi } 10419775a620SHiroshi Yamauchi dbgs() << "\n"); 10429775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 10439775a620SHiroshi Yamauchi // If any of Bases isn't hoistable to the hoist point, split. 10449775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10459775a620SHiroshi Yamauchi if (!checkHoistValue(V, InsertPoint, DT, Unhoistables, nullptr)) { 10469775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. checkHoistValue false " << *V << "\n"); 10479775a620SHiroshi Yamauchi return true; // Not hoistable, split. 10489775a620SHiroshi Yamauchi } 10499775a620SHiroshi Yamauchi } 10509775a620SHiroshi Yamauchi // If PrevConditionValues or ConditionValues is empty, don't split to avoid 10519775a620SHiroshi Yamauchi // unnecessary splits at scopes with no branch/selects. If 10529775a620SHiroshi Yamauchi // PrevConditionValues and ConditionValues don't intersect at all, split. 10539775a620SHiroshi Yamauchi if (!PrevConditionValues.empty() && !ConditionValues.empty()) { 10549775a620SHiroshi Yamauchi // Use std::set as DenseSet doesn't work with set_intersection. 10559775a620SHiroshi Yamauchi std::set<Value *> PrevBases, Bases; 10569775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10579775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10589775a620SHiroshi Yamauchi PrevBases.insert(BaseValues.begin(), BaseValues.end()); 10599775a620SHiroshi Yamauchi } 10609775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10619775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10629775a620SHiroshi Yamauchi Bases.insert(BaseValues.begin(), BaseValues.end()); 10639775a620SHiroshi Yamauchi } 10649775a620SHiroshi Yamauchi CHR_DEBUG( 10659775a620SHiroshi Yamauchi dbgs() << "PrevBases "; 10669775a620SHiroshi Yamauchi for (Value *V : PrevBases) { 10679775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10689775a620SHiroshi Yamauchi } 10699775a620SHiroshi Yamauchi dbgs() << " Bases "; 10709775a620SHiroshi Yamauchi for (Value *V : Bases) { 10719775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10729775a620SHiroshi Yamauchi } 10739775a620SHiroshi Yamauchi dbgs() << "\n"); 10749775a620SHiroshi Yamauchi std::set<Value *> Intersection; 10759775a620SHiroshi Yamauchi std::set_intersection(PrevBases.begin(), PrevBases.end(), 10769775a620SHiroshi Yamauchi Bases.begin(), Bases.end(), 10779775a620SHiroshi Yamauchi std::inserter(Intersection, Intersection.begin())); 10789775a620SHiroshi Yamauchi if (Intersection.empty()) { 10799775a620SHiroshi Yamauchi // Empty intersection, split. 10809775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. Intersection empty\n"); 10819775a620SHiroshi Yamauchi return true; 10829775a620SHiroshi Yamauchi } 10839775a620SHiroshi Yamauchi } 10849775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "No split\n"); 10859775a620SHiroshi Yamauchi return false; // Don't split. 10869775a620SHiroshi Yamauchi } 10879775a620SHiroshi Yamauchi 10889775a620SHiroshi Yamauchi static void GetSelectsInScope(CHRScope *Scope, 10899775a620SHiroshi Yamauchi DenseSet<Instruction *> &Output) { 10909775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 10919775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 10929775a620SHiroshi Yamauchi Output.insert(SI); 10939775a620SHiroshi Yamauchi } 10949775a620SHiroshi Yamauchi } 10959775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) { 10969775a620SHiroshi Yamauchi GetSelectsInScope(Sub, Output); 10979775a620SHiroshi Yamauchi } 10989775a620SHiroshi Yamauchi } 10999775a620SHiroshi Yamauchi 11009775a620SHiroshi Yamauchi void CHR::splitScopes(SmallVectorImpl<CHRScope *> &Input, 11019775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 11029775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 11039775a620SHiroshi Yamauchi assert(!Scope->BranchInsertPoint && 11049775a620SHiroshi Yamauchi "BranchInsertPoint must not be set"); 11059775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 11069775a620SHiroshi Yamauchi GetSelectsInScope(Scope, Unhoistables); 11079775a620SHiroshi Yamauchi splitScope(Scope, nullptr, nullptr, nullptr, Output, Unhoistables); 11089775a620SHiroshi Yamauchi } 11099775a620SHiroshi Yamauchi #ifndef NDEBUG 11109775a620SHiroshi Yamauchi for (CHRScope *Scope : Output) { 11119775a620SHiroshi Yamauchi assert(Scope->BranchInsertPoint && "BranchInsertPoint must be set"); 11129775a620SHiroshi Yamauchi } 11139775a620SHiroshi Yamauchi #endif 11149775a620SHiroshi Yamauchi } 11159775a620SHiroshi Yamauchi 11169775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> CHR::splitScope( 11179775a620SHiroshi Yamauchi CHRScope *Scope, 11189775a620SHiroshi Yamauchi CHRScope *Outer, 11199775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 11209775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 11219775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 11229775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 11239775a620SHiroshi Yamauchi if (Outer) { 11249775a620SHiroshi Yamauchi assert(OuterConditionValues && "Null OuterConditionValues"); 11259775a620SHiroshi Yamauchi assert(OuterInsertPoint && "Null OuterInsertPoint"); 11269775a620SHiroshi Yamauchi } 11279775a620SHiroshi Yamauchi bool PrevSplitFromOuter = true; 11289775a620SHiroshi Yamauchi DenseSet<Value *> PrevConditionValues; 11299775a620SHiroshi Yamauchi Instruction *PrevInsertPoint = nullptr; 11309775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Splits; 11319775a620SHiroshi Yamauchi SmallVector<bool, 8> SplitsSplitFromOuter; 11329775a620SHiroshi Yamauchi SmallVector<DenseSet<Value *>, 8> SplitsConditionValues; 11339775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> SplitsInsertPoints; 11349775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos(Scope->RegInfos); // Copy 11359775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) { 11369775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 11379775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues = getCHRConditionValuesForRegion(RI); 11389775a620SHiroshi Yamauchi CHR_DEBUG( 11399775a620SHiroshi Yamauchi dbgs() << "ConditionValues "; 11409775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 11419775a620SHiroshi Yamauchi dbgs() << *V << ", "; 11429775a620SHiroshi Yamauchi } 11439775a620SHiroshi Yamauchi dbgs() << "\n"); 11449775a620SHiroshi Yamauchi if (RI.R == RegInfos[0].R) { 11459775a620SHiroshi Yamauchi // First iteration. Check to see if we should split from the outer. 11469775a620SHiroshi Yamauchi if (Outer) { 11479775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer " << *Outer << "\n"); 11489775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from outer at " 11499775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 11509775a620SHiroshi Yamauchi if (shouldSplit(OuterInsertPoint, *OuterConditionValues, 11519775a620SHiroshi Yamauchi ConditionValues, DT, Unhoistables)) { 11529775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11539775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11549775a620SHiroshi Yamauchi } else { 11559775a620SHiroshi Yamauchi // Not splitting from the outer. Use the outer bases and insert 11569775a620SHiroshi Yamauchi // point. Union the bases. 11579775a620SHiroshi Yamauchi PrevSplitFromOuter = false; 11589775a620SHiroshi Yamauchi PrevConditionValues = *OuterConditionValues; 11599775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), 11609775a620SHiroshi Yamauchi ConditionValues.end()); 11619775a620SHiroshi Yamauchi PrevInsertPoint = OuterInsertPoint; 11629775a620SHiroshi Yamauchi } 11639775a620SHiroshi Yamauchi } else { 11649775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer null\n"); 11659775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11669775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11679775a620SHiroshi Yamauchi } 11689775a620SHiroshi Yamauchi } else { 11699775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from prev at " 11709775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 11719775a620SHiroshi Yamauchi if (shouldSplit(PrevInsertPoint, PrevConditionValues, ConditionValues, 11729775a620SHiroshi Yamauchi DT, Unhoistables)) { 11739775a620SHiroshi Yamauchi CHRScope *Tail = Scope->split(RI.R); 11749775a620SHiroshi Yamauchi Scopes.insert(Tail); 11759775a620SHiroshi Yamauchi Splits.push_back(Scope); 11769775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 11779775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 11789775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 11799775a620SHiroshi Yamauchi Scope = Tail; 11809775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11819775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11829775a620SHiroshi Yamauchi PrevSplitFromOuter = true; 11839775a620SHiroshi Yamauchi } else { 11849775a620SHiroshi Yamauchi // Not splitting. Union the bases. Keep the hoist point. 11859775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), ConditionValues.end()); 11869775a620SHiroshi Yamauchi } 11879775a620SHiroshi Yamauchi } 11889775a620SHiroshi Yamauchi } 11899775a620SHiroshi Yamauchi Splits.push_back(Scope); 11909775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 11919775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 11929775a620SHiroshi Yamauchi assert(PrevInsertPoint && "Null PrevInsertPoint"); 11939775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 11949775a620SHiroshi Yamauchi assert(Splits.size() == SplitsConditionValues.size() && 11959775a620SHiroshi Yamauchi Splits.size() == SplitsSplitFromOuter.size() && 11969775a620SHiroshi Yamauchi Splits.size() == SplitsInsertPoints.size() && "Mismatching sizes"); 11979775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 11989775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 11999775a620SHiroshi Yamauchi DenseSet<Value *> &SplitConditionValues = SplitsConditionValues[I]; 12009775a620SHiroshi Yamauchi Instruction *SplitInsertPoint = SplitsInsertPoints[I]; 12019775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> NewSubs; 12029775a620SHiroshi Yamauchi DenseSet<Instruction *> SplitUnhoistables; 12039775a620SHiroshi Yamauchi GetSelectsInScope(Split, SplitUnhoistables); 12049775a620SHiroshi Yamauchi for (CHRScope *Sub : Split->Subs) { 12059775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SubSplits = splitScope( 12069775a620SHiroshi Yamauchi Sub, Split, &SplitConditionValues, SplitInsertPoint, Output, 12079775a620SHiroshi Yamauchi SplitUnhoistables); 12089775a620SHiroshi Yamauchi NewSubs.insert(NewSubs.end(), SubSplits.begin(), SubSplits.end()); 12099775a620SHiroshi Yamauchi } 12109775a620SHiroshi Yamauchi Split->Subs = NewSubs; 12119775a620SHiroshi Yamauchi } 12129775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Result; 12139775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 12149775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 12159775a620SHiroshi Yamauchi if (SplitsSplitFromOuter[I]) { 12169775a620SHiroshi Yamauchi // Split from the outer. 12179775a620SHiroshi Yamauchi Output.push_back(Split); 12189775a620SHiroshi Yamauchi Split->BranchInsertPoint = SplitsInsertPoints[I]; 12199775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BranchInsertPoint " << *SplitsInsertPoints[I] 12209775a620SHiroshi Yamauchi << "\n"); 12219775a620SHiroshi Yamauchi } else { 12229775a620SHiroshi Yamauchi // Connected to the outer. 12239775a620SHiroshi Yamauchi Result.push_back(Split); 12249775a620SHiroshi Yamauchi } 12259775a620SHiroshi Yamauchi } 12269775a620SHiroshi Yamauchi if (!Outer) 12279775a620SHiroshi Yamauchi assert(Result.empty() && 12289775a620SHiroshi Yamauchi "If no outer (top-level), must return no nested ones"); 12299775a620SHiroshi Yamauchi return Result; 12309775a620SHiroshi Yamauchi } 12319775a620SHiroshi Yamauchi 12329775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes) { 12339775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 12349775a620SHiroshi Yamauchi assert(Scope->TrueBiasedRegions.empty() && Scope->FalseBiasedRegions.empty() && "Empty"); 12359775a620SHiroshi Yamauchi classifyBiasedScopes(Scope, Scope); 12369775a620SHiroshi Yamauchi CHR_DEBUG( 12379775a620SHiroshi Yamauchi dbgs() << "classifyBiasedScopes " << *Scope << "\n"; 12389775a620SHiroshi Yamauchi dbgs() << "TrueBiasedRegions "; 12399775a620SHiroshi Yamauchi for (Region *R : Scope->TrueBiasedRegions) { 12409775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12419775a620SHiroshi Yamauchi } 12429775a620SHiroshi Yamauchi dbgs() << "\n"; 12439775a620SHiroshi Yamauchi dbgs() << "FalseBiasedRegions "; 12449775a620SHiroshi Yamauchi for (Region *R : Scope->FalseBiasedRegions) { 12459775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12469775a620SHiroshi Yamauchi } 12479775a620SHiroshi Yamauchi dbgs() << "\n"; 12489775a620SHiroshi Yamauchi dbgs() << "TrueBiasedSelects "; 12499775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->TrueBiasedSelects) { 12509775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12519775a620SHiroshi Yamauchi } 12529775a620SHiroshi Yamauchi dbgs() << "\n"; 12539775a620SHiroshi Yamauchi dbgs() << "FalseBiasedSelects "; 12549775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->FalseBiasedSelects) { 12559775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12569775a620SHiroshi Yamauchi } 12579775a620SHiroshi Yamauchi dbgs() << "\n";); 12589775a620SHiroshi Yamauchi } 12599775a620SHiroshi Yamauchi } 12609775a620SHiroshi Yamauchi 12619775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope) { 12629775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 12639775a620SHiroshi Yamauchi if (RI.HasBranch) { 12649775a620SHiroshi Yamauchi Region *R = RI.R; 12659775a620SHiroshi Yamauchi if (TrueBiasedRegionsGlobal.count(R) > 0) 12669775a620SHiroshi Yamauchi OutermostScope->TrueBiasedRegions.insert(R); 12679775a620SHiroshi Yamauchi else if (FalseBiasedRegionsGlobal.count(R) > 0) 12689775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.insert(R); 12699775a620SHiroshi Yamauchi else 12709775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 12719775a620SHiroshi Yamauchi } 12729775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 12739775a620SHiroshi Yamauchi if (TrueBiasedSelectsGlobal.count(SI) > 0) 12749775a620SHiroshi Yamauchi OutermostScope->TrueBiasedSelects.insert(SI); 12759775a620SHiroshi Yamauchi else if (FalseBiasedSelectsGlobal.count(SI) > 0) 12769775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.insert(SI); 12779775a620SHiroshi Yamauchi else 12789775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 12799775a620SHiroshi Yamauchi } 12809775a620SHiroshi Yamauchi } 12819775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) { 12829775a620SHiroshi Yamauchi classifyBiasedScopes(Sub, OutermostScope); 12839775a620SHiroshi Yamauchi } 12849775a620SHiroshi Yamauchi } 12859775a620SHiroshi Yamauchi 12869775a620SHiroshi Yamauchi static bool hasAtLeastTwoBiasedBranches(CHRScope *Scope) { 12879775a620SHiroshi Yamauchi unsigned NumBiased = Scope->TrueBiasedRegions.size() + 12889775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.size() + 12899775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.size() + 12909775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.size(); 12919775a620SHiroshi Yamauchi return NumBiased >= CHRMergeThreshold; 12929775a620SHiroshi Yamauchi } 12939775a620SHiroshi Yamauchi 12949775a620SHiroshi Yamauchi void CHR::filterScopes(SmallVectorImpl<CHRScope *> &Input, 12959775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 12969775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 12979775a620SHiroshi Yamauchi // Filter out the ones with only one region and no subs. 12989775a620SHiroshi Yamauchi if (!hasAtLeastTwoBiasedBranches(Scope)) { 12999775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Filtered out by biased branches truthy-regions " 13009775a620SHiroshi Yamauchi << Scope->TrueBiasedRegions.size() 13019775a620SHiroshi Yamauchi << " falsy-regions " << Scope->FalseBiasedRegions.size() 13029775a620SHiroshi Yamauchi << " true-selects " << Scope->TrueBiasedSelects.size() 13039775a620SHiroshi Yamauchi << " false-selects " << Scope->FalseBiasedSelects.size() << "\n"); 13049775a620SHiroshi Yamauchi continue; 13059775a620SHiroshi Yamauchi } 13069775a620SHiroshi Yamauchi Output.push_back(Scope); 13079775a620SHiroshi Yamauchi } 13089775a620SHiroshi Yamauchi } 13099775a620SHiroshi Yamauchi 13109775a620SHiroshi Yamauchi void CHR::setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 13119775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13129775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 13139775a620SHiroshi Yamauchi assert(Scope->HoistStopMap.empty() && Scope->CHRRegions.empty() && 13149775a620SHiroshi Yamauchi "Empty"); 13159775a620SHiroshi Yamauchi setCHRRegions(Scope, Scope); 13169775a620SHiroshi Yamauchi Output.push_back(Scope); 13179775a620SHiroshi Yamauchi CHR_DEBUG( 13189775a620SHiroshi Yamauchi dbgs() << "setCHRRegions HoistStopMap " << *Scope << "\n"; 13199775a620SHiroshi Yamauchi for (auto pair : Scope->HoistStopMap) { 13209775a620SHiroshi Yamauchi Region *R = pair.first; 13219775a620SHiroshi Yamauchi dbgs() << "Region " << R->getNameStr() << "\n"; 13229775a620SHiroshi Yamauchi for (Instruction *I : pair.second) { 13239775a620SHiroshi Yamauchi dbgs() << "HoistStop " << *I << "\n"; 13249775a620SHiroshi Yamauchi } 13259775a620SHiroshi Yamauchi } 13269775a620SHiroshi Yamauchi dbgs() << "CHRRegions" << "\n"; 13279775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 13289775a620SHiroshi Yamauchi dbgs() << RI.R->getNameStr() << "\n"; 13299775a620SHiroshi Yamauchi }); 13309775a620SHiroshi Yamauchi } 13319775a620SHiroshi Yamauchi } 13329775a620SHiroshi Yamauchi 13339775a620SHiroshi Yamauchi void CHR::setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope) { 13349775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 13359775a620SHiroshi Yamauchi // Put the biased selects in Unhoistables because they should stay where they 13369775a620SHiroshi Yamauchi // are and constant-folded after CHR (in case one biased select or a branch 13379775a620SHiroshi Yamauchi // can depend on another biased select.) 13389775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13399775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13409775a620SHiroshi Yamauchi Unhoistables.insert(SI); 13419775a620SHiroshi Yamauchi } 13429775a620SHiroshi Yamauchi } 13439775a620SHiroshi Yamauchi Instruction *InsertPoint = OutermostScope->BranchInsertPoint; 13449775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13459775a620SHiroshi Yamauchi Region *R = RI.R; 13469775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistStops; 13479775a620SHiroshi Yamauchi bool IsHoisted = false; 13489775a620SHiroshi Yamauchi if (RI.HasBranch) { 13499775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedRegions.count(R) > 0 || 13509775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.count(R) > 0) && 13519775a620SHiroshi Yamauchi "Must be truthy or falsy"); 13529775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 13539775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 13549775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(BI->getCondition(), InsertPoint, DT, 13559775a620SHiroshi Yamauchi Unhoistables, &HoistStops); 13569775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 13579775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 13589775a620SHiroshi Yamauchi IsHoisted = true; 13599775a620SHiroshi Yamauchi } 13609775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13619775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedSelects.count(SI) > 0 || 13629775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.count(SI) > 0) && 13639775a620SHiroshi Yamauchi "Must be true or false biased"); 13649775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 13659775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, DT, 13669775a620SHiroshi Yamauchi Unhoistables, &HoistStops); 13679775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 13689775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 13699775a620SHiroshi Yamauchi IsHoisted = true; 13709775a620SHiroshi Yamauchi } 13719775a620SHiroshi Yamauchi if (IsHoisted) { 13729775a620SHiroshi Yamauchi OutermostScope->CHRRegions.push_back(RI); 13739775a620SHiroshi Yamauchi OutermostScope->HoistStopMap[R] = HoistStops; 13749775a620SHiroshi Yamauchi } 13759775a620SHiroshi Yamauchi } 13769775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) 13779775a620SHiroshi Yamauchi setCHRRegions(Sub, OutermostScope); 13789775a620SHiroshi Yamauchi } 13799775a620SHiroshi Yamauchi 13809775a620SHiroshi Yamauchi bool CHRScopeSorter(CHRScope *Scope1, CHRScope *Scope2) { 13819775a620SHiroshi Yamauchi return Scope1->RegInfos[0].R->getDepth() < Scope2->RegInfos[0].R->getDepth(); 13829775a620SHiroshi Yamauchi } 13839775a620SHiroshi Yamauchi 13849775a620SHiroshi Yamauchi void CHR::sortScopes(SmallVectorImpl<CHRScope *> &Input, 13859775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13869775a620SHiroshi Yamauchi Output.resize(Input.size()); 13879775a620SHiroshi Yamauchi std::copy(Input.begin(), Input.end(), Output.begin()); 13889775a620SHiroshi Yamauchi std::stable_sort(Output.begin(), Output.end(), CHRScopeSorter); 13899775a620SHiroshi Yamauchi } 13909775a620SHiroshi Yamauchi 13919775a620SHiroshi Yamauchi // Return true if V is already hoisted or was hoisted (along with its operands) 13929775a620SHiroshi Yamauchi // to the insert point. 13939775a620SHiroshi Yamauchi static void hoistValue(Value *V, Instruction *HoistPoint, Region *R, 13949775a620SHiroshi Yamauchi HoistStopMapTy &HoistStopMap, 13959775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistedSet, 13969775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 13979775a620SHiroshi Yamauchi auto IT = HoistStopMap.find(R); 13989775a620SHiroshi Yamauchi assert(IT != HoistStopMap.end() && "Region must be in hoist stop map"); 13999775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistStops = IT->second; 14009775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 14019775a620SHiroshi Yamauchi if (I == HoistPoint) 14029775a620SHiroshi Yamauchi return; 14039775a620SHiroshi Yamauchi if (HoistStops.count(I)) 14049775a620SHiroshi Yamauchi return; 14059775a620SHiroshi Yamauchi if (auto *PN = dyn_cast<PHINode>(I)) 14069775a620SHiroshi Yamauchi if (TrivialPHIs.count(PN)) 14079775a620SHiroshi Yamauchi // The trivial phi inserted by the previous CHR scope could replace a 14089775a620SHiroshi Yamauchi // non-phi in HoistStops. Note that since this phi is at the exit of a 14099775a620SHiroshi Yamauchi // previous CHR scope, which dominates this scope, it's safe to stop 14109775a620SHiroshi Yamauchi // hoisting there. 14119775a620SHiroshi Yamauchi return; 14129775a620SHiroshi Yamauchi if (HoistedSet.count(I)) 14139775a620SHiroshi Yamauchi // Already hoisted, return. 14149775a620SHiroshi Yamauchi return; 14159775a620SHiroshi Yamauchi assert(isHoistableInstructionType(I) && "Unhoistable instruction type"); 14169775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 14179775a620SHiroshi Yamauchi hoistValue(Op, HoistPoint, R, HoistStopMap, HoistedSet, TrivialPHIs); 14189775a620SHiroshi Yamauchi } 14199775a620SHiroshi Yamauchi I->moveBefore(HoistPoint); 14209775a620SHiroshi Yamauchi HoistedSet.insert(I); 14219775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "hoistValue " << *I << "\n"); 14229775a620SHiroshi Yamauchi } 14239775a620SHiroshi Yamauchi } 14249775a620SHiroshi Yamauchi 14259775a620SHiroshi Yamauchi // Hoist the dependent condition values of the branches and the selects in the 14269775a620SHiroshi Yamauchi // scope to the insert point. 14279775a620SHiroshi Yamauchi static void hoistScopeConditions(CHRScope *Scope, Instruction *HoistPoint, 14289775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 14299775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistedSet; 14309775a620SHiroshi Yamauchi for (const RegInfo &RI : Scope->CHRRegions) { 14319775a620SHiroshi Yamauchi Region *R = RI.R; 14329775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 14339775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 14349775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 14359775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 14369775a620SHiroshi Yamauchi hoistValue(BI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 14379775a620SHiroshi Yamauchi HoistedSet, TrivialPHIs); 14389775a620SHiroshi Yamauchi } 14399775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 14409775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 14419775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 14429775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 14439775a620SHiroshi Yamauchi continue; 14449775a620SHiroshi Yamauchi hoistValue(SI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 14459775a620SHiroshi Yamauchi HoistedSet, TrivialPHIs); 14469775a620SHiroshi Yamauchi } 14479775a620SHiroshi Yamauchi } 14489775a620SHiroshi Yamauchi } 14499775a620SHiroshi Yamauchi 14509775a620SHiroshi Yamauchi // Negate the predicate if an ICmp if it's used only by branches or selects by 14519775a620SHiroshi Yamauchi // swapping the operands of the branches or the selects. Returns true if success. 14529775a620SHiroshi Yamauchi static bool NegateICmpIfUsedByBranchOrSelectOnly(ICmpInst *ICmp, 14539775a620SHiroshi Yamauchi Instruction *ExcludedUser, 14549775a620SHiroshi Yamauchi CHRScope *Scope) { 14559775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 14569775a620SHiroshi Yamauchi if (U == ExcludedUser) 14579775a620SHiroshi Yamauchi continue; 14589775a620SHiroshi Yamauchi if (isa<BranchInst>(U) && cast<BranchInst>(U)->isConditional()) 14599775a620SHiroshi Yamauchi continue; 14609775a620SHiroshi Yamauchi if (isa<SelectInst>(U) && cast<SelectInst>(U)->getCondition() == ICmp) 14619775a620SHiroshi Yamauchi continue; 14629775a620SHiroshi Yamauchi return false; 14639775a620SHiroshi Yamauchi } 14649775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 14659775a620SHiroshi Yamauchi if (U == ExcludedUser) 14669775a620SHiroshi Yamauchi continue; 14679775a620SHiroshi Yamauchi if (auto *BI = dyn_cast<BranchInst>(U)) { 14689775a620SHiroshi Yamauchi assert(BI->isConditional() && "Must be conditional"); 14699775a620SHiroshi Yamauchi BI->swapSuccessors(); 14709775a620SHiroshi Yamauchi // Don't need to swap this in terms of 14719775a620SHiroshi Yamauchi // TrueBiasedRegions/FalseBiasedRegions because true-based/false-based 14729775a620SHiroshi Yamauchi // mean whehter the branch is likely go into the if-then rather than 14739775a620SHiroshi Yamauchi // successor0/successor1 and because we can tell which edge is the then or 14749775a620SHiroshi Yamauchi // the else one by comparing the destination to the region exit block. 14759775a620SHiroshi Yamauchi continue; 14769775a620SHiroshi Yamauchi } 14779775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(U)) { 14789775a620SHiroshi Yamauchi // Swap operands 14799775a620SHiroshi Yamauchi Value *TrueValue = SI->getTrueValue(); 14809775a620SHiroshi Yamauchi Value *FalseValue = SI->getFalseValue(); 14819775a620SHiroshi Yamauchi SI->setTrueValue(FalseValue); 14829775a620SHiroshi Yamauchi SI->setFalseValue(TrueValue); 14839775a620SHiroshi Yamauchi SI->swapProfMetadata(); 14849775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI)) { 14859775a620SHiroshi Yamauchi assert(Scope->FalseBiasedSelects.count(SI) == 0 && 14869775a620SHiroshi Yamauchi "Must not be already in"); 14879775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.insert(SI); 14889775a620SHiroshi Yamauchi } else if (Scope->FalseBiasedSelects.count(SI)) { 14899775a620SHiroshi Yamauchi assert(Scope->TrueBiasedSelects.count(SI) == 0 && 14909775a620SHiroshi Yamauchi "Must not be already in"); 14919775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.insert(SI); 14929775a620SHiroshi Yamauchi } 14939775a620SHiroshi Yamauchi continue; 14949775a620SHiroshi Yamauchi } 14959775a620SHiroshi Yamauchi llvm_unreachable("Must be a branch or a select"); 14969775a620SHiroshi Yamauchi } 14979775a620SHiroshi Yamauchi ICmp->setPredicate(CmpInst::getInversePredicate(ICmp->getPredicate())); 14989775a620SHiroshi Yamauchi return true; 14999775a620SHiroshi Yamauchi } 15009775a620SHiroshi Yamauchi 15019775a620SHiroshi Yamauchi // A helper for transformScopes. Insert a trivial phi at the scope exit block 15029775a620SHiroshi Yamauchi // for a value that's defined in the scope but used outside it (meaning it's 15039775a620SHiroshi Yamauchi // alive at the exit block). 15049775a620SHiroshi Yamauchi static void insertTrivialPHIs(CHRScope *Scope, 15059775a620SHiroshi Yamauchi BasicBlock *EntryBlock, BasicBlock *ExitBlock, 15069775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 15079775a620SHiroshi Yamauchi DenseSet<BasicBlock *> BlocksInScopeSet; 15089775a620SHiroshi Yamauchi SmallVector<BasicBlock *, 8> BlocksInScopeVec; 15099775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 15109775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 15119775a620SHiroshi Yamauchi // sub-Scopes. 15129775a620SHiroshi Yamauchi BlocksInScopeSet.insert(BB); 15139775a620SHiroshi Yamauchi BlocksInScopeVec.push_back(BB); 15149775a620SHiroshi Yamauchi } 15159775a620SHiroshi Yamauchi } 15169775a620SHiroshi Yamauchi CHR_DEBUG( 15179775a620SHiroshi Yamauchi dbgs() << "Inserting redudant phis\n"; 15189775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15199775a620SHiroshi Yamauchi dbgs() << "BlockInScope " << BB->getName() << "\n"; 15209775a620SHiroshi Yamauchi }); 15219775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15229775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 15239775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> Users; 15249775a620SHiroshi Yamauchi for (User *U : I.users()) { 15259775a620SHiroshi Yamauchi if (auto *UI = dyn_cast<Instruction>(U)) { 15269775a620SHiroshi Yamauchi if (BlocksInScopeSet.count(UI->getParent()) == 0 && 15279775a620SHiroshi Yamauchi // Unless there's already a phi for I at the exit block. 15289775a620SHiroshi Yamauchi !(isa<PHINode>(UI) && UI->getParent() == ExitBlock)) { 15299775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15309775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Used outside scope by user " << *UI << "\n"); 15319775a620SHiroshi Yamauchi Users.push_back(UI); 15329775a620SHiroshi Yamauchi } else if (UI->getParent() == EntryBlock && isa<PHINode>(UI)) { 15339775a620SHiroshi Yamauchi // There's a loop backedge from a block that's dominated by this 15349775a620SHiroshi Yamauchi // scope to the entry block. 15359775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15369775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() 15379775a620SHiroshi Yamauchi << "Used at entry block (for a back edge) by a phi user " 15389775a620SHiroshi Yamauchi << *UI << "\n"); 15399775a620SHiroshi Yamauchi Users.push_back(UI); 15409775a620SHiroshi Yamauchi } 15419775a620SHiroshi Yamauchi } 15429775a620SHiroshi Yamauchi } 15439775a620SHiroshi Yamauchi if (Users.size() > 0) { 15449775a620SHiroshi Yamauchi // Insert a trivial phi for I (phi [&I, P0], [&I, P1], ...) at 15459775a620SHiroshi Yamauchi // ExitBlock. Replace I with the new phi in UI unless UI is another 15469775a620SHiroshi Yamauchi // phi at ExitBlock. 15479775a620SHiroshi Yamauchi unsigned PredCount = std::distance(pred_begin(ExitBlock), 15489775a620SHiroshi Yamauchi pred_end(ExitBlock)); 15499775a620SHiroshi Yamauchi PHINode *PN = PHINode::Create(I.getType(), PredCount, "", 15509775a620SHiroshi Yamauchi &ExitBlock->front()); 15519775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(ExitBlock)) { 15529775a620SHiroshi Yamauchi PN->addIncoming(&I, Pred); 15539775a620SHiroshi Yamauchi } 15549775a620SHiroshi Yamauchi TrivialPHIs.insert(PN); 15559775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Insert phi " << *PN << "\n"); 15569775a620SHiroshi Yamauchi for (Instruction *UI : Users) { 15579775a620SHiroshi Yamauchi for (unsigned J = 0, NumOps = UI->getNumOperands(); J < NumOps; ++J) { 15589775a620SHiroshi Yamauchi if (UI->getOperand(J) == &I) { 15599775a620SHiroshi Yamauchi UI->setOperand(J, PN); 15609775a620SHiroshi Yamauchi } 15619775a620SHiroshi Yamauchi } 15629775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Updated user " << *UI << "\n"); 15639775a620SHiroshi Yamauchi } 15649775a620SHiroshi Yamauchi } 15659775a620SHiroshi Yamauchi } 15669775a620SHiroshi Yamauchi } 15679775a620SHiroshi Yamauchi } 15689775a620SHiroshi Yamauchi 15699775a620SHiroshi Yamauchi // Assert that all the CHR regions of the scope have a biased branch or select. 1570*c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED 1571*c8f348cbSFangrui Song assertCHRRegionsHaveBiasedBranchOrSelect(CHRScope *Scope) { 15729775a620SHiroshi Yamauchi #ifndef NDEBUG 15739775a620SHiroshi Yamauchi auto HasBiasedBranchOrSelect = [](RegInfo &RI, CHRScope *Scope) { 15749775a620SHiroshi Yamauchi if (Scope->TrueBiasedRegions.count(RI.R) || 15759775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.count(RI.R)) 15769775a620SHiroshi Yamauchi return true; 15779775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) 15789775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI) || 15799775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) 15809775a620SHiroshi Yamauchi return true; 15819775a620SHiroshi Yamauchi return false; 15829775a620SHiroshi Yamauchi }; 15839775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 15849775a620SHiroshi Yamauchi assert(HasBiasedBranchOrSelect(RI, Scope) && 15859775a620SHiroshi Yamauchi "Must have biased branch or select"); 15869775a620SHiroshi Yamauchi } 15879775a620SHiroshi Yamauchi #endif 15889775a620SHiroshi Yamauchi } 15899775a620SHiroshi Yamauchi 15909775a620SHiroshi Yamauchi // Assert that all the condition values of the biased branches and selects have 15919775a620SHiroshi Yamauchi // been hoisted to the pre-entry block or outside of the scope. 1592*c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED assertBranchOrSelectConditionHoisted( 1593*c8f348cbSFangrui Song CHRScope *Scope, BasicBlock *PreEntryBlock) { 15949775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Biased regions condition values \n"); 15959775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 15969775a620SHiroshi Yamauchi Region *R = RI.R; 15979775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 15989775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 15999775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 16009775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 16019775a620SHiroshi Yamauchi Value *V = BI->getCondition(); 16029775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16039775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 160472ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16059775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16069775a620SHiroshi Yamauchi !Scope->contains(I)) && 16079775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16089775a620SHiroshi Yamauchi } 16099775a620SHiroshi Yamauchi } 16109775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 16119775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 16129775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 16139775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 16149775a620SHiroshi Yamauchi continue; 16159775a620SHiroshi Yamauchi Value *V = SI->getCondition(); 16169775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16179775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 161872ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16199775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16209775a620SHiroshi Yamauchi !Scope->contains(I)) && 16219775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16229775a620SHiroshi Yamauchi } 16239775a620SHiroshi Yamauchi } 16249775a620SHiroshi Yamauchi } 16259775a620SHiroshi Yamauchi } 16269775a620SHiroshi Yamauchi 16279775a620SHiroshi Yamauchi void CHR::transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs) { 16289775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "transformScopes " << *Scope << "\n"); 16299775a620SHiroshi Yamauchi 16309775a620SHiroshi Yamauchi assert(Scope->RegInfos.size() >= 1 && "Should have at least one Region"); 16319775a620SHiroshi Yamauchi Region *FirstRegion = Scope->RegInfos[0].R; 16329775a620SHiroshi Yamauchi BasicBlock *EntryBlock = FirstRegion->getEntry(); 16339775a620SHiroshi Yamauchi Region *LastRegion = Scope->RegInfos[Scope->RegInfos.size() - 1].R; 16349775a620SHiroshi Yamauchi BasicBlock *ExitBlock = LastRegion->getExit(); 16359775a620SHiroshi Yamauchi Optional<uint64_t> ProfileCount = BFI.getBlockProfileCount(EntryBlock); 16369775a620SHiroshi Yamauchi 16379775a620SHiroshi Yamauchi if (ExitBlock) { 16389775a620SHiroshi Yamauchi // Insert a trivial phi at the exit block (where the CHR hot path and the 16399775a620SHiroshi Yamauchi // cold path merges) for a value that's defined in the scope but used 16409775a620SHiroshi Yamauchi // outside it (meaning it's alive at the exit block). We will add the 16419775a620SHiroshi Yamauchi // incoming values for the CHR cold paths to it below. Without this, we'd 16429775a620SHiroshi Yamauchi // miss updating phi's for such values unless there happens to already be a 16439775a620SHiroshi Yamauchi // phi for that value there. 16449775a620SHiroshi Yamauchi insertTrivialPHIs(Scope, EntryBlock, ExitBlock, TrivialPHIs); 16459775a620SHiroshi Yamauchi } 16469775a620SHiroshi Yamauchi 16479775a620SHiroshi Yamauchi // Split the entry block of the first region. The new block becomes the new 16489775a620SHiroshi Yamauchi // entry block of the first region. The old entry block becomes the block to 16499775a620SHiroshi Yamauchi // insert the CHR branch into. Note DT gets updated. Since DT gets updated 16509775a620SHiroshi Yamauchi // through the split, we update the entry of the first region after the split, 16519775a620SHiroshi Yamauchi // and Region only points to the entry and the exit blocks, rather than 16529775a620SHiroshi Yamauchi // keeping everything in a list or set, the blocks membership and the 16539775a620SHiroshi Yamauchi // entry/exit blocks of the region are still valid after the split. 16549775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Splitting entry block " << EntryBlock->getName() 16559775a620SHiroshi Yamauchi << " at " << *Scope->BranchInsertPoint << "\n"); 16569775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock = 16579775a620SHiroshi Yamauchi SplitBlock(EntryBlock, Scope->BranchInsertPoint, &DT); 16589775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 16599775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 16609775a620SHiroshi Yamauchi FirstRegion->replaceEntryRecursive(NewEntryBlock); 16619775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock = EntryBlock; 16629775a620SHiroshi Yamauchi 16639775a620SHiroshi Yamauchi ValueToValueMapTy VMap; 16649775a620SHiroshi Yamauchi // Clone the blocks in the scope (excluding the PreEntryBlock) to split into a 16659775a620SHiroshi Yamauchi // hot path (originals) and a cold path (clones) and update the PHIs at the 16669775a620SHiroshi Yamauchi // exit block. 16679775a620SHiroshi Yamauchi cloneScopeBlocks(Scope, PreEntryBlock, ExitBlock, LastRegion, VMap); 16689775a620SHiroshi Yamauchi 16699775a620SHiroshi Yamauchi // Replace the old (placeholder) branch with the new (merged) conditional 16709775a620SHiroshi Yamauchi // branch. 16719775a620SHiroshi Yamauchi BranchInst *MergedBr = createMergedBranch(PreEntryBlock, EntryBlock, 16729775a620SHiroshi Yamauchi NewEntryBlock, VMap); 16739775a620SHiroshi Yamauchi 16749775a620SHiroshi Yamauchi #ifndef NDEBUG 16759775a620SHiroshi Yamauchi assertCHRRegionsHaveBiasedBranchOrSelect(Scope); 16769775a620SHiroshi Yamauchi #endif 16779775a620SHiroshi Yamauchi 16789775a620SHiroshi Yamauchi // Hoist the conditional values of the branches/selects. 16799775a620SHiroshi Yamauchi hoistScopeConditions(Scope, PreEntryBlock->getTerminator(), TrivialPHIs); 16809775a620SHiroshi Yamauchi 16819775a620SHiroshi Yamauchi #ifndef NDEBUG 16829775a620SHiroshi Yamauchi assertBranchOrSelectConditionHoisted(Scope, PreEntryBlock); 16839775a620SHiroshi Yamauchi #endif 16849775a620SHiroshi Yamauchi 16859775a620SHiroshi Yamauchi // Create the combined branch condition and constant-fold the branches/selects 16869775a620SHiroshi Yamauchi // in the hot path. 16879775a620SHiroshi Yamauchi fixupBranchesAndSelects(Scope, PreEntryBlock, MergedBr, 16889775a620SHiroshi Yamauchi ProfileCount ? ProfileCount.getValue() : 0); 16899775a620SHiroshi Yamauchi } 16909775a620SHiroshi Yamauchi 16919775a620SHiroshi Yamauchi // A helper for transformScopes. Clone the blocks in the scope (excluding the 16929775a620SHiroshi Yamauchi // PreEntryBlock) to split into a hot path and a cold path and update the PHIs 16939775a620SHiroshi Yamauchi // at the exit block. 16949775a620SHiroshi Yamauchi void CHR::cloneScopeBlocks(CHRScope *Scope, 16959775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 16969775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 16979775a620SHiroshi Yamauchi Region *LastRegion, 16989775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 16999775a620SHiroshi Yamauchi // Clone all the blocks. The original blocks will be the hot-path 17009775a620SHiroshi Yamauchi // CHR-optimized code and the cloned blocks will be the original unoptimized 17019775a620SHiroshi Yamauchi // code. This is so that the block pointers from the 17029775a620SHiroshi Yamauchi // CHRScope/Region/RegionInfo can stay valid in pointing to the hot-path code 17039775a620SHiroshi Yamauchi // which CHR should apply to. 17049775a620SHiroshi Yamauchi SmallVector<BasicBlock*, 8> NewBlocks; 17059775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) 17069775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 17079775a620SHiroshi Yamauchi // sub-Scopes. 17089775a620SHiroshi Yamauchi assert(BB != PreEntryBlock && "Don't copy the preetntry block"); 17099775a620SHiroshi Yamauchi BasicBlock *NewBB = CloneBasicBlock(BB, VMap, ".nonchr", &F); 17109775a620SHiroshi Yamauchi NewBlocks.push_back(NewBB); 17119775a620SHiroshi Yamauchi VMap[BB] = NewBB; 17129775a620SHiroshi Yamauchi } 17139775a620SHiroshi Yamauchi 17149775a620SHiroshi Yamauchi // Place the cloned blocks right after the original blocks (right before the 17159775a620SHiroshi Yamauchi // exit block of.) 17169775a620SHiroshi Yamauchi if (ExitBlock) 17179775a620SHiroshi Yamauchi F.getBasicBlockList().splice(ExitBlock->getIterator(), 17189775a620SHiroshi Yamauchi F.getBasicBlockList(), 17199775a620SHiroshi Yamauchi NewBlocks[0]->getIterator(), F.end()); 17209775a620SHiroshi Yamauchi 17219775a620SHiroshi Yamauchi // Update the cloned blocks/instructions to refer to themselves. 17229775a620SHiroshi Yamauchi for (unsigned i = 0, e = NewBlocks.size(); i != e; ++i) 17239775a620SHiroshi Yamauchi for (Instruction &I : *NewBlocks[i]) 17249775a620SHiroshi Yamauchi RemapInstruction(&I, VMap, 17259775a620SHiroshi Yamauchi RF_NoModuleLevelChanges | RF_IgnoreMissingLocals); 17269775a620SHiroshi Yamauchi 17279775a620SHiroshi Yamauchi // Add the cloned blocks to the PHIs of the exit blocks. ExitBlock is null for 17289775a620SHiroshi Yamauchi // the top-level region but we don't need to add PHIs. The trivial PHIs 17299775a620SHiroshi Yamauchi // inserted above will be updated here. 17309775a620SHiroshi Yamauchi if (ExitBlock) 17319775a620SHiroshi Yamauchi for (PHINode &PN : ExitBlock->phis()) 17329775a620SHiroshi Yamauchi for (unsigned I = 0, NumOps = PN.getNumIncomingValues(); I < NumOps; 17339775a620SHiroshi Yamauchi ++I) { 17349775a620SHiroshi Yamauchi BasicBlock *Pred = PN.getIncomingBlock(I); 17359775a620SHiroshi Yamauchi if (LastRegion->contains(Pred)) { 17369775a620SHiroshi Yamauchi Value *V = PN.getIncomingValue(I); 17379775a620SHiroshi Yamauchi auto It = VMap.find(V); 17389775a620SHiroshi Yamauchi if (It != VMap.end()) V = It->second; 17399775a620SHiroshi Yamauchi assert(VMap.find(Pred) != VMap.end() && "Pred must have been cloned"); 17409775a620SHiroshi Yamauchi PN.addIncoming(V, cast<BasicBlock>(VMap[Pred])); 17419775a620SHiroshi Yamauchi } 17429775a620SHiroshi Yamauchi } 17439775a620SHiroshi Yamauchi } 17449775a620SHiroshi Yamauchi 17459775a620SHiroshi Yamauchi // A helper for transformScope. Replace the old (placeholder) branch with the 17469775a620SHiroshi Yamauchi // new (merged) conditional branch. 17479775a620SHiroshi Yamauchi BranchInst *CHR::createMergedBranch(BasicBlock *PreEntryBlock, 17489775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 17499775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 17509775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 17519775a620SHiroshi Yamauchi BranchInst *OldBR = cast<BranchInst>(PreEntryBlock->getTerminator()); 17529775a620SHiroshi Yamauchi assert(OldBR->isUnconditional() && OldBR->getSuccessor(0) == NewEntryBlock && 17539775a620SHiroshi Yamauchi "SplitBlock did not work correctly!"); 17549775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 17559775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 17569775a620SHiroshi Yamauchi assert(VMap.find(NewEntryBlock) != VMap.end() && 17579775a620SHiroshi Yamauchi "NewEntryBlock must have been copied"); 17589775a620SHiroshi Yamauchi OldBR->dropAllReferences(); 1759bd897a02SHiroshi Yamauchi OldBR->eraseFromParent(); 17609775a620SHiroshi Yamauchi // The true predicate is a placeholder. It will be replaced later in 17619775a620SHiroshi Yamauchi // fixupBranchesAndSelects(). 17629775a620SHiroshi Yamauchi BranchInst *NewBR = BranchInst::Create(NewEntryBlock, 17639775a620SHiroshi Yamauchi cast<BasicBlock>(VMap[NewEntryBlock]), 17649775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext())); 17659775a620SHiroshi Yamauchi PreEntryBlock->getInstList().push_back(NewBR); 17669775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 17679775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 17689775a620SHiroshi Yamauchi return NewBR; 17699775a620SHiroshi Yamauchi } 17709775a620SHiroshi Yamauchi 17719775a620SHiroshi Yamauchi // A helper for transformScopes. Create the combined branch condition and 17729775a620SHiroshi Yamauchi // constant-fold the branches/selects in the hot path. 17739775a620SHiroshi Yamauchi void CHR::fixupBranchesAndSelects(CHRScope *Scope, 17749775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 17759775a620SHiroshi Yamauchi BranchInst *MergedBR, 17769775a620SHiroshi Yamauchi uint64_t ProfileCount) { 17779775a620SHiroshi Yamauchi Value *MergedCondition = ConstantInt::getTrue(F.getContext()); 17789775a620SHiroshi Yamauchi BranchProbability CHRBranchBias(1, 1); 17799775a620SHiroshi Yamauchi uint64_t NumCHRedBranches = 0; 17809775a620SHiroshi Yamauchi IRBuilder<> IRB(PreEntryBlock->getTerminator()); 17819775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 17829775a620SHiroshi Yamauchi Region *R = RI.R; 17839775a620SHiroshi Yamauchi if (RI.HasBranch) { 17849775a620SHiroshi Yamauchi fixupBranch(R, Scope, IRB, MergedCondition, CHRBranchBias); 17859775a620SHiroshi Yamauchi ++NumCHRedBranches; 17869775a620SHiroshi Yamauchi } 17879775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 17889775a620SHiroshi Yamauchi fixupSelect(SI, Scope, IRB, MergedCondition, CHRBranchBias); 17899775a620SHiroshi Yamauchi ++NumCHRedBranches; 17909775a620SHiroshi Yamauchi } 17919775a620SHiroshi Yamauchi } 17929775a620SHiroshi Yamauchi Stats.NumBranchesDelta += NumCHRedBranches - 1; 17939775a620SHiroshi Yamauchi Stats.WeightedNumBranchesDelta += (NumCHRedBranches - 1) * ProfileCount; 17949775a620SHiroshi Yamauchi MergedBR->setCondition(MergedCondition); 17959775a620SHiroshi Yamauchi SmallVector<uint32_t, 2> Weights; 17969775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.scale(1000))); 17979775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.getCompl().scale(1000))); 17989775a620SHiroshi Yamauchi MDBuilder MDB(F.getContext()); 17999775a620SHiroshi Yamauchi MergedBR->setMetadata(LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); 18009775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR branch bias " << Weights[0] << ":" << Weights[1] 18019775a620SHiroshi Yamauchi << "\n"); 18029775a620SHiroshi Yamauchi } 18039775a620SHiroshi Yamauchi 18049775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 18059775a620SHiroshi Yamauchi // and constant-fold a branch in the hot path. 18069775a620SHiroshi Yamauchi void CHR::fixupBranch(Region *R, CHRScope *Scope, 18079775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18089775a620SHiroshi Yamauchi Value *&MergedCondition, 18099775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 18109775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 18119775a620SHiroshi Yamauchi assert((IsTrueBiased || Scope->FalseBiasedRegions.count(R)) && 18129775a620SHiroshi Yamauchi "Must be truthy or falsy"); 18139775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 18149775a620SHiroshi Yamauchi assert(BranchBiasMap.find(R) != BranchBiasMap.end() && 18159775a620SHiroshi Yamauchi "Must be in the bias map"); 18169775a620SHiroshi Yamauchi BranchProbability Bias = BranchBiasMap[R]; 18179775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 18189775a620SHiroshi Yamauchi // Take the min. 18199775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 18209775a620SHiroshi Yamauchi CHRBranchBias = Bias; 18219775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(1); 18229775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(0); 18239775a620SHiroshi Yamauchi BasicBlock *RegionExitBlock = R->getExit(); 18249775a620SHiroshi Yamauchi assert(RegionExitBlock && "Null ExitBlock"); 18259775a620SHiroshi Yamauchi assert((IfThen == RegionExitBlock || IfElse == RegionExitBlock) && 18269775a620SHiroshi Yamauchi IfThen != IfElse && "Invariant from findScopes"); 18279775a620SHiroshi Yamauchi if (IfThen == RegionExitBlock) { 18289775a620SHiroshi Yamauchi // Swap them so that IfThen means going into it and IfElse means skipping 18299775a620SHiroshi Yamauchi // it. 18309775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 18319775a620SHiroshi Yamauchi } 18329775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "IfThen " << IfThen->getName() 18339775a620SHiroshi Yamauchi << " IfElse " << IfElse->getName() << "\n"); 18349775a620SHiroshi Yamauchi Value *Cond = BI->getCondition(); 18359775a620SHiroshi Yamauchi BasicBlock *HotTarget = IsTrueBiased ? IfThen : IfElse; 18369775a620SHiroshi Yamauchi bool ConditionTrue = HotTarget == BI->getSuccessor(0); 18379775a620SHiroshi Yamauchi addToMergedCondition(ConditionTrue, Cond, BI, Scope, IRB, 18389775a620SHiroshi Yamauchi MergedCondition); 18399775a620SHiroshi Yamauchi // Constant-fold the branch at ClonedEntryBlock. 18409775a620SHiroshi Yamauchi assert(ConditionTrue == (HotTarget == BI->getSuccessor(0)) && 18419775a620SHiroshi Yamauchi "The successor shouldn't change"); 18429775a620SHiroshi Yamauchi Value *NewCondition = ConditionTrue ? 18439775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 18449775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 18459775a620SHiroshi Yamauchi BI->setCondition(NewCondition); 18469775a620SHiroshi Yamauchi } 18479775a620SHiroshi Yamauchi 18489775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 18499775a620SHiroshi Yamauchi // and constant-fold a select in the hot path. 18509775a620SHiroshi Yamauchi void CHR::fixupSelect(SelectInst *SI, CHRScope *Scope, 18519775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18529775a620SHiroshi Yamauchi Value *&MergedCondition, 18539775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 18549775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 18559775a620SHiroshi Yamauchi assert((IsTrueBiased || 18569775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) && "Must be biased"); 18579775a620SHiroshi Yamauchi assert(SelectBiasMap.find(SI) != SelectBiasMap.end() && 18589775a620SHiroshi Yamauchi "Must be in the bias map"); 18599775a620SHiroshi Yamauchi BranchProbability Bias = SelectBiasMap[SI]; 18609775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 18619775a620SHiroshi Yamauchi // Take the min. 18629775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 18639775a620SHiroshi Yamauchi CHRBranchBias = Bias; 18649775a620SHiroshi Yamauchi Value *Cond = SI->getCondition(); 18659775a620SHiroshi Yamauchi addToMergedCondition(IsTrueBiased, Cond, SI, Scope, IRB, 18669775a620SHiroshi Yamauchi MergedCondition); 18679775a620SHiroshi Yamauchi Value *NewCondition = IsTrueBiased ? 18689775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 18699775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 18709775a620SHiroshi Yamauchi SI->setCondition(NewCondition); 18719775a620SHiroshi Yamauchi } 18729775a620SHiroshi Yamauchi 18739775a620SHiroshi Yamauchi // A helper for fixupBranch/fixupSelect. Add a branch condition to the merged 18749775a620SHiroshi Yamauchi // condition. 18759775a620SHiroshi Yamauchi void CHR::addToMergedCondition(bool IsTrueBiased, Value *Cond, 18769775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 18779775a620SHiroshi Yamauchi CHRScope *Scope, 18789775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18799775a620SHiroshi Yamauchi Value *&MergedCondition) { 18809775a620SHiroshi Yamauchi if (IsTrueBiased) { 18819775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 18829775a620SHiroshi Yamauchi } else { 18839775a620SHiroshi Yamauchi // If Cond is an icmp and all users of V except for BranchOrSelect is a 18849775a620SHiroshi Yamauchi // branch, negate the icmp predicate and swap the branch targets and avoid 18859775a620SHiroshi Yamauchi // inserting an Xor to negate Cond. 18869775a620SHiroshi Yamauchi bool Done = false; 18879775a620SHiroshi Yamauchi if (auto *ICmp = dyn_cast<ICmpInst>(Cond)) 18889775a620SHiroshi Yamauchi if (NegateICmpIfUsedByBranchOrSelectOnly(ICmp, BranchOrSelect, Scope)) { 18899775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 18909775a620SHiroshi Yamauchi Done = true; 18919775a620SHiroshi Yamauchi } 18929775a620SHiroshi Yamauchi if (!Done) { 18939775a620SHiroshi Yamauchi Value *Negate = IRB.CreateXor( 18949775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()), Cond); 18959775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Negate); 18969775a620SHiroshi Yamauchi } 18979775a620SHiroshi Yamauchi } 18989775a620SHiroshi Yamauchi } 18999775a620SHiroshi Yamauchi 19009775a620SHiroshi Yamauchi void CHR::transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes) { 19019775a620SHiroshi Yamauchi unsigned i = 0; 19029775a620SHiroshi Yamauchi (void)(i); // Unused in release build. 19039775a620SHiroshi Yamauchi DenseSet<PHINode *> TrivialPHIs; 19049775a620SHiroshi Yamauchi for (CHRScope *Scope : CHRScopes) { 19059775a620SHiroshi Yamauchi transformScopes(Scope, TrivialPHIs); 19069775a620SHiroshi Yamauchi CHR_DEBUG( 19079775a620SHiroshi Yamauchi std::ostringstream oss; 19089775a620SHiroshi Yamauchi oss << " after transformScopes " << i++; 19099775a620SHiroshi Yamauchi dumpIR(F, oss.str().c_str(), nullptr)); 19109775a620SHiroshi Yamauchi } 19119775a620SHiroshi Yamauchi } 19129775a620SHiroshi Yamauchi 1913*c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED 1914*c8f348cbSFangrui Song dumpScopes(SmallVectorImpl<CHRScope *> &Scopes, const char *Label) { 19159775a620SHiroshi Yamauchi dbgs() << Label << " " << Scopes.size() << "\n"; 19169775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 19179775a620SHiroshi Yamauchi dbgs() << *Scope << "\n"; 19189775a620SHiroshi Yamauchi } 19199775a620SHiroshi Yamauchi } 19209775a620SHiroshi Yamauchi 19219775a620SHiroshi Yamauchi bool CHR::run() { 19229775a620SHiroshi Yamauchi if (!shouldApply(F, PSI)) 19239775a620SHiroshi Yamauchi return false; 19249775a620SHiroshi Yamauchi 19259775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "before", nullptr)); 19269775a620SHiroshi Yamauchi 19279775a620SHiroshi Yamauchi bool Changed = false; 19289775a620SHiroshi Yamauchi { 19299775a620SHiroshi Yamauchi CHR_DEBUG( 19309775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 19319775a620SHiroshi Yamauchi RI.print(dbgs())); 19329775a620SHiroshi Yamauchi 19339775a620SHiroshi Yamauchi // Recursively traverse the region tree and find regions that have biased 19349775a620SHiroshi Yamauchi // branches and/or selects and create scopes. 19359775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> AllScopes; 19369775a620SHiroshi Yamauchi findScopes(AllScopes); 19379775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(AllScopes, "All scopes")); 19389775a620SHiroshi Yamauchi 19399775a620SHiroshi Yamauchi // Split the scopes if 1) the conditiona values of the biased 19409775a620SHiroshi Yamauchi // branches/selects of the inner/lower scope can't be hoisted up to the 19419775a620SHiroshi Yamauchi // outermost/uppermost scope entry, or 2) the condition values of the biased 19429775a620SHiroshi Yamauchi // branches/selects in a scope (including subscopes) don't share at least 19439775a620SHiroshi Yamauchi // one common value. 19449775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SplitScopes; 19459775a620SHiroshi Yamauchi splitScopes(AllScopes, SplitScopes); 19469775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SplitScopes, "Split scopes")); 19479775a620SHiroshi Yamauchi 19489775a620SHiroshi Yamauchi // After splitting, set the biased regions and selects of a scope (a tree 19499775a620SHiroshi Yamauchi // root) that include those of the subscopes. 19509775a620SHiroshi Yamauchi classifyBiasedScopes(SplitScopes); 19519775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Set per-scope bias " << SplitScopes.size() << "\n"); 19529775a620SHiroshi Yamauchi 19539775a620SHiroshi Yamauchi // Filter out the scopes that has only one biased region or select (CHR 19549775a620SHiroshi Yamauchi // isn't useful in such a case). 19559775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> FilteredScopes; 19569775a620SHiroshi Yamauchi filterScopes(SplitScopes, FilteredScopes); 19579775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(FilteredScopes, "Filtered scopes")); 19589775a620SHiroshi Yamauchi 19599775a620SHiroshi Yamauchi // Set the regions to be CHR'ed and their hoist stops for each scope. 19609775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SetScopes; 19619775a620SHiroshi Yamauchi setCHRRegions(FilteredScopes, SetScopes); 19629775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SetScopes, "Set CHR regions")); 19639775a620SHiroshi Yamauchi 19649775a620SHiroshi Yamauchi // Sort CHRScopes by the depth so that outer CHRScopes comes before inner 19659775a620SHiroshi Yamauchi // ones. We need to apply CHR from outer to inner so that we apply CHR only 19669775a620SHiroshi Yamauchi // to the hot path, rather than both hot and cold paths. 19679775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SortedScopes; 19689775a620SHiroshi Yamauchi sortScopes(SetScopes, SortedScopes); 19699775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SortedScopes, "Sorted scopes")); 19709775a620SHiroshi Yamauchi 19719775a620SHiroshi Yamauchi CHR_DEBUG( 19729775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 19739775a620SHiroshi Yamauchi RI.print(dbgs())); 19749775a620SHiroshi Yamauchi 19759775a620SHiroshi Yamauchi // Apply the CHR transformation. 19769775a620SHiroshi Yamauchi if (!SortedScopes.empty()) { 19779775a620SHiroshi Yamauchi transformScopes(SortedScopes); 19789775a620SHiroshi Yamauchi Changed = true; 19799775a620SHiroshi Yamauchi } 19809775a620SHiroshi Yamauchi } 19819775a620SHiroshi Yamauchi 19829775a620SHiroshi Yamauchi if (Changed) 19839775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "after", &Stats)); 19849775a620SHiroshi Yamauchi 19859775a620SHiroshi Yamauchi return Changed; 19869775a620SHiroshi Yamauchi } 19879775a620SHiroshi Yamauchi 19889775a620SHiroshi Yamauchi bool ControlHeightReductionLegacyPass::runOnFunction(Function &F) { 19899775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI = 19909775a620SHiroshi Yamauchi getAnalysis<BlockFrequencyInfoWrapperPass>().getBFI(); 19919775a620SHiroshi Yamauchi DominatorTree &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 19929775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI = 19939775a620SHiroshi Yamauchi *getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI(); 19949775a620SHiroshi Yamauchi RegionInfo &RI = getAnalysis<RegionInfoPass>().getRegionInfo(); 19959775a620SHiroshi Yamauchi return CHR(F, BFI, DT, PSI, RI).run(); 19969775a620SHiroshi Yamauchi } 19979775a620SHiroshi Yamauchi 19989775a620SHiroshi Yamauchi namespace llvm { 19999775a620SHiroshi Yamauchi 20009775a620SHiroshi Yamauchi ControlHeightReductionPass::ControlHeightReductionPass() { 20019775a620SHiroshi Yamauchi ParseCHRFilterFiles(); 20029775a620SHiroshi Yamauchi } 20039775a620SHiroshi Yamauchi 20049775a620SHiroshi Yamauchi PreservedAnalyses ControlHeightReductionPass::run( 20059775a620SHiroshi Yamauchi Function &F, 20069775a620SHiroshi Yamauchi FunctionAnalysisManager &FAM) { 20079775a620SHiroshi Yamauchi auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F); 20089775a620SHiroshi Yamauchi auto &DT = FAM.getResult<DominatorTreeAnalysis>(F); 20099775a620SHiroshi Yamauchi auto &MAMProxy = FAM.getResult<ModuleAnalysisManagerFunctionProxy>(F); 20109775a620SHiroshi Yamauchi auto &MAM = MAMProxy.getManager(); 20119775a620SHiroshi Yamauchi auto &PSI = *MAM.getCachedResult<ProfileSummaryAnalysis>(*F.getParent()); 20129775a620SHiroshi Yamauchi auto &RI = FAM.getResult<RegionInfoAnalysis>(F); 20139775a620SHiroshi Yamauchi bool Changed = CHR(F, BFI, DT, PSI, RI).run(); 20149775a620SHiroshi Yamauchi if (!Changed) 20159775a620SHiroshi Yamauchi return PreservedAnalyses::all(); 20169775a620SHiroshi Yamauchi auto PA = PreservedAnalyses(); 20179775a620SHiroshi Yamauchi PA.preserve<GlobalsAA>(); 20189775a620SHiroshi Yamauchi return PA; 20199775a620SHiroshi Yamauchi } 20209775a620SHiroshi Yamauchi 20219775a620SHiroshi Yamauchi } // namespace llvm 2022