19775a620SHiroshi Yamauchi //===-- ControlHeightReduction.cpp - Control Height Reduction -------------===// 29775a620SHiroshi Yamauchi // 32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information. 52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 69775a620SHiroshi Yamauchi // 79775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 89775a620SHiroshi Yamauchi // 99775a620SHiroshi Yamauchi // This pass merges conditional blocks of code and reduces the number of 109775a620SHiroshi Yamauchi // conditional branches in the hot paths based on profiles. 119775a620SHiroshi Yamauchi // 129775a620SHiroshi Yamauchi //===----------------------------------------------------------------------===// 139775a620SHiroshi Yamauchi 149775a620SHiroshi Yamauchi #include "llvm/Transforms/Instrumentation/ControlHeightReduction.h" 159775a620SHiroshi Yamauchi #include "llvm/ADT/DenseMap.h" 169775a620SHiroshi Yamauchi #include "llvm/ADT/DenseSet.h" 179775a620SHiroshi Yamauchi #include "llvm/ADT/SmallVector.h" 189775a620SHiroshi Yamauchi #include "llvm/ADT/StringSet.h" 199775a620SHiroshi Yamauchi #include "llvm/Analysis/BlockFrequencyInfo.h" 209abad481SBenjamin Kramer #include "llvm/Analysis/GlobalsModRef.h" 21fd2c699dSHiroshi Yamauchi #include "llvm/Analysis/OptimizationRemarkEmitter.h" 229775a620SHiroshi Yamauchi #include "llvm/Analysis/ProfileSummaryInfo.h" 239775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionInfo.h" 249775a620SHiroshi Yamauchi #include "llvm/Analysis/RegionIterator.h" 259775a620SHiroshi Yamauchi #include "llvm/Analysis/ValueTracking.h" 269775a620SHiroshi Yamauchi #include "llvm/IR/CFG.h" 279775a620SHiroshi Yamauchi #include "llvm/IR/Dominators.h" 289775a620SHiroshi Yamauchi #include "llvm/IR/IRBuilder.h" 299775a620SHiroshi Yamauchi #include "llvm/IR/MDBuilder.h" 309775a620SHiroshi Yamauchi #include "llvm/Support/BranchProbability.h" 319775a620SHiroshi Yamauchi #include "llvm/Support/MemoryBuffer.h" 329abad481SBenjamin Kramer #include "llvm/Transforms/Utils.h" 339abad481SBenjamin Kramer #include "llvm/Transforms/Utils/BasicBlockUtils.h" 349abad481SBenjamin Kramer #include "llvm/Transforms/Utils/Cloning.h" 359abad481SBenjamin Kramer #include "llvm/Transforms/Utils/ValueMapper.h" 369775a620SHiroshi Yamauchi 379775a620SHiroshi Yamauchi #include <set> 389775a620SHiroshi Yamauchi #include <sstream> 399775a620SHiroshi Yamauchi 409775a620SHiroshi Yamauchi using namespace llvm; 419775a620SHiroshi Yamauchi 429775a620SHiroshi Yamauchi #define DEBUG_TYPE "chr" 439775a620SHiroshi Yamauchi 449775a620SHiroshi Yamauchi #define CHR_DEBUG(X) LLVM_DEBUG(X) 459775a620SHiroshi Yamauchi 469775a620SHiroshi Yamauchi static cl::opt<bool> ForceCHR("force-chr", cl::init(false), cl::Hidden, 479775a620SHiroshi Yamauchi cl::desc("Apply CHR for all functions")); 489775a620SHiroshi Yamauchi 499775a620SHiroshi Yamauchi static cl::opt<double> CHRBiasThreshold( 509775a620SHiroshi Yamauchi "chr-bias-threshold", cl::init(0.99), cl::Hidden, 519775a620SHiroshi Yamauchi cl::desc("CHR considers a branch bias greater than this ratio as biased")); 529775a620SHiroshi Yamauchi 539775a620SHiroshi Yamauchi static cl::opt<unsigned> CHRMergeThreshold( 549775a620SHiroshi Yamauchi "chr-merge-threshold", cl::init(2), cl::Hidden, 559775a620SHiroshi Yamauchi cl::desc("CHR merges a group of N branches/selects where N >= this value")); 569775a620SHiroshi Yamauchi 579775a620SHiroshi Yamauchi static cl::opt<std::string> CHRModuleList( 589775a620SHiroshi Yamauchi "chr-module-list", cl::init(""), cl::Hidden, 599775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of modules to apply CHR to")); 609775a620SHiroshi Yamauchi 619775a620SHiroshi Yamauchi static cl::opt<std::string> CHRFunctionList( 629775a620SHiroshi Yamauchi "chr-function-list", cl::init(""), cl::Hidden, 639775a620SHiroshi Yamauchi cl::desc("Specify file to retrieve the list of functions to apply CHR to")); 649775a620SHiroshi Yamauchi 659775a620SHiroshi Yamauchi static StringSet<> CHRModules; 669775a620SHiroshi Yamauchi static StringSet<> CHRFunctions; 679775a620SHiroshi Yamauchi 68b3b61de0SFangrui Song static void parseCHRFilterFiles() { 699775a620SHiroshi Yamauchi if (!CHRModuleList.empty()) { 709775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRModuleList); 719775a620SHiroshi Yamauchi if (!FileOrErr) { 729775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-module-list file " << CHRModuleList << "\n"; 739775a620SHiroshi Yamauchi std::exit(1); 749775a620SHiroshi Yamauchi } 759775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 769775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 779775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 789775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 799775a620SHiroshi Yamauchi Line = Line.trim(); 809775a620SHiroshi Yamauchi if (!Line.empty()) 819775a620SHiroshi Yamauchi CHRModules.insert(Line); 829775a620SHiroshi Yamauchi } 839775a620SHiroshi Yamauchi } 849775a620SHiroshi Yamauchi if (!CHRFunctionList.empty()) { 859775a620SHiroshi Yamauchi auto FileOrErr = MemoryBuffer::getFile(CHRFunctionList); 869775a620SHiroshi Yamauchi if (!FileOrErr) { 879775a620SHiroshi Yamauchi errs() << "Error: Couldn't read the chr-function-list file " << CHRFunctionList << "\n"; 889775a620SHiroshi Yamauchi std::exit(1); 899775a620SHiroshi Yamauchi } 909775a620SHiroshi Yamauchi StringRef Buf = FileOrErr->get()->getBuffer(); 919775a620SHiroshi Yamauchi SmallVector<StringRef, 0> Lines; 929775a620SHiroshi Yamauchi Buf.split(Lines, '\n'); 939775a620SHiroshi Yamauchi for (StringRef Line : Lines) { 949775a620SHiroshi Yamauchi Line = Line.trim(); 959775a620SHiroshi Yamauchi if (!Line.empty()) 969775a620SHiroshi Yamauchi CHRFunctions.insert(Line); 979775a620SHiroshi Yamauchi } 989775a620SHiroshi Yamauchi } 999775a620SHiroshi Yamauchi } 1009775a620SHiroshi Yamauchi 1019775a620SHiroshi Yamauchi namespace { 1029775a620SHiroshi Yamauchi class ControlHeightReductionLegacyPass : public FunctionPass { 1039775a620SHiroshi Yamauchi public: 1049775a620SHiroshi Yamauchi static char ID; 1059775a620SHiroshi Yamauchi 1069775a620SHiroshi Yamauchi ControlHeightReductionLegacyPass() : FunctionPass(ID) { 1079775a620SHiroshi Yamauchi initializeControlHeightReductionLegacyPassPass( 1089775a620SHiroshi Yamauchi *PassRegistry::getPassRegistry()); 109b3b61de0SFangrui Song parseCHRFilterFiles(); 1109775a620SHiroshi Yamauchi } 1119775a620SHiroshi Yamauchi 1129775a620SHiroshi Yamauchi bool runOnFunction(Function &F) override; 1139775a620SHiroshi Yamauchi void getAnalysisUsage(AnalysisUsage &AU) const override { 1149775a620SHiroshi Yamauchi AU.addRequired<BlockFrequencyInfoWrapperPass>(); 1159775a620SHiroshi Yamauchi AU.addRequired<DominatorTreeWrapperPass>(); 1169775a620SHiroshi Yamauchi AU.addRequired<ProfileSummaryInfoWrapperPass>(); 1179775a620SHiroshi Yamauchi AU.addRequired<RegionInfoPass>(); 1189775a620SHiroshi Yamauchi AU.addPreserved<GlobalsAAWrapperPass>(); 1199775a620SHiroshi Yamauchi } 1209775a620SHiroshi Yamauchi }; 1219775a620SHiroshi Yamauchi } // end anonymous namespace 1229775a620SHiroshi Yamauchi 1239775a620SHiroshi Yamauchi char ControlHeightReductionLegacyPass::ID = 0; 1249775a620SHiroshi Yamauchi 1259775a620SHiroshi Yamauchi INITIALIZE_PASS_BEGIN(ControlHeightReductionLegacyPass, 1269775a620SHiroshi Yamauchi "chr", 1279775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1289775a620SHiroshi Yamauchi false, false) 1299775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(BlockFrequencyInfoWrapperPass) 1309775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 1319775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(ProfileSummaryInfoWrapperPass) 1329775a620SHiroshi Yamauchi INITIALIZE_PASS_DEPENDENCY(RegionInfoPass) 1339775a620SHiroshi Yamauchi INITIALIZE_PASS_END(ControlHeightReductionLegacyPass, 1349775a620SHiroshi Yamauchi "chr", 1359775a620SHiroshi Yamauchi "Reduce control height in the hot paths", 1369775a620SHiroshi Yamauchi false, false) 1379775a620SHiroshi Yamauchi 1389775a620SHiroshi Yamauchi FunctionPass *llvm::createControlHeightReductionLegacyPass() { 1399775a620SHiroshi Yamauchi return new ControlHeightReductionLegacyPass(); 1409775a620SHiroshi Yamauchi } 1419775a620SHiroshi Yamauchi 1429775a620SHiroshi Yamauchi namespace { 1439775a620SHiroshi Yamauchi 1449775a620SHiroshi Yamauchi struct CHRStats { 1459775a620SHiroshi Yamauchi CHRStats() : NumBranches(0), NumBranchesDelta(0), 1469775a620SHiroshi Yamauchi WeightedNumBranchesDelta(0) {} 1479775a620SHiroshi Yamauchi void print(raw_ostream &OS) const { 1489775a620SHiroshi Yamauchi OS << "CHRStats: NumBranches " << NumBranches 1499775a620SHiroshi Yamauchi << " NumBranchesDelta " << NumBranchesDelta 1509775a620SHiroshi Yamauchi << " WeightedNumBranchesDelta " << WeightedNumBranchesDelta; 1519775a620SHiroshi Yamauchi } 1529775a620SHiroshi Yamauchi uint64_t NumBranches; // The original number of conditional branches / 1539775a620SHiroshi Yamauchi // selects 1549775a620SHiroshi Yamauchi uint64_t NumBranchesDelta; // The decrease of the number of conditional 1559775a620SHiroshi Yamauchi // branches / selects in the hot paths due to CHR. 1569775a620SHiroshi Yamauchi uint64_t WeightedNumBranchesDelta; // NumBranchesDelta weighted by the profile 1579775a620SHiroshi Yamauchi // count at the scope entry. 1589775a620SHiroshi Yamauchi }; 1599775a620SHiroshi Yamauchi 1609775a620SHiroshi Yamauchi // RegInfo - some properties of a Region. 1619775a620SHiroshi Yamauchi struct RegInfo { 1629775a620SHiroshi Yamauchi RegInfo() : R(nullptr), HasBranch(false) {} 1639775a620SHiroshi Yamauchi RegInfo(Region *RegionIn) : R(RegionIn), HasBranch(false) {} 1649775a620SHiroshi Yamauchi Region *R; 1659775a620SHiroshi Yamauchi bool HasBranch; 1669775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 1679775a620SHiroshi Yamauchi }; 1689775a620SHiroshi Yamauchi 1699775a620SHiroshi Yamauchi typedef DenseMap<Region *, DenseSet<Instruction *>> HoistStopMapTy; 1709775a620SHiroshi Yamauchi 1719775a620SHiroshi Yamauchi // CHRScope - a sequence of regions to CHR together. It corresponds to a 1729775a620SHiroshi Yamauchi // sequence of conditional blocks. It can have subscopes which correspond to 1739775a620SHiroshi Yamauchi // nested conditional blocks. Nested CHRScopes form a tree. 1749775a620SHiroshi Yamauchi class CHRScope { 1759775a620SHiroshi Yamauchi public: 1769775a620SHiroshi Yamauchi CHRScope(RegInfo RI) : BranchInsertPoint(nullptr) { 1779775a620SHiroshi Yamauchi assert(RI.R && "Null RegionIn"); 1789775a620SHiroshi Yamauchi RegInfos.push_back(RI); 1799775a620SHiroshi Yamauchi } 1809775a620SHiroshi Yamauchi 1819775a620SHiroshi Yamauchi Region *getParentRegion() { 1829775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1839775a620SHiroshi Yamauchi Region *Parent = RegInfos[0].R->getParent(); 1849775a620SHiroshi Yamauchi assert(Parent && "Unexpected to call this on the top-level region"); 1859775a620SHiroshi Yamauchi return Parent; 1869775a620SHiroshi Yamauchi } 1879775a620SHiroshi Yamauchi 1889775a620SHiroshi Yamauchi BasicBlock *getEntryBlock() { 1899775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1909775a620SHiroshi Yamauchi return RegInfos.front().R->getEntry(); 1919775a620SHiroshi Yamauchi } 1929775a620SHiroshi Yamauchi 1939775a620SHiroshi Yamauchi BasicBlock *getExitBlock() { 1949775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 1959775a620SHiroshi Yamauchi return RegInfos.back().R->getExit(); 1969775a620SHiroshi Yamauchi } 1979775a620SHiroshi Yamauchi 1989775a620SHiroshi Yamauchi bool appendable(CHRScope *Next) { 1999775a620SHiroshi Yamauchi // The next scope is appendable only if this scope is directly connected to 2009775a620SHiroshi Yamauchi // it (which implies it post-dominates this scope) and this scope dominates 2019775a620SHiroshi Yamauchi // it (no edge to the next scope outside this scope). 2029775a620SHiroshi Yamauchi BasicBlock *NextEntry = Next->getEntryBlock(); 2039775a620SHiroshi Yamauchi if (getExitBlock() != NextEntry) 2049775a620SHiroshi Yamauchi // Not directly connected. 2059775a620SHiroshi Yamauchi return false; 2069775a620SHiroshi Yamauchi Region *LastRegion = RegInfos.back().R; 2079775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(NextEntry)) 2089775a620SHiroshi Yamauchi if (!LastRegion->contains(Pred)) 2099775a620SHiroshi Yamauchi // There's an edge going into the entry of the next scope from outside 2109775a620SHiroshi Yamauchi // of this scope. 2119775a620SHiroshi Yamauchi return false; 2129775a620SHiroshi Yamauchi return true; 2139775a620SHiroshi Yamauchi } 2149775a620SHiroshi Yamauchi 2159775a620SHiroshi Yamauchi void append(CHRScope *Next) { 2169775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 2179775a620SHiroshi Yamauchi assert(Next->RegInfos.size() > 0 && "Empty CHRScope"); 2189775a620SHiroshi Yamauchi assert(getParentRegion() == Next->getParentRegion() && 2199775a620SHiroshi Yamauchi "Must be siblings"); 2209775a620SHiroshi Yamauchi assert(getExitBlock() == Next->getEntryBlock() && 2219775a620SHiroshi Yamauchi "Must be adjacent"); 2229775a620SHiroshi Yamauchi for (RegInfo &RI : Next->RegInfos) 2239775a620SHiroshi Yamauchi RegInfos.push_back(RI); 2249775a620SHiroshi Yamauchi for (CHRScope *Sub : Next->Subs) 2259775a620SHiroshi Yamauchi Subs.push_back(Sub); 2269775a620SHiroshi Yamauchi } 2279775a620SHiroshi Yamauchi 2289775a620SHiroshi Yamauchi void addSub(CHRScope *SubIn) { 2299775a620SHiroshi Yamauchi #ifndef NDEBUG 230b3b61de0SFangrui Song bool IsChild = false; 2319775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) 2329775a620SHiroshi Yamauchi if (RI.R == SubIn->getParentRegion()) { 233b3b61de0SFangrui Song IsChild = true; 2349775a620SHiroshi Yamauchi break; 2359775a620SHiroshi Yamauchi } 236b3b61de0SFangrui Song assert(IsChild && "Must be a child"); 2379775a620SHiroshi Yamauchi #endif 2389775a620SHiroshi Yamauchi Subs.push_back(SubIn); 2399775a620SHiroshi Yamauchi } 2409775a620SHiroshi Yamauchi 2419775a620SHiroshi Yamauchi // Split this scope at the boundary region into two, which will belong to the 2429775a620SHiroshi Yamauchi // tail and returns the tail. 2439775a620SHiroshi Yamauchi CHRScope *split(Region *Boundary) { 2449775a620SHiroshi Yamauchi assert(Boundary && "Boundary null"); 2459775a620SHiroshi Yamauchi assert(RegInfos.begin()->R != Boundary && 2469775a620SHiroshi Yamauchi "Can't be split at beginning"); 2479775a620SHiroshi Yamauchi auto BoundaryIt = std::find_if(RegInfos.begin(), RegInfos.end(), 2489775a620SHiroshi Yamauchi [&Boundary](const RegInfo& RI) { 2499775a620SHiroshi Yamauchi return Boundary == RI.R; 2509775a620SHiroshi Yamauchi }); 2519775a620SHiroshi Yamauchi if (BoundaryIt == RegInfos.end()) 2529775a620SHiroshi Yamauchi return nullptr; 2539775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> TailRegInfos; 2549775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> TailSubs; 2559775a620SHiroshi Yamauchi TailRegInfos.insert(TailRegInfos.begin(), BoundaryIt, RegInfos.end()); 2569775a620SHiroshi Yamauchi RegInfos.resize(BoundaryIt - RegInfos.begin()); 2579775a620SHiroshi Yamauchi DenseSet<Region *> TailRegionSet; 2589775a620SHiroshi Yamauchi for (RegInfo &RI : TailRegInfos) 2599775a620SHiroshi Yamauchi TailRegionSet.insert(RI.R); 2609775a620SHiroshi Yamauchi for (auto It = Subs.begin(); It != Subs.end(); ) { 2619775a620SHiroshi Yamauchi CHRScope *Sub = *It; 2629775a620SHiroshi Yamauchi assert(Sub && "null Sub"); 2639775a620SHiroshi Yamauchi Region *Parent = Sub->getParentRegion(); 2649775a620SHiroshi Yamauchi if (TailRegionSet.count(Parent)) { 2659775a620SHiroshi Yamauchi TailSubs.push_back(Sub); 2669775a620SHiroshi Yamauchi It = Subs.erase(It); 2679775a620SHiroshi Yamauchi } else { 2689775a620SHiroshi Yamauchi assert(std::find_if(RegInfos.begin(), RegInfos.end(), 2699775a620SHiroshi Yamauchi [&Parent](const RegInfo& RI) { 2709775a620SHiroshi Yamauchi return Parent == RI.R; 2719775a620SHiroshi Yamauchi }) != RegInfos.end() && 2729775a620SHiroshi Yamauchi "Must be in head"); 2739775a620SHiroshi Yamauchi ++It; 2749775a620SHiroshi Yamauchi } 2759775a620SHiroshi Yamauchi } 2769775a620SHiroshi Yamauchi assert(HoistStopMap.empty() && "MapHoistStops must be empty"); 2779775a620SHiroshi Yamauchi return new CHRScope(TailRegInfos, TailSubs); 2789775a620SHiroshi Yamauchi } 2799775a620SHiroshi Yamauchi 2809775a620SHiroshi Yamauchi bool contains(Instruction *I) const { 2819775a620SHiroshi Yamauchi BasicBlock *Parent = I->getParent(); 2829775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) 2839775a620SHiroshi Yamauchi if (RI.R->contains(Parent)) 2849775a620SHiroshi Yamauchi return true; 2859775a620SHiroshi Yamauchi return false; 2869775a620SHiroshi Yamauchi } 2879775a620SHiroshi Yamauchi 2889775a620SHiroshi Yamauchi void print(raw_ostream &OS) const; 2899775a620SHiroshi Yamauchi 2909775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos; // Regions that belong to this scope 2919775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subs; // Subscopes. 2929775a620SHiroshi Yamauchi 2939775a620SHiroshi Yamauchi // The instruction at which to insert the CHR conditional branch (and hoist 2949775a620SHiroshi Yamauchi // the dependent condition values). 2959775a620SHiroshi Yamauchi Instruction *BranchInsertPoint; 2969775a620SHiroshi Yamauchi 2979775a620SHiroshi Yamauchi // True-biased and false-biased regions (conditional blocks), 2989775a620SHiroshi Yamauchi // respectively. Used only for the outermost scope and includes regions in 2999775a620SHiroshi Yamauchi // subscopes. The rest are unbiased. 3009775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegions; 3019775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegions; 3029775a620SHiroshi Yamauchi // Among the biased regions, the regions that get CHRed. 3039775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> CHRRegions; 3049775a620SHiroshi Yamauchi 3059775a620SHiroshi Yamauchi // True-biased and false-biased selects, respectively. Used only for the 3069775a620SHiroshi Yamauchi // outermost scope and includes ones in subscopes. 3079775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelects; 3089775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelects; 3099775a620SHiroshi Yamauchi 3109775a620SHiroshi Yamauchi // Map from one of the above regions to the instructions to stop 3119775a620SHiroshi Yamauchi // hoisting instructions at through use-def chains. 3129775a620SHiroshi Yamauchi HoistStopMapTy HoistStopMap; 3139775a620SHiroshi Yamauchi 3149775a620SHiroshi Yamauchi private: 3159775a620SHiroshi Yamauchi CHRScope(SmallVector<RegInfo, 8> &RegInfosIn, 3169775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> &SubsIn) 3179775a620SHiroshi Yamauchi : RegInfos(RegInfosIn), Subs(SubsIn), BranchInsertPoint(nullptr) {} 3189775a620SHiroshi Yamauchi }; 3199775a620SHiroshi Yamauchi 3209775a620SHiroshi Yamauchi class CHR { 3219775a620SHiroshi Yamauchi public: 3229775a620SHiroshi Yamauchi CHR(Function &Fin, BlockFrequencyInfo &BFIin, DominatorTree &DTin, 323fd2c699dSHiroshi Yamauchi ProfileSummaryInfo &PSIin, RegionInfo &RIin, 324fd2c699dSHiroshi Yamauchi OptimizationRemarkEmitter &OREin) 325fd2c699dSHiroshi Yamauchi : F(Fin), BFI(BFIin), DT(DTin), PSI(PSIin), RI(RIin), ORE(OREin) {} 3269775a620SHiroshi Yamauchi 3279775a620SHiroshi Yamauchi ~CHR() { 3289775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 3299775a620SHiroshi Yamauchi delete Scope; 3309775a620SHiroshi Yamauchi } 3319775a620SHiroshi Yamauchi } 3329775a620SHiroshi Yamauchi 3339775a620SHiroshi Yamauchi bool run(); 3349775a620SHiroshi Yamauchi 3359775a620SHiroshi Yamauchi private: 3369775a620SHiroshi Yamauchi // See the comments in CHR::run() for the high level flow of the algorithm and 3379775a620SHiroshi Yamauchi // what the following functions do. 3389775a620SHiroshi Yamauchi 3399775a620SHiroshi Yamauchi void findScopes(SmallVectorImpl<CHRScope *> &Output) { 3409775a620SHiroshi Yamauchi Region *R = RI.getTopLevelRegion(); 3419775a620SHiroshi Yamauchi CHRScope *Scope = findScopes(R, nullptr, nullptr, Output); 3429775a620SHiroshi Yamauchi if (Scope) { 3439775a620SHiroshi Yamauchi Output.push_back(Scope); 3449775a620SHiroshi Yamauchi } 3459775a620SHiroshi Yamauchi } 3469775a620SHiroshi Yamauchi CHRScope *findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 3479775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes); 3489775a620SHiroshi Yamauchi CHRScope *findScope(Region *R); 3499775a620SHiroshi Yamauchi void checkScopeHoistable(CHRScope *Scope); 3509775a620SHiroshi Yamauchi 3519775a620SHiroshi Yamauchi void splitScopes(SmallVectorImpl<CHRScope *> &Input, 3529775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3539775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> splitScope(CHRScope *Scope, 3549775a620SHiroshi Yamauchi CHRScope *Outer, 3559775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 3569775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 3579775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 3589775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables); 3599775a620SHiroshi Yamauchi 3609775a620SHiroshi Yamauchi void classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes); 3619775a620SHiroshi Yamauchi void classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope); 3629775a620SHiroshi Yamauchi 3639775a620SHiroshi Yamauchi void filterScopes(SmallVectorImpl<CHRScope *> &Input, 3649775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3659775a620SHiroshi Yamauchi 3669775a620SHiroshi Yamauchi void setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 3679775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3689775a620SHiroshi Yamauchi void setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope); 3699775a620SHiroshi Yamauchi 3709775a620SHiroshi Yamauchi void sortScopes(SmallVectorImpl<CHRScope *> &Input, 3719775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output); 3729775a620SHiroshi Yamauchi 3739775a620SHiroshi Yamauchi void transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes); 3749775a620SHiroshi Yamauchi void transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs); 3759775a620SHiroshi Yamauchi void cloneScopeBlocks(CHRScope *Scope, 3769775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3779775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 3789775a620SHiroshi Yamauchi Region *LastRegion, 3799775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3809775a620SHiroshi Yamauchi BranchInst *createMergedBranch(BasicBlock *PreEntryBlock, 3819775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 3829775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 3839775a620SHiroshi Yamauchi ValueToValueMapTy &VMap); 3849775a620SHiroshi Yamauchi void fixupBranchesAndSelects(CHRScope *Scope, 3859775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 3869775a620SHiroshi Yamauchi BranchInst *MergedBR, 3879775a620SHiroshi Yamauchi uint64_t ProfileCount); 3889775a620SHiroshi Yamauchi void fixupBranch(Region *R, 3899775a620SHiroshi Yamauchi CHRScope *Scope, 3909775a620SHiroshi Yamauchi IRBuilder<> &IRB, 3919775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 3929775a620SHiroshi Yamauchi void fixupSelect(SelectInst* SI, 3939775a620SHiroshi Yamauchi CHRScope *Scope, 3949775a620SHiroshi Yamauchi IRBuilder<> &IRB, 3959775a620SHiroshi Yamauchi Value *&MergedCondition, BranchProbability &CHRBranchBias); 3969775a620SHiroshi Yamauchi void addToMergedCondition(bool IsTrueBiased, Value *Cond, 3979775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 3989775a620SHiroshi Yamauchi CHRScope *Scope, 3999775a620SHiroshi Yamauchi IRBuilder<> &IRB, 4009775a620SHiroshi Yamauchi Value *&MergedCondition); 4019775a620SHiroshi Yamauchi 4029775a620SHiroshi Yamauchi Function &F; 4039775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI; 4049775a620SHiroshi Yamauchi DominatorTree &DT; 4059775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI; 4069775a620SHiroshi Yamauchi RegionInfo &RI; 407fd2c699dSHiroshi Yamauchi OptimizationRemarkEmitter &ORE; 4089775a620SHiroshi Yamauchi CHRStats Stats; 4099775a620SHiroshi Yamauchi 4109775a620SHiroshi Yamauchi // All the true-biased regions in the function 4119775a620SHiroshi Yamauchi DenseSet<Region *> TrueBiasedRegionsGlobal; 4129775a620SHiroshi Yamauchi // All the false-biased regions in the function 4139775a620SHiroshi Yamauchi DenseSet<Region *> FalseBiasedRegionsGlobal; 4149775a620SHiroshi Yamauchi // All the true-biased selects in the function 4159775a620SHiroshi Yamauchi DenseSet<SelectInst *> TrueBiasedSelectsGlobal; 4169775a620SHiroshi Yamauchi // All the false-biased selects in the function 4179775a620SHiroshi Yamauchi DenseSet<SelectInst *> FalseBiasedSelectsGlobal; 4189775a620SHiroshi Yamauchi // A map from biased regions to their branch bias 4199775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> BranchBiasMap; 4209775a620SHiroshi Yamauchi // A map from biased selects to their branch bias 4219775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> SelectBiasMap; 4229775a620SHiroshi Yamauchi // All the scopes. 4239775a620SHiroshi Yamauchi DenseSet<CHRScope *> Scopes; 4249775a620SHiroshi Yamauchi }; 4259775a620SHiroshi Yamauchi 4269775a620SHiroshi Yamauchi } // end anonymous namespace 4279775a620SHiroshi Yamauchi 4285fb509b7SHiroshi Yamauchi static inline 4295fb509b7SHiroshi Yamauchi raw_ostream LLVM_ATTRIBUTE_UNUSED &operator<<(raw_ostream &OS, 4305fb509b7SHiroshi Yamauchi const CHRStats &Stats) { 4315fb509b7SHiroshi Yamauchi Stats.print(OS); 4325fb509b7SHiroshi Yamauchi return OS; 4335fb509b7SHiroshi Yamauchi } 4345fb509b7SHiroshi Yamauchi 4355fb509b7SHiroshi Yamauchi static inline 4365fb509b7SHiroshi Yamauchi raw_ostream &operator<<(raw_ostream &OS, const CHRScope &Scope) { 4375fb509b7SHiroshi Yamauchi Scope.print(OS); 4385fb509b7SHiroshi Yamauchi return OS; 4395fb509b7SHiroshi Yamauchi } 4405fb509b7SHiroshi Yamauchi 4419775a620SHiroshi Yamauchi static bool shouldApply(Function &F, ProfileSummaryInfo& PSI) { 4429775a620SHiroshi Yamauchi if (ForceCHR) 4439775a620SHiroshi Yamauchi return true; 4449775a620SHiroshi Yamauchi 4459775a620SHiroshi Yamauchi if (!CHRModuleList.empty() || !CHRFunctionList.empty()) { 4469775a620SHiroshi Yamauchi if (CHRModules.count(F.getParent()->getName())) 4479775a620SHiroshi Yamauchi return true; 4485fb509b7SHiroshi Yamauchi return CHRFunctions.count(F.getName()); 4499775a620SHiroshi Yamauchi } 4509775a620SHiroshi Yamauchi 4519775a620SHiroshi Yamauchi assert(PSI.hasProfileSummary() && "Empty PSI?"); 4529775a620SHiroshi Yamauchi return PSI.isFunctionEntryHot(&F); 4539775a620SHiroshi Yamauchi } 4549775a620SHiroshi Yamauchi 455c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED dumpIR(Function &F, const char *Label, 456c8f348cbSFangrui Song CHRStats *Stats) { 4575fb509b7SHiroshi Yamauchi StringRef FuncName = F.getName(); 4585fb509b7SHiroshi Yamauchi StringRef ModuleName = F.getParent()->getName(); 45906650941SHiroshi Yamauchi (void)(FuncName); // Unused in release build. 46006650941SHiroshi Yamauchi (void)(ModuleName); // Unused in release build. 4619775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR IR dump " << Label << " " << ModuleName << " " 4625fb509b7SHiroshi Yamauchi << FuncName); 4639775a620SHiroshi Yamauchi if (Stats) 4649775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << " " << *Stats); 4659775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "\n"); 4669775a620SHiroshi Yamauchi CHR_DEBUG(F.dump()); 4679775a620SHiroshi Yamauchi } 4689775a620SHiroshi Yamauchi 4699775a620SHiroshi Yamauchi void CHRScope::print(raw_ostream &OS) const { 4709775a620SHiroshi Yamauchi assert(RegInfos.size() > 0 && "Empty CHRScope"); 4719775a620SHiroshi Yamauchi OS << "CHRScope["; 4729775a620SHiroshi Yamauchi OS << RegInfos.size() << ", Regions["; 4739775a620SHiroshi Yamauchi for (const RegInfo &RI : RegInfos) { 4749775a620SHiroshi Yamauchi OS << RI.R->getNameStr(); 4759775a620SHiroshi Yamauchi if (RI.HasBranch) 4769775a620SHiroshi Yamauchi OS << " B"; 4779775a620SHiroshi Yamauchi if (RI.Selects.size() > 0) 4789775a620SHiroshi Yamauchi OS << " S" << RI.Selects.size(); 4799775a620SHiroshi Yamauchi OS << ", "; 4809775a620SHiroshi Yamauchi } 4819775a620SHiroshi Yamauchi if (RegInfos[0].R->getParent()) { 4829775a620SHiroshi Yamauchi OS << "], Parent " << RegInfos[0].R->getParent()->getNameStr(); 4839775a620SHiroshi Yamauchi } else { 4849775a620SHiroshi Yamauchi // top level region 4859775a620SHiroshi Yamauchi OS << "]"; 4869775a620SHiroshi Yamauchi } 4879775a620SHiroshi Yamauchi OS << ", Subs["; 4889775a620SHiroshi Yamauchi for (CHRScope *Sub : Subs) { 4899775a620SHiroshi Yamauchi OS << *Sub << ", "; 4909775a620SHiroshi Yamauchi } 4919775a620SHiroshi Yamauchi OS << "]]"; 4929775a620SHiroshi Yamauchi } 4939775a620SHiroshi Yamauchi 4949775a620SHiroshi Yamauchi // Return true if the given instruction type can be hoisted by CHR. 4959775a620SHiroshi Yamauchi static bool isHoistableInstructionType(Instruction *I) { 4969775a620SHiroshi Yamauchi return isa<BinaryOperator>(I) || isa<CastInst>(I) || isa<SelectInst>(I) || 4979775a620SHiroshi Yamauchi isa<GetElementPtrInst>(I) || isa<CmpInst>(I) || 4989775a620SHiroshi Yamauchi isa<InsertElementInst>(I) || isa<ExtractElementInst>(I) || 4999775a620SHiroshi Yamauchi isa<ShuffleVectorInst>(I) || isa<ExtractValueInst>(I) || 5009775a620SHiroshi Yamauchi isa<InsertValueInst>(I); 5019775a620SHiroshi Yamauchi } 5029775a620SHiroshi Yamauchi 5039775a620SHiroshi Yamauchi // Return true if the given instruction can be hoisted by CHR. 5049775a620SHiroshi Yamauchi static bool isHoistable(Instruction *I, DominatorTree &DT) { 5059775a620SHiroshi Yamauchi if (!isHoistableInstructionType(I)) 5069775a620SHiroshi Yamauchi return false; 5079775a620SHiroshi Yamauchi return isSafeToSpeculativelyExecute(I, nullptr, &DT); 5089775a620SHiroshi Yamauchi } 5099775a620SHiroshi Yamauchi 5109775a620SHiroshi Yamauchi // Recursively traverse the use-def chains of the given value and return a set 5119775a620SHiroshi Yamauchi // of the unhoistable base values defined within the scope (excluding the 5129775a620SHiroshi Yamauchi // first-region entry block) or the (hoistable or unhoistable) base values that 5139775a620SHiroshi Yamauchi // are defined outside (including the first-region entry block) of the 5149775a620SHiroshi Yamauchi // scope. The returned set doesn't include constants. 5159775a620SHiroshi Yamauchi static std::set<Value *> getBaseValues(Value *V, 5169775a620SHiroshi Yamauchi DominatorTree &DT) { 5179775a620SHiroshi Yamauchi std::set<Value *> Result; 5189775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 5199775a620SHiroshi Yamauchi // We don't stop at a block that's not in the Scope because we would miss some 5209775a620SHiroshi Yamauchi // instructions that are based on the same base values if we stop there. 5219775a620SHiroshi Yamauchi if (!isHoistable(I, DT)) { 5229775a620SHiroshi Yamauchi Result.insert(I); 5239775a620SHiroshi Yamauchi return Result; 5249775a620SHiroshi Yamauchi } 5259775a620SHiroshi Yamauchi // I is hoistable above the Scope. 5269775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 5279775a620SHiroshi Yamauchi std::set<Value *> OpResult = getBaseValues(Op, DT); 5289775a620SHiroshi Yamauchi Result.insert(OpResult.begin(), OpResult.end()); 5299775a620SHiroshi Yamauchi } 5309775a620SHiroshi Yamauchi return Result; 5319775a620SHiroshi Yamauchi } 5329775a620SHiroshi Yamauchi if (isa<Argument>(V)) { 5339775a620SHiroshi Yamauchi Result.insert(V); 5349775a620SHiroshi Yamauchi return Result; 5359775a620SHiroshi Yamauchi } 5369775a620SHiroshi Yamauchi // We don't include others like constants because those won't lead to any 5379775a620SHiroshi Yamauchi // chance of folding of conditions (eg two bit checks merged into one check) 5389775a620SHiroshi Yamauchi // after CHR. 5399775a620SHiroshi Yamauchi return Result; // empty 5409775a620SHiroshi Yamauchi } 5419775a620SHiroshi Yamauchi 5429775a620SHiroshi Yamauchi // Return true if V is already hoisted or can be hoisted (along with its 5439775a620SHiroshi Yamauchi // operands) above the insert point. When it returns true and HoistStops is 5449775a620SHiroshi Yamauchi // non-null, the instructions to stop hoisting at through the use-def chains are 5459775a620SHiroshi Yamauchi // inserted into HoistStops. 5469775a620SHiroshi Yamauchi static bool 5479775a620SHiroshi Yamauchi checkHoistValue(Value *V, Instruction *InsertPoint, DominatorTree &DT, 5489775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables, 549dfeb7974SHiroshi Yamauchi DenseSet<Instruction *> *HoistStops, 550dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> &Visited) { 5519775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 5529775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 553dfeb7974SHiroshi Yamauchi if (Visited.count(I)) { 554dfeb7974SHiroshi Yamauchi return Visited[I]; 555dfeb7974SHiroshi Yamauchi } 5569775a620SHiroshi Yamauchi assert(DT.getNode(I->getParent()) && "DT must contain I's parent block"); 5579775a620SHiroshi Yamauchi assert(DT.getNode(InsertPoint->getParent()) && "DT must contain Destination"); 5589775a620SHiroshi Yamauchi if (Unhoistables.count(I)) { 5599775a620SHiroshi Yamauchi // Don't hoist if they are not to be hoisted. 560dfeb7974SHiroshi Yamauchi Visited[I] = false; 5619775a620SHiroshi Yamauchi return false; 5629775a620SHiroshi Yamauchi } 5639775a620SHiroshi Yamauchi if (DT.dominates(I, InsertPoint)) { 5649775a620SHiroshi Yamauchi // We are already above the insert point. Stop here. 5659775a620SHiroshi Yamauchi if (HoistStops) 5669775a620SHiroshi Yamauchi HoistStops->insert(I); 567dfeb7974SHiroshi Yamauchi Visited[I] = true; 5689775a620SHiroshi Yamauchi return true; 5699775a620SHiroshi Yamauchi } 5709775a620SHiroshi Yamauchi // We aren't not above the insert point, check if we can hoist it above the 5719775a620SHiroshi Yamauchi // insert point. 5729775a620SHiroshi Yamauchi if (isHoistable(I, DT)) { 5739775a620SHiroshi Yamauchi // Check operands first. 5749775a620SHiroshi Yamauchi DenseSet<Instruction *> OpsHoistStops; 5759775a620SHiroshi Yamauchi bool AllOpsHoisted = true; 5769775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 577dfeb7974SHiroshi Yamauchi if (!checkHoistValue(Op, InsertPoint, DT, Unhoistables, &OpsHoistStops, 578dfeb7974SHiroshi Yamauchi Visited)) { 5799775a620SHiroshi Yamauchi AllOpsHoisted = false; 5809775a620SHiroshi Yamauchi break; 5819775a620SHiroshi Yamauchi } 5829775a620SHiroshi Yamauchi } 5839775a620SHiroshi Yamauchi if (AllOpsHoisted) { 5849775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "checkHoistValue " << *I << "\n"); 5859775a620SHiroshi Yamauchi if (HoistStops) 5869775a620SHiroshi Yamauchi HoistStops->insert(OpsHoistStops.begin(), OpsHoistStops.end()); 587dfeb7974SHiroshi Yamauchi Visited[I] = true; 5889775a620SHiroshi Yamauchi return true; 5899775a620SHiroshi Yamauchi } 5909775a620SHiroshi Yamauchi } 591dfeb7974SHiroshi Yamauchi Visited[I] = false; 5929775a620SHiroshi Yamauchi return false; 5939775a620SHiroshi Yamauchi } 5949775a620SHiroshi Yamauchi // Non-instructions are considered hoistable. 5959775a620SHiroshi Yamauchi return true; 5969775a620SHiroshi Yamauchi } 5979775a620SHiroshi Yamauchi 5989775a620SHiroshi Yamauchi // Returns true and sets the true probability and false probability of an 5999775a620SHiroshi Yamauchi // MD_prof metadata if it's well-formed. 600b3b61de0SFangrui Song static bool checkMDProf(MDNode *MD, BranchProbability &TrueProb, 6019775a620SHiroshi Yamauchi BranchProbability &FalseProb) { 6029775a620SHiroshi Yamauchi if (!MD) return false; 6039775a620SHiroshi Yamauchi MDString *MDName = cast<MDString>(MD->getOperand(0)); 6049775a620SHiroshi Yamauchi if (MDName->getString() != "branch_weights" || 6059775a620SHiroshi Yamauchi MD->getNumOperands() != 3) 6069775a620SHiroshi Yamauchi return false; 6079775a620SHiroshi Yamauchi ConstantInt *TrueWeight = mdconst::extract<ConstantInt>(MD->getOperand(1)); 6089775a620SHiroshi Yamauchi ConstantInt *FalseWeight = mdconst::extract<ConstantInt>(MD->getOperand(2)); 6099775a620SHiroshi Yamauchi if (!TrueWeight || !FalseWeight) 6109775a620SHiroshi Yamauchi return false; 61147c2bc58SRichard Trieu uint64_t TrueWt = TrueWeight->getValue().getZExtValue(); 61247c2bc58SRichard Trieu uint64_t FalseWt = FalseWeight->getValue().getZExtValue(); 61347c2bc58SRichard Trieu uint64_t SumWt = TrueWt + FalseWt; 61447c2bc58SRichard Trieu 61547c2bc58SRichard Trieu assert(SumWt >= TrueWt && SumWt >= FalseWt && 61647c2bc58SRichard Trieu "Overflow calculating branch probabilities."); 61747c2bc58SRichard Trieu 61847c2bc58SRichard Trieu TrueProb = BranchProbability::getBranchProbability(TrueWt, SumWt); 61947c2bc58SRichard Trieu FalseProb = BranchProbability::getBranchProbability(FalseWt, SumWt); 6209775a620SHiroshi Yamauchi return true; 6219775a620SHiroshi Yamauchi } 6229775a620SHiroshi Yamauchi 6239775a620SHiroshi Yamauchi static BranchProbability getCHRBiasThreshold() { 6249775a620SHiroshi Yamauchi return BranchProbability::getBranchProbability( 6259775a620SHiroshi Yamauchi static_cast<uint64_t>(CHRBiasThreshold * 1000000), 1000000); 6269775a620SHiroshi Yamauchi } 6279775a620SHiroshi Yamauchi 6289775a620SHiroshi Yamauchi // A helper for CheckBiasedBranch and CheckBiasedSelect. If TrueProb >= 6299775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into TrueSet and return true. If FalseProb >= 6309775a620SHiroshi Yamauchi // CHRBiasThreshold, put Key into FalseSet and return true. Otherwise, return 6319775a620SHiroshi Yamauchi // false. 6329775a620SHiroshi Yamauchi template <typename K, typename S, typename M> 633c55e9975SBenjamin Kramer static bool checkBias(K *Key, BranchProbability TrueProb, 634c55e9975SBenjamin Kramer BranchProbability FalseProb, S &TrueSet, S &FalseSet, 635c55e9975SBenjamin Kramer M &BiasMap) { 6369775a620SHiroshi Yamauchi BranchProbability Threshold = getCHRBiasThreshold(); 6379775a620SHiroshi Yamauchi if (TrueProb >= Threshold) { 6389775a620SHiroshi Yamauchi TrueSet.insert(Key); 6399775a620SHiroshi Yamauchi BiasMap[Key] = TrueProb; 6409775a620SHiroshi Yamauchi return true; 6419775a620SHiroshi Yamauchi } else if (FalseProb >= Threshold) { 6429775a620SHiroshi Yamauchi FalseSet.insert(Key); 6439775a620SHiroshi Yamauchi BiasMap[Key] = FalseProb; 6449775a620SHiroshi Yamauchi return true; 6459775a620SHiroshi Yamauchi } 6469775a620SHiroshi Yamauchi return false; 6479775a620SHiroshi Yamauchi } 6489775a620SHiroshi Yamauchi 6499775a620SHiroshi Yamauchi // Returns true and insert a region into the right biased set and the map if the 6509775a620SHiroshi Yamauchi // branch of the region is biased. 651b3b61de0SFangrui Song static bool checkBiasedBranch(BranchInst *BI, Region *R, 6529775a620SHiroshi Yamauchi DenseSet<Region *> &TrueBiasedRegionsGlobal, 6539775a620SHiroshi Yamauchi DenseSet<Region *> &FalseBiasedRegionsGlobal, 6549775a620SHiroshi Yamauchi DenseMap<Region *, BranchProbability> &BranchBiasMap) { 6559775a620SHiroshi Yamauchi if (!BI->isConditional()) 6569775a620SHiroshi Yamauchi return false; 6579775a620SHiroshi Yamauchi BranchProbability ThenProb, ElseProb; 658b3b61de0SFangrui Song if (!checkMDProf(BI->getMetadata(LLVMContext::MD_prof), 6599775a620SHiroshi Yamauchi ThenProb, ElseProb)) 6609775a620SHiroshi Yamauchi return false; 6619775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(0); 6629775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(1); 6639775a620SHiroshi Yamauchi assert((IfThen == R->getExit() || IfElse == R->getExit()) && 6649775a620SHiroshi Yamauchi IfThen != IfElse && 6659775a620SHiroshi Yamauchi "Invariant from findScopes"); 6669775a620SHiroshi Yamauchi if (IfThen == R->getExit()) { 6679775a620SHiroshi Yamauchi // Swap them so that IfThen/ThenProb means going into the conditional code 6689775a620SHiroshi Yamauchi // and IfElse/ElseProb means skipping it. 6699775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 6709775a620SHiroshi Yamauchi std::swap(ThenProb, ElseProb); 6719775a620SHiroshi Yamauchi } 6729775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *BI << " "); 6739775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ThenProb " << ThenProb << " "); 6749775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "ElseProb " << ElseProb << "\n"); 675b3b61de0SFangrui Song return checkBias(R, ThenProb, ElseProb, 6769775a620SHiroshi Yamauchi TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 6779775a620SHiroshi Yamauchi BranchBiasMap); 6789775a620SHiroshi Yamauchi } 6799775a620SHiroshi Yamauchi 6809775a620SHiroshi Yamauchi // Returns true and insert a select into the right biased set and the map if the 6819775a620SHiroshi Yamauchi // select is biased. 682b3b61de0SFangrui Song static bool checkBiasedSelect( 6839775a620SHiroshi Yamauchi SelectInst *SI, Region *R, 6849775a620SHiroshi Yamauchi DenseSet<SelectInst *> &TrueBiasedSelectsGlobal, 6859775a620SHiroshi Yamauchi DenseSet<SelectInst *> &FalseBiasedSelectsGlobal, 6869775a620SHiroshi Yamauchi DenseMap<SelectInst *, BranchProbability> &SelectBiasMap) { 6879775a620SHiroshi Yamauchi BranchProbability TrueProb, FalseProb; 688b3b61de0SFangrui Song if (!checkMDProf(SI->getMetadata(LLVMContext::MD_prof), 6899775a620SHiroshi Yamauchi TrueProb, FalseProb)) 6909775a620SHiroshi Yamauchi return false; 6919775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << " "); 6929775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "TrueProb " << TrueProb << " "); 6939775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "FalseProb " << FalseProb << "\n"); 694b3b61de0SFangrui Song return checkBias(SI, TrueProb, FalseProb, 6959775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, FalseBiasedSelectsGlobal, 6969775a620SHiroshi Yamauchi SelectBiasMap); 6979775a620SHiroshi Yamauchi } 6989775a620SHiroshi Yamauchi 6999775a620SHiroshi Yamauchi // Returns the instruction at which to hoist the dependent condition values and 7009775a620SHiroshi Yamauchi // insert the CHR branch for a region. This is the terminator branch in the 7019775a620SHiroshi Yamauchi // entry block or the first select in the entry block, if any. 7029775a620SHiroshi Yamauchi static Instruction* getBranchInsertPoint(RegInfo &RI) { 7039775a620SHiroshi Yamauchi Region *R = RI.R; 7049775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 7059775a620SHiroshi Yamauchi // The hoist point is by default the terminator of the entry block, which is 7069775a620SHiroshi Yamauchi // the same as the branch instruction if RI.HasBranch is true. 7079775a620SHiroshi Yamauchi Instruction *HoistPoint = EntryBB->getTerminator(); 7089775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7099775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7109775a620SHiroshi Yamauchi // Pick the first select in Selects in the entry block. Note Selects is 7119775a620SHiroshi Yamauchi // sorted in the instruction order within a block (asserted below). 7129775a620SHiroshi Yamauchi HoistPoint = SI; 7139775a620SHiroshi Yamauchi break; 7149775a620SHiroshi Yamauchi } 7159775a620SHiroshi Yamauchi } 7169775a620SHiroshi Yamauchi assert(HoistPoint && "Null HoistPoint"); 7179775a620SHiroshi Yamauchi #ifndef NDEBUG 7189775a620SHiroshi Yamauchi // Check that HoistPoint is the first one in Selects in the entry block, 7199775a620SHiroshi Yamauchi // if any. 7209775a620SHiroshi Yamauchi DenseSet<Instruction *> EntryBlockSelectSet; 7219775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 7229775a620SHiroshi Yamauchi if (SI->getParent() == EntryBB) { 7239775a620SHiroshi Yamauchi EntryBlockSelectSet.insert(SI); 7249775a620SHiroshi Yamauchi } 7259775a620SHiroshi Yamauchi } 7269775a620SHiroshi Yamauchi for (Instruction &I : *EntryBB) { 7279775a620SHiroshi Yamauchi if (EntryBlockSelectSet.count(&I) > 0) { 7289775a620SHiroshi Yamauchi assert(&I == HoistPoint && 7299775a620SHiroshi Yamauchi "HoistPoint must be the first one in Selects"); 7309775a620SHiroshi Yamauchi break; 7319775a620SHiroshi Yamauchi } 7329775a620SHiroshi Yamauchi } 7339775a620SHiroshi Yamauchi #endif 7349775a620SHiroshi Yamauchi return HoistPoint; 7359775a620SHiroshi Yamauchi } 7369775a620SHiroshi Yamauchi 7379775a620SHiroshi Yamauchi // Find a CHR scope in the given region. 7389775a620SHiroshi Yamauchi CHRScope * CHR::findScope(Region *R) { 7399775a620SHiroshi Yamauchi CHRScope *Result = nullptr; 7409775a620SHiroshi Yamauchi BasicBlock *Entry = R->getEntry(); 7419775a620SHiroshi Yamauchi BasicBlock *Exit = R->getExit(); // null if top level. 7429775a620SHiroshi Yamauchi assert(Entry && "Entry must not be null"); 7439775a620SHiroshi Yamauchi assert((Exit == nullptr) == (R->isTopLevelRegion()) && 7449775a620SHiroshi Yamauchi "Only top level region has a null exit"); 7459775a620SHiroshi Yamauchi if (Entry) 7469775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry " << Entry->getName() << "\n"); 7479775a620SHiroshi Yamauchi else 7489775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Entry null\n"); 7499775a620SHiroshi Yamauchi if (Exit) 7509775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit " << Exit->getName() << "\n"); 7519775a620SHiroshi Yamauchi else 7529775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Exit null\n"); 7539775a620SHiroshi Yamauchi // Exclude cases where Entry is part of a subregion (hence it doesn't belong 7549775a620SHiroshi Yamauchi // to this region). 7559775a620SHiroshi Yamauchi bool EntryInSubregion = RI.getRegionFor(Entry) != R; 7569775a620SHiroshi Yamauchi if (EntryInSubregion) 7579775a620SHiroshi Yamauchi return nullptr; 7589775a620SHiroshi Yamauchi // Exclude loops 7599775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(Entry)) 7609775a620SHiroshi Yamauchi if (R->contains(Pred)) 7619775a620SHiroshi Yamauchi return nullptr; 7629775a620SHiroshi Yamauchi if (Exit) { 7639775a620SHiroshi Yamauchi // Try to find an if-then block (check if R is an if-then). 7649775a620SHiroshi Yamauchi // if (cond) { 7659775a620SHiroshi Yamauchi // ... 7669775a620SHiroshi Yamauchi // } 7679775a620SHiroshi Yamauchi auto *BI = dyn_cast<BranchInst>(Entry->getTerminator()); 7689775a620SHiroshi Yamauchi if (BI) 7699775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI.isConditional " << BI->isConditional() << "\n"); 7709775a620SHiroshi Yamauchi else 7719775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI null\n"); 7729775a620SHiroshi Yamauchi if (BI && BI->isConditional()) { 7739775a620SHiroshi Yamauchi BasicBlock *S0 = BI->getSuccessor(0); 7749775a620SHiroshi Yamauchi BasicBlock *S1 = BI->getSuccessor(1); 7759775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S0 " << S0->getName() << "\n"); 7769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "S1 " << S1->getName() << "\n"); 7779775a620SHiroshi Yamauchi if (S0 != S1 && (S0 == Exit || S1 == Exit)) { 7789775a620SHiroshi Yamauchi RegInfo RI(R); 779b3b61de0SFangrui Song RI.HasBranch = checkBiasedBranch( 7809775a620SHiroshi Yamauchi BI, R, TrueBiasedRegionsGlobal, FalseBiasedRegionsGlobal, 7819775a620SHiroshi Yamauchi BranchBiasMap); 7829775a620SHiroshi Yamauchi Result = new CHRScope(RI); 7839775a620SHiroshi Yamauchi Scopes.insert(Result); 7849775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a region with a branch\n"); 7859775a620SHiroshi Yamauchi ++Stats.NumBranches; 786fd2c699dSHiroshi Yamauchi if (!RI.HasBranch) { 787fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 788fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, "BranchNotBiased", BI) 789fd2c699dSHiroshi Yamauchi << "Branch not biased"; 790fd2c699dSHiroshi Yamauchi }); 791fd2c699dSHiroshi Yamauchi } 7929775a620SHiroshi Yamauchi } 7939775a620SHiroshi Yamauchi } 7949775a620SHiroshi Yamauchi } 7959775a620SHiroshi Yamauchi { 7969775a620SHiroshi Yamauchi // Try to look for selects in the direct child blocks (as opposed to in 7979775a620SHiroshi Yamauchi // subregions) of R. 7989775a620SHiroshi Yamauchi // ... 7999775a620SHiroshi Yamauchi // if (..) { // Some subregion 8009775a620SHiroshi Yamauchi // ... 8019775a620SHiroshi Yamauchi // } 8029775a620SHiroshi Yamauchi // if (..) { // Some subregion 8039775a620SHiroshi Yamauchi // ... 8049775a620SHiroshi Yamauchi // } 8059775a620SHiroshi Yamauchi // ... 8069775a620SHiroshi Yamauchi // a = cond ? b : c; 8079775a620SHiroshi Yamauchi // ... 8089775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> Selects; 8099775a620SHiroshi Yamauchi for (RegionNode *E : R->elements()) { 8109775a620SHiroshi Yamauchi if (E->isSubRegion()) 8119775a620SHiroshi Yamauchi continue; 8129775a620SHiroshi Yamauchi // This returns the basic block of E if E is a direct child of R (not a 8139775a620SHiroshi Yamauchi // subregion.) 8149775a620SHiroshi Yamauchi BasicBlock *BB = E->getEntry(); 8159775a620SHiroshi Yamauchi // Need to push in the order to make it easier to find the first Select 8169775a620SHiroshi Yamauchi // later. 8179775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 8189775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(&I)) { 8199775a620SHiroshi Yamauchi Selects.push_back(SI); 8209775a620SHiroshi Yamauchi ++Stats.NumBranches; 8219775a620SHiroshi Yamauchi } 8229775a620SHiroshi Yamauchi } 8239775a620SHiroshi Yamauchi } 8249775a620SHiroshi Yamauchi if (Selects.size() > 0) { 8259775a620SHiroshi Yamauchi auto AddSelects = [&](RegInfo &RI) { 8269775a620SHiroshi Yamauchi for (auto *SI : Selects) 827b3b61de0SFangrui Song if (checkBiasedSelect(SI, RI.R, 8289775a620SHiroshi Yamauchi TrueBiasedSelectsGlobal, 8299775a620SHiroshi Yamauchi FalseBiasedSelectsGlobal, 8309775a620SHiroshi Yamauchi SelectBiasMap)) 8319775a620SHiroshi Yamauchi RI.Selects.push_back(SI); 832fd2c699dSHiroshi Yamauchi else 833fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 834fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, "SelectNotBiased", SI) 835fd2c699dSHiroshi Yamauchi << "Select not biased"; 836fd2c699dSHiroshi Yamauchi }); 8379775a620SHiroshi Yamauchi }; 8389775a620SHiroshi Yamauchi if (!Result) { 8399775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found a select-only region\n"); 8409775a620SHiroshi Yamauchi RegInfo RI(R); 8419775a620SHiroshi Yamauchi AddSelects(RI); 8429775a620SHiroshi Yamauchi Result = new CHRScope(RI); 8439775a620SHiroshi Yamauchi Scopes.insert(Result); 8449775a620SHiroshi Yamauchi } else { 8459775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Found select(s) in a region with a branch\n"); 8469775a620SHiroshi Yamauchi AddSelects(Result->RegInfos[0]); 8479775a620SHiroshi Yamauchi } 8489775a620SHiroshi Yamauchi } 8499775a620SHiroshi Yamauchi } 8509775a620SHiroshi Yamauchi 8519775a620SHiroshi Yamauchi if (Result) { 8529775a620SHiroshi Yamauchi checkScopeHoistable(Result); 8539775a620SHiroshi Yamauchi } 8549775a620SHiroshi Yamauchi return Result; 8559775a620SHiroshi Yamauchi } 8569775a620SHiroshi Yamauchi 8579775a620SHiroshi Yamauchi // Check that any of the branch and the selects in the region could be 8589775a620SHiroshi Yamauchi // hoisted above the the CHR branch insert point (the most dominating of 8599775a620SHiroshi Yamauchi // them, either the branch (at the end of the first block) or the first 8609775a620SHiroshi Yamauchi // select in the first block). If the branch can't be hoisted, drop the 8619775a620SHiroshi Yamauchi // selects in the first blocks. 8629775a620SHiroshi Yamauchi // 8639775a620SHiroshi Yamauchi // For example, for the following scope/region with selects, we want to insert 8649775a620SHiroshi Yamauchi // the merged branch right before the first select in the first/entry block by 8659775a620SHiroshi Yamauchi // hoisting c1, c2, c3, and c4. 8669775a620SHiroshi Yamauchi // 8679775a620SHiroshi Yamauchi // // Branch insert point here. 8689775a620SHiroshi Yamauchi // a = c1 ? b : c; // Select 1 8699775a620SHiroshi Yamauchi // d = c2 ? e : f; // Select 2 8709775a620SHiroshi Yamauchi // if (c3) { // Branch 8719775a620SHiroshi Yamauchi // ... 8729775a620SHiroshi Yamauchi // c4 = foo() // A call. 8739775a620SHiroshi Yamauchi // g = c4 ? h : i; // Select 3 8749775a620SHiroshi Yamauchi // } 8759775a620SHiroshi Yamauchi // 8769775a620SHiroshi Yamauchi // But suppose we can't hoist c4 because it's dependent on the preceding 8779775a620SHiroshi Yamauchi // call. Then, we drop Select 3. Furthermore, if we can't hoist c2, we also drop 8789775a620SHiroshi Yamauchi // Select 2. If we can't hoist c3, we drop Selects 1 & 2. 8799775a620SHiroshi Yamauchi void CHR::checkScopeHoistable(CHRScope *Scope) { 8809775a620SHiroshi Yamauchi RegInfo &RI = Scope->RegInfos[0]; 8819775a620SHiroshi Yamauchi Region *R = RI.R; 8829775a620SHiroshi Yamauchi BasicBlock *EntryBB = R->getEntry(); 8839775a620SHiroshi Yamauchi auto *Branch = RI.HasBranch ? 8849775a620SHiroshi Yamauchi cast<BranchInst>(EntryBB->getTerminator()) : nullptr; 8859775a620SHiroshi Yamauchi SmallVector<SelectInst *, 8> &Selects = RI.Selects; 8869775a620SHiroshi Yamauchi if (RI.HasBranch || !Selects.empty()) { 8879775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 8889775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 8899775a620SHiroshi Yamauchi // Avoid a data dependence from a select or a branch to a(nother) 8909775a620SHiroshi Yamauchi // select. Note no instruction can't data-depend on a branch (a branch 8919775a620SHiroshi Yamauchi // instruction doesn't produce a value). 8929775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 8939775a620SHiroshi Yamauchi // Initialize Unhoistables with the selects. 8949775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 8959775a620SHiroshi Yamauchi Unhoistables.insert(SI); 8969775a620SHiroshi Yamauchi } 8979775a620SHiroshi Yamauchi // Remove Selects that can't be hoisted. 8989775a620SHiroshi Yamauchi for (auto it = Selects.begin(); it != Selects.end(); ) { 8999775a620SHiroshi Yamauchi SelectInst *SI = *it; 9009775a620SHiroshi Yamauchi if (SI == InsertPoint) { 9019775a620SHiroshi Yamauchi ++it; 9029775a620SHiroshi Yamauchi continue; 9039775a620SHiroshi Yamauchi } 904dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 9059775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, 906dfeb7974SHiroshi Yamauchi DT, Unhoistables, nullptr, Visited); 9079775a620SHiroshi Yamauchi if (!IsHoistable) { 9089775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping select " << *SI << "\n"); 909fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 910fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, 911fd2c699dSHiroshi Yamauchi "DropUnhoistableSelect", SI) 912fd2c699dSHiroshi Yamauchi << "Dropped unhoistable select"; 913fd2c699dSHiroshi Yamauchi }); 9149775a620SHiroshi Yamauchi it = Selects.erase(it); 9159775a620SHiroshi Yamauchi // Since we are dropping the select here, we also drop it from 9169775a620SHiroshi Yamauchi // Unhoistables. 9179775a620SHiroshi Yamauchi Unhoistables.erase(SI); 9189775a620SHiroshi Yamauchi } else 9199775a620SHiroshi Yamauchi ++it; 9209775a620SHiroshi Yamauchi } 9219775a620SHiroshi Yamauchi // Update InsertPoint after potentially removing selects. 9229775a620SHiroshi Yamauchi InsertPoint = getBranchInsertPoint(RI); 9239775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9249775a620SHiroshi Yamauchi if (RI.HasBranch && InsertPoint != Branch) { 925dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 9269775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(Branch->getCondition(), InsertPoint, 927dfeb7974SHiroshi Yamauchi DT, Unhoistables, nullptr, Visited); 9289775a620SHiroshi Yamauchi if (!IsHoistable) { 9299775a620SHiroshi Yamauchi // If the branch isn't hoistable, drop the selects in the entry 9309775a620SHiroshi Yamauchi // block, preferring the branch, which makes the branch the hoist 9319775a620SHiroshi Yamauchi // point. 9329775a620SHiroshi Yamauchi assert(InsertPoint != Branch && "Branch must not be the hoist point"); 9339775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Dropping selects in entry block \n"); 9349775a620SHiroshi Yamauchi CHR_DEBUG( 9359775a620SHiroshi Yamauchi for (SelectInst *SI : Selects) { 9369775a620SHiroshi Yamauchi dbgs() << "SI " << *SI << "\n"; 9379775a620SHiroshi Yamauchi }); 938fd2c699dSHiroshi Yamauchi for (SelectInst *SI : Selects) { 939fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 940fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, 941fd2c699dSHiroshi Yamauchi "DropSelectUnhoistableBranch", SI) 942fd2c699dSHiroshi Yamauchi << "Dropped select due to unhoistable branch"; 943fd2c699dSHiroshi Yamauchi }); 944fd2c699dSHiroshi Yamauchi } 9459775a620SHiroshi Yamauchi Selects.erase(std::remove_if(Selects.begin(), Selects.end(), 9469775a620SHiroshi Yamauchi [EntryBB](SelectInst *SI) { 9479775a620SHiroshi Yamauchi return SI->getParent() == EntryBB; 9489775a620SHiroshi Yamauchi }), Selects.end()); 9499775a620SHiroshi Yamauchi Unhoistables.clear(); 9509775a620SHiroshi Yamauchi InsertPoint = Branch; 9519775a620SHiroshi Yamauchi } 9529775a620SHiroshi Yamauchi } 9539775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "InsertPoint " << *InsertPoint << "\n"); 9549775a620SHiroshi Yamauchi #ifndef NDEBUG 9559775a620SHiroshi Yamauchi if (RI.HasBranch) { 9569775a620SHiroshi Yamauchi assert(!DT.dominates(Branch, InsertPoint) && 9579775a620SHiroshi Yamauchi "Branch can't be already above the hoist point"); 958dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 9599775a620SHiroshi Yamauchi assert(checkHoistValue(Branch->getCondition(), InsertPoint, 960dfeb7974SHiroshi Yamauchi DT, Unhoistables, nullptr, Visited) && 9619775a620SHiroshi Yamauchi "checkHoistValue for branch"); 9629775a620SHiroshi Yamauchi } 9639775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9649775a620SHiroshi Yamauchi assert(!DT.dominates(SI, InsertPoint) && 9659775a620SHiroshi Yamauchi "SI can't be already above the hoist point"); 966dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 9679775a620SHiroshi Yamauchi assert(checkHoistValue(SI->getCondition(), InsertPoint, DT, 968dfeb7974SHiroshi Yamauchi Unhoistables, nullptr, Visited) && 9699775a620SHiroshi Yamauchi "checkHoistValue for selects"); 9709775a620SHiroshi Yamauchi } 9719775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Result\n"); 9729775a620SHiroshi Yamauchi if (RI.HasBranch) { 9739775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BI " << *Branch << "\n"); 9749775a620SHiroshi Yamauchi } 9759775a620SHiroshi Yamauchi for (auto *SI : Selects) { 9769775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "SI " << *SI << "\n"); 9779775a620SHiroshi Yamauchi } 9789775a620SHiroshi Yamauchi #endif 9799775a620SHiroshi Yamauchi } 9809775a620SHiroshi Yamauchi } 9819775a620SHiroshi Yamauchi 9829775a620SHiroshi Yamauchi // Traverse the region tree, find all nested scopes and merge them if possible. 9839775a620SHiroshi Yamauchi CHRScope * CHR::findScopes(Region *R, Region *NextRegion, Region *ParentRegion, 9849775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Scopes) { 9859775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "findScopes " << R->getNameStr() << "\n"); 9869775a620SHiroshi Yamauchi CHRScope *Result = findScope(R); 9879775a620SHiroshi Yamauchi // Visit subscopes. 9889775a620SHiroshi Yamauchi CHRScope *ConsecutiveSubscope = nullptr; 9899775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Subscopes; 9909775a620SHiroshi Yamauchi for (auto It = R->begin(); It != R->end(); ++It) { 9919775a620SHiroshi Yamauchi const std::unique_ptr<Region> &SubR = *It; 992b3b61de0SFangrui Song auto NextIt = std::next(It); 993b3b61de0SFangrui Song Region *NextSubR = NextIt != R->end() ? NextIt->get() : nullptr; 9949775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Looking at subregion " << SubR.get()->getNameStr() 9959775a620SHiroshi Yamauchi << "\n"); 9969775a620SHiroshi Yamauchi CHRScope *SubCHRScope = findScopes(SubR.get(), NextSubR, R, Scopes); 9979775a620SHiroshi Yamauchi if (SubCHRScope) { 9989775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope " << *SubCHRScope << "\n"); 9999775a620SHiroshi Yamauchi } else { 10009775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Subregion Scope null\n"); 10019775a620SHiroshi Yamauchi } 10029775a620SHiroshi Yamauchi if (SubCHRScope) { 10039775a620SHiroshi Yamauchi if (!ConsecutiveSubscope) 10049775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 10059775a620SHiroshi Yamauchi else if (!ConsecutiveSubscope->appendable(SubCHRScope)) { 10069775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 10079775a620SHiroshi Yamauchi ConsecutiveSubscope = SubCHRScope; 10089775a620SHiroshi Yamauchi } else 10099775a620SHiroshi Yamauchi ConsecutiveSubscope->append(SubCHRScope); 10109775a620SHiroshi Yamauchi } else { 10119775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 10129775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 10139775a620SHiroshi Yamauchi } 10149775a620SHiroshi Yamauchi ConsecutiveSubscope = nullptr; 10159775a620SHiroshi Yamauchi } 10169775a620SHiroshi Yamauchi } 10179775a620SHiroshi Yamauchi if (ConsecutiveSubscope) { 10189775a620SHiroshi Yamauchi Subscopes.push_back(ConsecutiveSubscope); 10199775a620SHiroshi Yamauchi } 10209775a620SHiroshi Yamauchi for (CHRScope *Sub : Subscopes) { 10219775a620SHiroshi Yamauchi if (Result) { 10229775a620SHiroshi Yamauchi // Combine it with the parent. 10239775a620SHiroshi Yamauchi Result->addSub(Sub); 10249775a620SHiroshi Yamauchi } else { 10259775a620SHiroshi Yamauchi // Push Subscopes as they won't be combined with the parent. 10269775a620SHiroshi Yamauchi Scopes.push_back(Sub); 10279775a620SHiroshi Yamauchi } 10289775a620SHiroshi Yamauchi } 10299775a620SHiroshi Yamauchi return Result; 10309775a620SHiroshi Yamauchi } 10319775a620SHiroshi Yamauchi 10329775a620SHiroshi Yamauchi static DenseSet<Value *> getCHRConditionValuesForRegion(RegInfo &RI) { 10339775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues; 10349775a620SHiroshi Yamauchi if (RI.HasBranch) { 10359775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(RI.R->getEntry()->getTerminator()); 10369775a620SHiroshi Yamauchi ConditionValues.insert(BI->getCondition()); 10379775a620SHiroshi Yamauchi } 10389775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 10399775a620SHiroshi Yamauchi ConditionValues.insert(SI->getCondition()); 10409775a620SHiroshi Yamauchi } 10419775a620SHiroshi Yamauchi return ConditionValues; 10429775a620SHiroshi Yamauchi } 10439775a620SHiroshi Yamauchi 10449775a620SHiroshi Yamauchi 10459775a620SHiroshi Yamauchi // Determine whether to split a scope depending on the sets of the branch 10469775a620SHiroshi Yamauchi // condition values of the previous region and the current region. We split 10479775a620SHiroshi Yamauchi // (return true) it if 1) the condition values of the inner/lower scope can't be 10489775a620SHiroshi Yamauchi // hoisted up to the outer/upper scope, or 2) the two sets of the condition 10499775a620SHiroshi Yamauchi // values have an empty intersection (because the combined branch conditions 10509775a620SHiroshi Yamauchi // won't probably lead to a simpler combined condition). 10519775a620SHiroshi Yamauchi static bool shouldSplit(Instruction *InsertPoint, 10529775a620SHiroshi Yamauchi DenseSet<Value *> &PrevConditionValues, 10539775a620SHiroshi Yamauchi DenseSet<Value *> &ConditionValues, 10549775a620SHiroshi Yamauchi DominatorTree &DT, 10559775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 10569775a620SHiroshi Yamauchi CHR_DEBUG( 10579775a620SHiroshi Yamauchi dbgs() << "shouldSplit " << *InsertPoint << " PrevConditionValues "; 10589775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10599775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10609775a620SHiroshi Yamauchi } 10619775a620SHiroshi Yamauchi dbgs() << " ConditionValues "; 10629775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10639775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10649775a620SHiroshi Yamauchi } 10659775a620SHiroshi Yamauchi dbgs() << "\n"); 10669775a620SHiroshi Yamauchi assert(InsertPoint && "Null InsertPoint"); 10679775a620SHiroshi Yamauchi // If any of Bases isn't hoistable to the hoist point, split. 10689775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 1069dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 1070dfeb7974SHiroshi Yamauchi if (!checkHoistValue(V, InsertPoint, DT, Unhoistables, nullptr, Visited)) { 10719775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. checkHoistValue false " << *V << "\n"); 10729775a620SHiroshi Yamauchi return true; // Not hoistable, split. 10739775a620SHiroshi Yamauchi } 10749775a620SHiroshi Yamauchi } 10759775a620SHiroshi Yamauchi // If PrevConditionValues or ConditionValues is empty, don't split to avoid 10769775a620SHiroshi Yamauchi // unnecessary splits at scopes with no branch/selects. If 10779775a620SHiroshi Yamauchi // PrevConditionValues and ConditionValues don't intersect at all, split. 10789775a620SHiroshi Yamauchi if (!PrevConditionValues.empty() && !ConditionValues.empty()) { 10799775a620SHiroshi Yamauchi // Use std::set as DenseSet doesn't work with set_intersection. 10809775a620SHiroshi Yamauchi std::set<Value *> PrevBases, Bases; 10819775a620SHiroshi Yamauchi for (Value *V : PrevConditionValues) { 10829775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10839775a620SHiroshi Yamauchi PrevBases.insert(BaseValues.begin(), BaseValues.end()); 10849775a620SHiroshi Yamauchi } 10859775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 10869775a620SHiroshi Yamauchi std::set<Value *> BaseValues = getBaseValues(V, DT); 10879775a620SHiroshi Yamauchi Bases.insert(BaseValues.begin(), BaseValues.end()); 10889775a620SHiroshi Yamauchi } 10899775a620SHiroshi Yamauchi CHR_DEBUG( 10909775a620SHiroshi Yamauchi dbgs() << "PrevBases "; 10919775a620SHiroshi Yamauchi for (Value *V : PrevBases) { 10929775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10939775a620SHiroshi Yamauchi } 10949775a620SHiroshi Yamauchi dbgs() << " Bases "; 10959775a620SHiroshi Yamauchi for (Value *V : Bases) { 10969775a620SHiroshi Yamauchi dbgs() << *V << ", "; 10979775a620SHiroshi Yamauchi } 10989775a620SHiroshi Yamauchi dbgs() << "\n"); 10999775a620SHiroshi Yamauchi std::set<Value *> Intersection; 11009775a620SHiroshi Yamauchi std::set_intersection(PrevBases.begin(), PrevBases.end(), 11019775a620SHiroshi Yamauchi Bases.begin(), Bases.end(), 11029775a620SHiroshi Yamauchi std::inserter(Intersection, Intersection.begin())); 11039775a620SHiroshi Yamauchi if (Intersection.empty()) { 11049775a620SHiroshi Yamauchi // Empty intersection, split. 11059775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Split. Intersection empty\n"); 11069775a620SHiroshi Yamauchi return true; 11079775a620SHiroshi Yamauchi } 11089775a620SHiroshi Yamauchi } 11099775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "No split\n"); 11109775a620SHiroshi Yamauchi return false; // Don't split. 11119775a620SHiroshi Yamauchi } 11129775a620SHiroshi Yamauchi 1113b3b61de0SFangrui Song static void getSelectsInScope(CHRScope *Scope, 11149775a620SHiroshi Yamauchi DenseSet<Instruction *> &Output) { 1115b3b61de0SFangrui Song for (RegInfo &RI : Scope->RegInfos) 1116b3b61de0SFangrui Song for (SelectInst *SI : RI.Selects) 11179775a620SHiroshi Yamauchi Output.insert(SI); 1118b3b61de0SFangrui Song for (CHRScope *Sub : Scope->Subs) 1119b3b61de0SFangrui Song getSelectsInScope(Sub, Output); 11209775a620SHiroshi Yamauchi } 11219775a620SHiroshi Yamauchi 11229775a620SHiroshi Yamauchi void CHR::splitScopes(SmallVectorImpl<CHRScope *> &Input, 11239775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 11249775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 11259775a620SHiroshi Yamauchi assert(!Scope->BranchInsertPoint && 11269775a620SHiroshi Yamauchi "BranchInsertPoint must not be set"); 11279775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 1128b3b61de0SFangrui Song getSelectsInScope(Scope, Unhoistables); 11299775a620SHiroshi Yamauchi splitScope(Scope, nullptr, nullptr, nullptr, Output, Unhoistables); 11309775a620SHiroshi Yamauchi } 11319775a620SHiroshi Yamauchi #ifndef NDEBUG 11329775a620SHiroshi Yamauchi for (CHRScope *Scope : Output) { 11339775a620SHiroshi Yamauchi assert(Scope->BranchInsertPoint && "BranchInsertPoint must be set"); 11349775a620SHiroshi Yamauchi } 11359775a620SHiroshi Yamauchi #endif 11369775a620SHiroshi Yamauchi } 11379775a620SHiroshi Yamauchi 11389775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> CHR::splitScope( 11399775a620SHiroshi Yamauchi CHRScope *Scope, 11409775a620SHiroshi Yamauchi CHRScope *Outer, 11419775a620SHiroshi Yamauchi DenseSet<Value *> *OuterConditionValues, 11429775a620SHiroshi Yamauchi Instruction *OuterInsertPoint, 11439775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output, 11449775a620SHiroshi Yamauchi DenseSet<Instruction *> &Unhoistables) { 11459775a620SHiroshi Yamauchi if (Outer) { 11469775a620SHiroshi Yamauchi assert(OuterConditionValues && "Null OuterConditionValues"); 11479775a620SHiroshi Yamauchi assert(OuterInsertPoint && "Null OuterInsertPoint"); 11489775a620SHiroshi Yamauchi } 11499775a620SHiroshi Yamauchi bool PrevSplitFromOuter = true; 11509775a620SHiroshi Yamauchi DenseSet<Value *> PrevConditionValues; 11519775a620SHiroshi Yamauchi Instruction *PrevInsertPoint = nullptr; 11529775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Splits; 11539775a620SHiroshi Yamauchi SmallVector<bool, 8> SplitsSplitFromOuter; 11549775a620SHiroshi Yamauchi SmallVector<DenseSet<Value *>, 8> SplitsConditionValues; 11559775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> SplitsInsertPoints; 11569775a620SHiroshi Yamauchi SmallVector<RegInfo, 8> RegInfos(Scope->RegInfos); // Copy 11579775a620SHiroshi Yamauchi for (RegInfo &RI : RegInfos) { 11589775a620SHiroshi Yamauchi Instruction *InsertPoint = getBranchInsertPoint(RI); 11599775a620SHiroshi Yamauchi DenseSet<Value *> ConditionValues = getCHRConditionValuesForRegion(RI); 11609775a620SHiroshi Yamauchi CHR_DEBUG( 11619775a620SHiroshi Yamauchi dbgs() << "ConditionValues "; 11629775a620SHiroshi Yamauchi for (Value *V : ConditionValues) { 11639775a620SHiroshi Yamauchi dbgs() << *V << ", "; 11649775a620SHiroshi Yamauchi } 11659775a620SHiroshi Yamauchi dbgs() << "\n"); 11669775a620SHiroshi Yamauchi if (RI.R == RegInfos[0].R) { 11679775a620SHiroshi Yamauchi // First iteration. Check to see if we should split from the outer. 11689775a620SHiroshi Yamauchi if (Outer) { 11699775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer " << *Outer << "\n"); 11709775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from outer at " 11719775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 11729775a620SHiroshi Yamauchi if (shouldSplit(OuterInsertPoint, *OuterConditionValues, 11739775a620SHiroshi Yamauchi ConditionValues, DT, Unhoistables)) { 11749775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11759775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 1176fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 1177fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, 1178fd2c699dSHiroshi Yamauchi "SplitScopeFromOuter", 1179fd2c699dSHiroshi Yamauchi RI.R->getEntry()->getTerminator()) 1180fd2c699dSHiroshi Yamauchi << "Split scope from outer due to unhoistable branch/select " 1181fd2c699dSHiroshi Yamauchi << "and/or lack of common condition values"; 1182fd2c699dSHiroshi Yamauchi }); 11839775a620SHiroshi Yamauchi } else { 11849775a620SHiroshi Yamauchi // Not splitting from the outer. Use the outer bases and insert 11859775a620SHiroshi Yamauchi // point. Union the bases. 11869775a620SHiroshi Yamauchi PrevSplitFromOuter = false; 11879775a620SHiroshi Yamauchi PrevConditionValues = *OuterConditionValues; 11889775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), 11899775a620SHiroshi Yamauchi ConditionValues.end()); 11909775a620SHiroshi Yamauchi PrevInsertPoint = OuterInsertPoint; 11919775a620SHiroshi Yamauchi } 11929775a620SHiroshi Yamauchi } else { 11939775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Outer null\n"); 11949775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 11959775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 11969775a620SHiroshi Yamauchi } 11979775a620SHiroshi Yamauchi } else { 11989775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Should split from prev at " 11999775a620SHiroshi Yamauchi << RI.R->getNameStr() << "\n"); 12009775a620SHiroshi Yamauchi if (shouldSplit(PrevInsertPoint, PrevConditionValues, ConditionValues, 12019775a620SHiroshi Yamauchi DT, Unhoistables)) { 12029775a620SHiroshi Yamauchi CHRScope *Tail = Scope->split(RI.R); 12039775a620SHiroshi Yamauchi Scopes.insert(Tail); 12049775a620SHiroshi Yamauchi Splits.push_back(Scope); 12059775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 12069775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 12079775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 12089775a620SHiroshi Yamauchi Scope = Tail; 12099775a620SHiroshi Yamauchi PrevConditionValues = ConditionValues; 12109775a620SHiroshi Yamauchi PrevInsertPoint = InsertPoint; 12119775a620SHiroshi Yamauchi PrevSplitFromOuter = true; 1212fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 1213fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed(DEBUG_TYPE, 1214fd2c699dSHiroshi Yamauchi "SplitScopeFromPrev", 1215fd2c699dSHiroshi Yamauchi RI.R->getEntry()->getTerminator()) 1216fd2c699dSHiroshi Yamauchi << "Split scope from previous due to unhoistable branch/select " 1217fd2c699dSHiroshi Yamauchi << "and/or lack of common condition values"; 1218fd2c699dSHiroshi Yamauchi }); 12199775a620SHiroshi Yamauchi } else { 12209775a620SHiroshi Yamauchi // Not splitting. Union the bases. Keep the hoist point. 12219775a620SHiroshi Yamauchi PrevConditionValues.insert(ConditionValues.begin(), ConditionValues.end()); 12229775a620SHiroshi Yamauchi } 12239775a620SHiroshi Yamauchi } 12249775a620SHiroshi Yamauchi } 12259775a620SHiroshi Yamauchi Splits.push_back(Scope); 12269775a620SHiroshi Yamauchi SplitsSplitFromOuter.push_back(PrevSplitFromOuter); 12279775a620SHiroshi Yamauchi SplitsConditionValues.push_back(PrevConditionValues); 12289775a620SHiroshi Yamauchi assert(PrevInsertPoint && "Null PrevInsertPoint"); 12299775a620SHiroshi Yamauchi SplitsInsertPoints.push_back(PrevInsertPoint); 12309775a620SHiroshi Yamauchi assert(Splits.size() == SplitsConditionValues.size() && 12319775a620SHiroshi Yamauchi Splits.size() == SplitsSplitFromOuter.size() && 12329775a620SHiroshi Yamauchi Splits.size() == SplitsInsertPoints.size() && "Mismatching sizes"); 12339775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 12349775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 12359775a620SHiroshi Yamauchi DenseSet<Value *> &SplitConditionValues = SplitsConditionValues[I]; 12369775a620SHiroshi Yamauchi Instruction *SplitInsertPoint = SplitsInsertPoints[I]; 12379775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> NewSubs; 12389775a620SHiroshi Yamauchi DenseSet<Instruction *> SplitUnhoistables; 1239b3b61de0SFangrui Song getSelectsInScope(Split, SplitUnhoistables); 12409775a620SHiroshi Yamauchi for (CHRScope *Sub : Split->Subs) { 12419775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SubSplits = splitScope( 12429775a620SHiroshi Yamauchi Sub, Split, &SplitConditionValues, SplitInsertPoint, Output, 12439775a620SHiroshi Yamauchi SplitUnhoistables); 12449775a620SHiroshi Yamauchi NewSubs.insert(NewSubs.end(), SubSplits.begin(), SubSplits.end()); 12459775a620SHiroshi Yamauchi } 12469775a620SHiroshi Yamauchi Split->Subs = NewSubs; 12479775a620SHiroshi Yamauchi } 12489775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> Result; 12499775a620SHiroshi Yamauchi for (size_t I = 0; I < Splits.size(); ++I) { 12509775a620SHiroshi Yamauchi CHRScope *Split = Splits[I]; 12519775a620SHiroshi Yamauchi if (SplitsSplitFromOuter[I]) { 12529775a620SHiroshi Yamauchi // Split from the outer. 12539775a620SHiroshi Yamauchi Output.push_back(Split); 12549775a620SHiroshi Yamauchi Split->BranchInsertPoint = SplitsInsertPoints[I]; 12559775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "BranchInsertPoint " << *SplitsInsertPoints[I] 12569775a620SHiroshi Yamauchi << "\n"); 12579775a620SHiroshi Yamauchi } else { 12589775a620SHiroshi Yamauchi // Connected to the outer. 12599775a620SHiroshi Yamauchi Result.push_back(Split); 12609775a620SHiroshi Yamauchi } 12619775a620SHiroshi Yamauchi } 12629775a620SHiroshi Yamauchi if (!Outer) 12639775a620SHiroshi Yamauchi assert(Result.empty() && 12649775a620SHiroshi Yamauchi "If no outer (top-level), must return no nested ones"); 12659775a620SHiroshi Yamauchi return Result; 12669775a620SHiroshi Yamauchi } 12679775a620SHiroshi Yamauchi 12689775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(SmallVectorImpl<CHRScope *> &Scopes) { 12699775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 12709775a620SHiroshi Yamauchi assert(Scope->TrueBiasedRegions.empty() && Scope->FalseBiasedRegions.empty() && "Empty"); 12719775a620SHiroshi Yamauchi classifyBiasedScopes(Scope, Scope); 12729775a620SHiroshi Yamauchi CHR_DEBUG( 12739775a620SHiroshi Yamauchi dbgs() << "classifyBiasedScopes " << *Scope << "\n"; 12749775a620SHiroshi Yamauchi dbgs() << "TrueBiasedRegions "; 12759775a620SHiroshi Yamauchi for (Region *R : Scope->TrueBiasedRegions) { 12769775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12779775a620SHiroshi Yamauchi } 12789775a620SHiroshi Yamauchi dbgs() << "\n"; 12799775a620SHiroshi Yamauchi dbgs() << "FalseBiasedRegions "; 12809775a620SHiroshi Yamauchi for (Region *R : Scope->FalseBiasedRegions) { 12819775a620SHiroshi Yamauchi dbgs() << R->getNameStr() << ", "; 12829775a620SHiroshi Yamauchi } 12839775a620SHiroshi Yamauchi dbgs() << "\n"; 12849775a620SHiroshi Yamauchi dbgs() << "TrueBiasedSelects "; 12859775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->TrueBiasedSelects) { 12869775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12879775a620SHiroshi Yamauchi } 12889775a620SHiroshi Yamauchi dbgs() << "\n"; 12899775a620SHiroshi Yamauchi dbgs() << "FalseBiasedSelects "; 12909775a620SHiroshi Yamauchi for (SelectInst *SI : Scope->FalseBiasedSelects) { 12919775a620SHiroshi Yamauchi dbgs() << *SI << ", "; 12929775a620SHiroshi Yamauchi } 12939775a620SHiroshi Yamauchi dbgs() << "\n";); 12949775a620SHiroshi Yamauchi } 12959775a620SHiroshi Yamauchi } 12969775a620SHiroshi Yamauchi 12979775a620SHiroshi Yamauchi void CHR::classifyBiasedScopes(CHRScope *Scope, CHRScope *OutermostScope) { 12989775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 12999775a620SHiroshi Yamauchi if (RI.HasBranch) { 13009775a620SHiroshi Yamauchi Region *R = RI.R; 13019775a620SHiroshi Yamauchi if (TrueBiasedRegionsGlobal.count(R) > 0) 13029775a620SHiroshi Yamauchi OutermostScope->TrueBiasedRegions.insert(R); 13039775a620SHiroshi Yamauchi else if (FalseBiasedRegionsGlobal.count(R) > 0) 13049775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.insert(R); 13059775a620SHiroshi Yamauchi else 13069775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 13079775a620SHiroshi Yamauchi } 13089775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13099775a620SHiroshi Yamauchi if (TrueBiasedSelectsGlobal.count(SI) > 0) 13109775a620SHiroshi Yamauchi OutermostScope->TrueBiasedSelects.insert(SI); 13119775a620SHiroshi Yamauchi else if (FalseBiasedSelectsGlobal.count(SI) > 0) 13129775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.insert(SI); 13139775a620SHiroshi Yamauchi else 13149775a620SHiroshi Yamauchi llvm_unreachable("Must be biased"); 13159775a620SHiroshi Yamauchi } 13169775a620SHiroshi Yamauchi } 13179775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) { 13189775a620SHiroshi Yamauchi classifyBiasedScopes(Sub, OutermostScope); 13199775a620SHiroshi Yamauchi } 13209775a620SHiroshi Yamauchi } 13219775a620SHiroshi Yamauchi 13229775a620SHiroshi Yamauchi static bool hasAtLeastTwoBiasedBranches(CHRScope *Scope) { 13239775a620SHiroshi Yamauchi unsigned NumBiased = Scope->TrueBiasedRegions.size() + 13249775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.size() + 13259775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.size() + 13269775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.size(); 13279775a620SHiroshi Yamauchi return NumBiased >= CHRMergeThreshold; 13289775a620SHiroshi Yamauchi } 13299775a620SHiroshi Yamauchi 13309775a620SHiroshi Yamauchi void CHR::filterScopes(SmallVectorImpl<CHRScope *> &Input, 13319775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13329775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 13339775a620SHiroshi Yamauchi // Filter out the ones with only one region and no subs. 13349775a620SHiroshi Yamauchi if (!hasAtLeastTwoBiasedBranches(Scope)) { 13359775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Filtered out by biased branches truthy-regions " 13369775a620SHiroshi Yamauchi << Scope->TrueBiasedRegions.size() 13379775a620SHiroshi Yamauchi << " falsy-regions " << Scope->FalseBiasedRegions.size() 13389775a620SHiroshi Yamauchi << " true-selects " << Scope->TrueBiasedSelects.size() 13399775a620SHiroshi Yamauchi << " false-selects " << Scope->FalseBiasedSelects.size() << "\n"); 1340fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 1341fd2c699dSHiroshi Yamauchi return OptimizationRemarkMissed( 1342fd2c699dSHiroshi Yamauchi DEBUG_TYPE, 1343fd2c699dSHiroshi Yamauchi "DropScopeWithOneBranchOrSelect", 1344fd2c699dSHiroshi Yamauchi Scope->RegInfos[0].R->getEntry()->getTerminator()) 1345fd2c699dSHiroshi Yamauchi << "Drop scope with < " 1346fd2c699dSHiroshi Yamauchi << ore::NV("CHRMergeThreshold", CHRMergeThreshold) 1347fd2c699dSHiroshi Yamauchi << " biased branch(es) or select(s)"; 1348fd2c699dSHiroshi Yamauchi }); 13499775a620SHiroshi Yamauchi continue; 13509775a620SHiroshi Yamauchi } 13519775a620SHiroshi Yamauchi Output.push_back(Scope); 13529775a620SHiroshi Yamauchi } 13539775a620SHiroshi Yamauchi } 13549775a620SHiroshi Yamauchi 13559775a620SHiroshi Yamauchi void CHR::setCHRRegions(SmallVectorImpl<CHRScope *> &Input, 13569775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 13579775a620SHiroshi Yamauchi for (CHRScope *Scope : Input) { 13589775a620SHiroshi Yamauchi assert(Scope->HoistStopMap.empty() && Scope->CHRRegions.empty() && 13599775a620SHiroshi Yamauchi "Empty"); 13609775a620SHiroshi Yamauchi setCHRRegions(Scope, Scope); 13619775a620SHiroshi Yamauchi Output.push_back(Scope); 13629775a620SHiroshi Yamauchi CHR_DEBUG( 13639775a620SHiroshi Yamauchi dbgs() << "setCHRRegions HoistStopMap " << *Scope << "\n"; 13649775a620SHiroshi Yamauchi for (auto pair : Scope->HoistStopMap) { 13659775a620SHiroshi Yamauchi Region *R = pair.first; 13669775a620SHiroshi Yamauchi dbgs() << "Region " << R->getNameStr() << "\n"; 13679775a620SHiroshi Yamauchi for (Instruction *I : pair.second) { 13689775a620SHiroshi Yamauchi dbgs() << "HoistStop " << *I << "\n"; 13699775a620SHiroshi Yamauchi } 13709775a620SHiroshi Yamauchi } 13719775a620SHiroshi Yamauchi dbgs() << "CHRRegions" << "\n"; 13729775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 13739775a620SHiroshi Yamauchi dbgs() << RI.R->getNameStr() << "\n"; 13749775a620SHiroshi Yamauchi }); 13759775a620SHiroshi Yamauchi } 13769775a620SHiroshi Yamauchi } 13779775a620SHiroshi Yamauchi 13789775a620SHiroshi Yamauchi void CHR::setCHRRegions(CHRScope *Scope, CHRScope *OutermostScope) { 13799775a620SHiroshi Yamauchi DenseSet<Instruction *> Unhoistables; 13809775a620SHiroshi Yamauchi // Put the biased selects in Unhoistables because they should stay where they 13819775a620SHiroshi Yamauchi // are and constant-folded after CHR (in case one biased select or a branch 13829775a620SHiroshi Yamauchi // can depend on another biased select.) 13839775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13849775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 13859775a620SHiroshi Yamauchi Unhoistables.insert(SI); 13869775a620SHiroshi Yamauchi } 13879775a620SHiroshi Yamauchi } 13889775a620SHiroshi Yamauchi Instruction *InsertPoint = OutermostScope->BranchInsertPoint; 13899775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 13909775a620SHiroshi Yamauchi Region *R = RI.R; 13919775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistStops; 13929775a620SHiroshi Yamauchi bool IsHoisted = false; 13939775a620SHiroshi Yamauchi if (RI.HasBranch) { 13949775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedRegions.count(R) > 0 || 13959775a620SHiroshi Yamauchi OutermostScope->FalseBiasedRegions.count(R) > 0) && 13969775a620SHiroshi Yamauchi "Must be truthy or falsy"); 13979775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 13989775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 1399dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 14009775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(BI->getCondition(), InsertPoint, DT, 1401dfeb7974SHiroshi Yamauchi Unhoistables, &HoistStops, Visited); 14029775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 14039775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 14049775a620SHiroshi Yamauchi IsHoisted = true; 14059775a620SHiroshi Yamauchi } 14069775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 14079775a620SHiroshi Yamauchi assert((OutermostScope->TrueBiasedSelects.count(SI) > 0 || 14089775a620SHiroshi Yamauchi OutermostScope->FalseBiasedSelects.count(SI) > 0) && 14099775a620SHiroshi Yamauchi "Must be true or false biased"); 14109775a620SHiroshi Yamauchi // Note checkHoistValue fills in HoistStops. 1411dfeb7974SHiroshi Yamauchi DenseMap<Instruction *, bool> Visited; 14129775a620SHiroshi Yamauchi bool IsHoistable = checkHoistValue(SI->getCondition(), InsertPoint, DT, 1413dfeb7974SHiroshi Yamauchi Unhoistables, &HoistStops, Visited); 14149775a620SHiroshi Yamauchi assert(IsHoistable && "Must be hoistable"); 14159775a620SHiroshi Yamauchi (void)(IsHoistable); // Unused in release build 14169775a620SHiroshi Yamauchi IsHoisted = true; 14179775a620SHiroshi Yamauchi } 14189775a620SHiroshi Yamauchi if (IsHoisted) { 14199775a620SHiroshi Yamauchi OutermostScope->CHRRegions.push_back(RI); 14209775a620SHiroshi Yamauchi OutermostScope->HoistStopMap[R] = HoistStops; 14219775a620SHiroshi Yamauchi } 14229775a620SHiroshi Yamauchi } 14239775a620SHiroshi Yamauchi for (CHRScope *Sub : Scope->Subs) 14249775a620SHiroshi Yamauchi setCHRRegions(Sub, OutermostScope); 14259775a620SHiroshi Yamauchi } 14269775a620SHiroshi Yamauchi 14279775a620SHiroshi Yamauchi bool CHRScopeSorter(CHRScope *Scope1, CHRScope *Scope2) { 14289775a620SHiroshi Yamauchi return Scope1->RegInfos[0].R->getDepth() < Scope2->RegInfos[0].R->getDepth(); 14299775a620SHiroshi Yamauchi } 14309775a620SHiroshi Yamauchi 14319775a620SHiroshi Yamauchi void CHR::sortScopes(SmallVectorImpl<CHRScope *> &Input, 14329775a620SHiroshi Yamauchi SmallVectorImpl<CHRScope *> &Output) { 14339775a620SHiroshi Yamauchi Output.resize(Input.size()); 143475709329SFangrui Song llvm::copy(Input, Output.begin()); 1435efd94c56SFangrui Song llvm::stable_sort(Output, CHRScopeSorter); 14369775a620SHiroshi Yamauchi } 14379775a620SHiroshi Yamauchi 14389775a620SHiroshi Yamauchi // Return true if V is already hoisted or was hoisted (along with its operands) 14399775a620SHiroshi Yamauchi // to the insert point. 14409775a620SHiroshi Yamauchi static void hoistValue(Value *V, Instruction *HoistPoint, Region *R, 14419775a620SHiroshi Yamauchi HoistStopMapTy &HoistStopMap, 14429775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistedSet, 144316201040SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs, 144416201040SHiroshi Yamauchi DominatorTree &DT) { 14459775a620SHiroshi Yamauchi auto IT = HoistStopMap.find(R); 14469775a620SHiroshi Yamauchi assert(IT != HoistStopMap.end() && "Region must be in hoist stop map"); 14479775a620SHiroshi Yamauchi DenseSet<Instruction *> &HoistStops = IT->second; 14489775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 14499775a620SHiroshi Yamauchi if (I == HoistPoint) 14509775a620SHiroshi Yamauchi return; 14519775a620SHiroshi Yamauchi if (HoistStops.count(I)) 14529775a620SHiroshi Yamauchi return; 14539775a620SHiroshi Yamauchi if (auto *PN = dyn_cast<PHINode>(I)) 14549775a620SHiroshi Yamauchi if (TrivialPHIs.count(PN)) 14559775a620SHiroshi Yamauchi // The trivial phi inserted by the previous CHR scope could replace a 14569775a620SHiroshi Yamauchi // non-phi in HoistStops. Note that since this phi is at the exit of a 14579775a620SHiroshi Yamauchi // previous CHR scope, which dominates this scope, it's safe to stop 14589775a620SHiroshi Yamauchi // hoisting there. 14599775a620SHiroshi Yamauchi return; 14609775a620SHiroshi Yamauchi if (HoistedSet.count(I)) 14619775a620SHiroshi Yamauchi // Already hoisted, return. 14629775a620SHiroshi Yamauchi return; 14639775a620SHiroshi Yamauchi assert(isHoistableInstructionType(I) && "Unhoistable instruction type"); 146416201040SHiroshi Yamauchi assert(DT.getNode(I->getParent()) && "DT must contain I's block"); 146516201040SHiroshi Yamauchi assert(DT.getNode(HoistPoint->getParent()) && 146616201040SHiroshi Yamauchi "DT must contain HoistPoint block"); 146716201040SHiroshi Yamauchi if (DT.dominates(I, HoistPoint)) 146816201040SHiroshi Yamauchi // We are already above the hoist point. Stop here. This may be necessary 146916201040SHiroshi Yamauchi // when multiple scopes would independently hoist the same 147016201040SHiroshi Yamauchi // instruction. Since an outer (dominating) scope would hoist it to its 147116201040SHiroshi Yamauchi // entry before an inner (dominated) scope would to its entry, the inner 147216201040SHiroshi Yamauchi // scope may see the instruction already hoisted, in which case it 147316201040SHiroshi Yamauchi // potentially wrong for the inner scope to hoist it and could cause bad 147416201040SHiroshi Yamauchi // IR (non-dominating def), but safe to skip hoisting it instead because 147516201040SHiroshi Yamauchi // it's already in a block that dominates the inner scope. 147616201040SHiroshi Yamauchi return; 14779775a620SHiroshi Yamauchi for (Value *Op : I->operands()) { 147816201040SHiroshi Yamauchi hoistValue(Op, HoistPoint, R, HoistStopMap, HoistedSet, TrivialPHIs, DT); 14799775a620SHiroshi Yamauchi } 14809775a620SHiroshi Yamauchi I->moveBefore(HoistPoint); 14819775a620SHiroshi Yamauchi HoistedSet.insert(I); 14829775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "hoistValue " << *I << "\n"); 14839775a620SHiroshi Yamauchi } 14849775a620SHiroshi Yamauchi } 14859775a620SHiroshi Yamauchi 14869775a620SHiroshi Yamauchi // Hoist the dependent condition values of the branches and the selects in the 14879775a620SHiroshi Yamauchi // scope to the insert point. 14889775a620SHiroshi Yamauchi static void hoistScopeConditions(CHRScope *Scope, Instruction *HoistPoint, 148916201040SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs, 149016201040SHiroshi Yamauchi DominatorTree &DT) { 14919775a620SHiroshi Yamauchi DenseSet<Instruction *> HoistedSet; 14929775a620SHiroshi Yamauchi for (const RegInfo &RI : Scope->CHRRegions) { 14939775a620SHiroshi Yamauchi Region *R = RI.R; 14949775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 14959775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 14969775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 14979775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 14989775a620SHiroshi Yamauchi hoistValue(BI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 149916201040SHiroshi Yamauchi HoistedSet, TrivialPHIs, DT); 15009775a620SHiroshi Yamauchi } 15019775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 15029775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 15039775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 15049775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 15059775a620SHiroshi Yamauchi continue; 15069775a620SHiroshi Yamauchi hoistValue(SI->getCondition(), HoistPoint, R, Scope->HoistStopMap, 150716201040SHiroshi Yamauchi HoistedSet, TrivialPHIs, DT); 15089775a620SHiroshi Yamauchi } 15099775a620SHiroshi Yamauchi } 15109775a620SHiroshi Yamauchi } 15119775a620SHiroshi Yamauchi 15129775a620SHiroshi Yamauchi // Negate the predicate if an ICmp if it's used only by branches or selects by 15139775a620SHiroshi Yamauchi // swapping the operands of the branches or the selects. Returns true if success. 1514b3b61de0SFangrui Song static bool negateICmpIfUsedByBranchOrSelectOnly(ICmpInst *ICmp, 15159775a620SHiroshi Yamauchi Instruction *ExcludedUser, 15169775a620SHiroshi Yamauchi CHRScope *Scope) { 15179775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 15189775a620SHiroshi Yamauchi if (U == ExcludedUser) 15199775a620SHiroshi Yamauchi continue; 15209775a620SHiroshi Yamauchi if (isa<BranchInst>(U) && cast<BranchInst>(U)->isConditional()) 15219775a620SHiroshi Yamauchi continue; 15229775a620SHiroshi Yamauchi if (isa<SelectInst>(U) && cast<SelectInst>(U)->getCondition() == ICmp) 15239775a620SHiroshi Yamauchi continue; 15249775a620SHiroshi Yamauchi return false; 15259775a620SHiroshi Yamauchi } 15269775a620SHiroshi Yamauchi for (User *U : ICmp->users()) { 15279775a620SHiroshi Yamauchi if (U == ExcludedUser) 15289775a620SHiroshi Yamauchi continue; 15299775a620SHiroshi Yamauchi if (auto *BI = dyn_cast<BranchInst>(U)) { 15309775a620SHiroshi Yamauchi assert(BI->isConditional() && "Must be conditional"); 15319775a620SHiroshi Yamauchi BI->swapSuccessors(); 15329775a620SHiroshi Yamauchi // Don't need to swap this in terms of 15339775a620SHiroshi Yamauchi // TrueBiasedRegions/FalseBiasedRegions because true-based/false-based 15349775a620SHiroshi Yamauchi // mean whehter the branch is likely go into the if-then rather than 15359775a620SHiroshi Yamauchi // successor0/successor1 and because we can tell which edge is the then or 15369775a620SHiroshi Yamauchi // the else one by comparing the destination to the region exit block. 15379775a620SHiroshi Yamauchi continue; 15389775a620SHiroshi Yamauchi } 15399775a620SHiroshi Yamauchi if (auto *SI = dyn_cast<SelectInst>(U)) { 15409775a620SHiroshi Yamauchi // Swap operands 15410efeaa81SRoman Lebedev SI->swapValues(); 15429775a620SHiroshi Yamauchi SI->swapProfMetadata(); 15439775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI)) { 15449775a620SHiroshi Yamauchi assert(Scope->FalseBiasedSelects.count(SI) == 0 && 15459775a620SHiroshi Yamauchi "Must not be already in"); 15469775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.insert(SI); 15479775a620SHiroshi Yamauchi } else if (Scope->FalseBiasedSelects.count(SI)) { 15489775a620SHiroshi Yamauchi assert(Scope->TrueBiasedSelects.count(SI) == 0 && 15499775a620SHiroshi Yamauchi "Must not be already in"); 15509775a620SHiroshi Yamauchi Scope->TrueBiasedSelects.insert(SI); 15519775a620SHiroshi Yamauchi } 15529775a620SHiroshi Yamauchi continue; 15539775a620SHiroshi Yamauchi } 15549775a620SHiroshi Yamauchi llvm_unreachable("Must be a branch or a select"); 15559775a620SHiroshi Yamauchi } 15569775a620SHiroshi Yamauchi ICmp->setPredicate(CmpInst::getInversePredicate(ICmp->getPredicate())); 15579775a620SHiroshi Yamauchi return true; 15589775a620SHiroshi Yamauchi } 15599775a620SHiroshi Yamauchi 15609775a620SHiroshi Yamauchi // A helper for transformScopes. Insert a trivial phi at the scope exit block 15619775a620SHiroshi Yamauchi // for a value that's defined in the scope but used outside it (meaning it's 15629775a620SHiroshi Yamauchi // alive at the exit block). 15639775a620SHiroshi Yamauchi static void insertTrivialPHIs(CHRScope *Scope, 15649775a620SHiroshi Yamauchi BasicBlock *EntryBlock, BasicBlock *ExitBlock, 15659775a620SHiroshi Yamauchi DenseSet<PHINode *> &TrivialPHIs) { 15669775a620SHiroshi Yamauchi DenseSet<BasicBlock *> BlocksInScopeSet; 15679775a620SHiroshi Yamauchi SmallVector<BasicBlock *, 8> BlocksInScopeVec; 15689775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) { 15699775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 15709775a620SHiroshi Yamauchi // sub-Scopes. 15719775a620SHiroshi Yamauchi BlocksInScopeSet.insert(BB); 15729775a620SHiroshi Yamauchi BlocksInScopeVec.push_back(BB); 15739775a620SHiroshi Yamauchi } 15749775a620SHiroshi Yamauchi } 15759775a620SHiroshi Yamauchi CHR_DEBUG( 15769775a620SHiroshi Yamauchi dbgs() << "Inserting redudant phis\n"; 15779775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15789775a620SHiroshi Yamauchi dbgs() << "BlockInScope " << BB->getName() << "\n"; 15799775a620SHiroshi Yamauchi }); 15809775a620SHiroshi Yamauchi for (BasicBlock *BB : BlocksInScopeVec) { 15819775a620SHiroshi Yamauchi for (Instruction &I : *BB) { 15829775a620SHiroshi Yamauchi SmallVector<Instruction *, 8> Users; 15839775a620SHiroshi Yamauchi for (User *U : I.users()) { 15849775a620SHiroshi Yamauchi if (auto *UI = dyn_cast<Instruction>(U)) { 15859775a620SHiroshi Yamauchi if (BlocksInScopeSet.count(UI->getParent()) == 0 && 15869775a620SHiroshi Yamauchi // Unless there's already a phi for I at the exit block. 15879775a620SHiroshi Yamauchi !(isa<PHINode>(UI) && UI->getParent() == ExitBlock)) { 15889775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15899775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Used outside scope by user " << *UI << "\n"); 15909775a620SHiroshi Yamauchi Users.push_back(UI); 15919775a620SHiroshi Yamauchi } else if (UI->getParent() == EntryBlock && isa<PHINode>(UI)) { 15929775a620SHiroshi Yamauchi // There's a loop backedge from a block that's dominated by this 15939775a620SHiroshi Yamauchi // scope to the entry block. 15949775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "V " << I << "\n"); 15959775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() 15969775a620SHiroshi Yamauchi << "Used at entry block (for a back edge) by a phi user " 15979775a620SHiroshi Yamauchi << *UI << "\n"); 15989775a620SHiroshi Yamauchi Users.push_back(UI); 15999775a620SHiroshi Yamauchi } 16009775a620SHiroshi Yamauchi } 16019775a620SHiroshi Yamauchi } 16029775a620SHiroshi Yamauchi if (Users.size() > 0) { 16039775a620SHiroshi Yamauchi // Insert a trivial phi for I (phi [&I, P0], [&I, P1], ...) at 16049775a620SHiroshi Yamauchi // ExitBlock. Replace I with the new phi in UI unless UI is another 16059775a620SHiroshi Yamauchi // phi at ExitBlock. 16069775a620SHiroshi Yamauchi unsigned PredCount = std::distance(pred_begin(ExitBlock), 16079775a620SHiroshi Yamauchi pred_end(ExitBlock)); 16089775a620SHiroshi Yamauchi PHINode *PN = PHINode::Create(I.getType(), PredCount, "", 16099775a620SHiroshi Yamauchi &ExitBlock->front()); 16109775a620SHiroshi Yamauchi for (BasicBlock *Pred : predecessors(ExitBlock)) { 16119775a620SHiroshi Yamauchi PN->addIncoming(&I, Pred); 16129775a620SHiroshi Yamauchi } 16139775a620SHiroshi Yamauchi TrivialPHIs.insert(PN); 16149775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Insert phi " << *PN << "\n"); 16159775a620SHiroshi Yamauchi for (Instruction *UI : Users) { 16169775a620SHiroshi Yamauchi for (unsigned J = 0, NumOps = UI->getNumOperands(); J < NumOps; ++J) { 16179775a620SHiroshi Yamauchi if (UI->getOperand(J) == &I) { 16189775a620SHiroshi Yamauchi UI->setOperand(J, PN); 16199775a620SHiroshi Yamauchi } 16209775a620SHiroshi Yamauchi } 16219775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Updated user " << *UI << "\n"); 16229775a620SHiroshi Yamauchi } 16239775a620SHiroshi Yamauchi } 16249775a620SHiroshi Yamauchi } 16259775a620SHiroshi Yamauchi } 16269775a620SHiroshi Yamauchi } 16279775a620SHiroshi Yamauchi 16289775a620SHiroshi Yamauchi // Assert that all the CHR regions of the scope have a biased branch or select. 1629c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED 1630c8f348cbSFangrui Song assertCHRRegionsHaveBiasedBranchOrSelect(CHRScope *Scope) { 16319775a620SHiroshi Yamauchi #ifndef NDEBUG 16329775a620SHiroshi Yamauchi auto HasBiasedBranchOrSelect = [](RegInfo &RI, CHRScope *Scope) { 16339775a620SHiroshi Yamauchi if (Scope->TrueBiasedRegions.count(RI.R) || 16349775a620SHiroshi Yamauchi Scope->FalseBiasedRegions.count(RI.R)) 16359775a620SHiroshi Yamauchi return true; 16369775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) 16379775a620SHiroshi Yamauchi if (Scope->TrueBiasedSelects.count(SI) || 16389775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) 16399775a620SHiroshi Yamauchi return true; 16409775a620SHiroshi Yamauchi return false; 16419775a620SHiroshi Yamauchi }; 16429775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 16439775a620SHiroshi Yamauchi assert(HasBiasedBranchOrSelect(RI, Scope) && 16449775a620SHiroshi Yamauchi "Must have biased branch or select"); 16459775a620SHiroshi Yamauchi } 16469775a620SHiroshi Yamauchi #endif 16479775a620SHiroshi Yamauchi } 16489775a620SHiroshi Yamauchi 16499775a620SHiroshi Yamauchi // Assert that all the condition values of the biased branches and selects have 16509775a620SHiroshi Yamauchi // been hoisted to the pre-entry block or outside of the scope. 1651c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED assertBranchOrSelectConditionHoisted( 1652c8f348cbSFangrui Song CHRScope *Scope, BasicBlock *PreEntryBlock) { 16539775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Biased regions condition values \n"); 16549775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 16559775a620SHiroshi Yamauchi Region *R = RI.R; 16569775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 16579775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedRegions.count(R); 16589775a620SHiroshi Yamauchi if (RI.HasBranch && (IsTrueBiased || IsFalseBiased)) { 16599775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 16609775a620SHiroshi Yamauchi Value *V = BI->getCondition(); 16619775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16629775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 166372ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16649775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16659775a620SHiroshi Yamauchi !Scope->contains(I)) && 16669775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16679775a620SHiroshi Yamauchi } 16689775a620SHiroshi Yamauchi } 16699775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 16709775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 16719775a620SHiroshi Yamauchi bool IsFalseBiased = Scope->FalseBiasedSelects.count(SI); 16729775a620SHiroshi Yamauchi if (!(IsTrueBiased || IsFalseBiased)) 16739775a620SHiroshi Yamauchi continue; 16749775a620SHiroshi Yamauchi Value *V = SI->getCondition(); 16759775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << *V << "\n"); 16769775a620SHiroshi Yamauchi if (auto *I = dyn_cast<Instruction>(V)) { 167772ee6d60SHiroshi Yamauchi (void)(I); // Unused in release build. 16789775a620SHiroshi Yamauchi assert((I->getParent() == PreEntryBlock || 16799775a620SHiroshi Yamauchi !Scope->contains(I)) && 16809775a620SHiroshi Yamauchi "Must have been hoisted to PreEntryBlock or outside the scope"); 16819775a620SHiroshi Yamauchi } 16829775a620SHiroshi Yamauchi } 16839775a620SHiroshi Yamauchi } 16849775a620SHiroshi Yamauchi } 16859775a620SHiroshi Yamauchi 16869775a620SHiroshi Yamauchi void CHR::transformScopes(CHRScope *Scope, DenseSet<PHINode *> &TrivialPHIs) { 16879775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "transformScopes " << *Scope << "\n"); 16889775a620SHiroshi Yamauchi 16899775a620SHiroshi Yamauchi assert(Scope->RegInfos.size() >= 1 && "Should have at least one Region"); 16909775a620SHiroshi Yamauchi Region *FirstRegion = Scope->RegInfos[0].R; 16919775a620SHiroshi Yamauchi BasicBlock *EntryBlock = FirstRegion->getEntry(); 16929775a620SHiroshi Yamauchi Region *LastRegion = Scope->RegInfos[Scope->RegInfos.size() - 1].R; 16939775a620SHiroshi Yamauchi BasicBlock *ExitBlock = LastRegion->getExit(); 16949775a620SHiroshi Yamauchi Optional<uint64_t> ProfileCount = BFI.getBlockProfileCount(EntryBlock); 16959775a620SHiroshi Yamauchi 16969775a620SHiroshi Yamauchi if (ExitBlock) { 16979775a620SHiroshi Yamauchi // Insert a trivial phi at the exit block (where the CHR hot path and the 16989775a620SHiroshi Yamauchi // cold path merges) for a value that's defined in the scope but used 16999775a620SHiroshi Yamauchi // outside it (meaning it's alive at the exit block). We will add the 17009775a620SHiroshi Yamauchi // incoming values for the CHR cold paths to it below. Without this, we'd 17019775a620SHiroshi Yamauchi // miss updating phi's for such values unless there happens to already be a 17029775a620SHiroshi Yamauchi // phi for that value there. 17039775a620SHiroshi Yamauchi insertTrivialPHIs(Scope, EntryBlock, ExitBlock, TrivialPHIs); 17049775a620SHiroshi Yamauchi } 17059775a620SHiroshi Yamauchi 17069775a620SHiroshi Yamauchi // Split the entry block of the first region. The new block becomes the new 17079775a620SHiroshi Yamauchi // entry block of the first region. The old entry block becomes the block to 17089775a620SHiroshi Yamauchi // insert the CHR branch into. Note DT gets updated. Since DT gets updated 17099775a620SHiroshi Yamauchi // through the split, we update the entry of the first region after the split, 17109775a620SHiroshi Yamauchi // and Region only points to the entry and the exit blocks, rather than 17119775a620SHiroshi Yamauchi // keeping everything in a list or set, the blocks membership and the 17129775a620SHiroshi Yamauchi // entry/exit blocks of the region are still valid after the split. 17139775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Splitting entry block " << EntryBlock->getName() 17149775a620SHiroshi Yamauchi << " at " << *Scope->BranchInsertPoint << "\n"); 17159775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock = 17169775a620SHiroshi Yamauchi SplitBlock(EntryBlock, Scope->BranchInsertPoint, &DT); 17179775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 17189775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 17199775a620SHiroshi Yamauchi FirstRegion->replaceEntryRecursive(NewEntryBlock); 17209775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock = EntryBlock; 17219775a620SHiroshi Yamauchi 17229775a620SHiroshi Yamauchi ValueToValueMapTy VMap; 17239775a620SHiroshi Yamauchi // Clone the blocks in the scope (excluding the PreEntryBlock) to split into a 17249775a620SHiroshi Yamauchi // hot path (originals) and a cold path (clones) and update the PHIs at the 17259775a620SHiroshi Yamauchi // exit block. 17269775a620SHiroshi Yamauchi cloneScopeBlocks(Scope, PreEntryBlock, ExitBlock, LastRegion, VMap); 17279775a620SHiroshi Yamauchi 17289775a620SHiroshi Yamauchi // Replace the old (placeholder) branch with the new (merged) conditional 17299775a620SHiroshi Yamauchi // branch. 17309775a620SHiroshi Yamauchi BranchInst *MergedBr = createMergedBranch(PreEntryBlock, EntryBlock, 17319775a620SHiroshi Yamauchi NewEntryBlock, VMap); 17329775a620SHiroshi Yamauchi 17339775a620SHiroshi Yamauchi #ifndef NDEBUG 17349775a620SHiroshi Yamauchi assertCHRRegionsHaveBiasedBranchOrSelect(Scope); 17359775a620SHiroshi Yamauchi #endif 17369775a620SHiroshi Yamauchi 17379775a620SHiroshi Yamauchi // Hoist the conditional values of the branches/selects. 173816201040SHiroshi Yamauchi hoistScopeConditions(Scope, PreEntryBlock->getTerminator(), TrivialPHIs, DT); 17399775a620SHiroshi Yamauchi 17409775a620SHiroshi Yamauchi #ifndef NDEBUG 17419775a620SHiroshi Yamauchi assertBranchOrSelectConditionHoisted(Scope, PreEntryBlock); 17429775a620SHiroshi Yamauchi #endif 17439775a620SHiroshi Yamauchi 17449775a620SHiroshi Yamauchi // Create the combined branch condition and constant-fold the branches/selects 17459775a620SHiroshi Yamauchi // in the hot path. 17469775a620SHiroshi Yamauchi fixupBranchesAndSelects(Scope, PreEntryBlock, MergedBr, 17479775a620SHiroshi Yamauchi ProfileCount ? ProfileCount.getValue() : 0); 17489775a620SHiroshi Yamauchi } 17499775a620SHiroshi Yamauchi 17509775a620SHiroshi Yamauchi // A helper for transformScopes. Clone the blocks in the scope (excluding the 17519775a620SHiroshi Yamauchi // PreEntryBlock) to split into a hot path and a cold path and update the PHIs 17529775a620SHiroshi Yamauchi // at the exit block. 17539775a620SHiroshi Yamauchi void CHR::cloneScopeBlocks(CHRScope *Scope, 17549775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 17559775a620SHiroshi Yamauchi BasicBlock *ExitBlock, 17569775a620SHiroshi Yamauchi Region *LastRegion, 17579775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 17589775a620SHiroshi Yamauchi // Clone all the blocks. The original blocks will be the hot-path 17599775a620SHiroshi Yamauchi // CHR-optimized code and the cloned blocks will be the original unoptimized 17609775a620SHiroshi Yamauchi // code. This is so that the block pointers from the 17619775a620SHiroshi Yamauchi // CHRScope/Region/RegionInfo can stay valid in pointing to the hot-path code 17629775a620SHiroshi Yamauchi // which CHR should apply to. 17639775a620SHiroshi Yamauchi SmallVector<BasicBlock*, 8> NewBlocks; 17649775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->RegInfos) 17659775a620SHiroshi Yamauchi for (BasicBlock *BB : RI.R->blocks()) { // This includes the blocks in the 17669775a620SHiroshi Yamauchi // sub-Scopes. 17679775a620SHiroshi Yamauchi assert(BB != PreEntryBlock && "Don't copy the preetntry block"); 17689775a620SHiroshi Yamauchi BasicBlock *NewBB = CloneBasicBlock(BB, VMap, ".nonchr", &F); 17699775a620SHiroshi Yamauchi NewBlocks.push_back(NewBB); 17709775a620SHiroshi Yamauchi VMap[BB] = NewBB; 17719775a620SHiroshi Yamauchi } 17729775a620SHiroshi Yamauchi 17739775a620SHiroshi Yamauchi // Place the cloned blocks right after the original blocks (right before the 17749775a620SHiroshi Yamauchi // exit block of.) 17759775a620SHiroshi Yamauchi if (ExitBlock) 17769775a620SHiroshi Yamauchi F.getBasicBlockList().splice(ExitBlock->getIterator(), 17779775a620SHiroshi Yamauchi F.getBasicBlockList(), 17789775a620SHiroshi Yamauchi NewBlocks[0]->getIterator(), F.end()); 17799775a620SHiroshi Yamauchi 17809775a620SHiroshi Yamauchi // Update the cloned blocks/instructions to refer to themselves. 17819775a620SHiroshi Yamauchi for (unsigned i = 0, e = NewBlocks.size(); i != e; ++i) 17829775a620SHiroshi Yamauchi for (Instruction &I : *NewBlocks[i]) 17839775a620SHiroshi Yamauchi RemapInstruction(&I, VMap, 17849775a620SHiroshi Yamauchi RF_NoModuleLevelChanges | RF_IgnoreMissingLocals); 17859775a620SHiroshi Yamauchi 17869775a620SHiroshi Yamauchi // Add the cloned blocks to the PHIs of the exit blocks. ExitBlock is null for 17879775a620SHiroshi Yamauchi // the top-level region but we don't need to add PHIs. The trivial PHIs 17889775a620SHiroshi Yamauchi // inserted above will be updated here. 17899775a620SHiroshi Yamauchi if (ExitBlock) 17909775a620SHiroshi Yamauchi for (PHINode &PN : ExitBlock->phis()) 17919775a620SHiroshi Yamauchi for (unsigned I = 0, NumOps = PN.getNumIncomingValues(); I < NumOps; 17929775a620SHiroshi Yamauchi ++I) { 17939775a620SHiroshi Yamauchi BasicBlock *Pred = PN.getIncomingBlock(I); 17949775a620SHiroshi Yamauchi if (LastRegion->contains(Pred)) { 17959775a620SHiroshi Yamauchi Value *V = PN.getIncomingValue(I); 17969775a620SHiroshi Yamauchi auto It = VMap.find(V); 17979775a620SHiroshi Yamauchi if (It != VMap.end()) V = It->second; 17989775a620SHiroshi Yamauchi assert(VMap.find(Pred) != VMap.end() && "Pred must have been cloned"); 17999775a620SHiroshi Yamauchi PN.addIncoming(V, cast<BasicBlock>(VMap[Pred])); 18009775a620SHiroshi Yamauchi } 18019775a620SHiroshi Yamauchi } 18029775a620SHiroshi Yamauchi } 18039775a620SHiroshi Yamauchi 18049775a620SHiroshi Yamauchi // A helper for transformScope. Replace the old (placeholder) branch with the 18059775a620SHiroshi Yamauchi // new (merged) conditional branch. 18069775a620SHiroshi Yamauchi BranchInst *CHR::createMergedBranch(BasicBlock *PreEntryBlock, 18079775a620SHiroshi Yamauchi BasicBlock *EntryBlock, 18089775a620SHiroshi Yamauchi BasicBlock *NewEntryBlock, 18099775a620SHiroshi Yamauchi ValueToValueMapTy &VMap) { 18109775a620SHiroshi Yamauchi BranchInst *OldBR = cast<BranchInst>(PreEntryBlock->getTerminator()); 18119775a620SHiroshi Yamauchi assert(OldBR->isUnconditional() && OldBR->getSuccessor(0) == NewEntryBlock && 18129775a620SHiroshi Yamauchi "SplitBlock did not work correctly!"); 18139775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 18149775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 18159775a620SHiroshi Yamauchi assert(VMap.find(NewEntryBlock) != VMap.end() && 18169775a620SHiroshi Yamauchi "NewEntryBlock must have been copied"); 18179775a620SHiroshi Yamauchi OldBR->dropAllReferences(); 1818bd897a02SHiroshi Yamauchi OldBR->eraseFromParent(); 18199775a620SHiroshi Yamauchi // The true predicate is a placeholder. It will be replaced later in 18209775a620SHiroshi Yamauchi // fixupBranchesAndSelects(). 18219775a620SHiroshi Yamauchi BranchInst *NewBR = BranchInst::Create(NewEntryBlock, 18229775a620SHiroshi Yamauchi cast<BasicBlock>(VMap[NewEntryBlock]), 18239775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext())); 18249775a620SHiroshi Yamauchi PreEntryBlock->getInstList().push_back(NewBR); 18259775a620SHiroshi Yamauchi assert(NewEntryBlock->getSinglePredecessor() == EntryBlock && 18269775a620SHiroshi Yamauchi "NewEntryBlock's only pred must be EntryBlock"); 18279775a620SHiroshi Yamauchi return NewBR; 18289775a620SHiroshi Yamauchi } 18299775a620SHiroshi Yamauchi 18309775a620SHiroshi Yamauchi // A helper for transformScopes. Create the combined branch condition and 18319775a620SHiroshi Yamauchi // constant-fold the branches/selects in the hot path. 18329775a620SHiroshi Yamauchi void CHR::fixupBranchesAndSelects(CHRScope *Scope, 18339775a620SHiroshi Yamauchi BasicBlock *PreEntryBlock, 18349775a620SHiroshi Yamauchi BranchInst *MergedBR, 18359775a620SHiroshi Yamauchi uint64_t ProfileCount) { 18369775a620SHiroshi Yamauchi Value *MergedCondition = ConstantInt::getTrue(F.getContext()); 18379775a620SHiroshi Yamauchi BranchProbability CHRBranchBias(1, 1); 18389775a620SHiroshi Yamauchi uint64_t NumCHRedBranches = 0; 18399775a620SHiroshi Yamauchi IRBuilder<> IRB(PreEntryBlock->getTerminator()); 18409775a620SHiroshi Yamauchi for (RegInfo &RI : Scope->CHRRegions) { 18419775a620SHiroshi Yamauchi Region *R = RI.R; 18429775a620SHiroshi Yamauchi if (RI.HasBranch) { 18439775a620SHiroshi Yamauchi fixupBranch(R, Scope, IRB, MergedCondition, CHRBranchBias); 18449775a620SHiroshi Yamauchi ++NumCHRedBranches; 18459775a620SHiroshi Yamauchi } 18469775a620SHiroshi Yamauchi for (SelectInst *SI : RI.Selects) { 18479775a620SHiroshi Yamauchi fixupSelect(SI, Scope, IRB, MergedCondition, CHRBranchBias); 18489775a620SHiroshi Yamauchi ++NumCHRedBranches; 18499775a620SHiroshi Yamauchi } 18509775a620SHiroshi Yamauchi } 18519775a620SHiroshi Yamauchi Stats.NumBranchesDelta += NumCHRedBranches - 1; 18529775a620SHiroshi Yamauchi Stats.WeightedNumBranchesDelta += (NumCHRedBranches - 1) * ProfileCount; 1853fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 1854fd2c699dSHiroshi Yamauchi return OptimizationRemark(DEBUG_TYPE, 1855fd2c699dSHiroshi Yamauchi "CHR", 1856fd2c699dSHiroshi Yamauchi // Refer to the hot (original) path 1857fd2c699dSHiroshi Yamauchi MergedBR->getSuccessor(0)->getTerminator()) 1858fd2c699dSHiroshi Yamauchi << "Merged " << ore::NV("NumCHRedBranches", NumCHRedBranches) 1859fd2c699dSHiroshi Yamauchi << " branches or selects"; 1860fd2c699dSHiroshi Yamauchi }); 18619775a620SHiroshi Yamauchi MergedBR->setCondition(MergedCondition); 18629775a620SHiroshi Yamauchi SmallVector<uint32_t, 2> Weights; 18639775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.scale(1000))); 18649775a620SHiroshi Yamauchi Weights.push_back(static_cast<uint32_t>(CHRBranchBias.getCompl().scale(1000))); 18659775a620SHiroshi Yamauchi MDBuilder MDB(F.getContext()); 18669775a620SHiroshi Yamauchi MergedBR->setMetadata(LLVMContext::MD_prof, MDB.createBranchWeights(Weights)); 18679775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "CHR branch bias " << Weights[0] << ":" << Weights[1] 18689775a620SHiroshi Yamauchi << "\n"); 18699775a620SHiroshi Yamauchi } 18709775a620SHiroshi Yamauchi 18719775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 18729775a620SHiroshi Yamauchi // and constant-fold a branch in the hot path. 18739775a620SHiroshi Yamauchi void CHR::fixupBranch(Region *R, CHRScope *Scope, 18749775a620SHiroshi Yamauchi IRBuilder<> &IRB, 18759775a620SHiroshi Yamauchi Value *&MergedCondition, 18769775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 18779775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedRegions.count(R); 18789775a620SHiroshi Yamauchi assert((IsTrueBiased || Scope->FalseBiasedRegions.count(R)) && 18799775a620SHiroshi Yamauchi "Must be truthy or falsy"); 18809775a620SHiroshi Yamauchi auto *BI = cast<BranchInst>(R->getEntry()->getTerminator()); 18819775a620SHiroshi Yamauchi assert(BranchBiasMap.find(R) != BranchBiasMap.end() && 18829775a620SHiroshi Yamauchi "Must be in the bias map"); 18839775a620SHiroshi Yamauchi BranchProbability Bias = BranchBiasMap[R]; 18849775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 18859775a620SHiroshi Yamauchi // Take the min. 18869775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 18879775a620SHiroshi Yamauchi CHRBranchBias = Bias; 18889775a620SHiroshi Yamauchi BasicBlock *IfThen = BI->getSuccessor(1); 18899775a620SHiroshi Yamauchi BasicBlock *IfElse = BI->getSuccessor(0); 18909775a620SHiroshi Yamauchi BasicBlock *RegionExitBlock = R->getExit(); 18919775a620SHiroshi Yamauchi assert(RegionExitBlock && "Null ExitBlock"); 18929775a620SHiroshi Yamauchi assert((IfThen == RegionExitBlock || IfElse == RegionExitBlock) && 18939775a620SHiroshi Yamauchi IfThen != IfElse && "Invariant from findScopes"); 18949775a620SHiroshi Yamauchi if (IfThen == RegionExitBlock) { 18959775a620SHiroshi Yamauchi // Swap them so that IfThen means going into it and IfElse means skipping 18969775a620SHiroshi Yamauchi // it. 18979775a620SHiroshi Yamauchi std::swap(IfThen, IfElse); 18989775a620SHiroshi Yamauchi } 18999775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "IfThen " << IfThen->getName() 19009775a620SHiroshi Yamauchi << " IfElse " << IfElse->getName() << "\n"); 19019775a620SHiroshi Yamauchi Value *Cond = BI->getCondition(); 19029775a620SHiroshi Yamauchi BasicBlock *HotTarget = IsTrueBiased ? IfThen : IfElse; 19039775a620SHiroshi Yamauchi bool ConditionTrue = HotTarget == BI->getSuccessor(0); 19049775a620SHiroshi Yamauchi addToMergedCondition(ConditionTrue, Cond, BI, Scope, IRB, 19059775a620SHiroshi Yamauchi MergedCondition); 19069775a620SHiroshi Yamauchi // Constant-fold the branch at ClonedEntryBlock. 19079775a620SHiroshi Yamauchi assert(ConditionTrue == (HotTarget == BI->getSuccessor(0)) && 19089775a620SHiroshi Yamauchi "The successor shouldn't change"); 19099775a620SHiroshi Yamauchi Value *NewCondition = ConditionTrue ? 19109775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 19119775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 19129775a620SHiroshi Yamauchi BI->setCondition(NewCondition); 19139775a620SHiroshi Yamauchi } 19149775a620SHiroshi Yamauchi 19159775a620SHiroshi Yamauchi // A helper for fixupBranchesAndSelects. Add to the combined branch condition 19169775a620SHiroshi Yamauchi // and constant-fold a select in the hot path. 19179775a620SHiroshi Yamauchi void CHR::fixupSelect(SelectInst *SI, CHRScope *Scope, 19189775a620SHiroshi Yamauchi IRBuilder<> &IRB, 19199775a620SHiroshi Yamauchi Value *&MergedCondition, 19209775a620SHiroshi Yamauchi BranchProbability &CHRBranchBias) { 19219775a620SHiroshi Yamauchi bool IsTrueBiased = Scope->TrueBiasedSelects.count(SI); 19229775a620SHiroshi Yamauchi assert((IsTrueBiased || 19239775a620SHiroshi Yamauchi Scope->FalseBiasedSelects.count(SI)) && "Must be biased"); 19249775a620SHiroshi Yamauchi assert(SelectBiasMap.find(SI) != SelectBiasMap.end() && 19259775a620SHiroshi Yamauchi "Must be in the bias map"); 19269775a620SHiroshi Yamauchi BranchProbability Bias = SelectBiasMap[SI]; 19279775a620SHiroshi Yamauchi assert(Bias >= getCHRBiasThreshold() && "Must be highly biased"); 19289775a620SHiroshi Yamauchi // Take the min. 19299775a620SHiroshi Yamauchi if (CHRBranchBias > Bias) 19309775a620SHiroshi Yamauchi CHRBranchBias = Bias; 19319775a620SHiroshi Yamauchi Value *Cond = SI->getCondition(); 19329775a620SHiroshi Yamauchi addToMergedCondition(IsTrueBiased, Cond, SI, Scope, IRB, 19339775a620SHiroshi Yamauchi MergedCondition); 19349775a620SHiroshi Yamauchi Value *NewCondition = IsTrueBiased ? 19359775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()) : 19369775a620SHiroshi Yamauchi ConstantInt::getFalse(F.getContext()); 19379775a620SHiroshi Yamauchi SI->setCondition(NewCondition); 19389775a620SHiroshi Yamauchi } 19399775a620SHiroshi Yamauchi 19409775a620SHiroshi Yamauchi // A helper for fixupBranch/fixupSelect. Add a branch condition to the merged 19419775a620SHiroshi Yamauchi // condition. 19429775a620SHiroshi Yamauchi void CHR::addToMergedCondition(bool IsTrueBiased, Value *Cond, 19439775a620SHiroshi Yamauchi Instruction *BranchOrSelect, 19449775a620SHiroshi Yamauchi CHRScope *Scope, 19459775a620SHiroshi Yamauchi IRBuilder<> &IRB, 19469775a620SHiroshi Yamauchi Value *&MergedCondition) { 19479775a620SHiroshi Yamauchi if (IsTrueBiased) { 19489775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 19499775a620SHiroshi Yamauchi } else { 19509775a620SHiroshi Yamauchi // If Cond is an icmp and all users of V except for BranchOrSelect is a 19519775a620SHiroshi Yamauchi // branch, negate the icmp predicate and swap the branch targets and avoid 19529775a620SHiroshi Yamauchi // inserting an Xor to negate Cond. 19539775a620SHiroshi Yamauchi bool Done = false; 19549775a620SHiroshi Yamauchi if (auto *ICmp = dyn_cast<ICmpInst>(Cond)) 1955b3b61de0SFangrui Song if (negateICmpIfUsedByBranchOrSelectOnly(ICmp, BranchOrSelect, Scope)) { 19569775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Cond); 19579775a620SHiroshi Yamauchi Done = true; 19589775a620SHiroshi Yamauchi } 19599775a620SHiroshi Yamauchi if (!Done) { 19609775a620SHiroshi Yamauchi Value *Negate = IRB.CreateXor( 19619775a620SHiroshi Yamauchi ConstantInt::getTrue(F.getContext()), Cond); 19629775a620SHiroshi Yamauchi MergedCondition = IRB.CreateAnd(MergedCondition, Negate); 19639775a620SHiroshi Yamauchi } 19649775a620SHiroshi Yamauchi } 19659775a620SHiroshi Yamauchi } 19669775a620SHiroshi Yamauchi 19679775a620SHiroshi Yamauchi void CHR::transformScopes(SmallVectorImpl<CHRScope *> &CHRScopes) { 1968b3b61de0SFangrui Song unsigned I = 0; 19699775a620SHiroshi Yamauchi DenseSet<PHINode *> TrivialPHIs; 19709775a620SHiroshi Yamauchi for (CHRScope *Scope : CHRScopes) { 19719775a620SHiroshi Yamauchi transformScopes(Scope, TrivialPHIs); 19729775a620SHiroshi Yamauchi CHR_DEBUG( 19739775a620SHiroshi Yamauchi std::ostringstream oss; 1974b3b61de0SFangrui Song oss << " after transformScopes " << I++; 19759775a620SHiroshi Yamauchi dumpIR(F, oss.str().c_str(), nullptr)); 1976b3b61de0SFangrui Song (void)I; 19779775a620SHiroshi Yamauchi } 19789775a620SHiroshi Yamauchi } 19799775a620SHiroshi Yamauchi 1980c8f348cbSFangrui Song static void LLVM_ATTRIBUTE_UNUSED 1981c8f348cbSFangrui Song dumpScopes(SmallVectorImpl<CHRScope *> &Scopes, const char *Label) { 19829775a620SHiroshi Yamauchi dbgs() << Label << " " << Scopes.size() << "\n"; 19839775a620SHiroshi Yamauchi for (CHRScope *Scope : Scopes) { 19849775a620SHiroshi Yamauchi dbgs() << *Scope << "\n"; 19859775a620SHiroshi Yamauchi } 19869775a620SHiroshi Yamauchi } 19879775a620SHiroshi Yamauchi 19889775a620SHiroshi Yamauchi bool CHR::run() { 19899775a620SHiroshi Yamauchi if (!shouldApply(F, PSI)) 19909775a620SHiroshi Yamauchi return false; 19919775a620SHiroshi Yamauchi 19929775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "before", nullptr)); 19939775a620SHiroshi Yamauchi 19949775a620SHiroshi Yamauchi bool Changed = false; 19959775a620SHiroshi Yamauchi { 19969775a620SHiroshi Yamauchi CHR_DEBUG( 19979775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 19989775a620SHiroshi Yamauchi RI.print(dbgs())); 19999775a620SHiroshi Yamauchi 20009775a620SHiroshi Yamauchi // Recursively traverse the region tree and find regions that have biased 20019775a620SHiroshi Yamauchi // branches and/or selects and create scopes. 20029775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> AllScopes; 20039775a620SHiroshi Yamauchi findScopes(AllScopes); 20049775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(AllScopes, "All scopes")); 20059775a620SHiroshi Yamauchi 20069775a620SHiroshi Yamauchi // Split the scopes if 1) the conditiona values of the biased 20079775a620SHiroshi Yamauchi // branches/selects of the inner/lower scope can't be hoisted up to the 20089775a620SHiroshi Yamauchi // outermost/uppermost scope entry, or 2) the condition values of the biased 20099775a620SHiroshi Yamauchi // branches/selects in a scope (including subscopes) don't share at least 20109775a620SHiroshi Yamauchi // one common value. 20119775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SplitScopes; 20129775a620SHiroshi Yamauchi splitScopes(AllScopes, SplitScopes); 20139775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SplitScopes, "Split scopes")); 20149775a620SHiroshi Yamauchi 20159775a620SHiroshi Yamauchi // After splitting, set the biased regions and selects of a scope (a tree 20169775a620SHiroshi Yamauchi // root) that include those of the subscopes. 20179775a620SHiroshi Yamauchi classifyBiasedScopes(SplitScopes); 20189775a620SHiroshi Yamauchi CHR_DEBUG(dbgs() << "Set per-scope bias " << SplitScopes.size() << "\n"); 20199775a620SHiroshi Yamauchi 20209775a620SHiroshi Yamauchi // Filter out the scopes that has only one biased region or select (CHR 20219775a620SHiroshi Yamauchi // isn't useful in such a case). 20229775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> FilteredScopes; 20239775a620SHiroshi Yamauchi filterScopes(SplitScopes, FilteredScopes); 20249775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(FilteredScopes, "Filtered scopes")); 20259775a620SHiroshi Yamauchi 20269775a620SHiroshi Yamauchi // Set the regions to be CHR'ed and their hoist stops for each scope. 20279775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SetScopes; 20289775a620SHiroshi Yamauchi setCHRRegions(FilteredScopes, SetScopes); 20299775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SetScopes, "Set CHR regions")); 20309775a620SHiroshi Yamauchi 20319775a620SHiroshi Yamauchi // Sort CHRScopes by the depth so that outer CHRScopes comes before inner 20329775a620SHiroshi Yamauchi // ones. We need to apply CHR from outer to inner so that we apply CHR only 20339775a620SHiroshi Yamauchi // to the hot path, rather than both hot and cold paths. 20349775a620SHiroshi Yamauchi SmallVector<CHRScope *, 8> SortedScopes; 20359775a620SHiroshi Yamauchi sortScopes(SetScopes, SortedScopes); 20369775a620SHiroshi Yamauchi CHR_DEBUG(dumpScopes(SortedScopes, "Sorted scopes")); 20379775a620SHiroshi Yamauchi 20389775a620SHiroshi Yamauchi CHR_DEBUG( 20399775a620SHiroshi Yamauchi dbgs() << "RegionInfo:\n"; 20409775a620SHiroshi Yamauchi RI.print(dbgs())); 20419775a620SHiroshi Yamauchi 20429775a620SHiroshi Yamauchi // Apply the CHR transformation. 20439775a620SHiroshi Yamauchi if (!SortedScopes.empty()) { 20449775a620SHiroshi Yamauchi transformScopes(SortedScopes); 20459775a620SHiroshi Yamauchi Changed = true; 20469775a620SHiroshi Yamauchi } 20479775a620SHiroshi Yamauchi } 20489775a620SHiroshi Yamauchi 2049fd2c699dSHiroshi Yamauchi if (Changed) { 20509775a620SHiroshi Yamauchi CHR_DEBUG(dumpIR(F, "after", &Stats)); 2051fd2c699dSHiroshi Yamauchi ORE.emit([&]() { 2052fd2c699dSHiroshi Yamauchi return OptimizationRemark(DEBUG_TYPE, "Stats", &F) 2053fd2c699dSHiroshi Yamauchi << ore::NV("Function", &F) << " " 2054fd2c699dSHiroshi Yamauchi << "Reduced the number of branches in hot paths by " 2055fd2c699dSHiroshi Yamauchi << ore::NV("NumBranchesDelta", Stats.NumBranchesDelta) 2056fd2c699dSHiroshi Yamauchi << " (static) and " 2057fd2c699dSHiroshi Yamauchi << ore::NV("WeightedNumBranchesDelta", Stats.WeightedNumBranchesDelta) 2058fd2c699dSHiroshi Yamauchi << " (weighted by PGO count)"; 2059fd2c699dSHiroshi Yamauchi }); 2060fd2c699dSHiroshi Yamauchi } 20619775a620SHiroshi Yamauchi 20629775a620SHiroshi Yamauchi return Changed; 20639775a620SHiroshi Yamauchi } 20649775a620SHiroshi Yamauchi 20659775a620SHiroshi Yamauchi bool ControlHeightReductionLegacyPass::runOnFunction(Function &F) { 20669775a620SHiroshi Yamauchi BlockFrequencyInfo &BFI = 20679775a620SHiroshi Yamauchi getAnalysis<BlockFrequencyInfoWrapperPass>().getBFI(); 20689775a620SHiroshi Yamauchi DominatorTree &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 20699775a620SHiroshi Yamauchi ProfileSummaryInfo &PSI = 2070e7b789b5SVedant Kumar getAnalysis<ProfileSummaryInfoWrapperPass>().getPSI(); 20719775a620SHiroshi Yamauchi RegionInfo &RI = getAnalysis<RegionInfoPass>().getRegionInfo(); 2072fd2c699dSHiroshi Yamauchi std::unique_ptr<OptimizationRemarkEmitter> OwnedORE = 2073*0eaee545SJonas Devlieghere std::make_unique<OptimizationRemarkEmitter>(&F); 2074fd2c699dSHiroshi Yamauchi return CHR(F, BFI, DT, PSI, RI, *OwnedORE.get()).run(); 20759775a620SHiroshi Yamauchi } 20769775a620SHiroshi Yamauchi 20779775a620SHiroshi Yamauchi namespace llvm { 20789775a620SHiroshi Yamauchi 20799775a620SHiroshi Yamauchi ControlHeightReductionPass::ControlHeightReductionPass() { 2080b3b61de0SFangrui Song parseCHRFilterFiles(); 20819775a620SHiroshi Yamauchi } 20829775a620SHiroshi Yamauchi 20839775a620SHiroshi Yamauchi PreservedAnalyses ControlHeightReductionPass::run( 20849775a620SHiroshi Yamauchi Function &F, 20859775a620SHiroshi Yamauchi FunctionAnalysisManager &FAM) { 20869775a620SHiroshi Yamauchi auto &BFI = FAM.getResult<BlockFrequencyAnalysis>(F); 20879775a620SHiroshi Yamauchi auto &DT = FAM.getResult<DominatorTreeAnalysis>(F); 20889775a620SHiroshi Yamauchi auto &MAMProxy = FAM.getResult<ModuleAnalysisManagerFunctionProxy>(F); 20899775a620SHiroshi Yamauchi auto &MAM = MAMProxy.getManager(); 20909775a620SHiroshi Yamauchi auto &PSI = *MAM.getCachedResult<ProfileSummaryAnalysis>(*F.getParent()); 20919775a620SHiroshi Yamauchi auto &RI = FAM.getResult<RegionInfoAnalysis>(F); 2092fd2c699dSHiroshi Yamauchi auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(F); 2093fd2c699dSHiroshi Yamauchi bool Changed = CHR(F, BFI, DT, PSI, RI, ORE).run(); 20949775a620SHiroshi Yamauchi if (!Changed) 20959775a620SHiroshi Yamauchi return PreservedAnalyses::all(); 20969775a620SHiroshi Yamauchi auto PA = PreservedAnalyses(); 20979775a620SHiroshi Yamauchi PA.preserve<GlobalsAA>(); 20989775a620SHiroshi Yamauchi return PA; 20999775a620SHiroshi Yamauchi } 21009775a620SHiroshi Yamauchi 21019775a620SHiroshi Yamauchi } // namespace llvm 2102