1ef512b99SJustin Bogner //===--- CodeGenPGO.cpp - PGO Instrumentation for LLVM CodeGen --*- C++ -*-===// 2ef512b99SJustin Bogner // 3ef512b99SJustin Bogner // The LLVM Compiler Infrastructure 4ef512b99SJustin Bogner // 5ef512b99SJustin Bogner // This file is distributed under the University of Illinois Open Source 6ef512b99SJustin Bogner // License. See LICENSE.TXT for details. 7ef512b99SJustin Bogner // 8ef512b99SJustin Bogner //===----------------------------------------------------------------------===// 9ef512b99SJustin Bogner // 10ef512b99SJustin Bogner // Instrumentation-based profile-guided optimization 11ef512b99SJustin Bogner // 12ef512b99SJustin Bogner //===----------------------------------------------------------------------===// 13ef512b99SJustin Bogner 14ef512b99SJustin Bogner #include "CodeGenPGO.h" 15ef512b99SJustin Bogner #include "CodeGenFunction.h" 16ef512b99SJustin Bogner #include "clang/AST/RecursiveASTVisitor.h" 17ef512b99SJustin Bogner #include "clang/AST/StmtVisitor.h" 18529f6dd8SJustin Bogner #include "llvm/Config/config.h" // for strtoull()/strtoll() define 19ef512b99SJustin Bogner #include "llvm/IR/MDBuilder.h" 20ef512b99SJustin Bogner #include "llvm/Support/FileSystem.h" 21ef512b99SJustin Bogner 22ef512b99SJustin Bogner using namespace clang; 23ef512b99SJustin Bogner using namespace CodeGen; 24ef512b99SJustin Bogner 25d66a17d0SJustin Bogner static void ReportBadPGOData(CodeGenModule &CGM, const char *Message) { 26d66a17d0SJustin Bogner DiagnosticsEngine &Diags = CGM.getDiags(); 27d66a17d0SJustin Bogner unsigned diagID = Diags.getCustomDiagID(DiagnosticsEngine::Error, "%0"); 28d66a17d0SJustin Bogner Diags.Report(diagID) << Message; 29d66a17d0SJustin Bogner } 30d66a17d0SJustin Bogner 31d66a17d0SJustin Bogner PGOProfileData::PGOProfileData(CodeGenModule &CGM, std::string Path) 32d66a17d0SJustin Bogner : CGM(CGM) { 33d66a17d0SJustin Bogner if (llvm::MemoryBuffer::getFile(Path, DataBuffer)) { 34d66a17d0SJustin Bogner ReportBadPGOData(CGM, "failed to open pgo data file"); 35d66a17d0SJustin Bogner return; 36d66a17d0SJustin Bogner } 37d66a17d0SJustin Bogner 38d66a17d0SJustin Bogner if (DataBuffer->getBufferSize() > std::numeric_limits<unsigned>::max()) { 39d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file too big"); 40d66a17d0SJustin Bogner return; 41d66a17d0SJustin Bogner } 42d66a17d0SJustin Bogner 43d66a17d0SJustin Bogner // Scan through the data file and map each function to the corresponding 44d66a17d0SJustin Bogner // file offset where its counts are stored. 45d66a17d0SJustin Bogner const char *BufferStart = DataBuffer->getBufferStart(); 46d66a17d0SJustin Bogner const char *BufferEnd = DataBuffer->getBufferEnd(); 47d66a17d0SJustin Bogner const char *CurPtr = BufferStart; 48d66a17d0SJustin Bogner uint64_t MaxCount = 0; 49d66a17d0SJustin Bogner while (CurPtr < BufferEnd) { 50d66a17d0SJustin Bogner // Read the function name. 51d66a17d0SJustin Bogner const char *FuncStart = CurPtr; 52d66a17d0SJustin Bogner // For Objective-C methods, the name may include whitespace, so search 53d66a17d0SJustin Bogner // backward from the end of the line to find the space that separates the 54d66a17d0SJustin Bogner // name from the number of counters. (This is a temporary hack since we are 55d66a17d0SJustin Bogner // going to completely replace this file format in the near future.) 56d66a17d0SJustin Bogner CurPtr = strchr(CurPtr, '\n'); 57d66a17d0SJustin Bogner if (!CurPtr) { 58d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file has malformed function entry"); 59d66a17d0SJustin Bogner return; 60d66a17d0SJustin Bogner } 61d66a17d0SJustin Bogner StringRef FuncName(FuncStart, CurPtr - FuncStart); 62d66a17d0SJustin Bogner 63b4416f58SJustin Bogner // Skip over the function hash. 64b4416f58SJustin Bogner CurPtr = strchr(++CurPtr, '\n'); 65b4416f58SJustin Bogner if (!CurPtr) { 66b4416f58SJustin Bogner ReportBadPGOData(CGM, "pgo data file is missing the function hash"); 67b4416f58SJustin Bogner return; 68b4416f58SJustin Bogner } 69b4416f58SJustin Bogner 70d66a17d0SJustin Bogner // Read the number of counters. 71d66a17d0SJustin Bogner char *EndPtr; 72d66a17d0SJustin Bogner unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10); 73d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n' || NumCounters <= 0) { 74d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file has unexpected number of counters"); 75d66a17d0SJustin Bogner return; 76d66a17d0SJustin Bogner } 77d66a17d0SJustin Bogner CurPtr = EndPtr; 78d66a17d0SJustin Bogner 79d66a17d0SJustin Bogner // Read function count. 80d66a17d0SJustin Bogner uint64_t Count = strtoll(CurPtr, &EndPtr, 10); 81d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n') { 82d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has bad count value"); 83d66a17d0SJustin Bogner return; 84d66a17d0SJustin Bogner } 85d66a17d0SJustin Bogner CurPtr = EndPtr; // Point to '\n'. 86d66a17d0SJustin Bogner FunctionCounts[FuncName] = Count; 87d66a17d0SJustin Bogner MaxCount = Count > MaxCount ? Count : MaxCount; 88d66a17d0SJustin Bogner 89d66a17d0SJustin Bogner // There is one line for each counter; skip over those lines. 90d66a17d0SJustin Bogner // Since function count is already read, we start the loop from 1. 91d66a17d0SJustin Bogner for (unsigned N = 1; N < NumCounters; ++N) { 92d66a17d0SJustin Bogner CurPtr = strchr(++CurPtr, '\n'); 93d66a17d0SJustin Bogner if (!CurPtr) { 94d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file is missing some counter info"); 95d66a17d0SJustin Bogner return; 96d66a17d0SJustin Bogner } 97d66a17d0SJustin Bogner } 98d66a17d0SJustin Bogner 99d66a17d0SJustin Bogner // Skip over the blank line separating functions. 100d66a17d0SJustin Bogner CurPtr += 2; 101d66a17d0SJustin Bogner 102d66a17d0SJustin Bogner DataOffsets[FuncName] = FuncStart - BufferStart; 103d66a17d0SJustin Bogner } 104d66a17d0SJustin Bogner MaxFunctionCount = MaxCount; 105d66a17d0SJustin Bogner } 106d66a17d0SJustin Bogner 107b4416f58SJustin Bogner bool PGOProfileData::getFunctionCounts(StringRef FuncName, uint64_t &FuncHash, 108d66a17d0SJustin Bogner std::vector<uint64_t> &Counts) { 109d66a17d0SJustin Bogner // Find the relevant section of the pgo-data file. 110d66a17d0SJustin Bogner llvm::StringMap<unsigned>::const_iterator OffsetIter = 111d66a17d0SJustin Bogner DataOffsets.find(FuncName); 112d66a17d0SJustin Bogner if (OffsetIter == DataOffsets.end()) 113d66a17d0SJustin Bogner return true; 114d66a17d0SJustin Bogner const char *CurPtr = DataBuffer->getBufferStart() + OffsetIter->getValue(); 115d66a17d0SJustin Bogner 116d66a17d0SJustin Bogner // Skip over the function name. 117d66a17d0SJustin Bogner CurPtr = strchr(CurPtr, '\n'); 118d66a17d0SJustin Bogner assert(CurPtr && "pgo-data has corrupted function entry"); 119b4416f58SJustin Bogner 120b4416f58SJustin Bogner char *EndPtr; 121b4416f58SJustin Bogner // Read the function hash. 122b4416f58SJustin Bogner FuncHash = strtoll(++CurPtr, &EndPtr, 10); 123b4416f58SJustin Bogner assert(EndPtr != CurPtr && *EndPtr == '\n' && 124b4416f58SJustin Bogner "pgo-data file has corrupted function hash"); 125b4416f58SJustin Bogner CurPtr = EndPtr; 126d66a17d0SJustin Bogner 127d66a17d0SJustin Bogner // Read the number of counters. 128d66a17d0SJustin Bogner unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10); 129d66a17d0SJustin Bogner assert(EndPtr != CurPtr && *EndPtr == '\n' && NumCounters > 0 && 130d66a17d0SJustin Bogner "pgo-data file has corrupted number of counters"); 131d66a17d0SJustin Bogner CurPtr = EndPtr; 132d66a17d0SJustin Bogner 133d66a17d0SJustin Bogner Counts.reserve(NumCounters); 134d66a17d0SJustin Bogner 135d66a17d0SJustin Bogner for (unsigned N = 0; N < NumCounters; ++N) { 136d66a17d0SJustin Bogner // Read the count value. 137d66a17d0SJustin Bogner uint64_t Count = strtoll(CurPtr, &EndPtr, 10); 138d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n') { 139d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has bad count value"); 140d66a17d0SJustin Bogner return true; 141d66a17d0SJustin Bogner } 142d66a17d0SJustin Bogner Counts.push_back(Count); 143d66a17d0SJustin Bogner CurPtr = EndPtr + 1; 144d66a17d0SJustin Bogner } 145d66a17d0SJustin Bogner 146d66a17d0SJustin Bogner // Make sure the number of counters matches up. 147d66a17d0SJustin Bogner if (Counts.size() != NumCounters) { 148d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has inconsistent counters"); 149d66a17d0SJustin Bogner return true; 150d66a17d0SJustin Bogner } 151d66a17d0SJustin Bogner 152d66a17d0SJustin Bogner return false; 153d66a17d0SJustin Bogner } 154d66a17d0SJustin Bogner 155da1ebedeSBob Wilson void CodeGenPGO::setFuncName(llvm::Function *Fn) { 1562fe531cbSDuncan P. N. Exon Smith RawFuncName = Fn->getName(); 157da1ebedeSBob Wilson 158da1ebedeSBob Wilson // Function names may be prefixed with a binary '1' to indicate 159da1ebedeSBob Wilson // that the backend should not modify the symbols due to any platform 160da1ebedeSBob Wilson // naming convention. Do not include that '1' in the PGO profile name. 1612fe531cbSDuncan P. N. Exon Smith if (RawFuncName[0] == '\1') 1622fe531cbSDuncan P. N. Exon Smith RawFuncName = RawFuncName.substr(1); 163da1ebedeSBob Wilson 164da1ebedeSBob Wilson if (!Fn->hasLocalLinkage()) { 1652fe531cbSDuncan P. N. Exon Smith PrefixedFuncName = new std::string(RawFuncName); 166da1ebedeSBob Wilson return; 167da1ebedeSBob Wilson } 168da1ebedeSBob Wilson 169da1ebedeSBob Wilson // For local symbols, prepend the main file name to distinguish them. 170da1ebedeSBob Wilson // Do not include the full path in the file name since there's no guarantee 171da1ebedeSBob Wilson // that it will stay the same, e.g., if the files are checked out from 172da1ebedeSBob Wilson // version control in different locations. 1732fe531cbSDuncan P. N. Exon Smith PrefixedFuncName = new std::string(CGM.getCodeGenOpts().MainFileName); 1742fe531cbSDuncan P. N. Exon Smith if (PrefixedFuncName->empty()) 1752fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->assign("<unknown>"); 1762fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->append(":"); 1772fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->append(RawFuncName); 178da1ebedeSBob Wilson } 179da1ebedeSBob Wilson 1802fe531cbSDuncan P. N. Exon Smith static llvm::Function *getRegisterFunc(CodeGenModule &CGM) { 1812fe531cbSDuncan P. N. Exon Smith return CGM.getModule().getFunction("__llvm_pgo_register_functions"); 1822fe531cbSDuncan P. N. Exon Smith } 1832fe531cbSDuncan P. N. Exon Smith 1842fe531cbSDuncan P. N. Exon Smith static llvm::BasicBlock *getOrInsertRegisterBB(CodeGenModule &CGM) { 185780443e8SDuncan P. N. Exon Smith // Don't do this for Darwin. compiler-rt uses linker magic. 186780443e8SDuncan P. N. Exon Smith if (CGM.getTarget().getTriple().isOSDarwin()) 187780443e8SDuncan P. N. Exon Smith return nullptr; 188780443e8SDuncan P. N. Exon Smith 1892fe531cbSDuncan P. N. Exon Smith // Only need to insert this once per module. 1902fe531cbSDuncan P. N. Exon Smith if (llvm::Function *RegisterF = getRegisterFunc(CGM)) 1912fe531cbSDuncan P. N. Exon Smith return &RegisterF->getEntryBlock(); 1922fe531cbSDuncan P. N. Exon Smith 1932fe531cbSDuncan P. N. Exon Smith // Construct the function. 1942fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 1952fe531cbSDuncan P. N. Exon Smith auto *RegisterFTy = llvm::FunctionType::get(VoidTy, false); 1962fe531cbSDuncan P. N. Exon Smith auto *RegisterF = llvm::Function::Create(RegisterFTy, 1972fe531cbSDuncan P. N. Exon Smith llvm::GlobalValue::InternalLinkage, 1982fe531cbSDuncan P. N. Exon Smith "__llvm_pgo_register_functions", 1992fe531cbSDuncan P. N. Exon Smith &CGM.getModule()); 2002fe531cbSDuncan P. N. Exon Smith RegisterF->setUnnamedAddr(true); 2012fe531cbSDuncan P. N. Exon Smith if (CGM.getCodeGenOpts().DisableRedZone) 2022fe531cbSDuncan P. N. Exon Smith RegisterF->addFnAttr(llvm::Attribute::NoRedZone); 2032fe531cbSDuncan P. N. Exon Smith 2042fe531cbSDuncan P. N. Exon Smith // Construct and return the entry block. 2052fe531cbSDuncan P. N. Exon Smith auto *BB = llvm::BasicBlock::Create(CGM.getLLVMContext(), "", RegisterF); 2062fe531cbSDuncan P. N. Exon Smith CGBuilderTy Builder(BB); 2072fe531cbSDuncan P. N. Exon Smith Builder.CreateRetVoid(); 2082fe531cbSDuncan P. N. Exon Smith return BB; 2092fe531cbSDuncan P. N. Exon Smith } 2102fe531cbSDuncan P. N. Exon Smith 2112fe531cbSDuncan P. N. Exon Smith static llvm::Constant *getOrInsertRuntimeRegister(CodeGenModule &CGM) { 2122fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 2132fe531cbSDuncan P. N. Exon Smith auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext()); 2142fe531cbSDuncan P. N. Exon Smith auto *RuntimeRegisterTy = llvm::FunctionType::get(VoidTy, VoidPtrTy, false); 2152fe531cbSDuncan P. N. Exon Smith return CGM.getModule().getOrInsertFunction("__llvm_pgo_register_function", 2162fe531cbSDuncan P. N. Exon Smith RuntimeRegisterTy); 2172fe531cbSDuncan P. N. Exon Smith } 2182fe531cbSDuncan P. N. Exon Smith 2197134d47dSDuncan P. N. Exon Smith static bool isMachO(const CodeGenModule &CGM) { 2207134d47dSDuncan P. N. Exon Smith return CGM.getTarget().getTriple().isOSBinFormatMachO(); 2217134d47dSDuncan P. N. Exon Smith } 2227134d47dSDuncan P. N. Exon Smith 2232fe531cbSDuncan P. N. Exon Smith static StringRef getCountersSection(const CodeGenModule &CGM) { 2247134d47dSDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_pgo_cnts" : "__llvm_pgo_cnts"; 2252fe531cbSDuncan P. N. Exon Smith } 2262fe531cbSDuncan P. N. Exon Smith 2272fe531cbSDuncan P. N. Exon Smith static StringRef getNameSection(const CodeGenModule &CGM) { 2287134d47dSDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_pgo_names" : "__llvm_pgo_names"; 2292fe531cbSDuncan P. N. Exon Smith } 2302fe531cbSDuncan P. N. Exon Smith 2312fe531cbSDuncan P. N. Exon Smith static StringRef getDataSection(const CodeGenModule &CGM) { 2327134d47dSDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_pgo_data" : "__llvm_pgo_data"; 2332fe531cbSDuncan P. N. Exon Smith } 2342fe531cbSDuncan P. N. Exon Smith 2352fe531cbSDuncan P. N. Exon Smith llvm::GlobalVariable *CodeGenPGO::buildDataVar() { 2362fe531cbSDuncan P. N. Exon Smith // Create name variable. 2372fe531cbSDuncan P. N. Exon Smith llvm::LLVMContext &Ctx = CGM.getLLVMContext(); 2382fe531cbSDuncan P. N. Exon Smith auto *VarName = llvm::ConstantDataArray::getString(Ctx, getFuncName(), 2392fe531cbSDuncan P. N. Exon Smith false); 2402fe531cbSDuncan P. N. Exon Smith auto *Name = new llvm::GlobalVariable(CGM.getModule(), VarName->getType(), 2412fe531cbSDuncan P. N. Exon Smith true, FuncLinkage, VarName, 2422fe531cbSDuncan P. N. Exon Smith getFuncVarName("name")); 2432fe531cbSDuncan P. N. Exon Smith Name->setSection(getNameSection(CGM)); 2442fe531cbSDuncan P. N. Exon Smith Name->setAlignment(1); 2452fe531cbSDuncan P. N. Exon Smith 2462fe531cbSDuncan P. N. Exon Smith // Create data variable. 2472fe531cbSDuncan P. N. Exon Smith auto *Int32Ty = llvm::Type::getInt32Ty(Ctx); 248b4416f58SJustin Bogner auto *Int64Ty = llvm::Type::getInt64Ty(Ctx); 2492fe531cbSDuncan P. N. Exon Smith auto *Int8PtrTy = llvm::Type::getInt8PtrTy(Ctx); 2502fe531cbSDuncan P. N. Exon Smith auto *Int64PtrTy = llvm::Type::getInt64PtrTy(Ctx); 2512fe531cbSDuncan P. N. Exon Smith llvm::Type *DataTypes[] = { 252b4416f58SJustin Bogner Int32Ty, Int32Ty, Int64Ty, Int8PtrTy, Int64PtrTy 2532fe531cbSDuncan P. N. Exon Smith }; 2542fe531cbSDuncan P. N. Exon Smith auto *DataTy = llvm::StructType::get(Ctx, makeArrayRef(DataTypes)); 2552fe531cbSDuncan P. N. Exon Smith llvm::Constant *DataVals[] = { 2562fe531cbSDuncan P. N. Exon Smith llvm::ConstantInt::get(Int32Ty, getFuncName().size()), 2572fe531cbSDuncan P. N. Exon Smith llvm::ConstantInt::get(Int32Ty, NumRegionCounters), 258b4416f58SJustin Bogner llvm::ConstantInt::get(Int64Ty, FunctionHash), 2592fe531cbSDuncan P. N. Exon Smith llvm::ConstantExpr::getBitCast(Name, Int8PtrTy), 2602fe531cbSDuncan P. N. Exon Smith llvm::ConstantExpr::getBitCast(RegionCounters, Int64PtrTy) 2612fe531cbSDuncan P. N. Exon Smith }; 2622fe531cbSDuncan P. N. Exon Smith auto *Data = 2632fe531cbSDuncan P. N. Exon Smith new llvm::GlobalVariable(CGM.getModule(), DataTy, true, FuncLinkage, 2642fe531cbSDuncan P. N. Exon Smith llvm::ConstantStruct::get(DataTy, DataVals), 2652fe531cbSDuncan P. N. Exon Smith getFuncVarName("data")); 2662fe531cbSDuncan P. N. Exon Smith 2672fe531cbSDuncan P. N. Exon Smith // All the data should be packed into an array in its own section. 2682fe531cbSDuncan P. N. Exon Smith Data->setSection(getDataSection(CGM)); 2692fe531cbSDuncan P. N. Exon Smith Data->setAlignment(8); 2702fe531cbSDuncan P. N. Exon Smith 2712fe531cbSDuncan P. N. Exon Smith // Make sure the data doesn't get deleted. 2722fe531cbSDuncan P. N. Exon Smith CGM.addUsedGlobal(Data); 2732fe531cbSDuncan P. N. Exon Smith return Data; 2742fe531cbSDuncan P. N. Exon Smith } 2752fe531cbSDuncan P. N. Exon Smith 2762fe531cbSDuncan P. N. Exon Smith void CodeGenPGO::emitInstrumentationData() { 277ef512b99SJustin Bogner if (!CGM.getCodeGenOpts().ProfileInstrGenerate) 278ef512b99SJustin Bogner return; 279ef512b99SJustin Bogner 2802fe531cbSDuncan P. N. Exon Smith // Build the data. 2812fe531cbSDuncan P. N. Exon Smith auto *Data = buildDataVar(); 282ef512b99SJustin Bogner 2832fe531cbSDuncan P. N. Exon Smith // Register the data. 284780443e8SDuncan P. N. Exon Smith auto *RegisterBB = getOrInsertRegisterBB(CGM); 285780443e8SDuncan P. N. Exon Smith if (!RegisterBB) 286780443e8SDuncan P. N. Exon Smith return; 287780443e8SDuncan P. N. Exon Smith CGBuilderTy Builder(RegisterBB->getTerminator()); 2882fe531cbSDuncan P. N. Exon Smith auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext()); 2892fe531cbSDuncan P. N. Exon Smith Builder.CreateCall(getOrInsertRuntimeRegister(CGM), 2902fe531cbSDuncan P. N. Exon Smith Builder.CreateBitCast(Data, VoidPtrTy)); 291ef512b99SJustin Bogner } 292ef512b99SJustin Bogner 293ef512b99SJustin Bogner llvm::Function *CodeGenPGO::emitInitialization(CodeGenModule &CGM) { 2942fe531cbSDuncan P. N. Exon Smith if (!CGM.getCodeGenOpts().ProfileInstrGenerate) 295a5f804a7SDuncan P. N. Exon Smith return nullptr; 296ef512b99SJustin Bogner 2972fe531cbSDuncan P. N. Exon Smith // Only need to create this once per module. 2982fe531cbSDuncan P. N. Exon Smith if (CGM.getModule().getFunction("__llvm_pgo_init")) 299a5f804a7SDuncan P. N. Exon Smith return nullptr; 300ef512b99SJustin Bogner 301*5188e91cSDuncan P. N. Exon Smith // Get the function to call at initialization. 3022fe531cbSDuncan P. N. Exon Smith llvm::Constant *RegisterF = getRegisterFunc(CGM); 303*5188e91cSDuncan P. N. Exon Smith if (!RegisterF) 304a5f804a7SDuncan P. N. Exon Smith return nullptr; 3052fe531cbSDuncan P. N. Exon Smith 3062fe531cbSDuncan P. N. Exon Smith // Create the initialization function. 3072fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 3082fe531cbSDuncan P. N. Exon Smith auto *F = llvm::Function::Create(llvm::FunctionType::get(VoidTy, false), 3092fe531cbSDuncan P. N. Exon Smith llvm::GlobalValue::InternalLinkage, 310ef512b99SJustin Bogner "__llvm_pgo_init", &CGM.getModule()); 311ef512b99SJustin Bogner F->setUnnamedAddr(true); 312ef512b99SJustin Bogner F->addFnAttr(llvm::Attribute::NoInline); 313ef512b99SJustin Bogner if (CGM.getCodeGenOpts().DisableRedZone) 314ef512b99SJustin Bogner F->addFnAttr(llvm::Attribute::NoRedZone); 315ef512b99SJustin Bogner 3162fe531cbSDuncan P. N. Exon Smith // Add the basic block and the necessary calls. 3172fe531cbSDuncan P. N. Exon Smith CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", F)); 3182fe531cbSDuncan P. N. Exon Smith Builder.CreateCall(RegisterF); 3192fe531cbSDuncan P. N. Exon Smith Builder.CreateRetVoid(); 320ef512b99SJustin Bogner 321ef512b99SJustin Bogner return F; 322ef512b99SJustin Bogner } 323ef512b99SJustin Bogner 324ef512b99SJustin Bogner namespace { 325ef512b99SJustin Bogner /// A StmtVisitor that fills a map of statements to PGO counters. 326ef512b99SJustin Bogner struct MapRegionCounters : public ConstStmtVisitor<MapRegionCounters> { 327ef512b99SJustin Bogner /// The next counter value to assign. 328ef512b99SJustin Bogner unsigned NextCounter; 329ef512b99SJustin Bogner /// The map of statements to counters. 330ef512b99SJustin Bogner llvm::DenseMap<const Stmt*, unsigned> *CounterMap; 331ef512b99SJustin Bogner 332ef512b99SJustin Bogner MapRegionCounters(llvm::DenseMap<const Stmt*, unsigned> *CounterMap) : 333ef512b99SJustin Bogner NextCounter(0), CounterMap(CounterMap) { 334ef512b99SJustin Bogner } 335ef512b99SJustin Bogner 336ef512b99SJustin Bogner void VisitChildren(const Stmt *S) { 337ef512b99SJustin Bogner for (Stmt::const_child_range I = S->children(); I; ++I) 338ef512b99SJustin Bogner if (*I) 339ef512b99SJustin Bogner this->Visit(*I); 340ef512b99SJustin Bogner } 341ef512b99SJustin Bogner void VisitStmt(const Stmt *S) { VisitChildren(S); } 342ef512b99SJustin Bogner 343ea278c32SJustin Bogner /// Assign a counter to track entry to the function body. 344ef512b99SJustin Bogner void VisitFunctionDecl(const FunctionDecl *S) { 345ef512b99SJustin Bogner (*CounterMap)[S->getBody()] = NextCounter++; 346ef512b99SJustin Bogner Visit(S->getBody()); 347ef512b99SJustin Bogner } 3485ec8fe19SBob Wilson void VisitObjCMethodDecl(const ObjCMethodDecl *S) { 3495ec8fe19SBob Wilson (*CounterMap)[S->getBody()] = NextCounter++; 3505ec8fe19SBob Wilson Visit(S->getBody()); 3515ec8fe19SBob Wilson } 352c845c00aSBob Wilson void VisitBlockDecl(const BlockDecl *S) { 353c845c00aSBob Wilson (*CounterMap)[S->getBody()] = NextCounter++; 354c845c00aSBob Wilson Visit(S->getBody()); 355c845c00aSBob Wilson } 356ea278c32SJustin Bogner /// Assign a counter to track the block following a label. 357ef512b99SJustin Bogner void VisitLabelStmt(const LabelStmt *S) { 358ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 359ef512b99SJustin Bogner Visit(S->getSubStmt()); 360ef512b99SJustin Bogner } 361bf854f0fSBob Wilson /// Assign a counter for the body of a while loop. 362ef512b99SJustin Bogner void VisitWhileStmt(const WhileStmt *S) { 363bf854f0fSBob Wilson (*CounterMap)[S] = NextCounter++; 364ef512b99SJustin Bogner Visit(S->getCond()); 365ef512b99SJustin Bogner Visit(S->getBody()); 366ef512b99SJustin Bogner } 367bf854f0fSBob Wilson /// Assign a counter for the body of a do-while loop. 368ef512b99SJustin Bogner void VisitDoStmt(const DoStmt *S) { 369bf854f0fSBob Wilson (*CounterMap)[S] = NextCounter++; 370ef512b99SJustin Bogner Visit(S->getBody()); 371ef512b99SJustin Bogner Visit(S->getCond()); 372ef512b99SJustin Bogner } 373bf854f0fSBob Wilson /// Assign a counter for the body of a for loop. 374ef512b99SJustin Bogner void VisitForStmt(const ForStmt *S) { 375bf854f0fSBob Wilson (*CounterMap)[S] = NextCounter++; 376bf854f0fSBob Wilson if (S->getInit()) 377bf854f0fSBob Wilson Visit(S->getInit()); 378ef512b99SJustin Bogner const Expr *E; 379ef512b99SJustin Bogner if ((E = S->getCond())) 380ef512b99SJustin Bogner Visit(E); 381ef512b99SJustin Bogner if ((E = S->getInc())) 382ef512b99SJustin Bogner Visit(E); 383bf854f0fSBob Wilson Visit(S->getBody()); 384ef512b99SJustin Bogner } 385bf854f0fSBob Wilson /// Assign a counter for the body of a for-range loop. 386ef512b99SJustin Bogner void VisitCXXForRangeStmt(const CXXForRangeStmt *S) { 387bf854f0fSBob Wilson (*CounterMap)[S] = NextCounter++; 388bf854f0fSBob Wilson Visit(S->getRangeStmt()); 389bf854f0fSBob Wilson Visit(S->getBeginEndStmt()); 390bf854f0fSBob Wilson Visit(S->getCond()); 391bf854f0fSBob Wilson Visit(S->getLoopVarStmt()); 392ef512b99SJustin Bogner Visit(S->getBody()); 393bf854f0fSBob Wilson Visit(S->getInc()); 394ef512b99SJustin Bogner } 395bf854f0fSBob Wilson /// Assign a counter for the body of a for-collection loop. 396ef512b99SJustin Bogner void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) { 397bf854f0fSBob Wilson (*CounterMap)[S] = NextCounter++; 398ef512b99SJustin Bogner Visit(S->getElement()); 399ef512b99SJustin Bogner Visit(S->getBody()); 400ef512b99SJustin Bogner } 401ef512b99SJustin Bogner /// Assign a counter for the exit block of the switch statement. 402ef512b99SJustin Bogner void VisitSwitchStmt(const SwitchStmt *S) { 403ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 404ef512b99SJustin Bogner Visit(S->getCond()); 405ef512b99SJustin Bogner Visit(S->getBody()); 406ef512b99SJustin Bogner } 407ef512b99SJustin Bogner /// Assign a counter for a particular case in a switch. This counts jumps 408ef512b99SJustin Bogner /// from the switch header as well as fallthrough from the case before this 409ef512b99SJustin Bogner /// one. 410ef512b99SJustin Bogner void VisitCaseStmt(const CaseStmt *S) { 411ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 412ef512b99SJustin Bogner Visit(S->getSubStmt()); 413ef512b99SJustin Bogner } 414ef512b99SJustin Bogner /// Assign a counter for the default case of a switch statement. The count 415ef512b99SJustin Bogner /// is the number of branches from the loop header to the default, and does 416ef512b99SJustin Bogner /// not include fallthrough from previous cases. If we have multiple 417ef512b99SJustin Bogner /// conditional branch blocks from the switch instruction to the default 418ef512b99SJustin Bogner /// block, as with large GNU case ranges, this is the counter for the last 419ef512b99SJustin Bogner /// edge in that series, rather than the first. 420ef512b99SJustin Bogner void VisitDefaultStmt(const DefaultStmt *S) { 421ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 422ef512b99SJustin Bogner Visit(S->getSubStmt()); 423ef512b99SJustin Bogner } 424ef512b99SJustin Bogner /// Assign a counter for the "then" part of an if statement. The count for 425ef512b99SJustin Bogner /// the "else" part, if it exists, will be calculated from this counter. 426ef512b99SJustin Bogner void VisitIfStmt(const IfStmt *S) { 427ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 428ef512b99SJustin Bogner Visit(S->getCond()); 429ef512b99SJustin Bogner Visit(S->getThen()); 430ef512b99SJustin Bogner if (S->getElse()) 431ef512b99SJustin Bogner Visit(S->getElse()); 432ef512b99SJustin Bogner } 433ef512b99SJustin Bogner /// Assign a counter for the continuation block of a C++ try statement. 434ef512b99SJustin Bogner void VisitCXXTryStmt(const CXXTryStmt *S) { 435ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 436ef512b99SJustin Bogner Visit(S->getTryBlock()); 437ef512b99SJustin Bogner for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I) 438ef512b99SJustin Bogner Visit(S->getHandler(I)); 439ef512b99SJustin Bogner } 440ef512b99SJustin Bogner /// Assign a counter for a catch statement's handler block. 441ef512b99SJustin Bogner void VisitCXXCatchStmt(const CXXCatchStmt *S) { 442ef512b99SJustin Bogner (*CounterMap)[S] = NextCounter++; 443ef512b99SJustin Bogner Visit(S->getHandlerBlock()); 444ef512b99SJustin Bogner } 445ef512b99SJustin Bogner /// Assign a counter for the "true" part of a conditional operator. The 446ef512b99SJustin Bogner /// count in the "false" part will be calculated from this counter. 447ef512b99SJustin Bogner void VisitConditionalOperator(const ConditionalOperator *E) { 448ef512b99SJustin Bogner (*CounterMap)[E] = NextCounter++; 449ef512b99SJustin Bogner Visit(E->getCond()); 450ef512b99SJustin Bogner Visit(E->getTrueExpr()); 451ef512b99SJustin Bogner Visit(E->getFalseExpr()); 452ef512b99SJustin Bogner } 453ef512b99SJustin Bogner /// Assign a counter for the right hand side of a logical and operator. 454ef512b99SJustin Bogner void VisitBinLAnd(const BinaryOperator *E) { 455ef512b99SJustin Bogner (*CounterMap)[E] = NextCounter++; 456ef512b99SJustin Bogner Visit(E->getLHS()); 457ef512b99SJustin Bogner Visit(E->getRHS()); 458ef512b99SJustin Bogner } 459ef512b99SJustin Bogner /// Assign a counter for the right hand side of a logical or operator. 460ef512b99SJustin Bogner void VisitBinLOr(const BinaryOperator *E) { 461ef512b99SJustin Bogner (*CounterMap)[E] = NextCounter++; 462ef512b99SJustin Bogner Visit(E->getLHS()); 463ef512b99SJustin Bogner Visit(E->getRHS()); 464ef512b99SJustin Bogner } 465ef512b99SJustin Bogner }; 466bf854f0fSBob Wilson 467bf854f0fSBob Wilson /// A StmtVisitor that propagates the raw counts through the AST and 468bf854f0fSBob Wilson /// records the count at statements where the value may change. 469bf854f0fSBob Wilson struct ComputeRegionCounts : public ConstStmtVisitor<ComputeRegionCounts> { 470bf854f0fSBob Wilson /// PGO state. 471bf854f0fSBob Wilson CodeGenPGO &PGO; 472bf854f0fSBob Wilson 473bf854f0fSBob Wilson /// A flag that is set when the current count should be recorded on the 474bf854f0fSBob Wilson /// next statement, such as at the exit of a loop. 475bf854f0fSBob Wilson bool RecordNextStmtCount; 476bf854f0fSBob Wilson 477bf854f0fSBob Wilson /// The map of statements to count values. 478bf854f0fSBob Wilson llvm::DenseMap<const Stmt*, uint64_t> *CountMap; 479bf854f0fSBob Wilson 480bf854f0fSBob Wilson /// BreakContinueStack - Keep counts of breaks and continues inside loops. 481bf854f0fSBob Wilson struct BreakContinue { 482bf854f0fSBob Wilson uint64_t BreakCount; 483bf854f0fSBob Wilson uint64_t ContinueCount; 484bf854f0fSBob Wilson BreakContinue() : BreakCount(0), ContinueCount(0) {} 485bf854f0fSBob Wilson }; 486bf854f0fSBob Wilson SmallVector<BreakContinue, 8> BreakContinueStack; 487bf854f0fSBob Wilson 488bf854f0fSBob Wilson ComputeRegionCounts(llvm::DenseMap<const Stmt*, uint64_t> *CountMap, 489bf854f0fSBob Wilson CodeGenPGO &PGO) : 490bf854f0fSBob Wilson PGO(PGO), RecordNextStmtCount(false), CountMap(CountMap) { 491bf854f0fSBob Wilson } 492bf854f0fSBob Wilson 493bf854f0fSBob Wilson void RecordStmtCount(const Stmt *S) { 494bf854f0fSBob Wilson if (RecordNextStmtCount) { 495bf854f0fSBob Wilson (*CountMap)[S] = PGO.getCurrentRegionCount(); 496bf854f0fSBob Wilson RecordNextStmtCount = false; 497bf854f0fSBob Wilson } 498bf854f0fSBob Wilson } 499bf854f0fSBob Wilson 500bf854f0fSBob Wilson void VisitStmt(const Stmt *S) { 501bf854f0fSBob Wilson RecordStmtCount(S); 502bf854f0fSBob Wilson for (Stmt::const_child_range I = S->children(); I; ++I) { 503bf854f0fSBob Wilson if (*I) 504bf854f0fSBob Wilson this->Visit(*I); 505bf854f0fSBob Wilson } 506bf854f0fSBob Wilson } 507bf854f0fSBob Wilson 508bf854f0fSBob Wilson void VisitFunctionDecl(const FunctionDecl *S) { 509bf854f0fSBob Wilson RegionCounter Cnt(PGO, S->getBody()); 510bf854f0fSBob Wilson Cnt.beginRegion(); 511bf854f0fSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 512bf854f0fSBob Wilson Visit(S->getBody()); 513bf854f0fSBob Wilson } 514bf854f0fSBob Wilson 5155ec8fe19SBob Wilson void VisitObjCMethodDecl(const ObjCMethodDecl *S) { 5165ec8fe19SBob Wilson RegionCounter Cnt(PGO, S->getBody()); 5175ec8fe19SBob Wilson Cnt.beginRegion(); 5185ec8fe19SBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 5195ec8fe19SBob Wilson Visit(S->getBody()); 5205ec8fe19SBob Wilson } 5215ec8fe19SBob Wilson 522c845c00aSBob Wilson void VisitBlockDecl(const BlockDecl *S) { 523c845c00aSBob Wilson RegionCounter Cnt(PGO, S->getBody()); 524c845c00aSBob Wilson Cnt.beginRegion(); 525c845c00aSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 526c845c00aSBob Wilson Visit(S->getBody()); 527c845c00aSBob Wilson } 528c845c00aSBob Wilson 529bf854f0fSBob Wilson void VisitReturnStmt(const ReturnStmt *S) { 530bf854f0fSBob Wilson RecordStmtCount(S); 531bf854f0fSBob Wilson if (S->getRetValue()) 532bf854f0fSBob Wilson Visit(S->getRetValue()); 533bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 534bf854f0fSBob Wilson RecordNextStmtCount = true; 535bf854f0fSBob Wilson } 536bf854f0fSBob Wilson 537bf854f0fSBob Wilson void VisitGotoStmt(const GotoStmt *S) { 538bf854f0fSBob Wilson RecordStmtCount(S); 539bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 540bf854f0fSBob Wilson RecordNextStmtCount = true; 541bf854f0fSBob Wilson } 542bf854f0fSBob Wilson 543bf854f0fSBob Wilson void VisitLabelStmt(const LabelStmt *S) { 544bf854f0fSBob Wilson RecordNextStmtCount = false; 545bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 546bf854f0fSBob Wilson Cnt.beginRegion(); 547bf854f0fSBob Wilson (*CountMap)[S] = PGO.getCurrentRegionCount(); 548bf854f0fSBob Wilson Visit(S->getSubStmt()); 549bf854f0fSBob Wilson } 550bf854f0fSBob Wilson 551bf854f0fSBob Wilson void VisitBreakStmt(const BreakStmt *S) { 552bf854f0fSBob Wilson RecordStmtCount(S); 553bf854f0fSBob Wilson assert(!BreakContinueStack.empty() && "break not in a loop or switch!"); 554bf854f0fSBob Wilson BreakContinueStack.back().BreakCount += PGO.getCurrentRegionCount(); 555bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 556bf854f0fSBob Wilson RecordNextStmtCount = true; 557bf854f0fSBob Wilson } 558bf854f0fSBob Wilson 559bf854f0fSBob Wilson void VisitContinueStmt(const ContinueStmt *S) { 560bf854f0fSBob Wilson RecordStmtCount(S); 561bf854f0fSBob Wilson assert(!BreakContinueStack.empty() && "continue stmt not in a loop!"); 562bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount += PGO.getCurrentRegionCount(); 563bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 564bf854f0fSBob Wilson RecordNextStmtCount = true; 565bf854f0fSBob Wilson } 566bf854f0fSBob Wilson 567bf854f0fSBob Wilson void VisitWhileStmt(const WhileStmt *S) { 568bf854f0fSBob Wilson RecordStmtCount(S); 569bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 570bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 571bf854f0fSBob Wilson // Visit the body region first so the break/continue adjustments can be 572bf854f0fSBob Wilson // included when visiting the condition. 573bf854f0fSBob Wilson Cnt.beginRegion(); 574bf854f0fSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 575bf854f0fSBob Wilson Visit(S->getBody()); 576bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 577bf854f0fSBob Wilson 578bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. The count 579bf854f0fSBob Wilson // at the start of the condition is the sum of the incoming edges, 580bf854f0fSBob Wilson // the backedge from the end of the loop body, and the edges from 581bf854f0fSBob Wilson // continue statements. 582bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 583bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 584bf854f0fSBob Wilson Cnt.getAdjustedCount() + BC.ContinueCount); 585bf854f0fSBob Wilson (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount(); 586bf854f0fSBob Wilson Visit(S->getCond()); 587bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 588bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 589bf854f0fSBob Wilson RecordNextStmtCount = true; 590bf854f0fSBob Wilson } 591bf854f0fSBob Wilson 592bf854f0fSBob Wilson void VisitDoStmt(const DoStmt *S) { 593bf854f0fSBob Wilson RecordStmtCount(S); 594bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 595bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 596bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 597bf854f0fSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 598bf854f0fSBob Wilson Visit(S->getBody()); 599bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 600bf854f0fSBob Wilson 601bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 602bf854f0fSBob Wilson // The count at the start of the condition is equal to the count at the 603bf854f0fSBob Wilson // end of the body. The adjusted count does not include either the 604bf854f0fSBob Wilson // fall-through count coming into the loop or the continue count, so add 605bf854f0fSBob Wilson // both of those separately. This is coincidentally the same equation as 606bf854f0fSBob Wilson // with while loops but for different reasons. 607bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 608bf854f0fSBob Wilson Cnt.getAdjustedCount() + BC.ContinueCount); 609bf854f0fSBob Wilson (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount(); 610bf854f0fSBob Wilson Visit(S->getCond()); 611bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 612bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 613bf854f0fSBob Wilson RecordNextStmtCount = true; 614bf854f0fSBob Wilson } 615bf854f0fSBob Wilson 616bf854f0fSBob Wilson void VisitForStmt(const ForStmt *S) { 617bf854f0fSBob Wilson RecordStmtCount(S); 618bf854f0fSBob Wilson if (S->getInit()) 619bf854f0fSBob Wilson Visit(S->getInit()); 620bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 621bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 622bf854f0fSBob Wilson // Visit the body region first. (This is basically the same as a while 623bf854f0fSBob Wilson // loop; see further comments in VisitWhileStmt.) 624bf854f0fSBob Wilson Cnt.beginRegion(); 625bf854f0fSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 626bf854f0fSBob Wilson Visit(S->getBody()); 627bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 628bf854f0fSBob Wilson 629bf854f0fSBob Wilson // The increment is essentially part of the body but it needs to include 630bf854f0fSBob Wilson // the count for all the continue statements. 631bf854f0fSBob Wilson if (S->getInc()) { 632bf854f0fSBob Wilson Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() + 633bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount); 634bf854f0fSBob Wilson (*CountMap)[S->getInc()] = PGO.getCurrentRegionCount(); 635bf854f0fSBob Wilson Visit(S->getInc()); 636bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 637bf854f0fSBob Wilson } 638bf854f0fSBob Wilson 639bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 640bf854f0fSBob Wilson 641bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. 642bf854f0fSBob Wilson if (S->getCond()) { 643bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 644bf854f0fSBob Wilson Cnt.getAdjustedCount() + 645bf854f0fSBob Wilson BC.ContinueCount); 646bf854f0fSBob Wilson (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount(); 647bf854f0fSBob Wilson Visit(S->getCond()); 648bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 649bf854f0fSBob Wilson } 650bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 651bf854f0fSBob Wilson RecordNextStmtCount = true; 652bf854f0fSBob Wilson } 653bf854f0fSBob Wilson 654bf854f0fSBob Wilson void VisitCXXForRangeStmt(const CXXForRangeStmt *S) { 655bf854f0fSBob Wilson RecordStmtCount(S); 656bf854f0fSBob Wilson Visit(S->getRangeStmt()); 657bf854f0fSBob Wilson Visit(S->getBeginEndStmt()); 658bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 659bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 660bf854f0fSBob Wilson // Visit the body region first. (This is basically the same as a while 661bf854f0fSBob Wilson // loop; see further comments in VisitWhileStmt.) 662bf854f0fSBob Wilson Cnt.beginRegion(); 663bf854f0fSBob Wilson (*CountMap)[S->getLoopVarStmt()] = PGO.getCurrentRegionCount(); 664bf854f0fSBob Wilson Visit(S->getLoopVarStmt()); 665bf854f0fSBob Wilson Visit(S->getBody()); 666bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 667bf854f0fSBob Wilson 668bf854f0fSBob Wilson // The increment is essentially part of the body but it needs to include 669bf854f0fSBob Wilson // the count for all the continue statements. 670bf854f0fSBob Wilson Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() + 671bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount); 672bf854f0fSBob Wilson (*CountMap)[S->getInc()] = PGO.getCurrentRegionCount(); 673bf854f0fSBob Wilson Visit(S->getInc()); 674bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 675bf854f0fSBob Wilson 676bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 677bf854f0fSBob Wilson 678bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. 679bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 680bf854f0fSBob Wilson Cnt.getAdjustedCount() + 681bf854f0fSBob Wilson BC.ContinueCount); 682bf854f0fSBob Wilson (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount(); 683bf854f0fSBob Wilson Visit(S->getCond()); 684bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 685bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 686bf854f0fSBob Wilson RecordNextStmtCount = true; 687bf854f0fSBob Wilson } 688bf854f0fSBob Wilson 689bf854f0fSBob Wilson void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) { 690bf854f0fSBob Wilson RecordStmtCount(S); 691bf854f0fSBob Wilson Visit(S->getElement()); 692bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 693bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 694bf854f0fSBob Wilson Cnt.beginRegion(); 695bf854f0fSBob Wilson (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount(); 696bf854f0fSBob Wilson Visit(S->getBody()); 697bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 698bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 699bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 700bf854f0fSBob Wilson RecordNextStmtCount = true; 701bf854f0fSBob Wilson } 702bf854f0fSBob Wilson 703bf854f0fSBob Wilson void VisitSwitchStmt(const SwitchStmt *S) { 704bf854f0fSBob Wilson RecordStmtCount(S); 705bf854f0fSBob Wilson Visit(S->getCond()); 706bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 707bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 708bf854f0fSBob Wilson Visit(S->getBody()); 709bf854f0fSBob Wilson // If the switch is inside a loop, add the continue counts. 710bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 711bf854f0fSBob Wilson if (!BreakContinueStack.empty()) 712bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount += BC.ContinueCount; 713bf854f0fSBob Wilson RegionCounter ExitCnt(PGO, S); 714bf854f0fSBob Wilson ExitCnt.beginRegion(); 715bf854f0fSBob Wilson RecordNextStmtCount = true; 716bf854f0fSBob Wilson } 717bf854f0fSBob Wilson 718bf854f0fSBob Wilson void VisitCaseStmt(const CaseStmt *S) { 719bf854f0fSBob Wilson RecordNextStmtCount = false; 720bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 721bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 722bf854f0fSBob Wilson (*CountMap)[S] = Cnt.getCount(); 723bf854f0fSBob Wilson RecordNextStmtCount = true; 724bf854f0fSBob Wilson Visit(S->getSubStmt()); 725bf854f0fSBob Wilson } 726bf854f0fSBob Wilson 727bf854f0fSBob Wilson void VisitDefaultStmt(const DefaultStmt *S) { 728bf854f0fSBob Wilson RecordNextStmtCount = false; 729bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 730bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 731bf854f0fSBob Wilson (*CountMap)[S] = Cnt.getCount(); 732bf854f0fSBob Wilson RecordNextStmtCount = true; 733bf854f0fSBob Wilson Visit(S->getSubStmt()); 734bf854f0fSBob Wilson } 735bf854f0fSBob Wilson 736bf854f0fSBob Wilson void VisitIfStmt(const IfStmt *S) { 737bf854f0fSBob Wilson RecordStmtCount(S); 738bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 739bf854f0fSBob Wilson Visit(S->getCond()); 740bf854f0fSBob Wilson 741bf854f0fSBob Wilson Cnt.beginRegion(); 742bf854f0fSBob Wilson (*CountMap)[S->getThen()] = PGO.getCurrentRegionCount(); 743bf854f0fSBob Wilson Visit(S->getThen()); 744bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 745bf854f0fSBob Wilson 746bf854f0fSBob Wilson if (S->getElse()) { 747bf854f0fSBob Wilson Cnt.beginElseRegion(); 748bf854f0fSBob Wilson (*CountMap)[S->getElse()] = PGO.getCurrentRegionCount(); 749bf854f0fSBob Wilson Visit(S->getElse()); 750bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 751bf854f0fSBob Wilson } 752bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 753bf854f0fSBob Wilson RecordNextStmtCount = true; 754bf854f0fSBob Wilson } 755bf854f0fSBob Wilson 756bf854f0fSBob Wilson void VisitCXXTryStmt(const CXXTryStmt *S) { 757bf854f0fSBob Wilson RecordStmtCount(S); 758bf854f0fSBob Wilson Visit(S->getTryBlock()); 759bf854f0fSBob Wilson for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I) 760bf854f0fSBob Wilson Visit(S->getHandler(I)); 761bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 762bf854f0fSBob Wilson Cnt.beginRegion(); 763bf854f0fSBob Wilson RecordNextStmtCount = true; 764bf854f0fSBob Wilson } 765bf854f0fSBob Wilson 766bf854f0fSBob Wilson void VisitCXXCatchStmt(const CXXCatchStmt *S) { 767bf854f0fSBob Wilson RecordNextStmtCount = false; 768bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 769bf854f0fSBob Wilson Cnt.beginRegion(); 770bf854f0fSBob Wilson (*CountMap)[S] = PGO.getCurrentRegionCount(); 771bf854f0fSBob Wilson Visit(S->getHandlerBlock()); 772bf854f0fSBob Wilson } 773bf854f0fSBob Wilson 774bf854f0fSBob Wilson void VisitConditionalOperator(const ConditionalOperator *E) { 775bf854f0fSBob Wilson RecordStmtCount(E); 776bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 777bf854f0fSBob Wilson Visit(E->getCond()); 778bf854f0fSBob Wilson 779bf854f0fSBob Wilson Cnt.beginRegion(); 780bf854f0fSBob Wilson (*CountMap)[E->getTrueExpr()] = PGO.getCurrentRegionCount(); 781bf854f0fSBob Wilson Visit(E->getTrueExpr()); 782bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 783bf854f0fSBob Wilson 784bf854f0fSBob Wilson Cnt.beginElseRegion(); 785bf854f0fSBob Wilson (*CountMap)[E->getFalseExpr()] = PGO.getCurrentRegionCount(); 786bf854f0fSBob Wilson Visit(E->getFalseExpr()); 787bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 788bf854f0fSBob Wilson 789bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 790bf854f0fSBob Wilson RecordNextStmtCount = true; 791bf854f0fSBob Wilson } 792bf854f0fSBob Wilson 793bf854f0fSBob Wilson void VisitBinLAnd(const BinaryOperator *E) { 794bf854f0fSBob Wilson RecordStmtCount(E); 795bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 796bf854f0fSBob Wilson Visit(E->getLHS()); 797bf854f0fSBob Wilson Cnt.beginRegion(); 798bf854f0fSBob Wilson (*CountMap)[E->getRHS()] = PGO.getCurrentRegionCount(); 799bf854f0fSBob Wilson Visit(E->getRHS()); 800bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 801bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 802bf854f0fSBob Wilson RecordNextStmtCount = true; 803bf854f0fSBob Wilson } 804bf854f0fSBob Wilson 805bf854f0fSBob Wilson void VisitBinLOr(const BinaryOperator *E) { 806bf854f0fSBob Wilson RecordStmtCount(E); 807bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 808bf854f0fSBob Wilson Visit(E->getLHS()); 809bf854f0fSBob Wilson Cnt.beginRegion(); 810bf854f0fSBob Wilson (*CountMap)[E->getRHS()] = PGO.getCurrentRegionCount(); 811bf854f0fSBob Wilson Visit(E->getRHS()); 812bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 813bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 814bf854f0fSBob Wilson RecordNextStmtCount = true; 815bf854f0fSBob Wilson } 816bf854f0fSBob Wilson }; 817ef512b99SJustin Bogner } 818ef512b99SJustin Bogner 819da1ebedeSBob Wilson void CodeGenPGO::assignRegionCounters(const Decl *D, llvm::Function *Fn) { 820ef512b99SJustin Bogner bool InstrumentRegions = CGM.getCodeGenOpts().ProfileInstrGenerate; 821d66a17d0SJustin Bogner PGOProfileData *PGOData = CGM.getPGOData(); 822d66a17d0SJustin Bogner if (!InstrumentRegions && !PGOData) 823ef512b99SJustin Bogner return; 824ef512b99SJustin Bogner if (!D) 825ef512b99SJustin Bogner return; 826da1ebedeSBob Wilson setFuncName(Fn); 8272fe531cbSDuncan P. N. Exon Smith FuncLinkage = Fn->getLinkage(); 828ef512b99SJustin Bogner mapRegionCounters(D); 829ef512b99SJustin Bogner if (InstrumentRegions) 830ef512b99SJustin Bogner emitCounterVariables(); 831d66a17d0SJustin Bogner if (PGOData) { 832d66a17d0SJustin Bogner loadRegionCounts(PGOData); 833bf854f0fSBob Wilson computeRegionCounts(D); 834d66a17d0SJustin Bogner applyFunctionAttributes(PGOData, Fn); 835bf854f0fSBob Wilson } 836ef512b99SJustin Bogner } 837ef512b99SJustin Bogner 838ef512b99SJustin Bogner void CodeGenPGO::mapRegionCounters(const Decl *D) { 839ef512b99SJustin Bogner RegionCounterMap = new llvm::DenseMap<const Stmt*, unsigned>(); 840ef512b99SJustin Bogner MapRegionCounters Walker(RegionCounterMap); 841ef512b99SJustin Bogner if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D)) 842ef512b99SJustin Bogner Walker.VisitFunctionDecl(FD); 8435ec8fe19SBob Wilson else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D)) 8445ec8fe19SBob Wilson Walker.VisitObjCMethodDecl(MD); 845c845c00aSBob Wilson else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D)) 846c845c00aSBob Wilson Walker.VisitBlockDecl(BD); 847ef512b99SJustin Bogner NumRegionCounters = Walker.NextCounter; 848b4416f58SJustin Bogner // FIXME: The number of counters isn't sufficient for the hash 849b4416f58SJustin Bogner FunctionHash = NumRegionCounters; 850ef512b99SJustin Bogner } 851ef512b99SJustin Bogner 852bf854f0fSBob Wilson void CodeGenPGO::computeRegionCounts(const Decl *D) { 853bf854f0fSBob Wilson StmtCountMap = new llvm::DenseMap<const Stmt*, uint64_t>(); 854bf854f0fSBob Wilson ComputeRegionCounts Walker(StmtCountMap, *this); 855bf854f0fSBob Wilson if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D)) 856bf854f0fSBob Wilson Walker.VisitFunctionDecl(FD); 8575ec8fe19SBob Wilson else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D)) 8585ec8fe19SBob Wilson Walker.VisitObjCMethodDecl(MD); 859c845c00aSBob Wilson else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D)) 860c845c00aSBob Wilson Walker.VisitBlockDecl(BD); 861bf854f0fSBob Wilson } 862bf854f0fSBob Wilson 863d66a17d0SJustin Bogner void CodeGenPGO::applyFunctionAttributes(PGOProfileData *PGOData, 8644c9c45c0SJustin Bogner llvm::Function *Fn) { 8654c9c45c0SJustin Bogner if (!haveRegionCounts()) 8664c9c45c0SJustin Bogner return; 8674c9c45c0SJustin Bogner 868d66a17d0SJustin Bogner uint64_t MaxFunctionCount = PGOData->getMaximumFunctionCount(); 8694c9c45c0SJustin Bogner uint64_t FunctionCount = getRegionCount(0); 8704c9c45c0SJustin Bogner if (FunctionCount >= (uint64_t)(0.3 * (double)MaxFunctionCount)) 8714c9c45c0SJustin Bogner // Turn on InlineHint attribute for hot functions. 8724c9c45c0SJustin Bogner // FIXME: 30% is from preliminary tuning on SPEC, it may not be optimal. 8734c9c45c0SJustin Bogner Fn->addFnAttr(llvm::Attribute::InlineHint); 8744c9c45c0SJustin Bogner else if (FunctionCount <= (uint64_t)(0.01 * (double)MaxFunctionCount)) 8754c9c45c0SJustin Bogner // Turn on Cold attribute for cold functions. 8764c9c45c0SJustin Bogner // FIXME: 1% is from preliminary tuning on SPEC, it may not be optimal. 8774c9c45c0SJustin Bogner Fn->addFnAttr(llvm::Attribute::Cold); 8784c9c45c0SJustin Bogner } 8794c9c45c0SJustin Bogner 880ef512b99SJustin Bogner void CodeGenPGO::emitCounterVariables() { 881ef512b99SJustin Bogner llvm::LLVMContext &Ctx = CGM.getLLVMContext(); 882ef512b99SJustin Bogner llvm::ArrayType *CounterTy = llvm::ArrayType::get(llvm::Type::getInt64Ty(Ctx), 883ef512b99SJustin Bogner NumRegionCounters); 884ef512b99SJustin Bogner RegionCounters = 8852fe531cbSDuncan P. N. Exon Smith new llvm::GlobalVariable(CGM.getModule(), CounterTy, false, FuncLinkage, 886ef512b99SJustin Bogner llvm::Constant::getNullValue(CounterTy), 8872fe531cbSDuncan P. N. Exon Smith getFuncVarName("counters")); 8882fe531cbSDuncan P. N. Exon Smith RegionCounters->setAlignment(8); 8892fe531cbSDuncan P. N. Exon Smith RegionCounters->setSection(getCountersSection(CGM)); 890ef512b99SJustin Bogner } 891ef512b99SJustin Bogner 892ef512b99SJustin Bogner void CodeGenPGO::emitCounterIncrement(CGBuilderTy &Builder, unsigned Counter) { 893749ebc7fSBob Wilson if (!RegionCounters) 894ef512b99SJustin Bogner return; 895ef512b99SJustin Bogner llvm::Value *Addr = 896ef512b99SJustin Bogner Builder.CreateConstInBoundsGEP2_64(RegionCounters, 0, Counter); 897ef512b99SJustin Bogner llvm::Value *Count = Builder.CreateLoad(Addr, "pgocount"); 898ef512b99SJustin Bogner Count = Builder.CreateAdd(Count, Builder.getInt64(1)); 899ef512b99SJustin Bogner Builder.CreateStore(Count, Addr); 900ef512b99SJustin Bogner } 901ef512b99SJustin Bogner 902d66a17d0SJustin Bogner void CodeGenPGO::loadRegionCounts(PGOProfileData *PGOData) { 903ef512b99SJustin Bogner // For now, ignore the counts from the PGO data file only if the number of 904ef512b99SJustin Bogner // counters does not match. This could be tightened down in the future to 905ef512b99SJustin Bogner // ignore counts when the input changes in various ways, e.g., by comparing a 906ef512b99SJustin Bogner // hash value based on some characteristics of the input. 907ef512b99SJustin Bogner RegionCounts = new std::vector<uint64_t>(); 908b4416f58SJustin Bogner uint64_t Hash; 909b4416f58SJustin Bogner if (PGOData->getFunctionCounts(getFuncName(), Hash, *RegionCounts) || 910b4416f58SJustin Bogner Hash != FunctionHash || RegionCounts->size() != NumRegionCounters) { 911ef512b99SJustin Bogner delete RegionCounts; 912ef512b99SJustin Bogner RegionCounts = 0; 913ef512b99SJustin Bogner } 914ef512b99SJustin Bogner } 915ef512b99SJustin Bogner 916ef512b99SJustin Bogner void CodeGenPGO::destroyRegionCounters() { 917ef512b99SJustin Bogner if (RegionCounterMap != 0) 918ef512b99SJustin Bogner delete RegionCounterMap; 919bf854f0fSBob Wilson if (StmtCountMap != 0) 920bf854f0fSBob Wilson delete StmtCountMap; 921ef512b99SJustin Bogner if (RegionCounts != 0) 922ef512b99SJustin Bogner delete RegionCounts; 923ef512b99SJustin Bogner } 924ef512b99SJustin Bogner 92538402dc9SDuncan P. N. Exon Smith /// \brief Calculate what to divide by to scale weights. 92638402dc9SDuncan P. N. Exon Smith /// 92738402dc9SDuncan P. N. Exon Smith /// Given the maximum weight, calculate a divisor that will scale all the 92838402dc9SDuncan P. N. Exon Smith /// weights to strictly less than UINT32_MAX. 92938402dc9SDuncan P. N. Exon Smith static uint64_t calculateWeightScale(uint64_t MaxWeight) { 93038402dc9SDuncan P. N. Exon Smith return MaxWeight < UINT32_MAX ? 1 : MaxWeight / UINT32_MAX + 1; 93138402dc9SDuncan P. N. Exon Smith } 93238402dc9SDuncan P. N. Exon Smith 93338402dc9SDuncan P. N. Exon Smith /// \brief Scale an individual branch weight (and add 1). 93438402dc9SDuncan P. N. Exon Smith /// 93538402dc9SDuncan P. N. Exon Smith /// Scale a 64-bit weight down to 32-bits using \c Scale. 93638402dc9SDuncan P. N. Exon Smith /// 93738402dc9SDuncan P. N. Exon Smith /// According to Laplace's Rule of Succession, it is better to compute the 93838402dc9SDuncan P. N. Exon Smith /// weight based on the count plus 1, so universally add 1 to the value. 93938402dc9SDuncan P. N. Exon Smith /// 94038402dc9SDuncan P. N. Exon Smith /// \pre \c Scale was calculated by \a calculateWeightScale() with a weight no 94138402dc9SDuncan P. N. Exon Smith /// greater than \c Weight. 94238402dc9SDuncan P. N. Exon Smith static uint32_t scaleBranchWeight(uint64_t Weight, uint64_t Scale) { 94338402dc9SDuncan P. N. Exon Smith assert(Scale && "scale by 0?"); 94438402dc9SDuncan P. N. Exon Smith uint64_t Scaled = Weight / Scale + 1; 94538402dc9SDuncan P. N. Exon Smith assert(Scaled <= UINT32_MAX && "overflow 32-bits"); 94638402dc9SDuncan P. N. Exon Smith return Scaled; 94738402dc9SDuncan P. N. Exon Smith } 94838402dc9SDuncan P. N. Exon Smith 949ef512b99SJustin Bogner llvm::MDNode *CodeGenPGO::createBranchWeights(uint64_t TrueCount, 950ef512b99SJustin Bogner uint64_t FalseCount) { 95138402dc9SDuncan P. N. Exon Smith // Check for empty weights. 952ef512b99SJustin Bogner if (!TrueCount && !FalseCount) 953a5f804a7SDuncan P. N. Exon Smith return nullptr; 954ef512b99SJustin Bogner 95538402dc9SDuncan P. N. Exon Smith // Calculate how to scale down to 32-bits. 95638402dc9SDuncan P. N. Exon Smith uint64_t Scale = calculateWeightScale(std::max(TrueCount, FalseCount)); 95738402dc9SDuncan P. N. Exon Smith 958ef512b99SJustin Bogner llvm::MDBuilder MDHelper(CGM.getLLVMContext()); 95938402dc9SDuncan P. N. Exon Smith return MDHelper.createBranchWeights(scaleBranchWeight(TrueCount, Scale), 96038402dc9SDuncan P. N. Exon Smith scaleBranchWeight(FalseCount, Scale)); 961ef512b99SJustin Bogner } 962ef512b99SJustin Bogner 96395a27b0eSBob Wilson llvm::MDNode *CodeGenPGO::createBranchWeights(ArrayRef<uint64_t> Weights) { 96438402dc9SDuncan P. N. Exon Smith // We need at least two elements to create meaningful weights. 96538402dc9SDuncan P. N. Exon Smith if (Weights.size() < 2) 966a5f804a7SDuncan P. N. Exon Smith return nullptr; 96738402dc9SDuncan P. N. Exon Smith 96838402dc9SDuncan P. N. Exon Smith // Calculate how to scale down to 32-bits. 96938402dc9SDuncan P. N. Exon Smith uint64_t Scale = calculateWeightScale(*std::max_element(Weights.begin(), 97038402dc9SDuncan P. N. Exon Smith Weights.end())); 97138402dc9SDuncan P. N. Exon Smith 972ef512b99SJustin Bogner SmallVector<uint32_t, 16> ScaledWeights; 973ef512b99SJustin Bogner ScaledWeights.reserve(Weights.size()); 97438402dc9SDuncan P. N. Exon Smith for (uint64_t W : Weights) 97538402dc9SDuncan P. N. Exon Smith ScaledWeights.push_back(scaleBranchWeight(W, Scale)); 97638402dc9SDuncan P. N. Exon Smith 97738402dc9SDuncan P. N. Exon Smith llvm::MDBuilder MDHelper(CGM.getLLVMContext()); 978ef512b99SJustin Bogner return MDHelper.createBranchWeights(ScaledWeights); 979ef512b99SJustin Bogner } 980bf854f0fSBob Wilson 981bf854f0fSBob Wilson llvm::MDNode *CodeGenPGO::createLoopWeights(const Stmt *Cond, 982bf854f0fSBob Wilson RegionCounter &Cnt) { 983bf854f0fSBob Wilson if (!haveRegionCounts()) 984a5f804a7SDuncan P. N. Exon Smith return nullptr; 985bf854f0fSBob Wilson uint64_t LoopCount = Cnt.getCount(); 986bf854f0fSBob Wilson uint64_t CondCount = 0; 987bf854f0fSBob Wilson bool Found = getStmtCount(Cond, CondCount); 988bf854f0fSBob Wilson assert(Found && "missing expected loop condition count"); 989bf854f0fSBob Wilson (void)Found; 990bf854f0fSBob Wilson if (CondCount == 0) 991a5f804a7SDuncan P. N. Exon Smith return nullptr; 992bf854f0fSBob Wilson return createBranchWeights(LoopCount, 993bf854f0fSBob Wilson std::max(CondCount, LoopCount) - LoopCount); 994bf854f0fSBob Wilson } 995