1ef512b99SJustin Bogner //===--- CodeGenPGO.cpp - PGO Instrumentation for LLVM CodeGen --*- C++ -*-===// 2ef512b99SJustin Bogner // 3ef512b99SJustin Bogner // The LLVM Compiler Infrastructure 4ef512b99SJustin Bogner // 5ef512b99SJustin Bogner // This file is distributed under the University of Illinois Open Source 6ef512b99SJustin Bogner // License. See LICENSE.TXT for details. 7ef512b99SJustin Bogner // 8ef512b99SJustin Bogner //===----------------------------------------------------------------------===// 9ef512b99SJustin Bogner // 10ef512b99SJustin Bogner // Instrumentation-based profile-guided optimization 11ef512b99SJustin Bogner // 12ef512b99SJustin Bogner //===----------------------------------------------------------------------===// 13ef512b99SJustin Bogner 14ef512b99SJustin Bogner #include "CodeGenPGO.h" 15ef512b99SJustin Bogner #include "CodeGenFunction.h" 16ef512b99SJustin Bogner #include "clang/AST/RecursiveASTVisitor.h" 17ef512b99SJustin Bogner #include "clang/AST/StmtVisitor.h" 18529f6dd8SJustin Bogner #include "llvm/Config/config.h" // for strtoull()/strtoll() define 19ef512b99SJustin Bogner #include "llvm/IR/MDBuilder.h" 20ef512b99SJustin Bogner #include "llvm/Support/FileSystem.h" 21ef512b99SJustin Bogner 22ef512b99SJustin Bogner using namespace clang; 23ef512b99SJustin Bogner using namespace CodeGen; 24ef512b99SJustin Bogner 25d66a17d0SJustin Bogner static void ReportBadPGOData(CodeGenModule &CGM, const char *Message) { 26d66a17d0SJustin Bogner DiagnosticsEngine &Diags = CGM.getDiags(); 27d66a17d0SJustin Bogner unsigned diagID = Diags.getCustomDiagID(DiagnosticsEngine::Error, "%0"); 28d66a17d0SJustin Bogner Diags.Report(diagID) << Message; 29d66a17d0SJustin Bogner } 30d66a17d0SJustin Bogner 31d66a17d0SJustin Bogner PGOProfileData::PGOProfileData(CodeGenModule &CGM, std::string Path) 32d66a17d0SJustin Bogner : CGM(CGM) { 33d66a17d0SJustin Bogner if (llvm::MemoryBuffer::getFile(Path, DataBuffer)) { 34d66a17d0SJustin Bogner ReportBadPGOData(CGM, "failed to open pgo data file"); 35d66a17d0SJustin Bogner return; 36d66a17d0SJustin Bogner } 37d66a17d0SJustin Bogner 38d66a17d0SJustin Bogner if (DataBuffer->getBufferSize() > std::numeric_limits<unsigned>::max()) { 39d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file too big"); 40d66a17d0SJustin Bogner return; 41d66a17d0SJustin Bogner } 42d66a17d0SJustin Bogner 43d66a17d0SJustin Bogner // Scan through the data file and map each function to the corresponding 44d66a17d0SJustin Bogner // file offset where its counts are stored. 45d66a17d0SJustin Bogner const char *BufferStart = DataBuffer->getBufferStart(); 46d66a17d0SJustin Bogner const char *BufferEnd = DataBuffer->getBufferEnd(); 47d66a17d0SJustin Bogner const char *CurPtr = BufferStart; 48d66a17d0SJustin Bogner uint64_t MaxCount = 0; 49d66a17d0SJustin Bogner while (CurPtr < BufferEnd) { 50d66a17d0SJustin Bogner // Read the function name. 51d66a17d0SJustin Bogner const char *FuncStart = CurPtr; 52d66a17d0SJustin Bogner // For Objective-C methods, the name may include whitespace, so search 53d66a17d0SJustin Bogner // backward from the end of the line to find the space that separates the 54d66a17d0SJustin Bogner // name from the number of counters. (This is a temporary hack since we are 55d66a17d0SJustin Bogner // going to completely replace this file format in the near future.) 56d66a17d0SJustin Bogner CurPtr = strchr(CurPtr, '\n'); 57d66a17d0SJustin Bogner if (!CurPtr) { 58d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file has malformed function entry"); 59d66a17d0SJustin Bogner return; 60d66a17d0SJustin Bogner } 61d66a17d0SJustin Bogner StringRef FuncName(FuncStart, CurPtr - FuncStart); 62d66a17d0SJustin Bogner 63b4416f58SJustin Bogner // Skip over the function hash. 64b4416f58SJustin Bogner CurPtr = strchr(++CurPtr, '\n'); 65b4416f58SJustin Bogner if (!CurPtr) { 66b4416f58SJustin Bogner ReportBadPGOData(CGM, "pgo data file is missing the function hash"); 67b4416f58SJustin Bogner return; 68b4416f58SJustin Bogner } 69b4416f58SJustin Bogner 70d66a17d0SJustin Bogner // Read the number of counters. 71d66a17d0SJustin Bogner char *EndPtr; 72d66a17d0SJustin Bogner unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10); 73d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n' || NumCounters <= 0) { 74d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file has unexpected number of counters"); 75d66a17d0SJustin Bogner return; 76d66a17d0SJustin Bogner } 77d66a17d0SJustin Bogner CurPtr = EndPtr; 78d66a17d0SJustin Bogner 79d66a17d0SJustin Bogner // Read function count. 80d66a17d0SJustin Bogner uint64_t Count = strtoll(CurPtr, &EndPtr, 10); 81d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n') { 82d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has bad count value"); 83d66a17d0SJustin Bogner return; 84d66a17d0SJustin Bogner } 85d66a17d0SJustin Bogner CurPtr = EndPtr; // Point to '\n'. 86d66a17d0SJustin Bogner FunctionCounts[FuncName] = Count; 87d66a17d0SJustin Bogner MaxCount = Count > MaxCount ? Count : MaxCount; 88d66a17d0SJustin Bogner 89d66a17d0SJustin Bogner // There is one line for each counter; skip over those lines. 90d66a17d0SJustin Bogner // Since function count is already read, we start the loop from 1. 91d66a17d0SJustin Bogner for (unsigned N = 1; N < NumCounters; ++N) { 92d66a17d0SJustin Bogner CurPtr = strchr(++CurPtr, '\n'); 93d66a17d0SJustin Bogner if (!CurPtr) { 94d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo data file is missing some counter info"); 95d66a17d0SJustin Bogner return; 96d66a17d0SJustin Bogner } 97d66a17d0SJustin Bogner } 98d66a17d0SJustin Bogner 99d66a17d0SJustin Bogner // Skip over the blank line separating functions. 100d66a17d0SJustin Bogner CurPtr += 2; 101d66a17d0SJustin Bogner 102d66a17d0SJustin Bogner DataOffsets[FuncName] = FuncStart - BufferStart; 103d66a17d0SJustin Bogner } 104d66a17d0SJustin Bogner MaxFunctionCount = MaxCount; 105d66a17d0SJustin Bogner } 106d66a17d0SJustin Bogner 107b4416f58SJustin Bogner bool PGOProfileData::getFunctionCounts(StringRef FuncName, uint64_t &FuncHash, 108d66a17d0SJustin Bogner std::vector<uint64_t> &Counts) { 109d66a17d0SJustin Bogner // Find the relevant section of the pgo-data file. 110d66a17d0SJustin Bogner llvm::StringMap<unsigned>::const_iterator OffsetIter = 111d66a17d0SJustin Bogner DataOffsets.find(FuncName); 112d66a17d0SJustin Bogner if (OffsetIter == DataOffsets.end()) 113d66a17d0SJustin Bogner return true; 114d66a17d0SJustin Bogner const char *CurPtr = DataBuffer->getBufferStart() + OffsetIter->getValue(); 115d66a17d0SJustin Bogner 116d66a17d0SJustin Bogner // Skip over the function name. 117d66a17d0SJustin Bogner CurPtr = strchr(CurPtr, '\n'); 118d66a17d0SJustin Bogner assert(CurPtr && "pgo-data has corrupted function entry"); 119b4416f58SJustin Bogner 120b4416f58SJustin Bogner char *EndPtr; 121b4416f58SJustin Bogner // Read the function hash. 122b4416f58SJustin Bogner FuncHash = strtoll(++CurPtr, &EndPtr, 10); 123b4416f58SJustin Bogner assert(EndPtr != CurPtr && *EndPtr == '\n' && 124b4416f58SJustin Bogner "pgo-data file has corrupted function hash"); 125b4416f58SJustin Bogner CurPtr = EndPtr; 126d66a17d0SJustin Bogner 127d66a17d0SJustin Bogner // Read the number of counters. 128d66a17d0SJustin Bogner unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10); 129d66a17d0SJustin Bogner assert(EndPtr != CurPtr && *EndPtr == '\n' && NumCounters > 0 && 130d66a17d0SJustin Bogner "pgo-data file has corrupted number of counters"); 131d66a17d0SJustin Bogner CurPtr = EndPtr; 132d66a17d0SJustin Bogner 133d66a17d0SJustin Bogner Counts.reserve(NumCounters); 134d66a17d0SJustin Bogner 135d66a17d0SJustin Bogner for (unsigned N = 0; N < NumCounters; ++N) { 136d66a17d0SJustin Bogner // Read the count value. 137d66a17d0SJustin Bogner uint64_t Count = strtoll(CurPtr, &EndPtr, 10); 138d66a17d0SJustin Bogner if (EndPtr == CurPtr || *EndPtr != '\n') { 139d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has bad count value"); 140d66a17d0SJustin Bogner return true; 141d66a17d0SJustin Bogner } 142d66a17d0SJustin Bogner Counts.push_back(Count); 143d66a17d0SJustin Bogner CurPtr = EndPtr + 1; 144d66a17d0SJustin Bogner } 145d66a17d0SJustin Bogner 146d66a17d0SJustin Bogner // Make sure the number of counters matches up. 147d66a17d0SJustin Bogner if (Counts.size() != NumCounters) { 148d66a17d0SJustin Bogner ReportBadPGOData(CGM, "pgo-data file has inconsistent counters"); 149d66a17d0SJustin Bogner return true; 150d66a17d0SJustin Bogner } 151d66a17d0SJustin Bogner 152d66a17d0SJustin Bogner return false; 153d66a17d0SJustin Bogner } 154d66a17d0SJustin Bogner 155da1ebedeSBob Wilson void CodeGenPGO::setFuncName(llvm::Function *Fn) { 1562fe531cbSDuncan P. N. Exon Smith RawFuncName = Fn->getName(); 157da1ebedeSBob Wilson 158da1ebedeSBob Wilson // Function names may be prefixed with a binary '1' to indicate 159da1ebedeSBob Wilson // that the backend should not modify the symbols due to any platform 160da1ebedeSBob Wilson // naming convention. Do not include that '1' in the PGO profile name. 1612fe531cbSDuncan P. N. Exon Smith if (RawFuncName[0] == '\1') 1622fe531cbSDuncan P. N. Exon Smith RawFuncName = RawFuncName.substr(1); 163da1ebedeSBob Wilson 164da1ebedeSBob Wilson if (!Fn->hasLocalLinkage()) { 1651b67cfd4SDuncan P. N. Exon Smith PrefixedFuncName.reset(new std::string(RawFuncName)); 166da1ebedeSBob Wilson return; 167da1ebedeSBob Wilson } 168da1ebedeSBob Wilson 169da1ebedeSBob Wilson // For local symbols, prepend the main file name to distinguish them. 170da1ebedeSBob Wilson // Do not include the full path in the file name since there's no guarantee 171da1ebedeSBob Wilson // that it will stay the same, e.g., if the files are checked out from 172da1ebedeSBob Wilson // version control in different locations. 1731b67cfd4SDuncan P. N. Exon Smith PrefixedFuncName.reset(new std::string(CGM.getCodeGenOpts().MainFileName)); 1742fe531cbSDuncan P. N. Exon Smith if (PrefixedFuncName->empty()) 1752fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->assign("<unknown>"); 1762fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->append(":"); 1772fe531cbSDuncan P. N. Exon Smith PrefixedFuncName->append(RawFuncName); 178da1ebedeSBob Wilson } 179da1ebedeSBob Wilson 1802fe531cbSDuncan P. N. Exon Smith static llvm::Function *getRegisterFunc(CodeGenModule &CGM) { 181a7807637SDuncan P. N. Exon Smith return CGM.getModule().getFunction("__llvm_profile_register_functions"); 1822fe531cbSDuncan P. N. Exon Smith } 1832fe531cbSDuncan P. N. Exon Smith 1842fe531cbSDuncan P. N. Exon Smith static llvm::BasicBlock *getOrInsertRegisterBB(CodeGenModule &CGM) { 185780443e8SDuncan P. N. Exon Smith // Don't do this for Darwin. compiler-rt uses linker magic. 186780443e8SDuncan P. N. Exon Smith if (CGM.getTarget().getTriple().isOSDarwin()) 187780443e8SDuncan P. N. Exon Smith return nullptr; 188780443e8SDuncan P. N. Exon Smith 1892fe531cbSDuncan P. N. Exon Smith // Only need to insert this once per module. 1902fe531cbSDuncan P. N. Exon Smith if (llvm::Function *RegisterF = getRegisterFunc(CGM)) 1912fe531cbSDuncan P. N. Exon Smith return &RegisterF->getEntryBlock(); 1922fe531cbSDuncan P. N. Exon Smith 1932fe531cbSDuncan P. N. Exon Smith // Construct the function. 1942fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 1952fe531cbSDuncan P. N. Exon Smith auto *RegisterFTy = llvm::FunctionType::get(VoidTy, false); 1962fe531cbSDuncan P. N. Exon Smith auto *RegisterF = llvm::Function::Create(RegisterFTy, 1972fe531cbSDuncan P. N. Exon Smith llvm::GlobalValue::InternalLinkage, 198a7807637SDuncan P. N. Exon Smith "__llvm_profile_register_functions", 1992fe531cbSDuncan P. N. Exon Smith &CGM.getModule()); 2002fe531cbSDuncan P. N. Exon Smith RegisterF->setUnnamedAddr(true); 2012fe531cbSDuncan P. N. Exon Smith if (CGM.getCodeGenOpts().DisableRedZone) 2022fe531cbSDuncan P. N. Exon Smith RegisterF->addFnAttr(llvm::Attribute::NoRedZone); 2032fe531cbSDuncan P. N. Exon Smith 2042fe531cbSDuncan P. N. Exon Smith // Construct and return the entry block. 2052fe531cbSDuncan P. N. Exon Smith auto *BB = llvm::BasicBlock::Create(CGM.getLLVMContext(), "", RegisterF); 2062fe531cbSDuncan P. N. Exon Smith CGBuilderTy Builder(BB); 2072fe531cbSDuncan P. N. Exon Smith Builder.CreateRetVoid(); 2082fe531cbSDuncan P. N. Exon Smith return BB; 2092fe531cbSDuncan P. N. Exon Smith } 2102fe531cbSDuncan P. N. Exon Smith 2112fe531cbSDuncan P. N. Exon Smith static llvm::Constant *getOrInsertRuntimeRegister(CodeGenModule &CGM) { 2122fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 2132fe531cbSDuncan P. N. Exon Smith auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext()); 2142fe531cbSDuncan P. N. Exon Smith auto *RuntimeRegisterTy = llvm::FunctionType::get(VoidTy, VoidPtrTy, false); 215a7807637SDuncan P. N. Exon Smith return CGM.getModule().getOrInsertFunction("__llvm_profile_register_function", 2162fe531cbSDuncan P. N. Exon Smith RuntimeRegisterTy); 2172fe531cbSDuncan P. N. Exon Smith } 2182fe531cbSDuncan P. N. Exon Smith 2197134d47dSDuncan P. N. Exon Smith static bool isMachO(const CodeGenModule &CGM) { 2207134d47dSDuncan P. N. Exon Smith return CGM.getTarget().getTriple().isOSBinFormatMachO(); 2217134d47dSDuncan P. N. Exon Smith } 2227134d47dSDuncan P. N. Exon Smith 2232fe531cbSDuncan P. N. Exon Smith static StringRef getCountersSection(const CodeGenModule &CGM) { 224a7807637SDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_prf_cnts" : "__llvm_prf_cnts"; 2252fe531cbSDuncan P. N. Exon Smith } 2262fe531cbSDuncan P. N. Exon Smith 2272fe531cbSDuncan P. N. Exon Smith static StringRef getNameSection(const CodeGenModule &CGM) { 228a7807637SDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_prf_names" : "__llvm_prf_names"; 2292fe531cbSDuncan P. N. Exon Smith } 2302fe531cbSDuncan P. N. Exon Smith 2312fe531cbSDuncan P. N. Exon Smith static StringRef getDataSection(const CodeGenModule &CGM) { 232a7807637SDuncan P. N. Exon Smith return isMachO(CGM) ? "__DATA,__llvm_prf_data" : "__llvm_prf_data"; 2332fe531cbSDuncan P. N. Exon Smith } 2342fe531cbSDuncan P. N. Exon Smith 2352fe531cbSDuncan P. N. Exon Smith llvm::GlobalVariable *CodeGenPGO::buildDataVar() { 2362fe531cbSDuncan P. N. Exon Smith // Create name variable. 2372fe531cbSDuncan P. N. Exon Smith llvm::LLVMContext &Ctx = CGM.getLLVMContext(); 2382fe531cbSDuncan P. N. Exon Smith auto *VarName = llvm::ConstantDataArray::getString(Ctx, getFuncName(), 2392fe531cbSDuncan P. N. Exon Smith false); 2402fe531cbSDuncan P. N. Exon Smith auto *Name = new llvm::GlobalVariable(CGM.getModule(), VarName->getType(), 24173f78627SDuncan P. N. Exon Smith true, VarLinkage, VarName, 2422fe531cbSDuncan P. N. Exon Smith getFuncVarName("name")); 2432fe531cbSDuncan P. N. Exon Smith Name->setSection(getNameSection(CGM)); 2442fe531cbSDuncan P. N. Exon Smith Name->setAlignment(1); 2452fe531cbSDuncan P. N. Exon Smith 2462fe531cbSDuncan P. N. Exon Smith // Create data variable. 2472fe531cbSDuncan P. N. Exon Smith auto *Int32Ty = llvm::Type::getInt32Ty(Ctx); 248b4416f58SJustin Bogner auto *Int64Ty = llvm::Type::getInt64Ty(Ctx); 2492fe531cbSDuncan P. N. Exon Smith auto *Int8PtrTy = llvm::Type::getInt8PtrTy(Ctx); 2502fe531cbSDuncan P. N. Exon Smith auto *Int64PtrTy = llvm::Type::getInt64PtrTy(Ctx); 2512fe531cbSDuncan P. N. Exon Smith llvm::Type *DataTypes[] = { 252b4416f58SJustin Bogner Int32Ty, Int32Ty, Int64Ty, Int8PtrTy, Int64PtrTy 2532fe531cbSDuncan P. N. Exon Smith }; 2542fe531cbSDuncan P. N. Exon Smith auto *DataTy = llvm::StructType::get(Ctx, makeArrayRef(DataTypes)); 2552fe531cbSDuncan P. N. Exon Smith llvm::Constant *DataVals[] = { 2562fe531cbSDuncan P. N. Exon Smith llvm::ConstantInt::get(Int32Ty, getFuncName().size()), 2572fe531cbSDuncan P. N. Exon Smith llvm::ConstantInt::get(Int32Ty, NumRegionCounters), 258b4416f58SJustin Bogner llvm::ConstantInt::get(Int64Ty, FunctionHash), 2592fe531cbSDuncan P. N. Exon Smith llvm::ConstantExpr::getBitCast(Name, Int8PtrTy), 2602fe531cbSDuncan P. N. Exon Smith llvm::ConstantExpr::getBitCast(RegionCounters, Int64PtrTy) 2612fe531cbSDuncan P. N. Exon Smith }; 2622fe531cbSDuncan P. N. Exon Smith auto *Data = 26373f78627SDuncan P. N. Exon Smith new llvm::GlobalVariable(CGM.getModule(), DataTy, true, VarLinkage, 2642fe531cbSDuncan P. N. Exon Smith llvm::ConstantStruct::get(DataTy, DataVals), 2652fe531cbSDuncan P. N. Exon Smith getFuncVarName("data")); 2662fe531cbSDuncan P. N. Exon Smith 2672fe531cbSDuncan P. N. Exon Smith // All the data should be packed into an array in its own section. 2682fe531cbSDuncan P. N. Exon Smith Data->setSection(getDataSection(CGM)); 2692fe531cbSDuncan P. N. Exon Smith Data->setAlignment(8); 2702fe531cbSDuncan P. N. Exon Smith 2712fe531cbSDuncan P. N. Exon Smith // Make sure the data doesn't get deleted. 2722fe531cbSDuncan P. N. Exon Smith CGM.addUsedGlobal(Data); 2732fe531cbSDuncan P. N. Exon Smith return Data; 2742fe531cbSDuncan P. N. Exon Smith } 2752fe531cbSDuncan P. N. Exon Smith 2762fe531cbSDuncan P. N. Exon Smith void CodeGenPGO::emitInstrumentationData() { 277ef512b99SJustin Bogner if (!CGM.getCodeGenOpts().ProfileInstrGenerate) 278ef512b99SJustin Bogner return; 279ef512b99SJustin Bogner 2802fe531cbSDuncan P. N. Exon Smith // Build the data. 2812fe531cbSDuncan P. N. Exon Smith auto *Data = buildDataVar(); 282ef512b99SJustin Bogner 2832fe531cbSDuncan P. N. Exon Smith // Register the data. 284780443e8SDuncan P. N. Exon Smith auto *RegisterBB = getOrInsertRegisterBB(CGM); 285780443e8SDuncan P. N. Exon Smith if (!RegisterBB) 286780443e8SDuncan P. N. Exon Smith return; 287780443e8SDuncan P. N. Exon Smith CGBuilderTy Builder(RegisterBB->getTerminator()); 2882fe531cbSDuncan P. N. Exon Smith auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext()); 2892fe531cbSDuncan P. N. Exon Smith Builder.CreateCall(getOrInsertRuntimeRegister(CGM), 2902fe531cbSDuncan P. N. Exon Smith Builder.CreateBitCast(Data, VoidPtrTy)); 291ef512b99SJustin Bogner } 292ef512b99SJustin Bogner 293ef512b99SJustin Bogner llvm::Function *CodeGenPGO::emitInitialization(CodeGenModule &CGM) { 2942fe531cbSDuncan P. N. Exon Smith if (!CGM.getCodeGenOpts().ProfileInstrGenerate) 295a5f804a7SDuncan P. N. Exon Smith return nullptr; 296ef512b99SJustin Bogner 2972fe531cbSDuncan P. N. Exon Smith // Only need to create this once per module. 298a7807637SDuncan P. N. Exon Smith if (CGM.getModule().getFunction("__llvm_profile_init")) 299a5f804a7SDuncan P. N. Exon Smith return nullptr; 300ef512b99SJustin Bogner 3015188e91cSDuncan P. N. Exon Smith // Get the function to call at initialization. 3022fe531cbSDuncan P. N. Exon Smith llvm::Constant *RegisterF = getRegisterFunc(CGM); 3035188e91cSDuncan P. N. Exon Smith if (!RegisterF) 304a5f804a7SDuncan P. N. Exon Smith return nullptr; 3052fe531cbSDuncan P. N. Exon Smith 3062fe531cbSDuncan P. N. Exon Smith // Create the initialization function. 3072fe531cbSDuncan P. N. Exon Smith auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext()); 3082fe531cbSDuncan P. N. Exon Smith auto *F = llvm::Function::Create(llvm::FunctionType::get(VoidTy, false), 3092fe531cbSDuncan P. N. Exon Smith llvm::GlobalValue::InternalLinkage, 310a7807637SDuncan P. N. Exon Smith "__llvm_profile_init", &CGM.getModule()); 311ef512b99SJustin Bogner F->setUnnamedAddr(true); 312ef512b99SJustin Bogner F->addFnAttr(llvm::Attribute::NoInline); 313ef512b99SJustin Bogner if (CGM.getCodeGenOpts().DisableRedZone) 314ef512b99SJustin Bogner F->addFnAttr(llvm::Attribute::NoRedZone); 315ef512b99SJustin Bogner 3162fe531cbSDuncan P. N. Exon Smith // Add the basic block and the necessary calls. 3172fe531cbSDuncan P. N. Exon Smith CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", F)); 3182fe531cbSDuncan P. N. Exon Smith Builder.CreateCall(RegisterF); 3192fe531cbSDuncan P. N. Exon Smith Builder.CreateRetVoid(); 320ef512b99SJustin Bogner 321ef512b99SJustin Bogner return F; 322ef512b99SJustin Bogner } 323ef512b99SJustin Bogner 324ef512b99SJustin Bogner namespace { 325ef512b99SJustin Bogner /// A StmtVisitor that fills a map of statements to PGO counters. 326ef512b99SJustin Bogner struct MapRegionCounters : public ConstStmtVisitor<MapRegionCounters> { 327ef512b99SJustin Bogner /// The next counter value to assign. 328ef512b99SJustin Bogner unsigned NextCounter; 329ef512b99SJustin Bogner /// The map of statements to counters. 3303586be72SDuncan P. N. Exon Smith llvm::DenseMap<const Stmt *, unsigned> &CounterMap; 331ef512b99SJustin Bogner 3323586be72SDuncan P. N. Exon Smith MapRegionCounters(llvm::DenseMap<const Stmt *, unsigned> &CounterMap) 3333586be72SDuncan P. N. Exon Smith : NextCounter(0), CounterMap(CounterMap) {} 334ef512b99SJustin Bogner 335ef512b99SJustin Bogner void VisitChildren(const Stmt *S) { 336ef512b99SJustin Bogner for (Stmt::const_child_range I = S->children(); I; ++I) 337ef512b99SJustin Bogner if (*I) 338ef512b99SJustin Bogner this->Visit(*I); 339ef512b99SJustin Bogner } 340ef512b99SJustin Bogner void VisitStmt(const Stmt *S) { VisitChildren(S); } 341ef512b99SJustin Bogner 342ea278c32SJustin Bogner /// Assign a counter to track entry to the function body. 343ef512b99SJustin Bogner void VisitFunctionDecl(const FunctionDecl *S) { 3443586be72SDuncan P. N. Exon Smith CounterMap[S->getBody()] = NextCounter++; 345ef512b99SJustin Bogner Visit(S->getBody()); 346ef512b99SJustin Bogner } 3475ec8fe19SBob Wilson void VisitObjCMethodDecl(const ObjCMethodDecl *S) { 3483586be72SDuncan P. N. Exon Smith CounterMap[S->getBody()] = NextCounter++; 3495ec8fe19SBob Wilson Visit(S->getBody()); 3505ec8fe19SBob Wilson } 351c845c00aSBob Wilson void VisitBlockDecl(const BlockDecl *S) { 3523586be72SDuncan P. N. Exon Smith CounterMap[S->getBody()] = NextCounter++; 353c845c00aSBob Wilson Visit(S->getBody()); 354c845c00aSBob Wilson } 355ea278c32SJustin Bogner /// Assign a counter to track the block following a label. 356ef512b99SJustin Bogner void VisitLabelStmt(const LabelStmt *S) { 3573586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 358ef512b99SJustin Bogner Visit(S->getSubStmt()); 359ef512b99SJustin Bogner } 360bf854f0fSBob Wilson /// Assign a counter for the body of a while loop. 361ef512b99SJustin Bogner void VisitWhileStmt(const WhileStmt *S) { 3623586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 363ef512b99SJustin Bogner Visit(S->getCond()); 364ef512b99SJustin Bogner Visit(S->getBody()); 365ef512b99SJustin Bogner } 366bf854f0fSBob Wilson /// Assign a counter for the body of a do-while loop. 367ef512b99SJustin Bogner void VisitDoStmt(const DoStmt *S) { 3683586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 369ef512b99SJustin Bogner Visit(S->getBody()); 370ef512b99SJustin Bogner Visit(S->getCond()); 371ef512b99SJustin Bogner } 372bf854f0fSBob Wilson /// Assign a counter for the body of a for loop. 373ef512b99SJustin Bogner void VisitForStmt(const ForStmt *S) { 3743586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 375bf854f0fSBob Wilson if (S->getInit()) 376bf854f0fSBob Wilson Visit(S->getInit()); 377ef512b99SJustin Bogner const Expr *E; 378ef512b99SJustin Bogner if ((E = S->getCond())) 379ef512b99SJustin Bogner Visit(E); 380ef512b99SJustin Bogner if ((E = S->getInc())) 381ef512b99SJustin Bogner Visit(E); 382bf854f0fSBob Wilson Visit(S->getBody()); 383ef512b99SJustin Bogner } 384bf854f0fSBob Wilson /// Assign a counter for the body of a for-range loop. 385ef512b99SJustin Bogner void VisitCXXForRangeStmt(const CXXForRangeStmt *S) { 3863586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 387bf854f0fSBob Wilson Visit(S->getRangeStmt()); 388bf854f0fSBob Wilson Visit(S->getBeginEndStmt()); 389bf854f0fSBob Wilson Visit(S->getCond()); 390bf854f0fSBob Wilson Visit(S->getLoopVarStmt()); 391ef512b99SJustin Bogner Visit(S->getBody()); 392bf854f0fSBob Wilson Visit(S->getInc()); 393ef512b99SJustin Bogner } 394bf854f0fSBob Wilson /// Assign a counter for the body of a for-collection loop. 395ef512b99SJustin Bogner void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) { 3963586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 397ef512b99SJustin Bogner Visit(S->getElement()); 398ef512b99SJustin Bogner Visit(S->getBody()); 399ef512b99SJustin Bogner } 400ef512b99SJustin Bogner /// Assign a counter for the exit block of the switch statement. 401ef512b99SJustin Bogner void VisitSwitchStmt(const SwitchStmt *S) { 4023586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 403ef512b99SJustin Bogner Visit(S->getCond()); 404ef512b99SJustin Bogner Visit(S->getBody()); 405ef512b99SJustin Bogner } 406ef512b99SJustin Bogner /// Assign a counter for a particular case in a switch. This counts jumps 407ef512b99SJustin Bogner /// from the switch header as well as fallthrough from the case before this 408ef512b99SJustin Bogner /// one. 409ef512b99SJustin Bogner void VisitCaseStmt(const CaseStmt *S) { 4103586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 411ef512b99SJustin Bogner Visit(S->getSubStmt()); 412ef512b99SJustin Bogner } 413ef512b99SJustin Bogner /// Assign a counter for the default case of a switch statement. The count 414ef512b99SJustin Bogner /// is the number of branches from the loop header to the default, and does 415ef512b99SJustin Bogner /// not include fallthrough from previous cases. If we have multiple 416ef512b99SJustin Bogner /// conditional branch blocks from the switch instruction to the default 417ef512b99SJustin Bogner /// block, as with large GNU case ranges, this is the counter for the last 418ef512b99SJustin Bogner /// edge in that series, rather than the first. 419ef512b99SJustin Bogner void VisitDefaultStmt(const DefaultStmt *S) { 4203586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 421ef512b99SJustin Bogner Visit(S->getSubStmt()); 422ef512b99SJustin Bogner } 423ef512b99SJustin Bogner /// Assign a counter for the "then" part of an if statement. The count for 424ef512b99SJustin Bogner /// the "else" part, if it exists, will be calculated from this counter. 425ef512b99SJustin Bogner void VisitIfStmt(const IfStmt *S) { 4263586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 427ef512b99SJustin Bogner Visit(S->getCond()); 428ef512b99SJustin Bogner Visit(S->getThen()); 429ef512b99SJustin Bogner if (S->getElse()) 430ef512b99SJustin Bogner Visit(S->getElse()); 431ef512b99SJustin Bogner } 432ef512b99SJustin Bogner /// Assign a counter for the continuation block of a C++ try statement. 433ef512b99SJustin Bogner void VisitCXXTryStmt(const CXXTryStmt *S) { 4343586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 435ef512b99SJustin Bogner Visit(S->getTryBlock()); 436ef512b99SJustin Bogner for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I) 437ef512b99SJustin Bogner Visit(S->getHandler(I)); 438ef512b99SJustin Bogner } 439ef512b99SJustin Bogner /// Assign a counter for a catch statement's handler block. 440ef512b99SJustin Bogner void VisitCXXCatchStmt(const CXXCatchStmt *S) { 4413586be72SDuncan P. N. Exon Smith CounterMap[S] = NextCounter++; 442ef512b99SJustin Bogner Visit(S->getHandlerBlock()); 443ef512b99SJustin Bogner } 444ef512b99SJustin Bogner /// Assign a counter for the "true" part of a conditional operator. The 445ef512b99SJustin Bogner /// count in the "false" part will be calculated from this counter. 446ef512b99SJustin Bogner void VisitConditionalOperator(const ConditionalOperator *E) { 4473586be72SDuncan P. N. Exon Smith CounterMap[E] = NextCounter++; 448ef512b99SJustin Bogner Visit(E->getCond()); 449ef512b99SJustin Bogner Visit(E->getTrueExpr()); 450ef512b99SJustin Bogner Visit(E->getFalseExpr()); 451ef512b99SJustin Bogner } 452ef512b99SJustin Bogner /// Assign a counter for the right hand side of a logical and operator. 453ef512b99SJustin Bogner void VisitBinLAnd(const BinaryOperator *E) { 4543586be72SDuncan P. N. Exon Smith CounterMap[E] = NextCounter++; 455ef512b99SJustin Bogner Visit(E->getLHS()); 456ef512b99SJustin Bogner Visit(E->getRHS()); 457ef512b99SJustin Bogner } 458ef512b99SJustin Bogner /// Assign a counter for the right hand side of a logical or operator. 459ef512b99SJustin Bogner void VisitBinLOr(const BinaryOperator *E) { 4603586be72SDuncan P. N. Exon Smith CounterMap[E] = NextCounter++; 461ef512b99SJustin Bogner Visit(E->getLHS()); 462ef512b99SJustin Bogner Visit(E->getRHS()); 463ef512b99SJustin Bogner } 464ef512b99SJustin Bogner }; 465bf854f0fSBob Wilson 466bf854f0fSBob Wilson /// A StmtVisitor that propagates the raw counts through the AST and 467bf854f0fSBob Wilson /// records the count at statements where the value may change. 468bf854f0fSBob Wilson struct ComputeRegionCounts : public ConstStmtVisitor<ComputeRegionCounts> { 469bf854f0fSBob Wilson /// PGO state. 470bf854f0fSBob Wilson CodeGenPGO &PGO; 471bf854f0fSBob Wilson 472bf854f0fSBob Wilson /// A flag that is set when the current count should be recorded on the 473bf854f0fSBob Wilson /// next statement, such as at the exit of a loop. 474bf854f0fSBob Wilson bool RecordNextStmtCount; 475bf854f0fSBob Wilson 476bf854f0fSBob Wilson /// The map of statements to count values. 4773586be72SDuncan P. N. Exon Smith llvm::DenseMap<const Stmt *, uint64_t> &CountMap; 478bf854f0fSBob Wilson 479bf854f0fSBob Wilson /// BreakContinueStack - Keep counts of breaks and continues inside loops. 480bf854f0fSBob Wilson struct BreakContinue { 481bf854f0fSBob Wilson uint64_t BreakCount; 482bf854f0fSBob Wilson uint64_t ContinueCount; 483bf854f0fSBob Wilson BreakContinue() : BreakCount(0), ContinueCount(0) {} 484bf854f0fSBob Wilson }; 485bf854f0fSBob Wilson SmallVector<BreakContinue, 8> BreakContinueStack; 486bf854f0fSBob Wilson 4873586be72SDuncan P. N. Exon Smith ComputeRegionCounts(llvm::DenseMap<const Stmt *, uint64_t> &CountMap, 4883586be72SDuncan P. N. Exon Smith CodeGenPGO &PGO) 4893586be72SDuncan P. N. Exon Smith : PGO(PGO), RecordNextStmtCount(false), CountMap(CountMap) {} 490bf854f0fSBob Wilson 491bf854f0fSBob Wilson void RecordStmtCount(const Stmt *S) { 492bf854f0fSBob Wilson if (RecordNextStmtCount) { 4933586be72SDuncan P. N. Exon Smith CountMap[S] = PGO.getCurrentRegionCount(); 494bf854f0fSBob Wilson RecordNextStmtCount = false; 495bf854f0fSBob Wilson } 496bf854f0fSBob Wilson } 497bf854f0fSBob Wilson 498bf854f0fSBob Wilson void VisitStmt(const Stmt *S) { 499bf854f0fSBob Wilson RecordStmtCount(S); 500bf854f0fSBob Wilson for (Stmt::const_child_range I = S->children(); I; ++I) { 501bf854f0fSBob Wilson if (*I) 502bf854f0fSBob Wilson this->Visit(*I); 503bf854f0fSBob Wilson } 504bf854f0fSBob Wilson } 505bf854f0fSBob Wilson 506bf854f0fSBob Wilson void VisitFunctionDecl(const FunctionDecl *S) { 507bf854f0fSBob Wilson RegionCounter Cnt(PGO, S->getBody()); 508bf854f0fSBob Wilson Cnt.beginRegion(); 5093586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 510bf854f0fSBob Wilson Visit(S->getBody()); 511bf854f0fSBob Wilson } 512bf854f0fSBob Wilson 5135ec8fe19SBob Wilson void VisitObjCMethodDecl(const ObjCMethodDecl *S) { 5145ec8fe19SBob Wilson RegionCounter Cnt(PGO, S->getBody()); 5155ec8fe19SBob Wilson Cnt.beginRegion(); 5163586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 5175ec8fe19SBob Wilson Visit(S->getBody()); 5185ec8fe19SBob Wilson } 5195ec8fe19SBob Wilson 520c845c00aSBob Wilson void VisitBlockDecl(const BlockDecl *S) { 521c845c00aSBob Wilson RegionCounter Cnt(PGO, S->getBody()); 522c845c00aSBob Wilson Cnt.beginRegion(); 5233586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 524c845c00aSBob Wilson Visit(S->getBody()); 525c845c00aSBob Wilson } 526c845c00aSBob Wilson 527bf854f0fSBob Wilson void VisitReturnStmt(const ReturnStmt *S) { 528bf854f0fSBob Wilson RecordStmtCount(S); 529bf854f0fSBob Wilson if (S->getRetValue()) 530bf854f0fSBob Wilson Visit(S->getRetValue()); 531bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 532bf854f0fSBob Wilson RecordNextStmtCount = true; 533bf854f0fSBob Wilson } 534bf854f0fSBob Wilson 535bf854f0fSBob Wilson void VisitGotoStmt(const GotoStmt *S) { 536bf854f0fSBob Wilson RecordStmtCount(S); 537bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 538bf854f0fSBob Wilson RecordNextStmtCount = true; 539bf854f0fSBob Wilson } 540bf854f0fSBob Wilson 541bf854f0fSBob Wilson void VisitLabelStmt(const LabelStmt *S) { 542bf854f0fSBob Wilson RecordNextStmtCount = false; 543bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 544bf854f0fSBob Wilson Cnt.beginRegion(); 5453586be72SDuncan P. N. Exon Smith CountMap[S] = PGO.getCurrentRegionCount(); 546bf854f0fSBob Wilson Visit(S->getSubStmt()); 547bf854f0fSBob Wilson } 548bf854f0fSBob Wilson 549bf854f0fSBob Wilson void VisitBreakStmt(const BreakStmt *S) { 550bf854f0fSBob Wilson RecordStmtCount(S); 551bf854f0fSBob Wilson assert(!BreakContinueStack.empty() && "break not in a loop or switch!"); 552bf854f0fSBob Wilson BreakContinueStack.back().BreakCount += PGO.getCurrentRegionCount(); 553bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 554bf854f0fSBob Wilson RecordNextStmtCount = true; 555bf854f0fSBob Wilson } 556bf854f0fSBob Wilson 557bf854f0fSBob Wilson void VisitContinueStmt(const ContinueStmt *S) { 558bf854f0fSBob Wilson RecordStmtCount(S); 559bf854f0fSBob Wilson assert(!BreakContinueStack.empty() && "continue stmt not in a loop!"); 560bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount += PGO.getCurrentRegionCount(); 561bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 562bf854f0fSBob Wilson RecordNextStmtCount = true; 563bf854f0fSBob Wilson } 564bf854f0fSBob Wilson 565bf854f0fSBob Wilson void VisitWhileStmt(const WhileStmt *S) { 566bf854f0fSBob Wilson RecordStmtCount(S); 567bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 568bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 569bf854f0fSBob Wilson // Visit the body region first so the break/continue adjustments can be 570bf854f0fSBob Wilson // included when visiting the condition. 571bf854f0fSBob Wilson Cnt.beginRegion(); 5723586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 573bf854f0fSBob Wilson Visit(S->getBody()); 574bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 575bf854f0fSBob Wilson 576bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. The count 577bf854f0fSBob Wilson // at the start of the condition is the sum of the incoming edges, 578bf854f0fSBob Wilson // the backedge from the end of the loop body, and the edges from 579bf854f0fSBob Wilson // continue statements. 580bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 581bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 582bf854f0fSBob Wilson Cnt.getAdjustedCount() + BC.ContinueCount); 5833586be72SDuncan P. N. Exon Smith CountMap[S->getCond()] = PGO.getCurrentRegionCount(); 584bf854f0fSBob Wilson Visit(S->getCond()); 585bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 586bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 587bf854f0fSBob Wilson RecordNextStmtCount = true; 588bf854f0fSBob Wilson } 589bf854f0fSBob Wilson 590bf854f0fSBob Wilson void VisitDoStmt(const DoStmt *S) { 591bf854f0fSBob Wilson RecordStmtCount(S); 592bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 593bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 594bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 5953586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 596bf854f0fSBob Wilson Visit(S->getBody()); 597bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 598bf854f0fSBob Wilson 599bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 600bf854f0fSBob Wilson // The count at the start of the condition is equal to the count at the 601bf854f0fSBob Wilson // end of the body. The adjusted count does not include either the 602bf854f0fSBob Wilson // fall-through count coming into the loop or the continue count, so add 603bf854f0fSBob Wilson // both of those separately. This is coincidentally the same equation as 604bf854f0fSBob Wilson // with while loops but for different reasons. 605bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 606bf854f0fSBob Wilson Cnt.getAdjustedCount() + BC.ContinueCount); 6073586be72SDuncan P. N. Exon Smith CountMap[S->getCond()] = PGO.getCurrentRegionCount(); 608bf854f0fSBob Wilson Visit(S->getCond()); 609bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 610bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 611bf854f0fSBob Wilson RecordNextStmtCount = true; 612bf854f0fSBob Wilson } 613bf854f0fSBob Wilson 614bf854f0fSBob Wilson void VisitForStmt(const ForStmt *S) { 615bf854f0fSBob Wilson RecordStmtCount(S); 616bf854f0fSBob Wilson if (S->getInit()) 617bf854f0fSBob Wilson Visit(S->getInit()); 618bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 619bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 620bf854f0fSBob Wilson // Visit the body region first. (This is basically the same as a while 621bf854f0fSBob Wilson // loop; see further comments in VisitWhileStmt.) 622bf854f0fSBob Wilson Cnt.beginRegion(); 6233586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 624bf854f0fSBob Wilson Visit(S->getBody()); 625bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 626bf854f0fSBob Wilson 627bf854f0fSBob Wilson // The increment is essentially part of the body but it needs to include 628bf854f0fSBob Wilson // the count for all the continue statements. 629bf854f0fSBob Wilson if (S->getInc()) { 630bf854f0fSBob Wilson Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() + 631bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount); 6323586be72SDuncan P. N. Exon Smith CountMap[S->getInc()] = PGO.getCurrentRegionCount(); 633bf854f0fSBob Wilson Visit(S->getInc()); 634bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 635bf854f0fSBob Wilson } 636bf854f0fSBob Wilson 637bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 638bf854f0fSBob Wilson 639bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. 640bf854f0fSBob Wilson if (S->getCond()) { 641bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 642bf854f0fSBob Wilson Cnt.getAdjustedCount() + 643bf854f0fSBob Wilson BC.ContinueCount); 6443586be72SDuncan P. N. Exon Smith CountMap[S->getCond()] = PGO.getCurrentRegionCount(); 645bf854f0fSBob Wilson Visit(S->getCond()); 646bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 647bf854f0fSBob Wilson } 648bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 649bf854f0fSBob Wilson RecordNextStmtCount = true; 650bf854f0fSBob Wilson } 651bf854f0fSBob Wilson 652bf854f0fSBob Wilson void VisitCXXForRangeStmt(const CXXForRangeStmt *S) { 653bf854f0fSBob Wilson RecordStmtCount(S); 654bf854f0fSBob Wilson Visit(S->getRangeStmt()); 655bf854f0fSBob Wilson Visit(S->getBeginEndStmt()); 656bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 657bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 658bf854f0fSBob Wilson // Visit the body region first. (This is basically the same as a while 659bf854f0fSBob Wilson // loop; see further comments in VisitWhileStmt.) 660bf854f0fSBob Wilson Cnt.beginRegion(); 6613586be72SDuncan P. N. Exon Smith CountMap[S->getLoopVarStmt()] = PGO.getCurrentRegionCount(); 662bf854f0fSBob Wilson Visit(S->getLoopVarStmt()); 663bf854f0fSBob Wilson Visit(S->getBody()); 664bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 665bf854f0fSBob Wilson 666bf854f0fSBob Wilson // The increment is essentially part of the body but it needs to include 667bf854f0fSBob Wilson // the count for all the continue statements. 668bf854f0fSBob Wilson Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() + 669bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount); 6703586be72SDuncan P. N. Exon Smith CountMap[S->getInc()] = PGO.getCurrentRegionCount(); 671bf854f0fSBob Wilson Visit(S->getInc()); 672bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 673bf854f0fSBob Wilson 674bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 675bf854f0fSBob Wilson 676bf854f0fSBob Wilson // ...then go back and propagate counts through the condition. 677bf854f0fSBob Wilson Cnt.setCurrentRegionCount(Cnt.getParentCount() + 678bf854f0fSBob Wilson Cnt.getAdjustedCount() + 679bf854f0fSBob Wilson BC.ContinueCount); 6803586be72SDuncan P. N. Exon Smith CountMap[S->getCond()] = PGO.getCurrentRegionCount(); 681bf854f0fSBob Wilson Visit(S->getCond()); 682bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 683bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 684bf854f0fSBob Wilson RecordNextStmtCount = true; 685bf854f0fSBob Wilson } 686bf854f0fSBob Wilson 687bf854f0fSBob Wilson void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) { 688bf854f0fSBob Wilson RecordStmtCount(S); 689bf854f0fSBob Wilson Visit(S->getElement()); 690bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 691bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 692bf854f0fSBob Wilson Cnt.beginRegion(); 6933586be72SDuncan P. N. Exon Smith CountMap[S->getBody()] = PGO.getCurrentRegionCount(); 694bf854f0fSBob Wilson Visit(S->getBody()); 695bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 696bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 697bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount); 698bf854f0fSBob Wilson RecordNextStmtCount = true; 699bf854f0fSBob Wilson } 700bf854f0fSBob Wilson 701bf854f0fSBob Wilson void VisitSwitchStmt(const SwitchStmt *S) { 702bf854f0fSBob Wilson RecordStmtCount(S); 703bf854f0fSBob Wilson Visit(S->getCond()); 704bf854f0fSBob Wilson PGO.setCurrentRegionUnreachable(); 705bf854f0fSBob Wilson BreakContinueStack.push_back(BreakContinue()); 706bf854f0fSBob Wilson Visit(S->getBody()); 707bf854f0fSBob Wilson // If the switch is inside a loop, add the continue counts. 708bf854f0fSBob Wilson BreakContinue BC = BreakContinueStack.pop_back_val(); 709bf854f0fSBob Wilson if (!BreakContinueStack.empty()) 710bf854f0fSBob Wilson BreakContinueStack.back().ContinueCount += BC.ContinueCount; 711bf854f0fSBob Wilson RegionCounter ExitCnt(PGO, S); 712bf854f0fSBob Wilson ExitCnt.beginRegion(); 713bf854f0fSBob Wilson RecordNextStmtCount = true; 714bf854f0fSBob Wilson } 715bf854f0fSBob Wilson 716bf854f0fSBob Wilson void VisitCaseStmt(const CaseStmt *S) { 717bf854f0fSBob Wilson RecordNextStmtCount = false; 718bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 719bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 7203586be72SDuncan P. N. Exon Smith CountMap[S] = Cnt.getCount(); 721bf854f0fSBob Wilson RecordNextStmtCount = true; 722bf854f0fSBob Wilson Visit(S->getSubStmt()); 723bf854f0fSBob Wilson } 724bf854f0fSBob Wilson 725bf854f0fSBob Wilson void VisitDefaultStmt(const DefaultStmt *S) { 726bf854f0fSBob Wilson RecordNextStmtCount = false; 727bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 728bf854f0fSBob Wilson Cnt.beginRegion(/*AddIncomingFallThrough=*/true); 7293586be72SDuncan P. N. Exon Smith CountMap[S] = Cnt.getCount(); 730bf854f0fSBob Wilson RecordNextStmtCount = true; 731bf854f0fSBob Wilson Visit(S->getSubStmt()); 732bf854f0fSBob Wilson } 733bf854f0fSBob Wilson 734bf854f0fSBob Wilson void VisitIfStmt(const IfStmt *S) { 735bf854f0fSBob Wilson RecordStmtCount(S); 736bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 737bf854f0fSBob Wilson Visit(S->getCond()); 738bf854f0fSBob Wilson 739bf854f0fSBob Wilson Cnt.beginRegion(); 7403586be72SDuncan P. N. Exon Smith CountMap[S->getThen()] = PGO.getCurrentRegionCount(); 741bf854f0fSBob Wilson Visit(S->getThen()); 742bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 743bf854f0fSBob Wilson 744bf854f0fSBob Wilson if (S->getElse()) { 745bf854f0fSBob Wilson Cnt.beginElseRegion(); 7463586be72SDuncan P. N. Exon Smith CountMap[S->getElse()] = PGO.getCurrentRegionCount(); 747bf854f0fSBob Wilson Visit(S->getElse()); 748bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 749bf854f0fSBob Wilson } 750bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 751bf854f0fSBob Wilson RecordNextStmtCount = true; 752bf854f0fSBob Wilson } 753bf854f0fSBob Wilson 754bf854f0fSBob Wilson void VisitCXXTryStmt(const CXXTryStmt *S) { 755bf854f0fSBob Wilson RecordStmtCount(S); 756bf854f0fSBob Wilson Visit(S->getTryBlock()); 757bf854f0fSBob Wilson for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I) 758bf854f0fSBob Wilson Visit(S->getHandler(I)); 759bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 760bf854f0fSBob Wilson Cnt.beginRegion(); 761bf854f0fSBob Wilson RecordNextStmtCount = true; 762bf854f0fSBob Wilson } 763bf854f0fSBob Wilson 764bf854f0fSBob Wilson void VisitCXXCatchStmt(const CXXCatchStmt *S) { 765bf854f0fSBob Wilson RecordNextStmtCount = false; 766bf854f0fSBob Wilson RegionCounter Cnt(PGO, S); 767bf854f0fSBob Wilson Cnt.beginRegion(); 7683586be72SDuncan P. N. Exon Smith CountMap[S] = PGO.getCurrentRegionCount(); 769bf854f0fSBob Wilson Visit(S->getHandlerBlock()); 770bf854f0fSBob Wilson } 771bf854f0fSBob Wilson 772bf854f0fSBob Wilson void VisitConditionalOperator(const ConditionalOperator *E) { 773bf854f0fSBob Wilson RecordStmtCount(E); 774bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 775bf854f0fSBob Wilson Visit(E->getCond()); 776bf854f0fSBob Wilson 777bf854f0fSBob Wilson Cnt.beginRegion(); 7783586be72SDuncan P. N. Exon Smith CountMap[E->getTrueExpr()] = PGO.getCurrentRegionCount(); 779bf854f0fSBob Wilson Visit(E->getTrueExpr()); 780bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 781bf854f0fSBob Wilson 782bf854f0fSBob Wilson Cnt.beginElseRegion(); 7833586be72SDuncan P. N. Exon Smith CountMap[E->getFalseExpr()] = PGO.getCurrentRegionCount(); 784bf854f0fSBob Wilson Visit(E->getFalseExpr()); 785bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 786bf854f0fSBob Wilson 787bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 788bf854f0fSBob Wilson RecordNextStmtCount = true; 789bf854f0fSBob Wilson } 790bf854f0fSBob Wilson 791bf854f0fSBob Wilson void VisitBinLAnd(const BinaryOperator *E) { 792bf854f0fSBob Wilson RecordStmtCount(E); 793bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 794bf854f0fSBob Wilson Visit(E->getLHS()); 795bf854f0fSBob Wilson Cnt.beginRegion(); 7963586be72SDuncan P. N. Exon Smith CountMap[E->getRHS()] = PGO.getCurrentRegionCount(); 797bf854f0fSBob Wilson Visit(E->getRHS()); 798bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 799bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 800bf854f0fSBob Wilson RecordNextStmtCount = true; 801bf854f0fSBob Wilson } 802bf854f0fSBob Wilson 803bf854f0fSBob Wilson void VisitBinLOr(const BinaryOperator *E) { 804bf854f0fSBob Wilson RecordStmtCount(E); 805bf854f0fSBob Wilson RegionCounter Cnt(PGO, E); 806bf854f0fSBob Wilson Visit(E->getLHS()); 807bf854f0fSBob Wilson Cnt.beginRegion(); 8083586be72SDuncan P. N. Exon Smith CountMap[E->getRHS()] = PGO.getCurrentRegionCount(); 809bf854f0fSBob Wilson Visit(E->getRHS()); 810bf854f0fSBob Wilson Cnt.adjustForControlFlow(); 811bf854f0fSBob Wilson Cnt.applyAdjustmentsToRegion(0); 812bf854f0fSBob Wilson RecordNextStmtCount = true; 813bf854f0fSBob Wilson } 814bf854f0fSBob Wilson }; 815ef512b99SJustin Bogner } 816ef512b99SJustin Bogner 817*d971cd1bSDuncan P. N. Exon Smith static void emitRuntimeHook(CodeGenModule &CGM) { 818*d971cd1bSDuncan P. N. Exon Smith constexpr const char *RuntimeVarName = "__llvm_profile_runtime"; 819*d971cd1bSDuncan P. N. Exon Smith constexpr const char *RuntimeUserName = "__llvm_profile_runtime_user"; 820*d971cd1bSDuncan P. N. Exon Smith if (CGM.getModule().getGlobalVariable(RuntimeVarName)) 821*d971cd1bSDuncan P. N. Exon Smith return; 822*d971cd1bSDuncan P. N. Exon Smith 823*d971cd1bSDuncan P. N. Exon Smith // Declare the runtime hook. 824*d971cd1bSDuncan P. N. Exon Smith llvm::LLVMContext &Ctx = CGM.getLLVMContext(); 825*d971cd1bSDuncan P. N. Exon Smith auto *Int32Ty = llvm::Type::getInt32Ty(Ctx); 826*d971cd1bSDuncan P. N. Exon Smith auto *Var = new llvm::GlobalVariable(CGM.getModule(), Int32Ty, false, 827*d971cd1bSDuncan P. N. Exon Smith llvm::GlobalValue::ExternalLinkage, 828*d971cd1bSDuncan P. N. Exon Smith nullptr, RuntimeVarName); 829*d971cd1bSDuncan P. N. Exon Smith 830*d971cd1bSDuncan P. N. Exon Smith // Make a function that uses it. 831*d971cd1bSDuncan P. N. Exon Smith auto *User = llvm::Function::Create(llvm::FunctionType::get(Int32Ty, false), 832*d971cd1bSDuncan P. N. Exon Smith llvm::GlobalValue::LinkOnceODRLinkage, 833*d971cd1bSDuncan P. N. Exon Smith RuntimeUserName, &CGM.getModule()); 834*d971cd1bSDuncan P. N. Exon Smith User->addFnAttr(llvm::Attribute::NoInline); 835*d971cd1bSDuncan P. N. Exon Smith if (CGM.getCodeGenOpts().DisableRedZone) 836*d971cd1bSDuncan P. N. Exon Smith User->addFnAttr(llvm::Attribute::NoRedZone); 837*d971cd1bSDuncan P. N. Exon Smith CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", User)); 838*d971cd1bSDuncan P. N. Exon Smith auto *Load = Builder.CreateLoad(Var); 839*d971cd1bSDuncan P. N. Exon Smith Builder.CreateRet(Load); 840*d971cd1bSDuncan P. N. Exon Smith 841*d971cd1bSDuncan P. N. Exon Smith // Create a use of the function. Now the definition of the runtime variable 842*d971cd1bSDuncan P. N. Exon Smith // should get pulled in, along with any static initializears. 843*d971cd1bSDuncan P. N. Exon Smith CGM.addUsedGlobal(User); 844*d971cd1bSDuncan P. N. Exon Smith } 845*d971cd1bSDuncan P. N. Exon Smith 846da1ebedeSBob Wilson void CodeGenPGO::assignRegionCounters(const Decl *D, llvm::Function *Fn) { 847ef512b99SJustin Bogner bool InstrumentRegions = CGM.getCodeGenOpts().ProfileInstrGenerate; 848d66a17d0SJustin Bogner PGOProfileData *PGOData = CGM.getPGOData(); 849d66a17d0SJustin Bogner if (!InstrumentRegions && !PGOData) 850ef512b99SJustin Bogner return; 851ef512b99SJustin Bogner if (!D) 852ef512b99SJustin Bogner return; 853da1ebedeSBob Wilson setFuncName(Fn); 8547c41451bSDuncan P. N. Exon Smith 8557c41451bSDuncan P. N. Exon Smith // Set the linkage for variables based on the function linkage. Usually, we 8567c41451bSDuncan P. N. Exon Smith // want to match it, but available_externally and extern_weak both have the 8577c41451bSDuncan P. N. Exon Smith // wrong semantics. 85873f78627SDuncan P. N. Exon Smith VarLinkage = Fn->getLinkage(); 8597c41451bSDuncan P. N. Exon Smith switch (VarLinkage) { 8607c41451bSDuncan P. N. Exon Smith case llvm::GlobalValue::ExternalWeakLinkage: 8617c41451bSDuncan P. N. Exon Smith VarLinkage = llvm::GlobalValue::LinkOnceAnyLinkage; 8627c41451bSDuncan P. N. Exon Smith break; 8637c41451bSDuncan P. N. Exon Smith case llvm::GlobalValue::AvailableExternallyLinkage: 8647c41451bSDuncan P. N. Exon Smith VarLinkage = llvm::GlobalValue::LinkOnceODRLinkage; 8657c41451bSDuncan P. N. Exon Smith break; 8667c41451bSDuncan P. N. Exon Smith default: 8677c41451bSDuncan P. N. Exon Smith break; 8687c41451bSDuncan P. N. Exon Smith } 8697c41451bSDuncan P. N. Exon Smith 870ef512b99SJustin Bogner mapRegionCounters(D); 871*d971cd1bSDuncan P. N. Exon Smith if (InstrumentRegions) { 872*d971cd1bSDuncan P. N. Exon Smith emitRuntimeHook(CGM); 873ef512b99SJustin Bogner emitCounterVariables(); 874*d971cd1bSDuncan P. N. Exon Smith } 875d66a17d0SJustin Bogner if (PGOData) { 876d66a17d0SJustin Bogner loadRegionCounts(PGOData); 877bf854f0fSBob Wilson computeRegionCounts(D); 878d66a17d0SJustin Bogner applyFunctionAttributes(PGOData, Fn); 879bf854f0fSBob Wilson } 880ef512b99SJustin Bogner } 881ef512b99SJustin Bogner 882ef512b99SJustin Bogner void CodeGenPGO::mapRegionCounters(const Decl *D) { 8831b67cfd4SDuncan P. N. Exon Smith RegionCounterMap.reset(new llvm::DenseMap<const Stmt *, unsigned>); 8843586be72SDuncan P. N. Exon Smith MapRegionCounters Walker(*RegionCounterMap); 885ef512b99SJustin Bogner if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D)) 886ef512b99SJustin Bogner Walker.VisitFunctionDecl(FD); 8875ec8fe19SBob Wilson else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D)) 8885ec8fe19SBob Wilson Walker.VisitObjCMethodDecl(MD); 889c845c00aSBob Wilson else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D)) 890c845c00aSBob Wilson Walker.VisitBlockDecl(BD); 891ef512b99SJustin Bogner NumRegionCounters = Walker.NextCounter; 892b4416f58SJustin Bogner // FIXME: The number of counters isn't sufficient for the hash 893b4416f58SJustin Bogner FunctionHash = NumRegionCounters; 894ef512b99SJustin Bogner } 895ef512b99SJustin Bogner 896bf854f0fSBob Wilson void CodeGenPGO::computeRegionCounts(const Decl *D) { 8971b67cfd4SDuncan P. N. Exon Smith StmtCountMap.reset(new llvm::DenseMap<const Stmt *, uint64_t>); 8983586be72SDuncan P. N. Exon Smith ComputeRegionCounts Walker(*StmtCountMap, *this); 899bf854f0fSBob Wilson if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D)) 900bf854f0fSBob Wilson Walker.VisitFunctionDecl(FD); 9015ec8fe19SBob Wilson else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D)) 9025ec8fe19SBob Wilson Walker.VisitObjCMethodDecl(MD); 903c845c00aSBob Wilson else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D)) 904c845c00aSBob Wilson Walker.VisitBlockDecl(BD); 905bf854f0fSBob Wilson } 906bf854f0fSBob Wilson 907d66a17d0SJustin Bogner void CodeGenPGO::applyFunctionAttributes(PGOProfileData *PGOData, 9084c9c45c0SJustin Bogner llvm::Function *Fn) { 9094c9c45c0SJustin Bogner if (!haveRegionCounts()) 9104c9c45c0SJustin Bogner return; 9114c9c45c0SJustin Bogner 912d66a17d0SJustin Bogner uint64_t MaxFunctionCount = PGOData->getMaximumFunctionCount(); 9134c9c45c0SJustin Bogner uint64_t FunctionCount = getRegionCount(0); 9144c9c45c0SJustin Bogner if (FunctionCount >= (uint64_t)(0.3 * (double)MaxFunctionCount)) 9154c9c45c0SJustin Bogner // Turn on InlineHint attribute for hot functions. 9164c9c45c0SJustin Bogner // FIXME: 30% is from preliminary tuning on SPEC, it may not be optimal. 9174c9c45c0SJustin Bogner Fn->addFnAttr(llvm::Attribute::InlineHint); 9184c9c45c0SJustin Bogner else if (FunctionCount <= (uint64_t)(0.01 * (double)MaxFunctionCount)) 9194c9c45c0SJustin Bogner // Turn on Cold attribute for cold functions. 9204c9c45c0SJustin Bogner // FIXME: 1% is from preliminary tuning on SPEC, it may not be optimal. 9214c9c45c0SJustin Bogner Fn->addFnAttr(llvm::Attribute::Cold); 9224c9c45c0SJustin Bogner } 9234c9c45c0SJustin Bogner 924ef512b99SJustin Bogner void CodeGenPGO::emitCounterVariables() { 925ef512b99SJustin Bogner llvm::LLVMContext &Ctx = CGM.getLLVMContext(); 926ef512b99SJustin Bogner llvm::ArrayType *CounterTy = llvm::ArrayType::get(llvm::Type::getInt64Ty(Ctx), 927ef512b99SJustin Bogner NumRegionCounters); 928ef512b99SJustin Bogner RegionCounters = 92973f78627SDuncan P. N. Exon Smith new llvm::GlobalVariable(CGM.getModule(), CounterTy, false, VarLinkage, 930ef512b99SJustin Bogner llvm::Constant::getNullValue(CounterTy), 9312fe531cbSDuncan P. N. Exon Smith getFuncVarName("counters")); 9322fe531cbSDuncan P. N. Exon Smith RegionCounters->setAlignment(8); 9332fe531cbSDuncan P. N. Exon Smith RegionCounters->setSection(getCountersSection(CGM)); 934ef512b99SJustin Bogner } 935ef512b99SJustin Bogner 936ef512b99SJustin Bogner void CodeGenPGO::emitCounterIncrement(CGBuilderTy &Builder, unsigned Counter) { 937749ebc7fSBob Wilson if (!RegionCounters) 938ef512b99SJustin Bogner return; 939ef512b99SJustin Bogner llvm::Value *Addr = 940ef512b99SJustin Bogner Builder.CreateConstInBoundsGEP2_64(RegionCounters, 0, Counter); 941ef512b99SJustin Bogner llvm::Value *Count = Builder.CreateLoad(Addr, "pgocount"); 942ef512b99SJustin Bogner Count = Builder.CreateAdd(Count, Builder.getInt64(1)); 943ef512b99SJustin Bogner Builder.CreateStore(Count, Addr); 944ef512b99SJustin Bogner } 945ef512b99SJustin Bogner 946d66a17d0SJustin Bogner void CodeGenPGO::loadRegionCounts(PGOProfileData *PGOData) { 947ef512b99SJustin Bogner // For now, ignore the counts from the PGO data file only if the number of 948ef512b99SJustin Bogner // counters does not match. This could be tightened down in the future to 949ef512b99SJustin Bogner // ignore counts when the input changes in various ways, e.g., by comparing a 950ef512b99SJustin Bogner // hash value based on some characteristics of the input. 9511b67cfd4SDuncan P. N. Exon Smith RegionCounts.reset(new std::vector<uint64_t>); 952b4416f58SJustin Bogner uint64_t Hash; 953b4416f58SJustin Bogner if (PGOData->getFunctionCounts(getFuncName(), Hash, *RegionCounts) || 9541b67cfd4SDuncan P. N. Exon Smith Hash != FunctionHash || RegionCounts->size() != NumRegionCounters) 9551b67cfd4SDuncan P. N. Exon Smith RegionCounts.reset(); 956ef512b99SJustin Bogner } 957ef512b99SJustin Bogner 958ef512b99SJustin Bogner void CodeGenPGO::destroyRegionCounters() { 9591b67cfd4SDuncan P. N. Exon Smith RegionCounterMap.reset(); 9601b67cfd4SDuncan P. N. Exon Smith StmtCountMap.reset(); 9611b67cfd4SDuncan P. N. Exon Smith RegionCounts.reset(); 962ef512b99SJustin Bogner } 963ef512b99SJustin Bogner 96438402dc9SDuncan P. N. Exon Smith /// \brief Calculate what to divide by to scale weights. 96538402dc9SDuncan P. N. Exon Smith /// 96638402dc9SDuncan P. N. Exon Smith /// Given the maximum weight, calculate a divisor that will scale all the 96738402dc9SDuncan P. N. Exon Smith /// weights to strictly less than UINT32_MAX. 96838402dc9SDuncan P. N. Exon Smith static uint64_t calculateWeightScale(uint64_t MaxWeight) { 96938402dc9SDuncan P. N. Exon Smith return MaxWeight < UINT32_MAX ? 1 : MaxWeight / UINT32_MAX + 1; 97038402dc9SDuncan P. N. Exon Smith } 97138402dc9SDuncan P. N. Exon Smith 97238402dc9SDuncan P. N. Exon Smith /// \brief Scale an individual branch weight (and add 1). 97338402dc9SDuncan P. N. Exon Smith /// 97438402dc9SDuncan P. N. Exon Smith /// Scale a 64-bit weight down to 32-bits using \c Scale. 97538402dc9SDuncan P. N. Exon Smith /// 97638402dc9SDuncan P. N. Exon Smith /// According to Laplace's Rule of Succession, it is better to compute the 97738402dc9SDuncan P. N. Exon Smith /// weight based on the count plus 1, so universally add 1 to the value. 97838402dc9SDuncan P. N. Exon Smith /// 97938402dc9SDuncan P. N. Exon Smith /// \pre \c Scale was calculated by \a calculateWeightScale() with a weight no 98038402dc9SDuncan P. N. Exon Smith /// greater than \c Weight. 98138402dc9SDuncan P. N. Exon Smith static uint32_t scaleBranchWeight(uint64_t Weight, uint64_t Scale) { 98238402dc9SDuncan P. N. Exon Smith assert(Scale && "scale by 0?"); 98338402dc9SDuncan P. N. Exon Smith uint64_t Scaled = Weight / Scale + 1; 98438402dc9SDuncan P. N. Exon Smith assert(Scaled <= UINT32_MAX && "overflow 32-bits"); 98538402dc9SDuncan P. N. Exon Smith return Scaled; 98638402dc9SDuncan P. N. Exon Smith } 98738402dc9SDuncan P. N. Exon Smith 988ef512b99SJustin Bogner llvm::MDNode *CodeGenPGO::createBranchWeights(uint64_t TrueCount, 989ef512b99SJustin Bogner uint64_t FalseCount) { 99038402dc9SDuncan P. N. Exon Smith // Check for empty weights. 991ef512b99SJustin Bogner if (!TrueCount && !FalseCount) 992a5f804a7SDuncan P. N. Exon Smith return nullptr; 993ef512b99SJustin Bogner 99438402dc9SDuncan P. N. Exon Smith // Calculate how to scale down to 32-bits. 99538402dc9SDuncan P. N. Exon Smith uint64_t Scale = calculateWeightScale(std::max(TrueCount, FalseCount)); 99638402dc9SDuncan P. N. Exon Smith 997ef512b99SJustin Bogner llvm::MDBuilder MDHelper(CGM.getLLVMContext()); 99838402dc9SDuncan P. N. Exon Smith return MDHelper.createBranchWeights(scaleBranchWeight(TrueCount, Scale), 99938402dc9SDuncan P. N. Exon Smith scaleBranchWeight(FalseCount, Scale)); 1000ef512b99SJustin Bogner } 1001ef512b99SJustin Bogner 100295a27b0eSBob Wilson llvm::MDNode *CodeGenPGO::createBranchWeights(ArrayRef<uint64_t> Weights) { 100338402dc9SDuncan P. N. Exon Smith // We need at least two elements to create meaningful weights. 100438402dc9SDuncan P. N. Exon Smith if (Weights.size() < 2) 1005a5f804a7SDuncan P. N. Exon Smith return nullptr; 100638402dc9SDuncan P. N. Exon Smith 100738402dc9SDuncan P. N. Exon Smith // Calculate how to scale down to 32-bits. 100838402dc9SDuncan P. N. Exon Smith uint64_t Scale = calculateWeightScale(*std::max_element(Weights.begin(), 100938402dc9SDuncan P. N. Exon Smith Weights.end())); 101038402dc9SDuncan P. N. Exon Smith 1011ef512b99SJustin Bogner SmallVector<uint32_t, 16> ScaledWeights; 1012ef512b99SJustin Bogner ScaledWeights.reserve(Weights.size()); 101338402dc9SDuncan P. N. Exon Smith for (uint64_t W : Weights) 101438402dc9SDuncan P. N. Exon Smith ScaledWeights.push_back(scaleBranchWeight(W, Scale)); 101538402dc9SDuncan P. N. Exon Smith 101638402dc9SDuncan P. N. Exon Smith llvm::MDBuilder MDHelper(CGM.getLLVMContext()); 1017ef512b99SJustin Bogner return MDHelper.createBranchWeights(ScaledWeights); 1018ef512b99SJustin Bogner } 1019bf854f0fSBob Wilson 1020bf854f0fSBob Wilson llvm::MDNode *CodeGenPGO::createLoopWeights(const Stmt *Cond, 1021bf854f0fSBob Wilson RegionCounter &Cnt) { 1022bf854f0fSBob Wilson if (!haveRegionCounts()) 1023a5f804a7SDuncan P. N. Exon Smith return nullptr; 1024bf854f0fSBob Wilson uint64_t LoopCount = Cnt.getCount(); 1025bf854f0fSBob Wilson uint64_t CondCount = 0; 1026bf854f0fSBob Wilson bool Found = getStmtCount(Cond, CondCount); 1027bf854f0fSBob Wilson assert(Found && "missing expected loop condition count"); 1028bf854f0fSBob Wilson (void)Found; 1029bf854f0fSBob Wilson if (CondCount == 0) 1030a5f804a7SDuncan P. N. Exon Smith return nullptr; 1031bf854f0fSBob Wilson return createBranchWeights(LoopCount, 1032bf854f0fSBob Wilson std::max(CondCount, LoopCount) - LoopCount); 1033bf854f0fSBob Wilson } 1034