1ef512b99SJustin Bogner //===--- CodeGenPGO.cpp - PGO Instrumentation for LLVM CodeGen --*- C++ -*-===//
2ef512b99SJustin Bogner //
3ef512b99SJustin Bogner //                     The LLVM Compiler Infrastructure
4ef512b99SJustin Bogner //
5ef512b99SJustin Bogner // This file is distributed under the University of Illinois Open Source
6ef512b99SJustin Bogner // License. See LICENSE.TXT for details.
7ef512b99SJustin Bogner //
8ef512b99SJustin Bogner //===----------------------------------------------------------------------===//
9ef512b99SJustin Bogner //
10ef512b99SJustin Bogner // Instrumentation-based profile-guided optimization
11ef512b99SJustin Bogner //
12ef512b99SJustin Bogner //===----------------------------------------------------------------------===//
13ef512b99SJustin Bogner 
14ef512b99SJustin Bogner #include "CodeGenPGO.h"
15ef512b99SJustin Bogner #include "CodeGenFunction.h"
16ef512b99SJustin Bogner #include "clang/AST/RecursiveASTVisitor.h"
17ef512b99SJustin Bogner #include "clang/AST/StmtVisitor.h"
18529f6dd8SJustin Bogner #include "llvm/Config/config.h" // for strtoull()/strtoll() define
19ef512b99SJustin Bogner #include "llvm/IR/MDBuilder.h"
20ef512b99SJustin Bogner #include "llvm/Support/FileSystem.h"
21ef512b99SJustin Bogner 
22ef512b99SJustin Bogner using namespace clang;
23ef512b99SJustin Bogner using namespace CodeGen;
24ef512b99SJustin Bogner 
25d66a17d0SJustin Bogner static void ReportBadPGOData(CodeGenModule &CGM, const char *Message) {
26d66a17d0SJustin Bogner   DiagnosticsEngine &Diags = CGM.getDiags();
27d66a17d0SJustin Bogner   unsigned diagID = Diags.getCustomDiagID(DiagnosticsEngine::Error, "%0");
28d66a17d0SJustin Bogner   Diags.Report(diagID) << Message;
29d66a17d0SJustin Bogner }
30d66a17d0SJustin Bogner 
31d66a17d0SJustin Bogner PGOProfileData::PGOProfileData(CodeGenModule &CGM, std::string Path)
32d66a17d0SJustin Bogner   : CGM(CGM) {
33d66a17d0SJustin Bogner   if (llvm::MemoryBuffer::getFile(Path, DataBuffer)) {
34d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "failed to open pgo data file");
35d66a17d0SJustin Bogner     return;
36d66a17d0SJustin Bogner   }
37d66a17d0SJustin Bogner 
38d66a17d0SJustin Bogner   if (DataBuffer->getBufferSize() > std::numeric_limits<unsigned>::max()) {
39d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "pgo data file too big");
40d66a17d0SJustin Bogner     return;
41d66a17d0SJustin Bogner   }
42d66a17d0SJustin Bogner 
43d66a17d0SJustin Bogner   // Scan through the data file and map each function to the corresponding
44d66a17d0SJustin Bogner   // file offset where its counts are stored.
45d66a17d0SJustin Bogner   const char *BufferStart = DataBuffer->getBufferStart();
46d66a17d0SJustin Bogner   const char *BufferEnd = DataBuffer->getBufferEnd();
47d66a17d0SJustin Bogner   const char *CurPtr = BufferStart;
48d66a17d0SJustin Bogner   uint64_t MaxCount = 0;
49d66a17d0SJustin Bogner   while (CurPtr < BufferEnd) {
50d66a17d0SJustin Bogner     // Read the function name.
51d66a17d0SJustin Bogner     const char *FuncStart = CurPtr;
52d66a17d0SJustin Bogner     // For Objective-C methods, the name may include whitespace, so search
53d66a17d0SJustin Bogner     // backward from the end of the line to find the space that separates the
54d66a17d0SJustin Bogner     // name from the number of counters. (This is a temporary hack since we are
55d66a17d0SJustin Bogner     // going to completely replace this file format in the near future.)
56d66a17d0SJustin Bogner     CurPtr = strchr(CurPtr, '\n');
57d66a17d0SJustin Bogner     if (!CurPtr) {
58d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo data file has malformed function entry");
59d66a17d0SJustin Bogner       return;
60d66a17d0SJustin Bogner     }
61d66a17d0SJustin Bogner     StringRef FuncName(FuncStart, CurPtr - FuncStart);
62d66a17d0SJustin Bogner 
63b4416f58SJustin Bogner     // Skip over the function hash.
64b4416f58SJustin Bogner     CurPtr = strchr(++CurPtr, '\n');
65b4416f58SJustin Bogner     if (!CurPtr) {
66b4416f58SJustin Bogner       ReportBadPGOData(CGM, "pgo data file is missing the function hash");
67b4416f58SJustin Bogner       return;
68b4416f58SJustin Bogner     }
69b4416f58SJustin Bogner 
70d66a17d0SJustin Bogner     // Read the number of counters.
71d66a17d0SJustin Bogner     char *EndPtr;
72d66a17d0SJustin Bogner     unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10);
73d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n' || NumCounters <= 0) {
74d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo data file has unexpected number of counters");
75d66a17d0SJustin Bogner       return;
76d66a17d0SJustin Bogner     }
77d66a17d0SJustin Bogner     CurPtr = EndPtr;
78d66a17d0SJustin Bogner 
79d66a17d0SJustin Bogner     // Read function count.
80d66a17d0SJustin Bogner     uint64_t Count = strtoll(CurPtr, &EndPtr, 10);
81d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n') {
82d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo-data file has bad count value");
83d66a17d0SJustin Bogner       return;
84d66a17d0SJustin Bogner     }
85d66a17d0SJustin Bogner     CurPtr = EndPtr; // Point to '\n'.
86d66a17d0SJustin Bogner     FunctionCounts[FuncName] = Count;
87d66a17d0SJustin Bogner     MaxCount = Count > MaxCount ? Count : MaxCount;
88d66a17d0SJustin Bogner 
89d66a17d0SJustin Bogner     // There is one line for each counter; skip over those lines.
90d66a17d0SJustin Bogner     // Since function count is already read, we start the loop from 1.
91d66a17d0SJustin Bogner     for (unsigned N = 1; N < NumCounters; ++N) {
92d66a17d0SJustin Bogner       CurPtr = strchr(++CurPtr, '\n');
93d66a17d0SJustin Bogner       if (!CurPtr) {
94d66a17d0SJustin Bogner         ReportBadPGOData(CGM, "pgo data file is missing some counter info");
95d66a17d0SJustin Bogner         return;
96d66a17d0SJustin Bogner       }
97d66a17d0SJustin Bogner     }
98d66a17d0SJustin Bogner 
99d66a17d0SJustin Bogner     // Skip over the blank line separating functions.
100d66a17d0SJustin Bogner     CurPtr += 2;
101d66a17d0SJustin Bogner 
102d66a17d0SJustin Bogner     DataOffsets[FuncName] = FuncStart - BufferStart;
103d66a17d0SJustin Bogner   }
104d66a17d0SJustin Bogner   MaxFunctionCount = MaxCount;
105d66a17d0SJustin Bogner }
106d66a17d0SJustin Bogner 
107b4416f58SJustin Bogner bool PGOProfileData::getFunctionCounts(StringRef FuncName, uint64_t &FuncHash,
108d66a17d0SJustin Bogner                                        std::vector<uint64_t> &Counts) {
109d66a17d0SJustin Bogner   // Find the relevant section of the pgo-data file.
110d66a17d0SJustin Bogner   llvm::StringMap<unsigned>::const_iterator OffsetIter =
111d66a17d0SJustin Bogner     DataOffsets.find(FuncName);
112d66a17d0SJustin Bogner   if (OffsetIter == DataOffsets.end())
113d66a17d0SJustin Bogner     return true;
114d66a17d0SJustin Bogner   const char *CurPtr = DataBuffer->getBufferStart() + OffsetIter->getValue();
115d66a17d0SJustin Bogner 
116d66a17d0SJustin Bogner   // Skip over the function name.
117d66a17d0SJustin Bogner   CurPtr = strchr(CurPtr, '\n');
118d66a17d0SJustin Bogner   assert(CurPtr && "pgo-data has corrupted function entry");
119b4416f58SJustin Bogner 
120b4416f58SJustin Bogner   char *EndPtr;
121b4416f58SJustin Bogner   // Read the function hash.
122b4416f58SJustin Bogner   FuncHash = strtoll(++CurPtr, &EndPtr, 10);
123b4416f58SJustin Bogner   assert(EndPtr != CurPtr && *EndPtr == '\n' &&
124b4416f58SJustin Bogner          "pgo-data file has corrupted function hash");
125b4416f58SJustin Bogner   CurPtr = EndPtr;
126d66a17d0SJustin Bogner 
127d66a17d0SJustin Bogner   // Read the number of counters.
128d66a17d0SJustin Bogner   unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10);
129d66a17d0SJustin Bogner   assert(EndPtr != CurPtr && *EndPtr == '\n' && NumCounters > 0 &&
130d66a17d0SJustin Bogner          "pgo-data file has corrupted number of counters");
131d66a17d0SJustin Bogner   CurPtr = EndPtr;
132d66a17d0SJustin Bogner 
133d66a17d0SJustin Bogner   Counts.reserve(NumCounters);
134d66a17d0SJustin Bogner 
135d66a17d0SJustin Bogner   for (unsigned N = 0; N < NumCounters; ++N) {
136d66a17d0SJustin Bogner     // Read the count value.
137d66a17d0SJustin Bogner     uint64_t Count = strtoll(CurPtr, &EndPtr, 10);
138d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n') {
139d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo-data file has bad count value");
140d66a17d0SJustin Bogner       return true;
141d66a17d0SJustin Bogner     }
142d66a17d0SJustin Bogner     Counts.push_back(Count);
143d66a17d0SJustin Bogner     CurPtr = EndPtr + 1;
144d66a17d0SJustin Bogner   }
145d66a17d0SJustin Bogner 
146d66a17d0SJustin Bogner   // Make sure the number of counters matches up.
147d66a17d0SJustin Bogner   if (Counts.size() != NumCounters) {
148d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "pgo-data file has inconsistent counters");
149d66a17d0SJustin Bogner     return true;
150d66a17d0SJustin Bogner   }
151d66a17d0SJustin Bogner 
152d66a17d0SJustin Bogner   return false;
153d66a17d0SJustin Bogner }
154d66a17d0SJustin Bogner 
155da1ebedeSBob Wilson void CodeGenPGO::setFuncName(llvm::Function *Fn) {
1562fe531cbSDuncan P. N. Exon Smith   RawFuncName = Fn->getName();
157da1ebedeSBob Wilson 
158da1ebedeSBob Wilson   // Function names may be prefixed with a binary '1' to indicate
159da1ebedeSBob Wilson   // that the backend should not modify the symbols due to any platform
160da1ebedeSBob Wilson   // naming convention. Do not include that '1' in the PGO profile name.
1612fe531cbSDuncan P. N. Exon Smith   if (RawFuncName[0] == '\1')
1622fe531cbSDuncan P. N. Exon Smith     RawFuncName = RawFuncName.substr(1);
163da1ebedeSBob Wilson 
164da1ebedeSBob Wilson   if (!Fn->hasLocalLinkage()) {
1652fe531cbSDuncan P. N. Exon Smith     PrefixedFuncName = new std::string(RawFuncName);
166da1ebedeSBob Wilson     return;
167da1ebedeSBob Wilson   }
168da1ebedeSBob Wilson 
169da1ebedeSBob Wilson   // For local symbols, prepend the main file name to distinguish them.
170da1ebedeSBob Wilson   // Do not include the full path in the file name since there's no guarantee
171da1ebedeSBob Wilson   // that it will stay the same, e.g., if the files are checked out from
172da1ebedeSBob Wilson   // version control in different locations.
1732fe531cbSDuncan P. N. Exon Smith   PrefixedFuncName = new std::string(CGM.getCodeGenOpts().MainFileName);
1742fe531cbSDuncan P. N. Exon Smith   if (PrefixedFuncName->empty())
1752fe531cbSDuncan P. N. Exon Smith     PrefixedFuncName->assign("<unknown>");
1762fe531cbSDuncan P. N. Exon Smith   PrefixedFuncName->append(":");
1772fe531cbSDuncan P. N. Exon Smith   PrefixedFuncName->append(RawFuncName);
178da1ebedeSBob Wilson }
179da1ebedeSBob Wilson 
1802fe531cbSDuncan P. N. Exon Smith static llvm::Function *getRegisterFunc(CodeGenModule &CGM) {
1812fe531cbSDuncan P. N. Exon Smith   return CGM.getModule().getFunction("__llvm_pgo_register_functions");
1822fe531cbSDuncan P. N. Exon Smith }
1832fe531cbSDuncan P. N. Exon Smith 
1842fe531cbSDuncan P. N. Exon Smith static llvm::BasicBlock *getOrInsertRegisterBB(CodeGenModule &CGM) {
185780443e8SDuncan P. N. Exon Smith   // Don't do this for Darwin.  compiler-rt uses linker magic.
186780443e8SDuncan P. N. Exon Smith   if (CGM.getTarget().getTriple().isOSDarwin())
187780443e8SDuncan P. N. Exon Smith     return nullptr;
188780443e8SDuncan P. N. Exon Smith 
1892fe531cbSDuncan P. N. Exon Smith   // Only need to insert this once per module.
1902fe531cbSDuncan P. N. Exon Smith   if (llvm::Function *RegisterF = getRegisterFunc(CGM))
1912fe531cbSDuncan P. N. Exon Smith     return &RegisterF->getEntryBlock();
1922fe531cbSDuncan P. N. Exon Smith 
1932fe531cbSDuncan P. N. Exon Smith   // Construct the function.
1942fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
1952fe531cbSDuncan P. N. Exon Smith   auto *RegisterFTy = llvm::FunctionType::get(VoidTy, false);
1962fe531cbSDuncan P. N. Exon Smith   auto *RegisterF = llvm::Function::Create(RegisterFTy,
1972fe531cbSDuncan P. N. Exon Smith                                            llvm::GlobalValue::InternalLinkage,
1982fe531cbSDuncan P. N. Exon Smith                                            "__llvm_pgo_register_functions",
1992fe531cbSDuncan P. N. Exon Smith                                            &CGM.getModule());
2002fe531cbSDuncan P. N. Exon Smith   RegisterF->setUnnamedAddr(true);
2012fe531cbSDuncan P. N. Exon Smith   if (CGM.getCodeGenOpts().DisableRedZone)
2022fe531cbSDuncan P. N. Exon Smith     RegisterF->addFnAttr(llvm::Attribute::NoRedZone);
2032fe531cbSDuncan P. N. Exon Smith 
2042fe531cbSDuncan P. N. Exon Smith   // Construct and return the entry block.
2052fe531cbSDuncan P. N. Exon Smith   auto *BB = llvm::BasicBlock::Create(CGM.getLLVMContext(), "", RegisterF);
2062fe531cbSDuncan P. N. Exon Smith   CGBuilderTy Builder(BB);
2072fe531cbSDuncan P. N. Exon Smith   Builder.CreateRetVoid();
2082fe531cbSDuncan P. N. Exon Smith   return BB;
2092fe531cbSDuncan P. N. Exon Smith }
2102fe531cbSDuncan P. N. Exon Smith 
2112fe531cbSDuncan P. N. Exon Smith static llvm::Constant *getOrInsertRuntimeRegister(CodeGenModule &CGM) {
2122fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
2132fe531cbSDuncan P. N. Exon Smith   auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext());
2142fe531cbSDuncan P. N. Exon Smith   auto *RuntimeRegisterTy = llvm::FunctionType::get(VoidTy, VoidPtrTy, false);
2152fe531cbSDuncan P. N. Exon Smith   return CGM.getModule().getOrInsertFunction("__llvm_pgo_register_function",
2162fe531cbSDuncan P. N. Exon Smith                                              RuntimeRegisterTy);
2172fe531cbSDuncan P. N. Exon Smith }
2182fe531cbSDuncan P. N. Exon Smith 
2197134d47dSDuncan P. N. Exon Smith static bool isMachO(const CodeGenModule &CGM) {
2207134d47dSDuncan P. N. Exon Smith   return CGM.getTarget().getTriple().isOSBinFormatMachO();
2217134d47dSDuncan P. N. Exon Smith }
2227134d47dSDuncan P. N. Exon Smith 
2232fe531cbSDuncan P. N. Exon Smith static StringRef getCountersSection(const CodeGenModule &CGM) {
2247134d47dSDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_pgo_cnts" : "__llvm_pgo_cnts";
2252fe531cbSDuncan P. N. Exon Smith }
2262fe531cbSDuncan P. N. Exon Smith 
2272fe531cbSDuncan P. N. Exon Smith static StringRef getNameSection(const CodeGenModule &CGM) {
2287134d47dSDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_pgo_names" : "__llvm_pgo_names";
2292fe531cbSDuncan P. N. Exon Smith }
2302fe531cbSDuncan P. N. Exon Smith 
2312fe531cbSDuncan P. N. Exon Smith static StringRef getDataSection(const CodeGenModule &CGM) {
2327134d47dSDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_pgo_data" : "__llvm_pgo_data";
2332fe531cbSDuncan P. N. Exon Smith }
2342fe531cbSDuncan P. N. Exon Smith 
2352fe531cbSDuncan P. N. Exon Smith llvm::GlobalVariable *CodeGenPGO::buildDataVar() {
2362fe531cbSDuncan P. N. Exon Smith   // Create name variable.
2372fe531cbSDuncan P. N. Exon Smith   llvm::LLVMContext &Ctx = CGM.getLLVMContext();
2382fe531cbSDuncan P. N. Exon Smith   auto *VarName = llvm::ConstantDataArray::getString(Ctx, getFuncName(),
2392fe531cbSDuncan P. N. Exon Smith                                                      false);
2402fe531cbSDuncan P. N. Exon Smith   auto *Name = new llvm::GlobalVariable(CGM.getModule(), VarName->getType(),
2412fe531cbSDuncan P. N. Exon Smith                                         true, FuncLinkage, VarName,
2422fe531cbSDuncan P. N. Exon Smith                                         getFuncVarName("name"));
2432fe531cbSDuncan P. N. Exon Smith   Name->setSection(getNameSection(CGM));
2442fe531cbSDuncan P. N. Exon Smith   Name->setAlignment(1);
2452fe531cbSDuncan P. N. Exon Smith 
2462fe531cbSDuncan P. N. Exon Smith   // Create data variable.
2472fe531cbSDuncan P. N. Exon Smith   auto *Int32Ty = llvm::Type::getInt32Ty(Ctx);
248b4416f58SJustin Bogner   auto *Int64Ty = llvm::Type::getInt64Ty(Ctx);
2492fe531cbSDuncan P. N. Exon Smith   auto *Int8PtrTy = llvm::Type::getInt8PtrTy(Ctx);
2502fe531cbSDuncan P. N. Exon Smith   auto *Int64PtrTy = llvm::Type::getInt64PtrTy(Ctx);
2512fe531cbSDuncan P. N. Exon Smith   llvm::Type *DataTypes[] = {
252b4416f58SJustin Bogner     Int32Ty, Int32Ty, Int64Ty, Int8PtrTy, Int64PtrTy
2532fe531cbSDuncan P. N. Exon Smith   };
2542fe531cbSDuncan P. N. Exon Smith   auto *DataTy = llvm::StructType::get(Ctx, makeArrayRef(DataTypes));
2552fe531cbSDuncan P. N. Exon Smith   llvm::Constant *DataVals[] = {
2562fe531cbSDuncan P. N. Exon Smith     llvm::ConstantInt::get(Int32Ty, getFuncName().size()),
2572fe531cbSDuncan P. N. Exon Smith     llvm::ConstantInt::get(Int32Ty, NumRegionCounters),
258b4416f58SJustin Bogner     llvm::ConstantInt::get(Int64Ty, FunctionHash),
2592fe531cbSDuncan P. N. Exon Smith     llvm::ConstantExpr::getBitCast(Name, Int8PtrTy),
2602fe531cbSDuncan P. N. Exon Smith     llvm::ConstantExpr::getBitCast(RegionCounters, Int64PtrTy)
2612fe531cbSDuncan P. N. Exon Smith   };
2622fe531cbSDuncan P. N. Exon Smith   auto *Data =
2632fe531cbSDuncan P. N. Exon Smith     new llvm::GlobalVariable(CGM.getModule(), DataTy, true, FuncLinkage,
2642fe531cbSDuncan P. N. Exon Smith                              llvm::ConstantStruct::get(DataTy, DataVals),
2652fe531cbSDuncan P. N. Exon Smith                              getFuncVarName("data"));
2662fe531cbSDuncan P. N. Exon Smith 
2672fe531cbSDuncan P. N. Exon Smith   // All the data should be packed into an array in its own section.
2682fe531cbSDuncan P. N. Exon Smith   Data->setSection(getDataSection(CGM));
2692fe531cbSDuncan P. N. Exon Smith   Data->setAlignment(8);
2702fe531cbSDuncan P. N. Exon Smith 
2712fe531cbSDuncan P. N. Exon Smith   // Make sure the data doesn't get deleted.
2722fe531cbSDuncan P. N. Exon Smith   CGM.addUsedGlobal(Data);
2732fe531cbSDuncan P. N. Exon Smith   return Data;
2742fe531cbSDuncan P. N. Exon Smith }
2752fe531cbSDuncan P. N. Exon Smith 
2762fe531cbSDuncan P. N. Exon Smith void CodeGenPGO::emitInstrumentationData() {
277ef512b99SJustin Bogner   if (!CGM.getCodeGenOpts().ProfileInstrGenerate)
278ef512b99SJustin Bogner     return;
279ef512b99SJustin Bogner 
2802fe531cbSDuncan P. N. Exon Smith   // Build the data.
2812fe531cbSDuncan P. N. Exon Smith   auto *Data = buildDataVar();
282ef512b99SJustin Bogner 
2832fe531cbSDuncan P. N. Exon Smith   // Register the data.
284780443e8SDuncan P. N. Exon Smith   auto *RegisterBB = getOrInsertRegisterBB(CGM);
285780443e8SDuncan P. N. Exon Smith   if (!RegisterBB)
286780443e8SDuncan P. N. Exon Smith     return;
287780443e8SDuncan P. N. Exon Smith   CGBuilderTy Builder(RegisterBB->getTerminator());
2882fe531cbSDuncan P. N. Exon Smith   auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext());
2892fe531cbSDuncan P. N. Exon Smith   Builder.CreateCall(getOrInsertRuntimeRegister(CGM),
2902fe531cbSDuncan P. N. Exon Smith                      Builder.CreateBitCast(Data, VoidPtrTy));
291ef512b99SJustin Bogner }
292ef512b99SJustin Bogner 
293ef512b99SJustin Bogner llvm::Function *CodeGenPGO::emitInitialization(CodeGenModule &CGM) {
2942fe531cbSDuncan P. N. Exon Smith   if (!CGM.getCodeGenOpts().ProfileInstrGenerate)
295a5f804a7SDuncan P. N. Exon Smith     return nullptr;
296ef512b99SJustin Bogner 
2972fe531cbSDuncan P. N. Exon Smith   // Only need to create this once per module.
2982fe531cbSDuncan P. N. Exon Smith   if (CGM.getModule().getFunction("__llvm_pgo_init"))
299a5f804a7SDuncan P. N. Exon Smith     return nullptr;
300ef512b99SJustin Bogner 
301*5188e91cSDuncan P. N. Exon Smith   // Get the function to call at initialization.
3022fe531cbSDuncan P. N. Exon Smith   llvm::Constant *RegisterF = getRegisterFunc(CGM);
303*5188e91cSDuncan P. N. Exon Smith   if (!RegisterF)
304a5f804a7SDuncan P. N. Exon Smith     return nullptr;
3052fe531cbSDuncan P. N. Exon Smith 
3062fe531cbSDuncan P. N. Exon Smith   // Create the initialization function.
3072fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
3082fe531cbSDuncan P. N. Exon Smith   auto *F = llvm::Function::Create(llvm::FunctionType::get(VoidTy, false),
3092fe531cbSDuncan P. N. Exon Smith                                    llvm::GlobalValue::InternalLinkage,
310ef512b99SJustin Bogner                                    "__llvm_pgo_init", &CGM.getModule());
311ef512b99SJustin Bogner   F->setUnnamedAddr(true);
312ef512b99SJustin Bogner   F->addFnAttr(llvm::Attribute::NoInline);
313ef512b99SJustin Bogner   if (CGM.getCodeGenOpts().DisableRedZone)
314ef512b99SJustin Bogner     F->addFnAttr(llvm::Attribute::NoRedZone);
315ef512b99SJustin Bogner 
3162fe531cbSDuncan P. N. Exon Smith   // Add the basic block and the necessary calls.
3172fe531cbSDuncan P. N. Exon Smith   CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", F));
3182fe531cbSDuncan P. N. Exon Smith   Builder.CreateCall(RegisterF);
3192fe531cbSDuncan P. N. Exon Smith   Builder.CreateRetVoid();
320ef512b99SJustin Bogner 
321ef512b99SJustin Bogner   return F;
322ef512b99SJustin Bogner }
323ef512b99SJustin Bogner 
324ef512b99SJustin Bogner namespace {
325ef512b99SJustin Bogner   /// A StmtVisitor that fills a map of statements to PGO counters.
326ef512b99SJustin Bogner   struct MapRegionCounters : public ConstStmtVisitor<MapRegionCounters> {
327ef512b99SJustin Bogner     /// The next counter value to assign.
328ef512b99SJustin Bogner     unsigned NextCounter;
329ef512b99SJustin Bogner     /// The map of statements to counters.
330ef512b99SJustin Bogner     llvm::DenseMap<const Stmt*, unsigned> *CounterMap;
331ef512b99SJustin Bogner 
332ef512b99SJustin Bogner     MapRegionCounters(llvm::DenseMap<const Stmt*, unsigned> *CounterMap) :
333ef512b99SJustin Bogner       NextCounter(0), CounterMap(CounterMap) {
334ef512b99SJustin Bogner     }
335ef512b99SJustin Bogner 
336ef512b99SJustin Bogner     void VisitChildren(const Stmt *S) {
337ef512b99SJustin Bogner       for (Stmt::const_child_range I = S->children(); I; ++I)
338ef512b99SJustin Bogner         if (*I)
339ef512b99SJustin Bogner          this->Visit(*I);
340ef512b99SJustin Bogner     }
341ef512b99SJustin Bogner     void VisitStmt(const Stmt *S) { VisitChildren(S); }
342ef512b99SJustin Bogner 
343ea278c32SJustin Bogner     /// Assign a counter to track entry to the function body.
344ef512b99SJustin Bogner     void VisitFunctionDecl(const FunctionDecl *S) {
345ef512b99SJustin Bogner       (*CounterMap)[S->getBody()] = NextCounter++;
346ef512b99SJustin Bogner       Visit(S->getBody());
347ef512b99SJustin Bogner     }
3485ec8fe19SBob Wilson     void VisitObjCMethodDecl(const ObjCMethodDecl *S) {
3495ec8fe19SBob Wilson       (*CounterMap)[S->getBody()] = NextCounter++;
3505ec8fe19SBob Wilson       Visit(S->getBody());
3515ec8fe19SBob Wilson     }
352c845c00aSBob Wilson     void VisitBlockDecl(const BlockDecl *S) {
353c845c00aSBob Wilson       (*CounterMap)[S->getBody()] = NextCounter++;
354c845c00aSBob Wilson       Visit(S->getBody());
355c845c00aSBob Wilson     }
356ea278c32SJustin Bogner     /// Assign a counter to track the block following a label.
357ef512b99SJustin Bogner     void VisitLabelStmt(const LabelStmt *S) {
358ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
359ef512b99SJustin Bogner       Visit(S->getSubStmt());
360ef512b99SJustin Bogner     }
361bf854f0fSBob Wilson     /// Assign a counter for the body of a while loop.
362ef512b99SJustin Bogner     void VisitWhileStmt(const WhileStmt *S) {
363bf854f0fSBob Wilson       (*CounterMap)[S] = NextCounter++;
364ef512b99SJustin Bogner       Visit(S->getCond());
365ef512b99SJustin Bogner       Visit(S->getBody());
366ef512b99SJustin Bogner     }
367bf854f0fSBob Wilson     /// Assign a counter for the body of a do-while loop.
368ef512b99SJustin Bogner     void VisitDoStmt(const DoStmt *S) {
369bf854f0fSBob Wilson       (*CounterMap)[S] = NextCounter++;
370ef512b99SJustin Bogner       Visit(S->getBody());
371ef512b99SJustin Bogner       Visit(S->getCond());
372ef512b99SJustin Bogner     }
373bf854f0fSBob Wilson     /// Assign a counter for the body of a for loop.
374ef512b99SJustin Bogner     void VisitForStmt(const ForStmt *S) {
375bf854f0fSBob Wilson       (*CounterMap)[S] = NextCounter++;
376bf854f0fSBob Wilson       if (S->getInit())
377bf854f0fSBob Wilson         Visit(S->getInit());
378ef512b99SJustin Bogner       const Expr *E;
379ef512b99SJustin Bogner       if ((E = S->getCond()))
380ef512b99SJustin Bogner         Visit(E);
381ef512b99SJustin Bogner       if ((E = S->getInc()))
382ef512b99SJustin Bogner         Visit(E);
383bf854f0fSBob Wilson       Visit(S->getBody());
384ef512b99SJustin Bogner     }
385bf854f0fSBob Wilson     /// Assign a counter for the body of a for-range loop.
386ef512b99SJustin Bogner     void VisitCXXForRangeStmt(const CXXForRangeStmt *S) {
387bf854f0fSBob Wilson       (*CounterMap)[S] = NextCounter++;
388bf854f0fSBob Wilson       Visit(S->getRangeStmt());
389bf854f0fSBob Wilson       Visit(S->getBeginEndStmt());
390bf854f0fSBob Wilson       Visit(S->getCond());
391bf854f0fSBob Wilson       Visit(S->getLoopVarStmt());
392ef512b99SJustin Bogner       Visit(S->getBody());
393bf854f0fSBob Wilson       Visit(S->getInc());
394ef512b99SJustin Bogner     }
395bf854f0fSBob Wilson     /// Assign a counter for the body of a for-collection loop.
396ef512b99SJustin Bogner     void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) {
397bf854f0fSBob Wilson       (*CounterMap)[S] = NextCounter++;
398ef512b99SJustin Bogner       Visit(S->getElement());
399ef512b99SJustin Bogner       Visit(S->getBody());
400ef512b99SJustin Bogner     }
401ef512b99SJustin Bogner     /// Assign a counter for the exit block of the switch statement.
402ef512b99SJustin Bogner     void VisitSwitchStmt(const SwitchStmt *S) {
403ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
404ef512b99SJustin Bogner       Visit(S->getCond());
405ef512b99SJustin Bogner       Visit(S->getBody());
406ef512b99SJustin Bogner     }
407ef512b99SJustin Bogner     /// Assign a counter for a particular case in a switch. This counts jumps
408ef512b99SJustin Bogner     /// from the switch header as well as fallthrough from the case before this
409ef512b99SJustin Bogner     /// one.
410ef512b99SJustin Bogner     void VisitCaseStmt(const CaseStmt *S) {
411ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
412ef512b99SJustin Bogner       Visit(S->getSubStmt());
413ef512b99SJustin Bogner     }
414ef512b99SJustin Bogner     /// Assign a counter for the default case of a switch statement. The count
415ef512b99SJustin Bogner     /// is the number of branches from the loop header to the default, and does
416ef512b99SJustin Bogner     /// not include fallthrough from previous cases. If we have multiple
417ef512b99SJustin Bogner     /// conditional branch blocks from the switch instruction to the default
418ef512b99SJustin Bogner     /// block, as with large GNU case ranges, this is the counter for the last
419ef512b99SJustin Bogner     /// edge in that series, rather than the first.
420ef512b99SJustin Bogner     void VisitDefaultStmt(const DefaultStmt *S) {
421ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
422ef512b99SJustin Bogner       Visit(S->getSubStmt());
423ef512b99SJustin Bogner     }
424ef512b99SJustin Bogner     /// Assign a counter for the "then" part of an if statement. The count for
425ef512b99SJustin Bogner     /// the "else" part, if it exists, will be calculated from this counter.
426ef512b99SJustin Bogner     void VisitIfStmt(const IfStmt *S) {
427ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
428ef512b99SJustin Bogner       Visit(S->getCond());
429ef512b99SJustin Bogner       Visit(S->getThen());
430ef512b99SJustin Bogner       if (S->getElse())
431ef512b99SJustin Bogner         Visit(S->getElse());
432ef512b99SJustin Bogner     }
433ef512b99SJustin Bogner     /// Assign a counter for the continuation block of a C++ try statement.
434ef512b99SJustin Bogner     void VisitCXXTryStmt(const CXXTryStmt *S) {
435ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
436ef512b99SJustin Bogner       Visit(S->getTryBlock());
437ef512b99SJustin Bogner       for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I)
438ef512b99SJustin Bogner         Visit(S->getHandler(I));
439ef512b99SJustin Bogner     }
440ef512b99SJustin Bogner     /// Assign a counter for a catch statement's handler block.
441ef512b99SJustin Bogner     void VisitCXXCatchStmt(const CXXCatchStmt *S) {
442ef512b99SJustin Bogner       (*CounterMap)[S] = NextCounter++;
443ef512b99SJustin Bogner       Visit(S->getHandlerBlock());
444ef512b99SJustin Bogner     }
445ef512b99SJustin Bogner     /// Assign a counter for the "true" part of a conditional operator. The
446ef512b99SJustin Bogner     /// count in the "false" part will be calculated from this counter.
447ef512b99SJustin Bogner     void VisitConditionalOperator(const ConditionalOperator *E) {
448ef512b99SJustin Bogner       (*CounterMap)[E] = NextCounter++;
449ef512b99SJustin Bogner       Visit(E->getCond());
450ef512b99SJustin Bogner       Visit(E->getTrueExpr());
451ef512b99SJustin Bogner       Visit(E->getFalseExpr());
452ef512b99SJustin Bogner     }
453ef512b99SJustin Bogner     /// Assign a counter for the right hand side of a logical and operator.
454ef512b99SJustin Bogner     void VisitBinLAnd(const BinaryOperator *E) {
455ef512b99SJustin Bogner       (*CounterMap)[E] = NextCounter++;
456ef512b99SJustin Bogner       Visit(E->getLHS());
457ef512b99SJustin Bogner       Visit(E->getRHS());
458ef512b99SJustin Bogner     }
459ef512b99SJustin Bogner     /// Assign a counter for the right hand side of a logical or operator.
460ef512b99SJustin Bogner     void VisitBinLOr(const BinaryOperator *E) {
461ef512b99SJustin Bogner       (*CounterMap)[E] = NextCounter++;
462ef512b99SJustin Bogner       Visit(E->getLHS());
463ef512b99SJustin Bogner       Visit(E->getRHS());
464ef512b99SJustin Bogner     }
465ef512b99SJustin Bogner   };
466bf854f0fSBob Wilson 
467bf854f0fSBob Wilson   /// A StmtVisitor that propagates the raw counts through the AST and
468bf854f0fSBob Wilson   /// records the count at statements where the value may change.
469bf854f0fSBob Wilson   struct ComputeRegionCounts : public ConstStmtVisitor<ComputeRegionCounts> {
470bf854f0fSBob Wilson     /// PGO state.
471bf854f0fSBob Wilson     CodeGenPGO &PGO;
472bf854f0fSBob Wilson 
473bf854f0fSBob Wilson     /// A flag that is set when the current count should be recorded on the
474bf854f0fSBob Wilson     /// next statement, such as at the exit of a loop.
475bf854f0fSBob Wilson     bool RecordNextStmtCount;
476bf854f0fSBob Wilson 
477bf854f0fSBob Wilson     /// The map of statements to count values.
478bf854f0fSBob Wilson     llvm::DenseMap<const Stmt*, uint64_t> *CountMap;
479bf854f0fSBob Wilson 
480bf854f0fSBob Wilson     /// BreakContinueStack - Keep counts of breaks and continues inside loops.
481bf854f0fSBob Wilson     struct BreakContinue {
482bf854f0fSBob Wilson       uint64_t BreakCount;
483bf854f0fSBob Wilson       uint64_t ContinueCount;
484bf854f0fSBob Wilson       BreakContinue() : BreakCount(0), ContinueCount(0) {}
485bf854f0fSBob Wilson     };
486bf854f0fSBob Wilson     SmallVector<BreakContinue, 8> BreakContinueStack;
487bf854f0fSBob Wilson 
488bf854f0fSBob Wilson     ComputeRegionCounts(llvm::DenseMap<const Stmt*, uint64_t> *CountMap,
489bf854f0fSBob Wilson                         CodeGenPGO &PGO) :
490bf854f0fSBob Wilson       PGO(PGO), RecordNextStmtCount(false), CountMap(CountMap) {
491bf854f0fSBob Wilson     }
492bf854f0fSBob Wilson 
493bf854f0fSBob Wilson     void RecordStmtCount(const Stmt *S) {
494bf854f0fSBob Wilson       if (RecordNextStmtCount) {
495bf854f0fSBob Wilson         (*CountMap)[S] = PGO.getCurrentRegionCount();
496bf854f0fSBob Wilson         RecordNextStmtCount = false;
497bf854f0fSBob Wilson       }
498bf854f0fSBob Wilson     }
499bf854f0fSBob Wilson 
500bf854f0fSBob Wilson     void VisitStmt(const Stmt *S) {
501bf854f0fSBob Wilson       RecordStmtCount(S);
502bf854f0fSBob Wilson       for (Stmt::const_child_range I = S->children(); I; ++I) {
503bf854f0fSBob Wilson         if (*I)
504bf854f0fSBob Wilson          this->Visit(*I);
505bf854f0fSBob Wilson       }
506bf854f0fSBob Wilson     }
507bf854f0fSBob Wilson 
508bf854f0fSBob Wilson     void VisitFunctionDecl(const FunctionDecl *S) {
509bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S->getBody());
510bf854f0fSBob Wilson       Cnt.beginRegion();
511bf854f0fSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
512bf854f0fSBob Wilson       Visit(S->getBody());
513bf854f0fSBob Wilson     }
514bf854f0fSBob Wilson 
5155ec8fe19SBob Wilson     void VisitObjCMethodDecl(const ObjCMethodDecl *S) {
5165ec8fe19SBob Wilson       RegionCounter Cnt(PGO, S->getBody());
5175ec8fe19SBob Wilson       Cnt.beginRegion();
5185ec8fe19SBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
5195ec8fe19SBob Wilson       Visit(S->getBody());
5205ec8fe19SBob Wilson     }
5215ec8fe19SBob Wilson 
522c845c00aSBob Wilson     void VisitBlockDecl(const BlockDecl *S) {
523c845c00aSBob Wilson       RegionCounter Cnt(PGO, S->getBody());
524c845c00aSBob Wilson       Cnt.beginRegion();
525c845c00aSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
526c845c00aSBob Wilson       Visit(S->getBody());
527c845c00aSBob Wilson     }
528c845c00aSBob Wilson 
529bf854f0fSBob Wilson     void VisitReturnStmt(const ReturnStmt *S) {
530bf854f0fSBob Wilson       RecordStmtCount(S);
531bf854f0fSBob Wilson       if (S->getRetValue())
532bf854f0fSBob Wilson         Visit(S->getRetValue());
533bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
534bf854f0fSBob Wilson       RecordNextStmtCount = true;
535bf854f0fSBob Wilson     }
536bf854f0fSBob Wilson 
537bf854f0fSBob Wilson     void VisitGotoStmt(const GotoStmt *S) {
538bf854f0fSBob Wilson       RecordStmtCount(S);
539bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
540bf854f0fSBob Wilson       RecordNextStmtCount = true;
541bf854f0fSBob Wilson     }
542bf854f0fSBob Wilson 
543bf854f0fSBob Wilson     void VisitLabelStmt(const LabelStmt *S) {
544bf854f0fSBob Wilson       RecordNextStmtCount = false;
545bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
546bf854f0fSBob Wilson       Cnt.beginRegion();
547bf854f0fSBob Wilson       (*CountMap)[S] = PGO.getCurrentRegionCount();
548bf854f0fSBob Wilson       Visit(S->getSubStmt());
549bf854f0fSBob Wilson     }
550bf854f0fSBob Wilson 
551bf854f0fSBob Wilson     void VisitBreakStmt(const BreakStmt *S) {
552bf854f0fSBob Wilson       RecordStmtCount(S);
553bf854f0fSBob Wilson       assert(!BreakContinueStack.empty() && "break not in a loop or switch!");
554bf854f0fSBob Wilson       BreakContinueStack.back().BreakCount += PGO.getCurrentRegionCount();
555bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
556bf854f0fSBob Wilson       RecordNextStmtCount = true;
557bf854f0fSBob Wilson     }
558bf854f0fSBob Wilson 
559bf854f0fSBob Wilson     void VisitContinueStmt(const ContinueStmt *S) {
560bf854f0fSBob Wilson       RecordStmtCount(S);
561bf854f0fSBob Wilson       assert(!BreakContinueStack.empty() && "continue stmt not in a loop!");
562bf854f0fSBob Wilson       BreakContinueStack.back().ContinueCount += PGO.getCurrentRegionCount();
563bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
564bf854f0fSBob Wilson       RecordNextStmtCount = true;
565bf854f0fSBob Wilson     }
566bf854f0fSBob Wilson 
567bf854f0fSBob Wilson     void VisitWhileStmt(const WhileStmt *S) {
568bf854f0fSBob Wilson       RecordStmtCount(S);
569bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
570bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
571bf854f0fSBob Wilson       // Visit the body region first so the break/continue adjustments can be
572bf854f0fSBob Wilson       // included when visiting the condition.
573bf854f0fSBob Wilson       Cnt.beginRegion();
574bf854f0fSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
575bf854f0fSBob Wilson       Visit(S->getBody());
576bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
577bf854f0fSBob Wilson 
578bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition. The count
579bf854f0fSBob Wilson       // at the start of the condition is the sum of the incoming edges,
580bf854f0fSBob Wilson       // the backedge from the end of the loop body, and the edges from
581bf854f0fSBob Wilson       // continue statements.
582bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
583bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
584bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() + BC.ContinueCount);
585bf854f0fSBob Wilson       (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount();
586bf854f0fSBob Wilson       Visit(S->getCond());
587bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
588bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
589bf854f0fSBob Wilson       RecordNextStmtCount = true;
590bf854f0fSBob Wilson     }
591bf854f0fSBob Wilson 
592bf854f0fSBob Wilson     void VisitDoStmt(const DoStmt *S) {
593bf854f0fSBob Wilson       RecordStmtCount(S);
594bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
595bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
596bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
597bf854f0fSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
598bf854f0fSBob Wilson       Visit(S->getBody());
599bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
600bf854f0fSBob Wilson 
601bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
602bf854f0fSBob Wilson       // The count at the start of the condition is equal to the count at the
603bf854f0fSBob Wilson       // end of the body. The adjusted count does not include either the
604bf854f0fSBob Wilson       // fall-through count coming into the loop or the continue count, so add
605bf854f0fSBob Wilson       // both of those separately. This is coincidentally the same equation as
606bf854f0fSBob Wilson       // with while loops but for different reasons.
607bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
608bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() + BC.ContinueCount);
609bf854f0fSBob Wilson       (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount();
610bf854f0fSBob Wilson       Visit(S->getCond());
611bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
612bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
613bf854f0fSBob Wilson       RecordNextStmtCount = true;
614bf854f0fSBob Wilson     }
615bf854f0fSBob Wilson 
616bf854f0fSBob Wilson     void VisitForStmt(const ForStmt *S) {
617bf854f0fSBob Wilson       RecordStmtCount(S);
618bf854f0fSBob Wilson       if (S->getInit())
619bf854f0fSBob Wilson         Visit(S->getInit());
620bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
621bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
622bf854f0fSBob Wilson       // Visit the body region first. (This is basically the same as a while
623bf854f0fSBob Wilson       // loop; see further comments in VisitWhileStmt.)
624bf854f0fSBob Wilson       Cnt.beginRegion();
625bf854f0fSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
626bf854f0fSBob Wilson       Visit(S->getBody());
627bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
628bf854f0fSBob Wilson 
629bf854f0fSBob Wilson       // The increment is essentially part of the body but it needs to include
630bf854f0fSBob Wilson       // the count for all the continue statements.
631bf854f0fSBob Wilson       if (S->getInc()) {
632bf854f0fSBob Wilson         Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() +
633bf854f0fSBob Wilson                                   BreakContinueStack.back().ContinueCount);
634bf854f0fSBob Wilson         (*CountMap)[S->getInc()] = PGO.getCurrentRegionCount();
635bf854f0fSBob Wilson         Visit(S->getInc());
636bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
637bf854f0fSBob Wilson       }
638bf854f0fSBob Wilson 
639bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
640bf854f0fSBob Wilson 
641bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition.
642bf854f0fSBob Wilson       if (S->getCond()) {
643bf854f0fSBob Wilson         Cnt.setCurrentRegionCount(Cnt.getParentCount() +
644bf854f0fSBob Wilson                                   Cnt.getAdjustedCount() +
645bf854f0fSBob Wilson                                   BC.ContinueCount);
646bf854f0fSBob Wilson         (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount();
647bf854f0fSBob Wilson         Visit(S->getCond());
648bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
649bf854f0fSBob Wilson       }
650bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
651bf854f0fSBob Wilson       RecordNextStmtCount = true;
652bf854f0fSBob Wilson     }
653bf854f0fSBob Wilson 
654bf854f0fSBob Wilson     void VisitCXXForRangeStmt(const CXXForRangeStmt *S) {
655bf854f0fSBob Wilson       RecordStmtCount(S);
656bf854f0fSBob Wilson       Visit(S->getRangeStmt());
657bf854f0fSBob Wilson       Visit(S->getBeginEndStmt());
658bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
659bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
660bf854f0fSBob Wilson       // Visit the body region first. (This is basically the same as a while
661bf854f0fSBob Wilson       // loop; see further comments in VisitWhileStmt.)
662bf854f0fSBob Wilson       Cnt.beginRegion();
663bf854f0fSBob Wilson       (*CountMap)[S->getLoopVarStmt()] = PGO.getCurrentRegionCount();
664bf854f0fSBob Wilson       Visit(S->getLoopVarStmt());
665bf854f0fSBob Wilson       Visit(S->getBody());
666bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
667bf854f0fSBob Wilson 
668bf854f0fSBob Wilson       // The increment is essentially part of the body but it needs to include
669bf854f0fSBob Wilson       // the count for all the continue statements.
670bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() +
671bf854f0fSBob Wilson                                 BreakContinueStack.back().ContinueCount);
672bf854f0fSBob Wilson       (*CountMap)[S->getInc()] = PGO.getCurrentRegionCount();
673bf854f0fSBob Wilson       Visit(S->getInc());
674bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
675bf854f0fSBob Wilson 
676bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
677bf854f0fSBob Wilson 
678bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition.
679bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
680bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() +
681bf854f0fSBob Wilson                                 BC.ContinueCount);
682bf854f0fSBob Wilson       (*CountMap)[S->getCond()] = PGO.getCurrentRegionCount();
683bf854f0fSBob Wilson       Visit(S->getCond());
684bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
685bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
686bf854f0fSBob Wilson       RecordNextStmtCount = true;
687bf854f0fSBob Wilson     }
688bf854f0fSBob Wilson 
689bf854f0fSBob Wilson     void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) {
690bf854f0fSBob Wilson       RecordStmtCount(S);
691bf854f0fSBob Wilson       Visit(S->getElement());
692bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
693bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
694bf854f0fSBob Wilson       Cnt.beginRegion();
695bf854f0fSBob Wilson       (*CountMap)[S->getBody()] = PGO.getCurrentRegionCount();
696bf854f0fSBob Wilson       Visit(S->getBody());
697bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
698bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
699bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
700bf854f0fSBob Wilson       RecordNextStmtCount = true;
701bf854f0fSBob Wilson     }
702bf854f0fSBob Wilson 
703bf854f0fSBob Wilson     void VisitSwitchStmt(const SwitchStmt *S) {
704bf854f0fSBob Wilson       RecordStmtCount(S);
705bf854f0fSBob Wilson       Visit(S->getCond());
706bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
707bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
708bf854f0fSBob Wilson       Visit(S->getBody());
709bf854f0fSBob Wilson       // If the switch is inside a loop, add the continue counts.
710bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
711bf854f0fSBob Wilson       if (!BreakContinueStack.empty())
712bf854f0fSBob Wilson         BreakContinueStack.back().ContinueCount += BC.ContinueCount;
713bf854f0fSBob Wilson       RegionCounter ExitCnt(PGO, S);
714bf854f0fSBob Wilson       ExitCnt.beginRegion();
715bf854f0fSBob Wilson       RecordNextStmtCount = true;
716bf854f0fSBob Wilson     }
717bf854f0fSBob Wilson 
718bf854f0fSBob Wilson     void VisitCaseStmt(const CaseStmt *S) {
719bf854f0fSBob Wilson       RecordNextStmtCount = false;
720bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
721bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
722bf854f0fSBob Wilson       (*CountMap)[S] = Cnt.getCount();
723bf854f0fSBob Wilson       RecordNextStmtCount = true;
724bf854f0fSBob Wilson       Visit(S->getSubStmt());
725bf854f0fSBob Wilson     }
726bf854f0fSBob Wilson 
727bf854f0fSBob Wilson     void VisitDefaultStmt(const DefaultStmt *S) {
728bf854f0fSBob Wilson       RecordNextStmtCount = false;
729bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
730bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
731bf854f0fSBob Wilson       (*CountMap)[S] = Cnt.getCount();
732bf854f0fSBob Wilson       RecordNextStmtCount = true;
733bf854f0fSBob Wilson       Visit(S->getSubStmt());
734bf854f0fSBob Wilson     }
735bf854f0fSBob Wilson 
736bf854f0fSBob Wilson     void VisitIfStmt(const IfStmt *S) {
737bf854f0fSBob Wilson       RecordStmtCount(S);
738bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
739bf854f0fSBob Wilson       Visit(S->getCond());
740bf854f0fSBob Wilson 
741bf854f0fSBob Wilson       Cnt.beginRegion();
742bf854f0fSBob Wilson       (*CountMap)[S->getThen()] = PGO.getCurrentRegionCount();
743bf854f0fSBob Wilson       Visit(S->getThen());
744bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
745bf854f0fSBob Wilson 
746bf854f0fSBob Wilson       if (S->getElse()) {
747bf854f0fSBob Wilson         Cnt.beginElseRegion();
748bf854f0fSBob Wilson         (*CountMap)[S->getElse()] = PGO.getCurrentRegionCount();
749bf854f0fSBob Wilson         Visit(S->getElse());
750bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
751bf854f0fSBob Wilson       }
752bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
753bf854f0fSBob Wilson       RecordNextStmtCount = true;
754bf854f0fSBob Wilson     }
755bf854f0fSBob Wilson 
756bf854f0fSBob Wilson     void VisitCXXTryStmt(const CXXTryStmt *S) {
757bf854f0fSBob Wilson       RecordStmtCount(S);
758bf854f0fSBob Wilson       Visit(S->getTryBlock());
759bf854f0fSBob Wilson       for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I)
760bf854f0fSBob Wilson         Visit(S->getHandler(I));
761bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
762bf854f0fSBob Wilson       Cnt.beginRegion();
763bf854f0fSBob Wilson       RecordNextStmtCount = true;
764bf854f0fSBob Wilson     }
765bf854f0fSBob Wilson 
766bf854f0fSBob Wilson     void VisitCXXCatchStmt(const CXXCatchStmt *S) {
767bf854f0fSBob Wilson       RecordNextStmtCount = false;
768bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
769bf854f0fSBob Wilson       Cnt.beginRegion();
770bf854f0fSBob Wilson       (*CountMap)[S] = PGO.getCurrentRegionCount();
771bf854f0fSBob Wilson       Visit(S->getHandlerBlock());
772bf854f0fSBob Wilson     }
773bf854f0fSBob Wilson 
774bf854f0fSBob Wilson     void VisitConditionalOperator(const ConditionalOperator *E) {
775bf854f0fSBob Wilson       RecordStmtCount(E);
776bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
777bf854f0fSBob Wilson       Visit(E->getCond());
778bf854f0fSBob Wilson 
779bf854f0fSBob Wilson       Cnt.beginRegion();
780bf854f0fSBob Wilson       (*CountMap)[E->getTrueExpr()] = PGO.getCurrentRegionCount();
781bf854f0fSBob Wilson       Visit(E->getTrueExpr());
782bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
783bf854f0fSBob Wilson 
784bf854f0fSBob Wilson       Cnt.beginElseRegion();
785bf854f0fSBob Wilson       (*CountMap)[E->getFalseExpr()] = PGO.getCurrentRegionCount();
786bf854f0fSBob Wilson       Visit(E->getFalseExpr());
787bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
788bf854f0fSBob Wilson 
789bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
790bf854f0fSBob Wilson       RecordNextStmtCount = true;
791bf854f0fSBob Wilson     }
792bf854f0fSBob Wilson 
793bf854f0fSBob Wilson     void VisitBinLAnd(const BinaryOperator *E) {
794bf854f0fSBob Wilson       RecordStmtCount(E);
795bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
796bf854f0fSBob Wilson       Visit(E->getLHS());
797bf854f0fSBob Wilson       Cnt.beginRegion();
798bf854f0fSBob Wilson       (*CountMap)[E->getRHS()] = PGO.getCurrentRegionCount();
799bf854f0fSBob Wilson       Visit(E->getRHS());
800bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
801bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
802bf854f0fSBob Wilson       RecordNextStmtCount = true;
803bf854f0fSBob Wilson     }
804bf854f0fSBob Wilson 
805bf854f0fSBob Wilson     void VisitBinLOr(const BinaryOperator *E) {
806bf854f0fSBob Wilson       RecordStmtCount(E);
807bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
808bf854f0fSBob Wilson       Visit(E->getLHS());
809bf854f0fSBob Wilson       Cnt.beginRegion();
810bf854f0fSBob Wilson       (*CountMap)[E->getRHS()] = PGO.getCurrentRegionCount();
811bf854f0fSBob Wilson       Visit(E->getRHS());
812bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
813bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
814bf854f0fSBob Wilson       RecordNextStmtCount = true;
815bf854f0fSBob Wilson     }
816bf854f0fSBob Wilson   };
817ef512b99SJustin Bogner }
818ef512b99SJustin Bogner 
819da1ebedeSBob Wilson void CodeGenPGO::assignRegionCounters(const Decl *D, llvm::Function *Fn) {
820ef512b99SJustin Bogner   bool InstrumentRegions = CGM.getCodeGenOpts().ProfileInstrGenerate;
821d66a17d0SJustin Bogner   PGOProfileData *PGOData = CGM.getPGOData();
822d66a17d0SJustin Bogner   if (!InstrumentRegions && !PGOData)
823ef512b99SJustin Bogner     return;
824ef512b99SJustin Bogner   if (!D)
825ef512b99SJustin Bogner     return;
826da1ebedeSBob Wilson   setFuncName(Fn);
8272fe531cbSDuncan P. N. Exon Smith   FuncLinkage = Fn->getLinkage();
828ef512b99SJustin Bogner   mapRegionCounters(D);
829ef512b99SJustin Bogner   if (InstrumentRegions)
830ef512b99SJustin Bogner     emitCounterVariables();
831d66a17d0SJustin Bogner   if (PGOData) {
832d66a17d0SJustin Bogner     loadRegionCounts(PGOData);
833bf854f0fSBob Wilson     computeRegionCounts(D);
834d66a17d0SJustin Bogner     applyFunctionAttributes(PGOData, Fn);
835bf854f0fSBob Wilson   }
836ef512b99SJustin Bogner }
837ef512b99SJustin Bogner 
838ef512b99SJustin Bogner void CodeGenPGO::mapRegionCounters(const Decl *D) {
839ef512b99SJustin Bogner   RegionCounterMap = new llvm::DenseMap<const Stmt*, unsigned>();
840ef512b99SJustin Bogner   MapRegionCounters Walker(RegionCounterMap);
841ef512b99SJustin Bogner   if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D))
842ef512b99SJustin Bogner     Walker.VisitFunctionDecl(FD);
8435ec8fe19SBob Wilson   else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D))
8445ec8fe19SBob Wilson     Walker.VisitObjCMethodDecl(MD);
845c845c00aSBob Wilson   else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D))
846c845c00aSBob Wilson     Walker.VisitBlockDecl(BD);
847ef512b99SJustin Bogner   NumRegionCounters = Walker.NextCounter;
848b4416f58SJustin Bogner   // FIXME: The number of counters isn't sufficient for the hash
849b4416f58SJustin Bogner   FunctionHash = NumRegionCounters;
850ef512b99SJustin Bogner }
851ef512b99SJustin Bogner 
852bf854f0fSBob Wilson void CodeGenPGO::computeRegionCounts(const Decl *D) {
853bf854f0fSBob Wilson   StmtCountMap = new llvm::DenseMap<const Stmt*, uint64_t>();
854bf854f0fSBob Wilson   ComputeRegionCounts Walker(StmtCountMap, *this);
855bf854f0fSBob Wilson   if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D))
856bf854f0fSBob Wilson     Walker.VisitFunctionDecl(FD);
8575ec8fe19SBob Wilson   else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D))
8585ec8fe19SBob Wilson     Walker.VisitObjCMethodDecl(MD);
859c845c00aSBob Wilson   else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D))
860c845c00aSBob Wilson     Walker.VisitBlockDecl(BD);
861bf854f0fSBob Wilson }
862bf854f0fSBob Wilson 
863d66a17d0SJustin Bogner void CodeGenPGO::applyFunctionAttributes(PGOProfileData *PGOData,
8644c9c45c0SJustin Bogner                                          llvm::Function *Fn) {
8654c9c45c0SJustin Bogner   if (!haveRegionCounts())
8664c9c45c0SJustin Bogner     return;
8674c9c45c0SJustin Bogner 
868d66a17d0SJustin Bogner   uint64_t MaxFunctionCount = PGOData->getMaximumFunctionCount();
8694c9c45c0SJustin Bogner   uint64_t FunctionCount = getRegionCount(0);
8704c9c45c0SJustin Bogner   if (FunctionCount >= (uint64_t)(0.3 * (double)MaxFunctionCount))
8714c9c45c0SJustin Bogner     // Turn on InlineHint attribute for hot functions.
8724c9c45c0SJustin Bogner     // FIXME: 30% is from preliminary tuning on SPEC, it may not be optimal.
8734c9c45c0SJustin Bogner     Fn->addFnAttr(llvm::Attribute::InlineHint);
8744c9c45c0SJustin Bogner   else if (FunctionCount <= (uint64_t)(0.01 * (double)MaxFunctionCount))
8754c9c45c0SJustin Bogner     // Turn on Cold attribute for cold functions.
8764c9c45c0SJustin Bogner     // FIXME: 1% is from preliminary tuning on SPEC, it may not be optimal.
8774c9c45c0SJustin Bogner     Fn->addFnAttr(llvm::Attribute::Cold);
8784c9c45c0SJustin Bogner }
8794c9c45c0SJustin Bogner 
880ef512b99SJustin Bogner void CodeGenPGO::emitCounterVariables() {
881ef512b99SJustin Bogner   llvm::LLVMContext &Ctx = CGM.getLLVMContext();
882ef512b99SJustin Bogner   llvm::ArrayType *CounterTy = llvm::ArrayType::get(llvm::Type::getInt64Ty(Ctx),
883ef512b99SJustin Bogner                                                     NumRegionCounters);
884ef512b99SJustin Bogner   RegionCounters =
8852fe531cbSDuncan P. N. Exon Smith     new llvm::GlobalVariable(CGM.getModule(), CounterTy, false, FuncLinkage,
886ef512b99SJustin Bogner                              llvm::Constant::getNullValue(CounterTy),
8872fe531cbSDuncan P. N. Exon Smith                              getFuncVarName("counters"));
8882fe531cbSDuncan P. N. Exon Smith   RegionCounters->setAlignment(8);
8892fe531cbSDuncan P. N. Exon Smith   RegionCounters->setSection(getCountersSection(CGM));
890ef512b99SJustin Bogner }
891ef512b99SJustin Bogner 
892ef512b99SJustin Bogner void CodeGenPGO::emitCounterIncrement(CGBuilderTy &Builder, unsigned Counter) {
893749ebc7fSBob Wilson   if (!RegionCounters)
894ef512b99SJustin Bogner     return;
895ef512b99SJustin Bogner   llvm::Value *Addr =
896ef512b99SJustin Bogner     Builder.CreateConstInBoundsGEP2_64(RegionCounters, 0, Counter);
897ef512b99SJustin Bogner   llvm::Value *Count = Builder.CreateLoad(Addr, "pgocount");
898ef512b99SJustin Bogner   Count = Builder.CreateAdd(Count, Builder.getInt64(1));
899ef512b99SJustin Bogner   Builder.CreateStore(Count, Addr);
900ef512b99SJustin Bogner }
901ef512b99SJustin Bogner 
902d66a17d0SJustin Bogner void CodeGenPGO::loadRegionCounts(PGOProfileData *PGOData) {
903ef512b99SJustin Bogner   // For now, ignore the counts from the PGO data file only if the number of
904ef512b99SJustin Bogner   // counters does not match. This could be tightened down in the future to
905ef512b99SJustin Bogner   // ignore counts when the input changes in various ways, e.g., by comparing a
906ef512b99SJustin Bogner   // hash value based on some characteristics of the input.
907ef512b99SJustin Bogner   RegionCounts = new std::vector<uint64_t>();
908b4416f58SJustin Bogner   uint64_t Hash;
909b4416f58SJustin Bogner   if (PGOData->getFunctionCounts(getFuncName(), Hash, *RegionCounts) ||
910b4416f58SJustin Bogner       Hash != FunctionHash || RegionCounts->size() != NumRegionCounters) {
911ef512b99SJustin Bogner     delete RegionCounts;
912ef512b99SJustin Bogner     RegionCounts = 0;
913ef512b99SJustin Bogner   }
914ef512b99SJustin Bogner }
915ef512b99SJustin Bogner 
916ef512b99SJustin Bogner void CodeGenPGO::destroyRegionCounters() {
917ef512b99SJustin Bogner   if (RegionCounterMap != 0)
918ef512b99SJustin Bogner     delete RegionCounterMap;
919bf854f0fSBob Wilson   if (StmtCountMap != 0)
920bf854f0fSBob Wilson     delete StmtCountMap;
921ef512b99SJustin Bogner   if (RegionCounts != 0)
922ef512b99SJustin Bogner     delete RegionCounts;
923ef512b99SJustin Bogner }
924ef512b99SJustin Bogner 
92538402dc9SDuncan P. N. Exon Smith /// \brief Calculate what to divide by to scale weights.
92638402dc9SDuncan P. N. Exon Smith ///
92738402dc9SDuncan P. N. Exon Smith /// Given the maximum weight, calculate a divisor that will scale all the
92838402dc9SDuncan P. N. Exon Smith /// weights to strictly less than UINT32_MAX.
92938402dc9SDuncan P. N. Exon Smith static uint64_t calculateWeightScale(uint64_t MaxWeight) {
93038402dc9SDuncan P. N. Exon Smith   return MaxWeight < UINT32_MAX ? 1 : MaxWeight / UINT32_MAX + 1;
93138402dc9SDuncan P. N. Exon Smith }
93238402dc9SDuncan P. N. Exon Smith 
93338402dc9SDuncan P. N. Exon Smith /// \brief Scale an individual branch weight (and add 1).
93438402dc9SDuncan P. N. Exon Smith ///
93538402dc9SDuncan P. N. Exon Smith /// Scale a 64-bit weight down to 32-bits using \c Scale.
93638402dc9SDuncan P. N. Exon Smith ///
93738402dc9SDuncan P. N. Exon Smith /// According to Laplace's Rule of Succession, it is better to compute the
93838402dc9SDuncan P. N. Exon Smith /// weight based on the count plus 1, so universally add 1 to the value.
93938402dc9SDuncan P. N. Exon Smith ///
94038402dc9SDuncan P. N. Exon Smith /// \pre \c Scale was calculated by \a calculateWeightScale() with a weight no
94138402dc9SDuncan P. N. Exon Smith /// greater than \c Weight.
94238402dc9SDuncan P. N. Exon Smith static uint32_t scaleBranchWeight(uint64_t Weight, uint64_t Scale) {
94338402dc9SDuncan P. N. Exon Smith   assert(Scale && "scale by 0?");
94438402dc9SDuncan P. N. Exon Smith   uint64_t Scaled = Weight / Scale + 1;
94538402dc9SDuncan P. N. Exon Smith   assert(Scaled <= UINT32_MAX && "overflow 32-bits");
94638402dc9SDuncan P. N. Exon Smith   return Scaled;
94738402dc9SDuncan P. N. Exon Smith }
94838402dc9SDuncan P. N. Exon Smith 
949ef512b99SJustin Bogner llvm::MDNode *CodeGenPGO::createBranchWeights(uint64_t TrueCount,
950ef512b99SJustin Bogner                                               uint64_t FalseCount) {
95138402dc9SDuncan P. N. Exon Smith   // Check for empty weights.
952ef512b99SJustin Bogner   if (!TrueCount && !FalseCount)
953a5f804a7SDuncan P. N. Exon Smith     return nullptr;
954ef512b99SJustin Bogner 
95538402dc9SDuncan P. N. Exon Smith   // Calculate how to scale down to 32-bits.
95638402dc9SDuncan P. N. Exon Smith   uint64_t Scale = calculateWeightScale(std::max(TrueCount, FalseCount));
95738402dc9SDuncan P. N. Exon Smith 
958ef512b99SJustin Bogner   llvm::MDBuilder MDHelper(CGM.getLLVMContext());
95938402dc9SDuncan P. N. Exon Smith   return MDHelper.createBranchWeights(scaleBranchWeight(TrueCount, Scale),
96038402dc9SDuncan P. N. Exon Smith                                       scaleBranchWeight(FalseCount, Scale));
961ef512b99SJustin Bogner }
962ef512b99SJustin Bogner 
96395a27b0eSBob Wilson llvm::MDNode *CodeGenPGO::createBranchWeights(ArrayRef<uint64_t> Weights) {
96438402dc9SDuncan P. N. Exon Smith   // We need at least two elements to create meaningful weights.
96538402dc9SDuncan P. N. Exon Smith   if (Weights.size() < 2)
966a5f804a7SDuncan P. N. Exon Smith     return nullptr;
96738402dc9SDuncan P. N. Exon Smith 
96838402dc9SDuncan P. N. Exon Smith   // Calculate how to scale down to 32-bits.
96938402dc9SDuncan P. N. Exon Smith   uint64_t Scale = calculateWeightScale(*std::max_element(Weights.begin(),
97038402dc9SDuncan P. N. Exon Smith                                                           Weights.end()));
97138402dc9SDuncan P. N. Exon Smith 
972ef512b99SJustin Bogner   SmallVector<uint32_t, 16> ScaledWeights;
973ef512b99SJustin Bogner   ScaledWeights.reserve(Weights.size());
97438402dc9SDuncan P. N. Exon Smith   for (uint64_t W : Weights)
97538402dc9SDuncan P. N. Exon Smith     ScaledWeights.push_back(scaleBranchWeight(W, Scale));
97638402dc9SDuncan P. N. Exon Smith 
97738402dc9SDuncan P. N. Exon Smith   llvm::MDBuilder MDHelper(CGM.getLLVMContext());
978ef512b99SJustin Bogner   return MDHelper.createBranchWeights(ScaledWeights);
979ef512b99SJustin Bogner }
980bf854f0fSBob Wilson 
981bf854f0fSBob Wilson llvm::MDNode *CodeGenPGO::createLoopWeights(const Stmt *Cond,
982bf854f0fSBob Wilson                                             RegionCounter &Cnt) {
983bf854f0fSBob Wilson   if (!haveRegionCounts())
984a5f804a7SDuncan P. N. Exon Smith     return nullptr;
985bf854f0fSBob Wilson   uint64_t LoopCount = Cnt.getCount();
986bf854f0fSBob Wilson   uint64_t CondCount = 0;
987bf854f0fSBob Wilson   bool Found = getStmtCount(Cond, CondCount);
988bf854f0fSBob Wilson   assert(Found && "missing expected loop condition count");
989bf854f0fSBob Wilson   (void)Found;
990bf854f0fSBob Wilson   if (CondCount == 0)
991a5f804a7SDuncan P. N. Exon Smith     return nullptr;
992bf854f0fSBob Wilson   return createBranchWeights(LoopCount,
993bf854f0fSBob Wilson                              std::max(CondCount, LoopCount) - LoopCount);
994bf854f0fSBob Wilson }
995