1ef512b99SJustin Bogner //===--- CodeGenPGO.cpp - PGO Instrumentation for LLVM CodeGen --*- C++ -*-===//
2ef512b99SJustin Bogner //
3ef512b99SJustin Bogner //                     The LLVM Compiler Infrastructure
4ef512b99SJustin Bogner //
5ef512b99SJustin Bogner // This file is distributed under the University of Illinois Open Source
6ef512b99SJustin Bogner // License. See LICENSE.TXT for details.
7ef512b99SJustin Bogner //
8ef512b99SJustin Bogner //===----------------------------------------------------------------------===//
9ef512b99SJustin Bogner //
10ef512b99SJustin Bogner // Instrumentation-based profile-guided optimization
11ef512b99SJustin Bogner //
12ef512b99SJustin Bogner //===----------------------------------------------------------------------===//
13ef512b99SJustin Bogner 
14ef512b99SJustin Bogner #include "CodeGenPGO.h"
15ef512b99SJustin Bogner #include "CodeGenFunction.h"
16ef512b99SJustin Bogner #include "clang/AST/RecursiveASTVisitor.h"
17ef512b99SJustin Bogner #include "clang/AST/StmtVisitor.h"
18529f6dd8SJustin Bogner #include "llvm/Config/config.h" // for strtoull()/strtoll() define
19ef512b99SJustin Bogner #include "llvm/IR/MDBuilder.h"
20ef512b99SJustin Bogner #include "llvm/Support/FileSystem.h"
21ef512b99SJustin Bogner 
22ef512b99SJustin Bogner using namespace clang;
23ef512b99SJustin Bogner using namespace CodeGen;
24ef512b99SJustin Bogner 
25d66a17d0SJustin Bogner static void ReportBadPGOData(CodeGenModule &CGM, const char *Message) {
26d66a17d0SJustin Bogner   DiagnosticsEngine &Diags = CGM.getDiags();
27d66a17d0SJustin Bogner   unsigned diagID = Diags.getCustomDiagID(DiagnosticsEngine::Error, "%0");
28d66a17d0SJustin Bogner   Diags.Report(diagID) << Message;
29d66a17d0SJustin Bogner }
30d66a17d0SJustin Bogner 
31d66a17d0SJustin Bogner PGOProfileData::PGOProfileData(CodeGenModule &CGM, std::string Path)
32d66a17d0SJustin Bogner   : CGM(CGM) {
33d66a17d0SJustin Bogner   if (llvm::MemoryBuffer::getFile(Path, DataBuffer)) {
34d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "failed to open pgo data file");
35d66a17d0SJustin Bogner     return;
36d66a17d0SJustin Bogner   }
37d66a17d0SJustin Bogner 
38d66a17d0SJustin Bogner   if (DataBuffer->getBufferSize() > std::numeric_limits<unsigned>::max()) {
39d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "pgo data file too big");
40d66a17d0SJustin Bogner     return;
41d66a17d0SJustin Bogner   }
42d66a17d0SJustin Bogner 
43d66a17d0SJustin Bogner   // Scan through the data file and map each function to the corresponding
44d66a17d0SJustin Bogner   // file offset where its counts are stored.
45d66a17d0SJustin Bogner   const char *BufferStart = DataBuffer->getBufferStart();
46d66a17d0SJustin Bogner   const char *BufferEnd = DataBuffer->getBufferEnd();
47d66a17d0SJustin Bogner   const char *CurPtr = BufferStart;
48d66a17d0SJustin Bogner   uint64_t MaxCount = 0;
49d66a17d0SJustin Bogner   while (CurPtr < BufferEnd) {
50d66a17d0SJustin Bogner     // Read the function name.
51d66a17d0SJustin Bogner     const char *FuncStart = CurPtr;
52d66a17d0SJustin Bogner     // For Objective-C methods, the name may include whitespace, so search
53d66a17d0SJustin Bogner     // backward from the end of the line to find the space that separates the
54d66a17d0SJustin Bogner     // name from the number of counters. (This is a temporary hack since we are
55d66a17d0SJustin Bogner     // going to completely replace this file format in the near future.)
56d66a17d0SJustin Bogner     CurPtr = strchr(CurPtr, '\n');
57d66a17d0SJustin Bogner     if (!CurPtr) {
58d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo data file has malformed function entry");
59d66a17d0SJustin Bogner       return;
60d66a17d0SJustin Bogner     }
61d66a17d0SJustin Bogner     StringRef FuncName(FuncStart, CurPtr - FuncStart);
62d66a17d0SJustin Bogner 
63b4416f58SJustin Bogner     // Skip over the function hash.
64b4416f58SJustin Bogner     CurPtr = strchr(++CurPtr, '\n');
65b4416f58SJustin Bogner     if (!CurPtr) {
66b4416f58SJustin Bogner       ReportBadPGOData(CGM, "pgo data file is missing the function hash");
67b4416f58SJustin Bogner       return;
68b4416f58SJustin Bogner     }
69b4416f58SJustin Bogner 
70d66a17d0SJustin Bogner     // Read the number of counters.
71d66a17d0SJustin Bogner     char *EndPtr;
72d66a17d0SJustin Bogner     unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10);
73d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n' || NumCounters <= 0) {
74d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo data file has unexpected number of counters");
75d66a17d0SJustin Bogner       return;
76d66a17d0SJustin Bogner     }
77d66a17d0SJustin Bogner     CurPtr = EndPtr;
78d66a17d0SJustin Bogner 
79d66a17d0SJustin Bogner     // Read function count.
80d66a17d0SJustin Bogner     uint64_t Count = strtoll(CurPtr, &EndPtr, 10);
81d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n') {
82d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo-data file has bad count value");
83d66a17d0SJustin Bogner       return;
84d66a17d0SJustin Bogner     }
85d66a17d0SJustin Bogner     CurPtr = EndPtr; // Point to '\n'.
86d66a17d0SJustin Bogner     FunctionCounts[FuncName] = Count;
87d66a17d0SJustin Bogner     MaxCount = Count > MaxCount ? Count : MaxCount;
88d66a17d0SJustin Bogner 
89d66a17d0SJustin Bogner     // There is one line for each counter; skip over those lines.
90d66a17d0SJustin Bogner     // Since function count is already read, we start the loop from 1.
91d66a17d0SJustin Bogner     for (unsigned N = 1; N < NumCounters; ++N) {
92d66a17d0SJustin Bogner       CurPtr = strchr(++CurPtr, '\n');
93d66a17d0SJustin Bogner       if (!CurPtr) {
94d66a17d0SJustin Bogner         ReportBadPGOData(CGM, "pgo data file is missing some counter info");
95d66a17d0SJustin Bogner         return;
96d66a17d0SJustin Bogner       }
97d66a17d0SJustin Bogner     }
98d66a17d0SJustin Bogner 
99d66a17d0SJustin Bogner     // Skip over the blank line separating functions.
100d66a17d0SJustin Bogner     CurPtr += 2;
101d66a17d0SJustin Bogner 
102d66a17d0SJustin Bogner     DataOffsets[FuncName] = FuncStart - BufferStart;
103d66a17d0SJustin Bogner   }
104d66a17d0SJustin Bogner   MaxFunctionCount = MaxCount;
105d66a17d0SJustin Bogner }
106d66a17d0SJustin Bogner 
107b4416f58SJustin Bogner bool PGOProfileData::getFunctionCounts(StringRef FuncName, uint64_t &FuncHash,
108d66a17d0SJustin Bogner                                        std::vector<uint64_t> &Counts) {
109d66a17d0SJustin Bogner   // Find the relevant section of the pgo-data file.
110d66a17d0SJustin Bogner   llvm::StringMap<unsigned>::const_iterator OffsetIter =
111d66a17d0SJustin Bogner     DataOffsets.find(FuncName);
112d66a17d0SJustin Bogner   if (OffsetIter == DataOffsets.end())
113d66a17d0SJustin Bogner     return true;
114d66a17d0SJustin Bogner   const char *CurPtr = DataBuffer->getBufferStart() + OffsetIter->getValue();
115d66a17d0SJustin Bogner 
116d66a17d0SJustin Bogner   // Skip over the function name.
117d66a17d0SJustin Bogner   CurPtr = strchr(CurPtr, '\n');
118d66a17d0SJustin Bogner   assert(CurPtr && "pgo-data has corrupted function entry");
119b4416f58SJustin Bogner 
120b4416f58SJustin Bogner   char *EndPtr;
121b4416f58SJustin Bogner   // Read the function hash.
122b4416f58SJustin Bogner   FuncHash = strtoll(++CurPtr, &EndPtr, 10);
123b4416f58SJustin Bogner   assert(EndPtr != CurPtr && *EndPtr == '\n' &&
124b4416f58SJustin Bogner          "pgo-data file has corrupted function hash");
125b4416f58SJustin Bogner   CurPtr = EndPtr;
126d66a17d0SJustin Bogner 
127d66a17d0SJustin Bogner   // Read the number of counters.
128d66a17d0SJustin Bogner   unsigned NumCounters = strtol(++CurPtr, &EndPtr, 10);
129d66a17d0SJustin Bogner   assert(EndPtr != CurPtr && *EndPtr == '\n' && NumCounters > 0 &&
130d66a17d0SJustin Bogner          "pgo-data file has corrupted number of counters");
131d66a17d0SJustin Bogner   CurPtr = EndPtr;
132d66a17d0SJustin Bogner 
133d66a17d0SJustin Bogner   Counts.reserve(NumCounters);
134d66a17d0SJustin Bogner 
135d66a17d0SJustin Bogner   for (unsigned N = 0; N < NumCounters; ++N) {
136d66a17d0SJustin Bogner     // Read the count value.
137d66a17d0SJustin Bogner     uint64_t Count = strtoll(CurPtr, &EndPtr, 10);
138d66a17d0SJustin Bogner     if (EndPtr == CurPtr || *EndPtr != '\n') {
139d66a17d0SJustin Bogner       ReportBadPGOData(CGM, "pgo-data file has bad count value");
140d66a17d0SJustin Bogner       return true;
141d66a17d0SJustin Bogner     }
142d66a17d0SJustin Bogner     Counts.push_back(Count);
143d66a17d0SJustin Bogner     CurPtr = EndPtr + 1;
144d66a17d0SJustin Bogner   }
145d66a17d0SJustin Bogner 
146d66a17d0SJustin Bogner   // Make sure the number of counters matches up.
147d66a17d0SJustin Bogner   if (Counts.size() != NumCounters) {
148d66a17d0SJustin Bogner     ReportBadPGOData(CGM, "pgo-data file has inconsistent counters");
149d66a17d0SJustin Bogner     return true;
150d66a17d0SJustin Bogner   }
151d66a17d0SJustin Bogner 
152d66a17d0SJustin Bogner   return false;
153d66a17d0SJustin Bogner }
154d66a17d0SJustin Bogner 
155da1ebedeSBob Wilson void CodeGenPGO::setFuncName(llvm::Function *Fn) {
1562fe531cbSDuncan P. N. Exon Smith   RawFuncName = Fn->getName();
157da1ebedeSBob Wilson 
158da1ebedeSBob Wilson   // Function names may be prefixed with a binary '1' to indicate
159da1ebedeSBob Wilson   // that the backend should not modify the symbols due to any platform
160da1ebedeSBob Wilson   // naming convention. Do not include that '1' in the PGO profile name.
1612fe531cbSDuncan P. N. Exon Smith   if (RawFuncName[0] == '\1')
1622fe531cbSDuncan P. N. Exon Smith     RawFuncName = RawFuncName.substr(1);
163da1ebedeSBob Wilson 
164da1ebedeSBob Wilson   if (!Fn->hasLocalLinkage()) {
1651b67cfd4SDuncan P. N. Exon Smith     PrefixedFuncName.reset(new std::string(RawFuncName));
166da1ebedeSBob Wilson     return;
167da1ebedeSBob Wilson   }
168da1ebedeSBob Wilson 
169da1ebedeSBob Wilson   // For local symbols, prepend the main file name to distinguish them.
170da1ebedeSBob Wilson   // Do not include the full path in the file name since there's no guarantee
171da1ebedeSBob Wilson   // that it will stay the same, e.g., if the files are checked out from
172da1ebedeSBob Wilson   // version control in different locations.
1731b67cfd4SDuncan P. N. Exon Smith   PrefixedFuncName.reset(new std::string(CGM.getCodeGenOpts().MainFileName));
1742fe531cbSDuncan P. N. Exon Smith   if (PrefixedFuncName->empty())
1752fe531cbSDuncan P. N. Exon Smith     PrefixedFuncName->assign("<unknown>");
1762fe531cbSDuncan P. N. Exon Smith   PrefixedFuncName->append(":");
1772fe531cbSDuncan P. N. Exon Smith   PrefixedFuncName->append(RawFuncName);
178da1ebedeSBob Wilson }
179da1ebedeSBob Wilson 
1802fe531cbSDuncan P. N. Exon Smith static llvm::Function *getRegisterFunc(CodeGenModule &CGM) {
181a7807637SDuncan P. N. Exon Smith   return CGM.getModule().getFunction("__llvm_profile_register_functions");
1822fe531cbSDuncan P. N. Exon Smith }
1832fe531cbSDuncan P. N. Exon Smith 
1842fe531cbSDuncan P. N. Exon Smith static llvm::BasicBlock *getOrInsertRegisterBB(CodeGenModule &CGM) {
185780443e8SDuncan P. N. Exon Smith   // Don't do this for Darwin.  compiler-rt uses linker magic.
186780443e8SDuncan P. N. Exon Smith   if (CGM.getTarget().getTriple().isOSDarwin())
187780443e8SDuncan P. N. Exon Smith     return nullptr;
188780443e8SDuncan P. N. Exon Smith 
1892fe531cbSDuncan P. N. Exon Smith   // Only need to insert this once per module.
1902fe531cbSDuncan P. N. Exon Smith   if (llvm::Function *RegisterF = getRegisterFunc(CGM))
1912fe531cbSDuncan P. N. Exon Smith     return &RegisterF->getEntryBlock();
1922fe531cbSDuncan P. N. Exon Smith 
1932fe531cbSDuncan P. N. Exon Smith   // Construct the function.
1942fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
1952fe531cbSDuncan P. N. Exon Smith   auto *RegisterFTy = llvm::FunctionType::get(VoidTy, false);
1962fe531cbSDuncan P. N. Exon Smith   auto *RegisterF = llvm::Function::Create(RegisterFTy,
1972fe531cbSDuncan P. N. Exon Smith                                            llvm::GlobalValue::InternalLinkage,
198a7807637SDuncan P. N. Exon Smith                                            "__llvm_profile_register_functions",
1992fe531cbSDuncan P. N. Exon Smith                                            &CGM.getModule());
2002fe531cbSDuncan P. N. Exon Smith   RegisterF->setUnnamedAddr(true);
2012fe531cbSDuncan P. N. Exon Smith   if (CGM.getCodeGenOpts().DisableRedZone)
2022fe531cbSDuncan P. N. Exon Smith     RegisterF->addFnAttr(llvm::Attribute::NoRedZone);
2032fe531cbSDuncan P. N. Exon Smith 
2042fe531cbSDuncan P. N. Exon Smith   // Construct and return the entry block.
2052fe531cbSDuncan P. N. Exon Smith   auto *BB = llvm::BasicBlock::Create(CGM.getLLVMContext(), "", RegisterF);
2062fe531cbSDuncan P. N. Exon Smith   CGBuilderTy Builder(BB);
2072fe531cbSDuncan P. N. Exon Smith   Builder.CreateRetVoid();
2082fe531cbSDuncan P. N. Exon Smith   return BB;
2092fe531cbSDuncan P. N. Exon Smith }
2102fe531cbSDuncan P. N. Exon Smith 
2112fe531cbSDuncan P. N. Exon Smith static llvm::Constant *getOrInsertRuntimeRegister(CodeGenModule &CGM) {
2122fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
2132fe531cbSDuncan P. N. Exon Smith   auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext());
2142fe531cbSDuncan P. N. Exon Smith   auto *RuntimeRegisterTy = llvm::FunctionType::get(VoidTy, VoidPtrTy, false);
215a7807637SDuncan P. N. Exon Smith   return CGM.getModule().getOrInsertFunction("__llvm_profile_register_function",
2162fe531cbSDuncan P. N. Exon Smith                                              RuntimeRegisterTy);
2172fe531cbSDuncan P. N. Exon Smith }
2182fe531cbSDuncan P. N. Exon Smith 
2197134d47dSDuncan P. N. Exon Smith static bool isMachO(const CodeGenModule &CGM) {
2207134d47dSDuncan P. N. Exon Smith   return CGM.getTarget().getTriple().isOSBinFormatMachO();
2217134d47dSDuncan P. N. Exon Smith }
2227134d47dSDuncan P. N. Exon Smith 
2232fe531cbSDuncan P. N. Exon Smith static StringRef getCountersSection(const CodeGenModule &CGM) {
224a7807637SDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_prf_cnts" : "__llvm_prf_cnts";
2252fe531cbSDuncan P. N. Exon Smith }
2262fe531cbSDuncan P. N. Exon Smith 
2272fe531cbSDuncan P. N. Exon Smith static StringRef getNameSection(const CodeGenModule &CGM) {
228a7807637SDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_prf_names" : "__llvm_prf_names";
2292fe531cbSDuncan P. N. Exon Smith }
2302fe531cbSDuncan P. N. Exon Smith 
2312fe531cbSDuncan P. N. Exon Smith static StringRef getDataSection(const CodeGenModule &CGM) {
232a7807637SDuncan P. N. Exon Smith   return isMachO(CGM) ? "__DATA,__llvm_prf_data" : "__llvm_prf_data";
2332fe531cbSDuncan P. N. Exon Smith }
2342fe531cbSDuncan P. N. Exon Smith 
2352fe531cbSDuncan P. N. Exon Smith llvm::GlobalVariable *CodeGenPGO::buildDataVar() {
2362fe531cbSDuncan P. N. Exon Smith   // Create name variable.
2372fe531cbSDuncan P. N. Exon Smith   llvm::LLVMContext &Ctx = CGM.getLLVMContext();
2382fe531cbSDuncan P. N. Exon Smith   auto *VarName = llvm::ConstantDataArray::getString(Ctx, getFuncName(),
2392fe531cbSDuncan P. N. Exon Smith                                                      false);
2402fe531cbSDuncan P. N. Exon Smith   auto *Name = new llvm::GlobalVariable(CGM.getModule(), VarName->getType(),
24173f78627SDuncan P. N. Exon Smith                                         true, VarLinkage, VarName,
2422fe531cbSDuncan P. N. Exon Smith                                         getFuncVarName("name"));
2432fe531cbSDuncan P. N. Exon Smith   Name->setSection(getNameSection(CGM));
2442fe531cbSDuncan P. N. Exon Smith   Name->setAlignment(1);
2452fe531cbSDuncan P. N. Exon Smith 
2462fe531cbSDuncan P. N. Exon Smith   // Create data variable.
2472fe531cbSDuncan P. N. Exon Smith   auto *Int32Ty = llvm::Type::getInt32Ty(Ctx);
248b4416f58SJustin Bogner   auto *Int64Ty = llvm::Type::getInt64Ty(Ctx);
2492fe531cbSDuncan P. N. Exon Smith   auto *Int8PtrTy = llvm::Type::getInt8PtrTy(Ctx);
2502fe531cbSDuncan P. N. Exon Smith   auto *Int64PtrTy = llvm::Type::getInt64PtrTy(Ctx);
2512fe531cbSDuncan P. N. Exon Smith   llvm::Type *DataTypes[] = {
252b4416f58SJustin Bogner     Int32Ty, Int32Ty, Int64Ty, Int8PtrTy, Int64PtrTy
2532fe531cbSDuncan P. N. Exon Smith   };
2542fe531cbSDuncan P. N. Exon Smith   auto *DataTy = llvm::StructType::get(Ctx, makeArrayRef(DataTypes));
2552fe531cbSDuncan P. N. Exon Smith   llvm::Constant *DataVals[] = {
2562fe531cbSDuncan P. N. Exon Smith     llvm::ConstantInt::get(Int32Ty, getFuncName().size()),
2572fe531cbSDuncan P. N. Exon Smith     llvm::ConstantInt::get(Int32Ty, NumRegionCounters),
258b4416f58SJustin Bogner     llvm::ConstantInt::get(Int64Ty, FunctionHash),
2592fe531cbSDuncan P. N. Exon Smith     llvm::ConstantExpr::getBitCast(Name, Int8PtrTy),
2602fe531cbSDuncan P. N. Exon Smith     llvm::ConstantExpr::getBitCast(RegionCounters, Int64PtrTy)
2612fe531cbSDuncan P. N. Exon Smith   };
2622fe531cbSDuncan P. N. Exon Smith   auto *Data =
26373f78627SDuncan P. N. Exon Smith     new llvm::GlobalVariable(CGM.getModule(), DataTy, true, VarLinkage,
2642fe531cbSDuncan P. N. Exon Smith                              llvm::ConstantStruct::get(DataTy, DataVals),
2652fe531cbSDuncan P. N. Exon Smith                              getFuncVarName("data"));
2662fe531cbSDuncan P. N. Exon Smith 
2672fe531cbSDuncan P. N. Exon Smith   // All the data should be packed into an array in its own section.
2682fe531cbSDuncan P. N. Exon Smith   Data->setSection(getDataSection(CGM));
2692fe531cbSDuncan P. N. Exon Smith   Data->setAlignment(8);
2702fe531cbSDuncan P. N. Exon Smith 
2712fe531cbSDuncan P. N. Exon Smith   // Make sure the data doesn't get deleted.
2722fe531cbSDuncan P. N. Exon Smith   CGM.addUsedGlobal(Data);
2732fe531cbSDuncan P. N. Exon Smith   return Data;
2742fe531cbSDuncan P. N. Exon Smith }
2752fe531cbSDuncan P. N. Exon Smith 
2762fe531cbSDuncan P. N. Exon Smith void CodeGenPGO::emitInstrumentationData() {
277ef512b99SJustin Bogner   if (!CGM.getCodeGenOpts().ProfileInstrGenerate)
278ef512b99SJustin Bogner     return;
279ef512b99SJustin Bogner 
2802fe531cbSDuncan P. N. Exon Smith   // Build the data.
2812fe531cbSDuncan P. N. Exon Smith   auto *Data = buildDataVar();
282ef512b99SJustin Bogner 
2832fe531cbSDuncan P. N. Exon Smith   // Register the data.
284780443e8SDuncan P. N. Exon Smith   auto *RegisterBB = getOrInsertRegisterBB(CGM);
285780443e8SDuncan P. N. Exon Smith   if (!RegisterBB)
286780443e8SDuncan P. N. Exon Smith     return;
287780443e8SDuncan P. N. Exon Smith   CGBuilderTy Builder(RegisterBB->getTerminator());
2882fe531cbSDuncan P. N. Exon Smith   auto *VoidPtrTy = llvm::Type::getInt8PtrTy(CGM.getLLVMContext());
2892fe531cbSDuncan P. N. Exon Smith   Builder.CreateCall(getOrInsertRuntimeRegister(CGM),
2902fe531cbSDuncan P. N. Exon Smith                      Builder.CreateBitCast(Data, VoidPtrTy));
291ef512b99SJustin Bogner }
292ef512b99SJustin Bogner 
293ef512b99SJustin Bogner llvm::Function *CodeGenPGO::emitInitialization(CodeGenModule &CGM) {
2942fe531cbSDuncan P. N. Exon Smith   if (!CGM.getCodeGenOpts().ProfileInstrGenerate)
295a5f804a7SDuncan P. N. Exon Smith     return nullptr;
296ef512b99SJustin Bogner 
2972fe531cbSDuncan P. N. Exon Smith   // Only need to create this once per module.
298a7807637SDuncan P. N. Exon Smith   if (CGM.getModule().getFunction("__llvm_profile_init"))
299a5f804a7SDuncan P. N. Exon Smith     return nullptr;
300ef512b99SJustin Bogner 
3015188e91cSDuncan P. N. Exon Smith   // Get the function to call at initialization.
3022fe531cbSDuncan P. N. Exon Smith   llvm::Constant *RegisterF = getRegisterFunc(CGM);
3035188e91cSDuncan P. N. Exon Smith   if (!RegisterF)
304a5f804a7SDuncan P. N. Exon Smith     return nullptr;
3052fe531cbSDuncan P. N. Exon Smith 
3062fe531cbSDuncan P. N. Exon Smith   // Create the initialization function.
3072fe531cbSDuncan P. N. Exon Smith   auto *VoidTy = llvm::Type::getVoidTy(CGM.getLLVMContext());
3082fe531cbSDuncan P. N. Exon Smith   auto *F = llvm::Function::Create(llvm::FunctionType::get(VoidTy, false),
3092fe531cbSDuncan P. N. Exon Smith                                    llvm::GlobalValue::InternalLinkage,
310a7807637SDuncan P. N. Exon Smith                                    "__llvm_profile_init", &CGM.getModule());
311ef512b99SJustin Bogner   F->setUnnamedAddr(true);
312ef512b99SJustin Bogner   F->addFnAttr(llvm::Attribute::NoInline);
313ef512b99SJustin Bogner   if (CGM.getCodeGenOpts().DisableRedZone)
314ef512b99SJustin Bogner     F->addFnAttr(llvm::Attribute::NoRedZone);
315ef512b99SJustin Bogner 
3162fe531cbSDuncan P. N. Exon Smith   // Add the basic block and the necessary calls.
3172fe531cbSDuncan P. N. Exon Smith   CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", F));
3182fe531cbSDuncan P. N. Exon Smith   Builder.CreateCall(RegisterF);
3192fe531cbSDuncan P. N. Exon Smith   Builder.CreateRetVoid();
320ef512b99SJustin Bogner 
321ef512b99SJustin Bogner   return F;
322ef512b99SJustin Bogner }
323ef512b99SJustin Bogner 
324ef512b99SJustin Bogner namespace {
325ef512b99SJustin Bogner   /// A StmtVisitor that fills a map of statements to PGO counters.
326ef512b99SJustin Bogner   struct MapRegionCounters : public ConstStmtVisitor<MapRegionCounters> {
327ef512b99SJustin Bogner     /// The next counter value to assign.
328ef512b99SJustin Bogner     unsigned NextCounter;
329ef512b99SJustin Bogner     /// The map of statements to counters.
3303586be72SDuncan P. N. Exon Smith     llvm::DenseMap<const Stmt *, unsigned> &CounterMap;
331ef512b99SJustin Bogner 
3323586be72SDuncan P. N. Exon Smith     MapRegionCounters(llvm::DenseMap<const Stmt *, unsigned> &CounterMap)
3333586be72SDuncan P. N. Exon Smith         : NextCounter(0), CounterMap(CounterMap) {}
334ef512b99SJustin Bogner 
335ef512b99SJustin Bogner     void VisitChildren(const Stmt *S) {
336ef512b99SJustin Bogner       for (Stmt::const_child_range I = S->children(); I; ++I)
337ef512b99SJustin Bogner         if (*I)
338ef512b99SJustin Bogner          this->Visit(*I);
339ef512b99SJustin Bogner     }
340ef512b99SJustin Bogner     void VisitStmt(const Stmt *S) { VisitChildren(S); }
341ef512b99SJustin Bogner 
342ea278c32SJustin Bogner     /// Assign a counter to track entry to the function body.
343ef512b99SJustin Bogner     void VisitFunctionDecl(const FunctionDecl *S) {
3443586be72SDuncan P. N. Exon Smith       CounterMap[S->getBody()] = NextCounter++;
345ef512b99SJustin Bogner       Visit(S->getBody());
346ef512b99SJustin Bogner     }
3475ec8fe19SBob Wilson     void VisitObjCMethodDecl(const ObjCMethodDecl *S) {
3483586be72SDuncan P. N. Exon Smith       CounterMap[S->getBody()] = NextCounter++;
3495ec8fe19SBob Wilson       Visit(S->getBody());
3505ec8fe19SBob Wilson     }
351c845c00aSBob Wilson     void VisitBlockDecl(const BlockDecl *S) {
3523586be72SDuncan P. N. Exon Smith       CounterMap[S->getBody()] = NextCounter++;
353c845c00aSBob Wilson       Visit(S->getBody());
354c845c00aSBob Wilson     }
355ea278c32SJustin Bogner     /// Assign a counter to track the block following a label.
356ef512b99SJustin Bogner     void VisitLabelStmt(const LabelStmt *S) {
3573586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
358ef512b99SJustin Bogner       Visit(S->getSubStmt());
359ef512b99SJustin Bogner     }
360bf854f0fSBob Wilson     /// Assign a counter for the body of a while loop.
361ef512b99SJustin Bogner     void VisitWhileStmt(const WhileStmt *S) {
3623586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
363ef512b99SJustin Bogner       Visit(S->getCond());
364ef512b99SJustin Bogner       Visit(S->getBody());
365ef512b99SJustin Bogner     }
366bf854f0fSBob Wilson     /// Assign a counter for the body of a do-while loop.
367ef512b99SJustin Bogner     void VisitDoStmt(const DoStmt *S) {
3683586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
369ef512b99SJustin Bogner       Visit(S->getBody());
370ef512b99SJustin Bogner       Visit(S->getCond());
371ef512b99SJustin Bogner     }
372bf854f0fSBob Wilson     /// Assign a counter for the body of a for loop.
373ef512b99SJustin Bogner     void VisitForStmt(const ForStmt *S) {
3743586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
375bf854f0fSBob Wilson       if (S->getInit())
376bf854f0fSBob Wilson         Visit(S->getInit());
377ef512b99SJustin Bogner       const Expr *E;
378ef512b99SJustin Bogner       if ((E = S->getCond()))
379ef512b99SJustin Bogner         Visit(E);
380ef512b99SJustin Bogner       if ((E = S->getInc()))
381ef512b99SJustin Bogner         Visit(E);
382bf854f0fSBob Wilson       Visit(S->getBody());
383ef512b99SJustin Bogner     }
384bf854f0fSBob Wilson     /// Assign a counter for the body of a for-range loop.
385ef512b99SJustin Bogner     void VisitCXXForRangeStmt(const CXXForRangeStmt *S) {
3863586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
387bf854f0fSBob Wilson       Visit(S->getRangeStmt());
388bf854f0fSBob Wilson       Visit(S->getBeginEndStmt());
389bf854f0fSBob Wilson       Visit(S->getCond());
390bf854f0fSBob Wilson       Visit(S->getLoopVarStmt());
391ef512b99SJustin Bogner       Visit(S->getBody());
392bf854f0fSBob Wilson       Visit(S->getInc());
393ef512b99SJustin Bogner     }
394bf854f0fSBob Wilson     /// Assign a counter for the body of a for-collection loop.
395ef512b99SJustin Bogner     void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) {
3963586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
397ef512b99SJustin Bogner       Visit(S->getElement());
398ef512b99SJustin Bogner       Visit(S->getBody());
399ef512b99SJustin Bogner     }
400ef512b99SJustin Bogner     /// Assign a counter for the exit block of the switch statement.
401ef512b99SJustin Bogner     void VisitSwitchStmt(const SwitchStmt *S) {
4023586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
403ef512b99SJustin Bogner       Visit(S->getCond());
404ef512b99SJustin Bogner       Visit(S->getBody());
405ef512b99SJustin Bogner     }
406ef512b99SJustin Bogner     /// Assign a counter for a particular case in a switch. This counts jumps
407ef512b99SJustin Bogner     /// from the switch header as well as fallthrough from the case before this
408ef512b99SJustin Bogner     /// one.
409ef512b99SJustin Bogner     void VisitCaseStmt(const CaseStmt *S) {
4103586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
411ef512b99SJustin Bogner       Visit(S->getSubStmt());
412ef512b99SJustin Bogner     }
413ef512b99SJustin Bogner     /// Assign a counter for the default case of a switch statement. The count
414ef512b99SJustin Bogner     /// is the number of branches from the loop header to the default, and does
415ef512b99SJustin Bogner     /// not include fallthrough from previous cases. If we have multiple
416ef512b99SJustin Bogner     /// conditional branch blocks from the switch instruction to the default
417ef512b99SJustin Bogner     /// block, as with large GNU case ranges, this is the counter for the last
418ef512b99SJustin Bogner     /// edge in that series, rather than the first.
419ef512b99SJustin Bogner     void VisitDefaultStmt(const DefaultStmt *S) {
4203586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
421ef512b99SJustin Bogner       Visit(S->getSubStmt());
422ef512b99SJustin Bogner     }
423ef512b99SJustin Bogner     /// Assign a counter for the "then" part of an if statement. The count for
424ef512b99SJustin Bogner     /// the "else" part, if it exists, will be calculated from this counter.
425ef512b99SJustin Bogner     void VisitIfStmt(const IfStmt *S) {
4263586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
427ef512b99SJustin Bogner       Visit(S->getCond());
428ef512b99SJustin Bogner       Visit(S->getThen());
429ef512b99SJustin Bogner       if (S->getElse())
430ef512b99SJustin Bogner         Visit(S->getElse());
431ef512b99SJustin Bogner     }
432ef512b99SJustin Bogner     /// Assign a counter for the continuation block of a C++ try statement.
433ef512b99SJustin Bogner     void VisitCXXTryStmt(const CXXTryStmt *S) {
4343586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
435ef512b99SJustin Bogner       Visit(S->getTryBlock());
436ef512b99SJustin Bogner       for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I)
437ef512b99SJustin Bogner         Visit(S->getHandler(I));
438ef512b99SJustin Bogner     }
439ef512b99SJustin Bogner     /// Assign a counter for a catch statement's handler block.
440ef512b99SJustin Bogner     void VisitCXXCatchStmt(const CXXCatchStmt *S) {
4413586be72SDuncan P. N. Exon Smith       CounterMap[S] = NextCounter++;
442ef512b99SJustin Bogner       Visit(S->getHandlerBlock());
443ef512b99SJustin Bogner     }
444ef512b99SJustin Bogner     /// Assign a counter for the "true" part of a conditional operator. The
445ef512b99SJustin Bogner     /// count in the "false" part will be calculated from this counter.
446ef512b99SJustin Bogner     void VisitConditionalOperator(const ConditionalOperator *E) {
4473586be72SDuncan P. N. Exon Smith       CounterMap[E] = NextCounter++;
448ef512b99SJustin Bogner       Visit(E->getCond());
449ef512b99SJustin Bogner       Visit(E->getTrueExpr());
450ef512b99SJustin Bogner       Visit(E->getFalseExpr());
451ef512b99SJustin Bogner     }
452ef512b99SJustin Bogner     /// Assign a counter for the right hand side of a logical and operator.
453ef512b99SJustin Bogner     void VisitBinLAnd(const BinaryOperator *E) {
4543586be72SDuncan P. N. Exon Smith       CounterMap[E] = NextCounter++;
455ef512b99SJustin Bogner       Visit(E->getLHS());
456ef512b99SJustin Bogner       Visit(E->getRHS());
457ef512b99SJustin Bogner     }
458ef512b99SJustin Bogner     /// Assign a counter for the right hand side of a logical or operator.
459ef512b99SJustin Bogner     void VisitBinLOr(const BinaryOperator *E) {
4603586be72SDuncan P. N. Exon Smith       CounterMap[E] = NextCounter++;
461ef512b99SJustin Bogner       Visit(E->getLHS());
462ef512b99SJustin Bogner       Visit(E->getRHS());
463ef512b99SJustin Bogner     }
464ef512b99SJustin Bogner   };
465bf854f0fSBob Wilson 
466bf854f0fSBob Wilson   /// A StmtVisitor that propagates the raw counts through the AST and
467bf854f0fSBob Wilson   /// records the count at statements where the value may change.
468bf854f0fSBob Wilson   struct ComputeRegionCounts : public ConstStmtVisitor<ComputeRegionCounts> {
469bf854f0fSBob Wilson     /// PGO state.
470bf854f0fSBob Wilson     CodeGenPGO &PGO;
471bf854f0fSBob Wilson 
472bf854f0fSBob Wilson     /// A flag that is set when the current count should be recorded on the
473bf854f0fSBob Wilson     /// next statement, such as at the exit of a loop.
474bf854f0fSBob Wilson     bool RecordNextStmtCount;
475bf854f0fSBob Wilson 
476bf854f0fSBob Wilson     /// The map of statements to count values.
4773586be72SDuncan P. N. Exon Smith     llvm::DenseMap<const Stmt *, uint64_t> &CountMap;
478bf854f0fSBob Wilson 
479bf854f0fSBob Wilson     /// BreakContinueStack - Keep counts of breaks and continues inside loops.
480bf854f0fSBob Wilson     struct BreakContinue {
481bf854f0fSBob Wilson       uint64_t BreakCount;
482bf854f0fSBob Wilson       uint64_t ContinueCount;
483bf854f0fSBob Wilson       BreakContinue() : BreakCount(0), ContinueCount(0) {}
484bf854f0fSBob Wilson     };
485bf854f0fSBob Wilson     SmallVector<BreakContinue, 8> BreakContinueStack;
486bf854f0fSBob Wilson 
4873586be72SDuncan P. N. Exon Smith     ComputeRegionCounts(llvm::DenseMap<const Stmt *, uint64_t> &CountMap,
4883586be72SDuncan P. N. Exon Smith                         CodeGenPGO &PGO)
4893586be72SDuncan P. N. Exon Smith         : PGO(PGO), RecordNextStmtCount(false), CountMap(CountMap) {}
490bf854f0fSBob Wilson 
491bf854f0fSBob Wilson     void RecordStmtCount(const Stmt *S) {
492bf854f0fSBob Wilson       if (RecordNextStmtCount) {
4933586be72SDuncan P. N. Exon Smith         CountMap[S] = PGO.getCurrentRegionCount();
494bf854f0fSBob Wilson         RecordNextStmtCount = false;
495bf854f0fSBob Wilson       }
496bf854f0fSBob Wilson     }
497bf854f0fSBob Wilson 
498bf854f0fSBob Wilson     void VisitStmt(const Stmt *S) {
499bf854f0fSBob Wilson       RecordStmtCount(S);
500bf854f0fSBob Wilson       for (Stmt::const_child_range I = S->children(); I; ++I) {
501bf854f0fSBob Wilson         if (*I)
502bf854f0fSBob Wilson          this->Visit(*I);
503bf854f0fSBob Wilson       }
504bf854f0fSBob Wilson     }
505bf854f0fSBob Wilson 
506bf854f0fSBob Wilson     void VisitFunctionDecl(const FunctionDecl *S) {
507bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S->getBody());
508bf854f0fSBob Wilson       Cnt.beginRegion();
5093586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
510bf854f0fSBob Wilson       Visit(S->getBody());
511bf854f0fSBob Wilson     }
512bf854f0fSBob Wilson 
5135ec8fe19SBob Wilson     void VisitObjCMethodDecl(const ObjCMethodDecl *S) {
5145ec8fe19SBob Wilson       RegionCounter Cnt(PGO, S->getBody());
5155ec8fe19SBob Wilson       Cnt.beginRegion();
5163586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
5175ec8fe19SBob Wilson       Visit(S->getBody());
5185ec8fe19SBob Wilson     }
5195ec8fe19SBob Wilson 
520c845c00aSBob Wilson     void VisitBlockDecl(const BlockDecl *S) {
521c845c00aSBob Wilson       RegionCounter Cnt(PGO, S->getBody());
522c845c00aSBob Wilson       Cnt.beginRegion();
5233586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
524c845c00aSBob Wilson       Visit(S->getBody());
525c845c00aSBob Wilson     }
526c845c00aSBob Wilson 
527bf854f0fSBob Wilson     void VisitReturnStmt(const ReturnStmt *S) {
528bf854f0fSBob Wilson       RecordStmtCount(S);
529bf854f0fSBob Wilson       if (S->getRetValue())
530bf854f0fSBob Wilson         Visit(S->getRetValue());
531bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
532bf854f0fSBob Wilson       RecordNextStmtCount = true;
533bf854f0fSBob Wilson     }
534bf854f0fSBob Wilson 
535bf854f0fSBob Wilson     void VisitGotoStmt(const GotoStmt *S) {
536bf854f0fSBob Wilson       RecordStmtCount(S);
537bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
538bf854f0fSBob Wilson       RecordNextStmtCount = true;
539bf854f0fSBob Wilson     }
540bf854f0fSBob Wilson 
541bf854f0fSBob Wilson     void VisitLabelStmt(const LabelStmt *S) {
542bf854f0fSBob Wilson       RecordNextStmtCount = false;
543bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
544bf854f0fSBob Wilson       Cnt.beginRegion();
5453586be72SDuncan P. N. Exon Smith       CountMap[S] = PGO.getCurrentRegionCount();
546bf854f0fSBob Wilson       Visit(S->getSubStmt());
547bf854f0fSBob Wilson     }
548bf854f0fSBob Wilson 
549bf854f0fSBob Wilson     void VisitBreakStmt(const BreakStmt *S) {
550bf854f0fSBob Wilson       RecordStmtCount(S);
551bf854f0fSBob Wilson       assert(!BreakContinueStack.empty() && "break not in a loop or switch!");
552bf854f0fSBob Wilson       BreakContinueStack.back().BreakCount += PGO.getCurrentRegionCount();
553bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
554bf854f0fSBob Wilson       RecordNextStmtCount = true;
555bf854f0fSBob Wilson     }
556bf854f0fSBob Wilson 
557bf854f0fSBob Wilson     void VisitContinueStmt(const ContinueStmt *S) {
558bf854f0fSBob Wilson       RecordStmtCount(S);
559bf854f0fSBob Wilson       assert(!BreakContinueStack.empty() && "continue stmt not in a loop!");
560bf854f0fSBob Wilson       BreakContinueStack.back().ContinueCount += PGO.getCurrentRegionCount();
561bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
562bf854f0fSBob Wilson       RecordNextStmtCount = true;
563bf854f0fSBob Wilson     }
564bf854f0fSBob Wilson 
565bf854f0fSBob Wilson     void VisitWhileStmt(const WhileStmt *S) {
566bf854f0fSBob Wilson       RecordStmtCount(S);
567bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
568bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
569bf854f0fSBob Wilson       // Visit the body region first so the break/continue adjustments can be
570bf854f0fSBob Wilson       // included when visiting the condition.
571bf854f0fSBob Wilson       Cnt.beginRegion();
5723586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
573bf854f0fSBob Wilson       Visit(S->getBody());
574bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
575bf854f0fSBob Wilson 
576bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition. The count
577bf854f0fSBob Wilson       // at the start of the condition is the sum of the incoming edges,
578bf854f0fSBob Wilson       // the backedge from the end of the loop body, and the edges from
579bf854f0fSBob Wilson       // continue statements.
580bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
581bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
582bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() + BC.ContinueCount);
5833586be72SDuncan P. N. Exon Smith       CountMap[S->getCond()] = PGO.getCurrentRegionCount();
584bf854f0fSBob Wilson       Visit(S->getCond());
585bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
586bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
587bf854f0fSBob Wilson       RecordNextStmtCount = true;
588bf854f0fSBob Wilson     }
589bf854f0fSBob Wilson 
590bf854f0fSBob Wilson     void VisitDoStmt(const DoStmt *S) {
591bf854f0fSBob Wilson       RecordStmtCount(S);
592bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
593bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
594bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
5953586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
596bf854f0fSBob Wilson       Visit(S->getBody());
597bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
598bf854f0fSBob Wilson 
599bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
600bf854f0fSBob Wilson       // The count at the start of the condition is equal to the count at the
601bf854f0fSBob Wilson       // end of the body. The adjusted count does not include either the
602bf854f0fSBob Wilson       // fall-through count coming into the loop or the continue count, so add
603bf854f0fSBob Wilson       // both of those separately. This is coincidentally the same equation as
604bf854f0fSBob Wilson       // with while loops but for different reasons.
605bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
606bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() + BC.ContinueCount);
6073586be72SDuncan P. N. Exon Smith       CountMap[S->getCond()] = PGO.getCurrentRegionCount();
608bf854f0fSBob Wilson       Visit(S->getCond());
609bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
610bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
611bf854f0fSBob Wilson       RecordNextStmtCount = true;
612bf854f0fSBob Wilson     }
613bf854f0fSBob Wilson 
614bf854f0fSBob Wilson     void VisitForStmt(const ForStmt *S) {
615bf854f0fSBob Wilson       RecordStmtCount(S);
616bf854f0fSBob Wilson       if (S->getInit())
617bf854f0fSBob Wilson         Visit(S->getInit());
618bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
619bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
620bf854f0fSBob Wilson       // Visit the body region first. (This is basically the same as a while
621bf854f0fSBob Wilson       // loop; see further comments in VisitWhileStmt.)
622bf854f0fSBob Wilson       Cnt.beginRegion();
6233586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
624bf854f0fSBob Wilson       Visit(S->getBody());
625bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
626bf854f0fSBob Wilson 
627bf854f0fSBob Wilson       // The increment is essentially part of the body but it needs to include
628bf854f0fSBob Wilson       // the count for all the continue statements.
629bf854f0fSBob Wilson       if (S->getInc()) {
630bf854f0fSBob Wilson         Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() +
631bf854f0fSBob Wilson                                   BreakContinueStack.back().ContinueCount);
6323586be72SDuncan P. N. Exon Smith         CountMap[S->getInc()] = PGO.getCurrentRegionCount();
633bf854f0fSBob Wilson         Visit(S->getInc());
634bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
635bf854f0fSBob Wilson       }
636bf854f0fSBob Wilson 
637bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
638bf854f0fSBob Wilson 
639bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition.
640bf854f0fSBob Wilson       if (S->getCond()) {
641bf854f0fSBob Wilson         Cnt.setCurrentRegionCount(Cnt.getParentCount() +
642bf854f0fSBob Wilson                                   Cnt.getAdjustedCount() +
643bf854f0fSBob Wilson                                   BC.ContinueCount);
6443586be72SDuncan P. N. Exon Smith         CountMap[S->getCond()] = PGO.getCurrentRegionCount();
645bf854f0fSBob Wilson         Visit(S->getCond());
646bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
647bf854f0fSBob Wilson       }
648bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
649bf854f0fSBob Wilson       RecordNextStmtCount = true;
650bf854f0fSBob Wilson     }
651bf854f0fSBob Wilson 
652bf854f0fSBob Wilson     void VisitCXXForRangeStmt(const CXXForRangeStmt *S) {
653bf854f0fSBob Wilson       RecordStmtCount(S);
654bf854f0fSBob Wilson       Visit(S->getRangeStmt());
655bf854f0fSBob Wilson       Visit(S->getBeginEndStmt());
656bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
657bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
658bf854f0fSBob Wilson       // Visit the body region first. (This is basically the same as a while
659bf854f0fSBob Wilson       // loop; see further comments in VisitWhileStmt.)
660bf854f0fSBob Wilson       Cnt.beginRegion();
6613586be72SDuncan P. N. Exon Smith       CountMap[S->getLoopVarStmt()] = PGO.getCurrentRegionCount();
662bf854f0fSBob Wilson       Visit(S->getLoopVarStmt());
663bf854f0fSBob Wilson       Visit(S->getBody());
664bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
665bf854f0fSBob Wilson 
666bf854f0fSBob Wilson       // The increment is essentially part of the body but it needs to include
667bf854f0fSBob Wilson       // the count for all the continue statements.
668bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(PGO.getCurrentRegionCount() +
669bf854f0fSBob Wilson                                 BreakContinueStack.back().ContinueCount);
6703586be72SDuncan P. N. Exon Smith       CountMap[S->getInc()] = PGO.getCurrentRegionCount();
671bf854f0fSBob Wilson       Visit(S->getInc());
672bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
673bf854f0fSBob Wilson 
674bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
675bf854f0fSBob Wilson 
676bf854f0fSBob Wilson       // ...then go back and propagate counts through the condition.
677bf854f0fSBob Wilson       Cnt.setCurrentRegionCount(Cnt.getParentCount() +
678bf854f0fSBob Wilson                                 Cnt.getAdjustedCount() +
679bf854f0fSBob Wilson                                 BC.ContinueCount);
6803586be72SDuncan P. N. Exon Smith       CountMap[S->getCond()] = PGO.getCurrentRegionCount();
681bf854f0fSBob Wilson       Visit(S->getCond());
682bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
683bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
684bf854f0fSBob Wilson       RecordNextStmtCount = true;
685bf854f0fSBob Wilson     }
686bf854f0fSBob Wilson 
687bf854f0fSBob Wilson     void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) {
688bf854f0fSBob Wilson       RecordStmtCount(S);
689bf854f0fSBob Wilson       Visit(S->getElement());
690bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
691bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
692bf854f0fSBob Wilson       Cnt.beginRegion();
6933586be72SDuncan P. N. Exon Smith       CountMap[S->getBody()] = PGO.getCurrentRegionCount();
694bf854f0fSBob Wilson       Visit(S->getBody());
695bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
696bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
697bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(BC.BreakCount + BC.ContinueCount);
698bf854f0fSBob Wilson       RecordNextStmtCount = true;
699bf854f0fSBob Wilson     }
700bf854f0fSBob Wilson 
701bf854f0fSBob Wilson     void VisitSwitchStmt(const SwitchStmt *S) {
702bf854f0fSBob Wilson       RecordStmtCount(S);
703bf854f0fSBob Wilson       Visit(S->getCond());
704bf854f0fSBob Wilson       PGO.setCurrentRegionUnreachable();
705bf854f0fSBob Wilson       BreakContinueStack.push_back(BreakContinue());
706bf854f0fSBob Wilson       Visit(S->getBody());
707bf854f0fSBob Wilson       // If the switch is inside a loop, add the continue counts.
708bf854f0fSBob Wilson       BreakContinue BC = BreakContinueStack.pop_back_val();
709bf854f0fSBob Wilson       if (!BreakContinueStack.empty())
710bf854f0fSBob Wilson         BreakContinueStack.back().ContinueCount += BC.ContinueCount;
711bf854f0fSBob Wilson       RegionCounter ExitCnt(PGO, S);
712bf854f0fSBob Wilson       ExitCnt.beginRegion();
713bf854f0fSBob Wilson       RecordNextStmtCount = true;
714bf854f0fSBob Wilson     }
715bf854f0fSBob Wilson 
716bf854f0fSBob Wilson     void VisitCaseStmt(const CaseStmt *S) {
717bf854f0fSBob Wilson       RecordNextStmtCount = false;
718bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
719bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
7203586be72SDuncan P. N. Exon Smith       CountMap[S] = Cnt.getCount();
721bf854f0fSBob Wilson       RecordNextStmtCount = true;
722bf854f0fSBob Wilson       Visit(S->getSubStmt());
723bf854f0fSBob Wilson     }
724bf854f0fSBob Wilson 
725bf854f0fSBob Wilson     void VisitDefaultStmt(const DefaultStmt *S) {
726bf854f0fSBob Wilson       RecordNextStmtCount = false;
727bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
728bf854f0fSBob Wilson       Cnt.beginRegion(/*AddIncomingFallThrough=*/true);
7293586be72SDuncan P. N. Exon Smith       CountMap[S] = Cnt.getCount();
730bf854f0fSBob Wilson       RecordNextStmtCount = true;
731bf854f0fSBob Wilson       Visit(S->getSubStmt());
732bf854f0fSBob Wilson     }
733bf854f0fSBob Wilson 
734bf854f0fSBob Wilson     void VisitIfStmt(const IfStmt *S) {
735bf854f0fSBob Wilson       RecordStmtCount(S);
736bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
737bf854f0fSBob Wilson       Visit(S->getCond());
738bf854f0fSBob Wilson 
739bf854f0fSBob Wilson       Cnt.beginRegion();
7403586be72SDuncan P. N. Exon Smith       CountMap[S->getThen()] = PGO.getCurrentRegionCount();
741bf854f0fSBob Wilson       Visit(S->getThen());
742bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
743bf854f0fSBob Wilson 
744bf854f0fSBob Wilson       if (S->getElse()) {
745bf854f0fSBob Wilson         Cnt.beginElseRegion();
7463586be72SDuncan P. N. Exon Smith         CountMap[S->getElse()] = PGO.getCurrentRegionCount();
747bf854f0fSBob Wilson         Visit(S->getElse());
748bf854f0fSBob Wilson         Cnt.adjustForControlFlow();
749bf854f0fSBob Wilson       }
750bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
751bf854f0fSBob Wilson       RecordNextStmtCount = true;
752bf854f0fSBob Wilson     }
753bf854f0fSBob Wilson 
754bf854f0fSBob Wilson     void VisitCXXTryStmt(const CXXTryStmt *S) {
755bf854f0fSBob Wilson       RecordStmtCount(S);
756bf854f0fSBob Wilson       Visit(S->getTryBlock());
757bf854f0fSBob Wilson       for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I)
758bf854f0fSBob Wilson         Visit(S->getHandler(I));
759bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
760bf854f0fSBob Wilson       Cnt.beginRegion();
761bf854f0fSBob Wilson       RecordNextStmtCount = true;
762bf854f0fSBob Wilson     }
763bf854f0fSBob Wilson 
764bf854f0fSBob Wilson     void VisitCXXCatchStmt(const CXXCatchStmt *S) {
765bf854f0fSBob Wilson       RecordNextStmtCount = false;
766bf854f0fSBob Wilson       RegionCounter Cnt(PGO, S);
767bf854f0fSBob Wilson       Cnt.beginRegion();
7683586be72SDuncan P. N. Exon Smith       CountMap[S] = PGO.getCurrentRegionCount();
769bf854f0fSBob Wilson       Visit(S->getHandlerBlock());
770bf854f0fSBob Wilson     }
771bf854f0fSBob Wilson 
772bf854f0fSBob Wilson     void VisitConditionalOperator(const ConditionalOperator *E) {
773bf854f0fSBob Wilson       RecordStmtCount(E);
774bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
775bf854f0fSBob Wilson       Visit(E->getCond());
776bf854f0fSBob Wilson 
777bf854f0fSBob Wilson       Cnt.beginRegion();
7783586be72SDuncan P. N. Exon Smith       CountMap[E->getTrueExpr()] = PGO.getCurrentRegionCount();
779bf854f0fSBob Wilson       Visit(E->getTrueExpr());
780bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
781bf854f0fSBob Wilson 
782bf854f0fSBob Wilson       Cnt.beginElseRegion();
7833586be72SDuncan P. N. Exon Smith       CountMap[E->getFalseExpr()] = PGO.getCurrentRegionCount();
784bf854f0fSBob Wilson       Visit(E->getFalseExpr());
785bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
786bf854f0fSBob Wilson 
787bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
788bf854f0fSBob Wilson       RecordNextStmtCount = true;
789bf854f0fSBob Wilson     }
790bf854f0fSBob Wilson 
791bf854f0fSBob Wilson     void VisitBinLAnd(const BinaryOperator *E) {
792bf854f0fSBob Wilson       RecordStmtCount(E);
793bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
794bf854f0fSBob Wilson       Visit(E->getLHS());
795bf854f0fSBob Wilson       Cnt.beginRegion();
7963586be72SDuncan P. N. Exon Smith       CountMap[E->getRHS()] = PGO.getCurrentRegionCount();
797bf854f0fSBob Wilson       Visit(E->getRHS());
798bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
799bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
800bf854f0fSBob Wilson       RecordNextStmtCount = true;
801bf854f0fSBob Wilson     }
802bf854f0fSBob Wilson 
803bf854f0fSBob Wilson     void VisitBinLOr(const BinaryOperator *E) {
804bf854f0fSBob Wilson       RecordStmtCount(E);
805bf854f0fSBob Wilson       RegionCounter Cnt(PGO, E);
806bf854f0fSBob Wilson       Visit(E->getLHS());
807bf854f0fSBob Wilson       Cnt.beginRegion();
8083586be72SDuncan P. N. Exon Smith       CountMap[E->getRHS()] = PGO.getCurrentRegionCount();
809bf854f0fSBob Wilson       Visit(E->getRHS());
810bf854f0fSBob Wilson       Cnt.adjustForControlFlow();
811bf854f0fSBob Wilson       Cnt.applyAdjustmentsToRegion(0);
812bf854f0fSBob Wilson       RecordNextStmtCount = true;
813bf854f0fSBob Wilson     }
814bf854f0fSBob Wilson   };
815ef512b99SJustin Bogner }
816ef512b99SJustin Bogner 
817*d971cd1bSDuncan P. N. Exon Smith static void emitRuntimeHook(CodeGenModule &CGM) {
818*d971cd1bSDuncan P. N. Exon Smith   constexpr const char *RuntimeVarName = "__llvm_profile_runtime";
819*d971cd1bSDuncan P. N. Exon Smith   constexpr const char *RuntimeUserName = "__llvm_profile_runtime_user";
820*d971cd1bSDuncan P. N. Exon Smith   if (CGM.getModule().getGlobalVariable(RuntimeVarName))
821*d971cd1bSDuncan P. N. Exon Smith     return;
822*d971cd1bSDuncan P. N. Exon Smith 
823*d971cd1bSDuncan P. N. Exon Smith   // Declare the runtime hook.
824*d971cd1bSDuncan P. N. Exon Smith   llvm::LLVMContext &Ctx = CGM.getLLVMContext();
825*d971cd1bSDuncan P. N. Exon Smith   auto *Int32Ty = llvm::Type::getInt32Ty(Ctx);
826*d971cd1bSDuncan P. N. Exon Smith   auto *Var = new llvm::GlobalVariable(CGM.getModule(), Int32Ty, false,
827*d971cd1bSDuncan P. N. Exon Smith                                        llvm::GlobalValue::ExternalLinkage,
828*d971cd1bSDuncan P. N. Exon Smith                                        nullptr, RuntimeVarName);
829*d971cd1bSDuncan P. N. Exon Smith 
830*d971cd1bSDuncan P. N. Exon Smith   // Make a function that uses it.
831*d971cd1bSDuncan P. N. Exon Smith   auto *User = llvm::Function::Create(llvm::FunctionType::get(Int32Ty, false),
832*d971cd1bSDuncan P. N. Exon Smith                                       llvm::GlobalValue::LinkOnceODRLinkage,
833*d971cd1bSDuncan P. N. Exon Smith                                       RuntimeUserName, &CGM.getModule());
834*d971cd1bSDuncan P. N. Exon Smith   User->addFnAttr(llvm::Attribute::NoInline);
835*d971cd1bSDuncan P. N. Exon Smith   if (CGM.getCodeGenOpts().DisableRedZone)
836*d971cd1bSDuncan P. N. Exon Smith     User->addFnAttr(llvm::Attribute::NoRedZone);
837*d971cd1bSDuncan P. N. Exon Smith   CGBuilderTy Builder(llvm::BasicBlock::Create(CGM.getLLVMContext(), "", User));
838*d971cd1bSDuncan P. N. Exon Smith   auto *Load = Builder.CreateLoad(Var);
839*d971cd1bSDuncan P. N. Exon Smith   Builder.CreateRet(Load);
840*d971cd1bSDuncan P. N. Exon Smith 
841*d971cd1bSDuncan P. N. Exon Smith   // Create a use of the function.  Now the definition of the runtime variable
842*d971cd1bSDuncan P. N. Exon Smith   // should get pulled in, along with any static initializears.
843*d971cd1bSDuncan P. N. Exon Smith   CGM.addUsedGlobal(User);
844*d971cd1bSDuncan P. N. Exon Smith }
845*d971cd1bSDuncan P. N. Exon Smith 
846da1ebedeSBob Wilson void CodeGenPGO::assignRegionCounters(const Decl *D, llvm::Function *Fn) {
847ef512b99SJustin Bogner   bool InstrumentRegions = CGM.getCodeGenOpts().ProfileInstrGenerate;
848d66a17d0SJustin Bogner   PGOProfileData *PGOData = CGM.getPGOData();
849d66a17d0SJustin Bogner   if (!InstrumentRegions && !PGOData)
850ef512b99SJustin Bogner     return;
851ef512b99SJustin Bogner   if (!D)
852ef512b99SJustin Bogner     return;
853da1ebedeSBob Wilson   setFuncName(Fn);
8547c41451bSDuncan P. N. Exon Smith 
8557c41451bSDuncan P. N. Exon Smith   // Set the linkage for variables based on the function linkage.  Usually, we
8567c41451bSDuncan P. N. Exon Smith   // want to match it, but available_externally and extern_weak both have the
8577c41451bSDuncan P. N. Exon Smith   // wrong semantics.
85873f78627SDuncan P. N. Exon Smith   VarLinkage = Fn->getLinkage();
8597c41451bSDuncan P. N. Exon Smith   switch (VarLinkage) {
8607c41451bSDuncan P. N. Exon Smith   case llvm::GlobalValue::ExternalWeakLinkage:
8617c41451bSDuncan P. N. Exon Smith     VarLinkage = llvm::GlobalValue::LinkOnceAnyLinkage;
8627c41451bSDuncan P. N. Exon Smith     break;
8637c41451bSDuncan P. N. Exon Smith   case llvm::GlobalValue::AvailableExternallyLinkage:
8647c41451bSDuncan P. N. Exon Smith     VarLinkage = llvm::GlobalValue::LinkOnceODRLinkage;
8657c41451bSDuncan P. N. Exon Smith     break;
8667c41451bSDuncan P. N. Exon Smith   default:
8677c41451bSDuncan P. N. Exon Smith     break;
8687c41451bSDuncan P. N. Exon Smith   }
8697c41451bSDuncan P. N. Exon Smith 
870ef512b99SJustin Bogner   mapRegionCounters(D);
871*d971cd1bSDuncan P. N. Exon Smith   if (InstrumentRegions) {
872*d971cd1bSDuncan P. N. Exon Smith     emitRuntimeHook(CGM);
873ef512b99SJustin Bogner     emitCounterVariables();
874*d971cd1bSDuncan P. N. Exon Smith   }
875d66a17d0SJustin Bogner   if (PGOData) {
876d66a17d0SJustin Bogner     loadRegionCounts(PGOData);
877bf854f0fSBob Wilson     computeRegionCounts(D);
878d66a17d0SJustin Bogner     applyFunctionAttributes(PGOData, Fn);
879bf854f0fSBob Wilson   }
880ef512b99SJustin Bogner }
881ef512b99SJustin Bogner 
882ef512b99SJustin Bogner void CodeGenPGO::mapRegionCounters(const Decl *D) {
8831b67cfd4SDuncan P. N. Exon Smith   RegionCounterMap.reset(new llvm::DenseMap<const Stmt *, unsigned>);
8843586be72SDuncan P. N. Exon Smith   MapRegionCounters Walker(*RegionCounterMap);
885ef512b99SJustin Bogner   if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D))
886ef512b99SJustin Bogner     Walker.VisitFunctionDecl(FD);
8875ec8fe19SBob Wilson   else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D))
8885ec8fe19SBob Wilson     Walker.VisitObjCMethodDecl(MD);
889c845c00aSBob Wilson   else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D))
890c845c00aSBob Wilson     Walker.VisitBlockDecl(BD);
891ef512b99SJustin Bogner   NumRegionCounters = Walker.NextCounter;
892b4416f58SJustin Bogner   // FIXME: The number of counters isn't sufficient for the hash
893b4416f58SJustin Bogner   FunctionHash = NumRegionCounters;
894ef512b99SJustin Bogner }
895ef512b99SJustin Bogner 
896bf854f0fSBob Wilson void CodeGenPGO::computeRegionCounts(const Decl *D) {
8971b67cfd4SDuncan P. N. Exon Smith   StmtCountMap.reset(new llvm::DenseMap<const Stmt *, uint64_t>);
8983586be72SDuncan P. N. Exon Smith   ComputeRegionCounts Walker(*StmtCountMap, *this);
899bf854f0fSBob Wilson   if (const FunctionDecl *FD = dyn_cast_or_null<FunctionDecl>(D))
900bf854f0fSBob Wilson     Walker.VisitFunctionDecl(FD);
9015ec8fe19SBob Wilson   else if (const ObjCMethodDecl *MD = dyn_cast_or_null<ObjCMethodDecl>(D))
9025ec8fe19SBob Wilson     Walker.VisitObjCMethodDecl(MD);
903c845c00aSBob Wilson   else if (const BlockDecl *BD = dyn_cast_or_null<BlockDecl>(D))
904c845c00aSBob Wilson     Walker.VisitBlockDecl(BD);
905bf854f0fSBob Wilson }
906bf854f0fSBob Wilson 
907d66a17d0SJustin Bogner void CodeGenPGO::applyFunctionAttributes(PGOProfileData *PGOData,
9084c9c45c0SJustin Bogner                                          llvm::Function *Fn) {
9094c9c45c0SJustin Bogner   if (!haveRegionCounts())
9104c9c45c0SJustin Bogner     return;
9114c9c45c0SJustin Bogner 
912d66a17d0SJustin Bogner   uint64_t MaxFunctionCount = PGOData->getMaximumFunctionCount();
9134c9c45c0SJustin Bogner   uint64_t FunctionCount = getRegionCount(0);
9144c9c45c0SJustin Bogner   if (FunctionCount >= (uint64_t)(0.3 * (double)MaxFunctionCount))
9154c9c45c0SJustin Bogner     // Turn on InlineHint attribute for hot functions.
9164c9c45c0SJustin Bogner     // FIXME: 30% is from preliminary tuning on SPEC, it may not be optimal.
9174c9c45c0SJustin Bogner     Fn->addFnAttr(llvm::Attribute::InlineHint);
9184c9c45c0SJustin Bogner   else if (FunctionCount <= (uint64_t)(0.01 * (double)MaxFunctionCount))
9194c9c45c0SJustin Bogner     // Turn on Cold attribute for cold functions.
9204c9c45c0SJustin Bogner     // FIXME: 1% is from preliminary tuning on SPEC, it may not be optimal.
9214c9c45c0SJustin Bogner     Fn->addFnAttr(llvm::Attribute::Cold);
9224c9c45c0SJustin Bogner }
9234c9c45c0SJustin Bogner 
924ef512b99SJustin Bogner void CodeGenPGO::emitCounterVariables() {
925ef512b99SJustin Bogner   llvm::LLVMContext &Ctx = CGM.getLLVMContext();
926ef512b99SJustin Bogner   llvm::ArrayType *CounterTy = llvm::ArrayType::get(llvm::Type::getInt64Ty(Ctx),
927ef512b99SJustin Bogner                                                     NumRegionCounters);
928ef512b99SJustin Bogner   RegionCounters =
92973f78627SDuncan P. N. Exon Smith     new llvm::GlobalVariable(CGM.getModule(), CounterTy, false, VarLinkage,
930ef512b99SJustin Bogner                              llvm::Constant::getNullValue(CounterTy),
9312fe531cbSDuncan P. N. Exon Smith                              getFuncVarName("counters"));
9322fe531cbSDuncan P. N. Exon Smith   RegionCounters->setAlignment(8);
9332fe531cbSDuncan P. N. Exon Smith   RegionCounters->setSection(getCountersSection(CGM));
934ef512b99SJustin Bogner }
935ef512b99SJustin Bogner 
936ef512b99SJustin Bogner void CodeGenPGO::emitCounterIncrement(CGBuilderTy &Builder, unsigned Counter) {
937749ebc7fSBob Wilson   if (!RegionCounters)
938ef512b99SJustin Bogner     return;
939ef512b99SJustin Bogner   llvm::Value *Addr =
940ef512b99SJustin Bogner     Builder.CreateConstInBoundsGEP2_64(RegionCounters, 0, Counter);
941ef512b99SJustin Bogner   llvm::Value *Count = Builder.CreateLoad(Addr, "pgocount");
942ef512b99SJustin Bogner   Count = Builder.CreateAdd(Count, Builder.getInt64(1));
943ef512b99SJustin Bogner   Builder.CreateStore(Count, Addr);
944ef512b99SJustin Bogner }
945ef512b99SJustin Bogner 
946d66a17d0SJustin Bogner void CodeGenPGO::loadRegionCounts(PGOProfileData *PGOData) {
947ef512b99SJustin Bogner   // For now, ignore the counts from the PGO data file only if the number of
948ef512b99SJustin Bogner   // counters does not match. This could be tightened down in the future to
949ef512b99SJustin Bogner   // ignore counts when the input changes in various ways, e.g., by comparing a
950ef512b99SJustin Bogner   // hash value based on some characteristics of the input.
9511b67cfd4SDuncan P. N. Exon Smith   RegionCounts.reset(new std::vector<uint64_t>);
952b4416f58SJustin Bogner   uint64_t Hash;
953b4416f58SJustin Bogner   if (PGOData->getFunctionCounts(getFuncName(), Hash, *RegionCounts) ||
9541b67cfd4SDuncan P. N. Exon Smith       Hash != FunctionHash || RegionCounts->size() != NumRegionCounters)
9551b67cfd4SDuncan P. N. Exon Smith     RegionCounts.reset();
956ef512b99SJustin Bogner }
957ef512b99SJustin Bogner 
958ef512b99SJustin Bogner void CodeGenPGO::destroyRegionCounters() {
9591b67cfd4SDuncan P. N. Exon Smith   RegionCounterMap.reset();
9601b67cfd4SDuncan P. N. Exon Smith   StmtCountMap.reset();
9611b67cfd4SDuncan P. N. Exon Smith   RegionCounts.reset();
962ef512b99SJustin Bogner }
963ef512b99SJustin Bogner 
96438402dc9SDuncan P. N. Exon Smith /// \brief Calculate what to divide by to scale weights.
96538402dc9SDuncan P. N. Exon Smith ///
96638402dc9SDuncan P. N. Exon Smith /// Given the maximum weight, calculate a divisor that will scale all the
96738402dc9SDuncan P. N. Exon Smith /// weights to strictly less than UINT32_MAX.
96838402dc9SDuncan P. N. Exon Smith static uint64_t calculateWeightScale(uint64_t MaxWeight) {
96938402dc9SDuncan P. N. Exon Smith   return MaxWeight < UINT32_MAX ? 1 : MaxWeight / UINT32_MAX + 1;
97038402dc9SDuncan P. N. Exon Smith }
97138402dc9SDuncan P. N. Exon Smith 
97238402dc9SDuncan P. N. Exon Smith /// \brief Scale an individual branch weight (and add 1).
97338402dc9SDuncan P. N. Exon Smith ///
97438402dc9SDuncan P. N. Exon Smith /// Scale a 64-bit weight down to 32-bits using \c Scale.
97538402dc9SDuncan P. N. Exon Smith ///
97638402dc9SDuncan P. N. Exon Smith /// According to Laplace's Rule of Succession, it is better to compute the
97738402dc9SDuncan P. N. Exon Smith /// weight based on the count plus 1, so universally add 1 to the value.
97838402dc9SDuncan P. N. Exon Smith ///
97938402dc9SDuncan P. N. Exon Smith /// \pre \c Scale was calculated by \a calculateWeightScale() with a weight no
98038402dc9SDuncan P. N. Exon Smith /// greater than \c Weight.
98138402dc9SDuncan P. N. Exon Smith static uint32_t scaleBranchWeight(uint64_t Weight, uint64_t Scale) {
98238402dc9SDuncan P. N. Exon Smith   assert(Scale && "scale by 0?");
98338402dc9SDuncan P. N. Exon Smith   uint64_t Scaled = Weight / Scale + 1;
98438402dc9SDuncan P. N. Exon Smith   assert(Scaled <= UINT32_MAX && "overflow 32-bits");
98538402dc9SDuncan P. N. Exon Smith   return Scaled;
98638402dc9SDuncan P. N. Exon Smith }
98738402dc9SDuncan P. N. Exon Smith 
988ef512b99SJustin Bogner llvm::MDNode *CodeGenPGO::createBranchWeights(uint64_t TrueCount,
989ef512b99SJustin Bogner                                               uint64_t FalseCount) {
99038402dc9SDuncan P. N. Exon Smith   // Check for empty weights.
991ef512b99SJustin Bogner   if (!TrueCount && !FalseCount)
992a5f804a7SDuncan P. N. Exon Smith     return nullptr;
993ef512b99SJustin Bogner 
99438402dc9SDuncan P. N. Exon Smith   // Calculate how to scale down to 32-bits.
99538402dc9SDuncan P. N. Exon Smith   uint64_t Scale = calculateWeightScale(std::max(TrueCount, FalseCount));
99638402dc9SDuncan P. N. Exon Smith 
997ef512b99SJustin Bogner   llvm::MDBuilder MDHelper(CGM.getLLVMContext());
99838402dc9SDuncan P. N. Exon Smith   return MDHelper.createBranchWeights(scaleBranchWeight(TrueCount, Scale),
99938402dc9SDuncan P. N. Exon Smith                                       scaleBranchWeight(FalseCount, Scale));
1000ef512b99SJustin Bogner }
1001ef512b99SJustin Bogner 
100295a27b0eSBob Wilson llvm::MDNode *CodeGenPGO::createBranchWeights(ArrayRef<uint64_t> Weights) {
100338402dc9SDuncan P. N. Exon Smith   // We need at least two elements to create meaningful weights.
100438402dc9SDuncan P. N. Exon Smith   if (Weights.size() < 2)
1005a5f804a7SDuncan P. N. Exon Smith     return nullptr;
100638402dc9SDuncan P. N. Exon Smith 
100738402dc9SDuncan P. N. Exon Smith   // Calculate how to scale down to 32-bits.
100838402dc9SDuncan P. N. Exon Smith   uint64_t Scale = calculateWeightScale(*std::max_element(Weights.begin(),
100938402dc9SDuncan P. N. Exon Smith                                                           Weights.end()));
101038402dc9SDuncan P. N. Exon Smith 
1011ef512b99SJustin Bogner   SmallVector<uint32_t, 16> ScaledWeights;
1012ef512b99SJustin Bogner   ScaledWeights.reserve(Weights.size());
101338402dc9SDuncan P. N. Exon Smith   for (uint64_t W : Weights)
101438402dc9SDuncan P. N. Exon Smith     ScaledWeights.push_back(scaleBranchWeight(W, Scale));
101538402dc9SDuncan P. N. Exon Smith 
101638402dc9SDuncan P. N. Exon Smith   llvm::MDBuilder MDHelper(CGM.getLLVMContext());
1017ef512b99SJustin Bogner   return MDHelper.createBranchWeights(ScaledWeights);
1018ef512b99SJustin Bogner }
1019bf854f0fSBob Wilson 
1020bf854f0fSBob Wilson llvm::MDNode *CodeGenPGO::createLoopWeights(const Stmt *Cond,
1021bf854f0fSBob Wilson                                             RegionCounter &Cnt) {
1022bf854f0fSBob Wilson   if (!haveRegionCounts())
1023a5f804a7SDuncan P. N. Exon Smith     return nullptr;
1024bf854f0fSBob Wilson   uint64_t LoopCount = Cnt.getCount();
1025bf854f0fSBob Wilson   uint64_t CondCount = 0;
1026bf854f0fSBob Wilson   bool Found = getStmtCount(Cond, CondCount);
1027bf854f0fSBob Wilson   assert(Found && "missing expected loop condition count");
1028bf854f0fSBob Wilson   (void)Found;
1029bf854f0fSBob Wilson   if (CondCount == 0)
1030a5f804a7SDuncan P. N. Exon Smith     return nullptr;
1031bf854f0fSBob Wilson   return createBranchWeights(LoopCount,
1032bf854f0fSBob Wilson                              std::max(CondCount, LoopCount) - LoopCount);
1033bf854f0fSBob Wilson }
1034