1 //===-- InstrProfiling.cpp - Frontend instrumentation based profiling -----===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This pass lowers instrprof_* intrinsics emitted by a frontend for profiling.
11 // It also builds the data structures and initialization code needed for
12 // updating execution counts and emitting the profile at runtime.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #include "llvm/ADT/Triple.h"
17 #include "llvm/IR/IRBuilder.h"
18 #include "llvm/IR/IntrinsicInst.h"
19 #include "llvm/IR/Module.h"
20 #include "llvm/ProfileData/InstrProf.h"
21 #include "llvm/Transforms/InstrProfiling.h"
22 #include "llvm/Transforms/Utils/ModuleUtils.h"
23 
24 using namespace llvm;
25 
26 #define DEBUG_TYPE "instrprof"
27 
28 namespace {
29 
30 cl::opt<bool> DoNameCompression("enable-name-compression",
31                                 cl::desc("Enable name string compression"),
32                                 cl::init(true));
33 
34 class InstrProfilingLegacyPass : public ModulePass {
35   InstrProfiling InstrProf;
36 
37 public:
38   static char ID;
39   InstrProfilingLegacyPass() : ModulePass(ID), InstrProf() {}
40   InstrProfilingLegacyPass(const InstrProfOptions &Options)
41       : ModulePass(ID), InstrProf(Options) {}
42   const char *getPassName() const override {
43     return "Frontend instrumentation-based coverage lowering";
44   }
45 
46   bool runOnModule(Module &M) override { return InstrProf.run(M); }
47 
48   void getAnalysisUsage(AnalysisUsage &AU) const override {
49     AU.setPreservesCFG();
50   }
51 };
52 
53 } // anonymous namespace
54 
55 PreservedAnalyses InstrProfiling::run(Module &M, AnalysisManager<Module> &AM) {
56   if (!run(M))
57     return PreservedAnalyses::all();
58 
59   return PreservedAnalyses::none();
60 }
61 
62 char InstrProfilingLegacyPass::ID = 0;
63 INITIALIZE_PASS(InstrProfilingLegacyPass, "instrprof",
64                 "Frontend instrumentation-based coverage lowering.", false,
65                 false)
66 
67 ModulePass *llvm::createInstrProfilingLegacyPass(const InstrProfOptions &Options) {
68   return new InstrProfilingLegacyPass(Options);
69 }
70 
71 bool InstrProfiling::isMachO() const {
72   return Triple(M->getTargetTriple()).isOSBinFormatMachO();
73 }
74 
75 /// Get the section name for the counter variables.
76 StringRef InstrProfiling::getCountersSection() const {
77   return getInstrProfCountersSectionName(isMachO());
78 }
79 
80 /// Get the section name for the name variables.
81 StringRef InstrProfiling::getNameSection() const {
82   return getInstrProfNameSectionName(isMachO());
83 }
84 
85 /// Get the section name for the profile data variables.
86 StringRef InstrProfiling::getDataSection() const {
87   return getInstrProfDataSectionName(isMachO());
88 }
89 
90 /// Get the section name for the coverage mapping data.
91 StringRef InstrProfiling::getCoverageSection() const {
92   return getInstrProfCoverageSectionName(isMachO());
93 }
94 
95 bool InstrProfiling::run(Module &M) {
96   bool MadeChange = false;
97 
98   this->M = &M;
99   NamesVar = nullptr;
100   NamesSize = 0;
101   ProfileDataMap.clear();
102   UsedVars.clear();
103 
104   // We did not know how many value sites there would be inside
105   // the instrumented function. This is counting the number of instrumented
106   // target value sites to enter it as field in the profile data variable.
107   for (Function &F : M) {
108     InstrProfIncrementInst *FirstProfIncInst = nullptr;
109     for (BasicBlock &BB : F)
110       for (auto I = BB.begin(), E = BB.end(); I != E; I++)
111         if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(I))
112           computeNumValueSiteCounts(Ind);
113         else if (FirstProfIncInst == nullptr)
114           FirstProfIncInst = dyn_cast<InstrProfIncrementInst>(I);
115 
116     // Value profiling intrinsic lowering requires per-function profile data
117     // variable to be created first.
118     if (FirstProfIncInst != nullptr)
119       static_cast<void>(getOrCreateRegionCounters(FirstProfIncInst));
120   }
121 
122   for (Function &F : M)
123     for (BasicBlock &BB : F)
124       for (auto I = BB.begin(), E = BB.end(); I != E;) {
125         auto Instr = I++;
126         if (auto *Inc = dyn_cast<InstrProfIncrementInst>(Instr)) {
127           lowerIncrement(Inc);
128           MadeChange = true;
129         } else if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(Instr)) {
130           lowerValueProfileInst(Ind);
131           MadeChange = true;
132         }
133       }
134 
135   if (GlobalVariable *CoverageNamesVar =
136           M.getNamedGlobal(getCoverageUnusedNamesVarName())) {
137     lowerCoverageData(CoverageNamesVar);
138     MadeChange = true;
139   }
140 
141   if (!MadeChange)
142     return false;
143 
144   emitNameData();
145   emitRegistration();
146   emitRuntimeHook();
147   emitUses();
148   emitInitialization();
149   return true;
150 }
151 
152 static Constant *getOrInsertValueProfilingCall(Module &M) {
153   LLVMContext &Ctx = M.getContext();
154   auto *ReturnTy = Type::getVoidTy(M.getContext());
155   Type *ParamTypes[] = {
156 #define VALUE_PROF_FUNC_PARAM(ParamType, ParamName, ParamLLVMType) ParamLLVMType
157 #include "llvm/ProfileData/InstrProfData.inc"
158   };
159   auto *ValueProfilingCallTy =
160       FunctionType::get(ReturnTy, makeArrayRef(ParamTypes), false);
161   return M.getOrInsertFunction(getInstrProfValueProfFuncName(),
162                                ValueProfilingCallTy);
163 }
164 
165 void InstrProfiling::computeNumValueSiteCounts(InstrProfValueProfileInst *Ind) {
166 
167   GlobalVariable *Name = Ind->getName();
168   uint64_t ValueKind = Ind->getValueKind()->getZExtValue();
169   uint64_t Index = Ind->getIndex()->getZExtValue();
170   auto It = ProfileDataMap.find(Name);
171   if (It == ProfileDataMap.end()) {
172     PerFunctionProfileData PD;
173     PD.NumValueSites[ValueKind] = Index + 1;
174     ProfileDataMap[Name] = PD;
175   } else if (It->second.NumValueSites[ValueKind] <= Index)
176     It->second.NumValueSites[ValueKind] = Index + 1;
177 }
178 
179 void InstrProfiling::lowerValueProfileInst(InstrProfValueProfileInst *Ind) {
180 
181   GlobalVariable *Name = Ind->getName();
182   auto It = ProfileDataMap.find(Name);
183   assert(It != ProfileDataMap.end() && It->second.DataVar &&
184     "value profiling detected in function with no counter incerement");
185 
186   GlobalVariable *DataVar = It->second.DataVar;
187   uint64_t ValueKind = Ind->getValueKind()->getZExtValue();
188   uint64_t Index = Ind->getIndex()->getZExtValue();
189   for (uint32_t Kind = IPVK_First; Kind < ValueKind; ++Kind)
190     Index += It->second.NumValueSites[Kind];
191 
192   IRBuilder<> Builder(Ind);
193   Value* Args[3] = {Ind->getTargetValue(),
194       Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()),
195       Builder.getInt32(Index)};
196   Ind->replaceAllUsesWith(
197       Builder.CreateCall(getOrInsertValueProfilingCall(*M), Args));
198   Ind->eraseFromParent();
199 }
200 
201 void InstrProfiling::lowerIncrement(InstrProfIncrementInst *Inc) {
202   GlobalVariable *Counters = getOrCreateRegionCounters(Inc);
203 
204   IRBuilder<> Builder(Inc);
205   uint64_t Index = Inc->getIndex()->getZExtValue();
206   Value *Addr = Builder.CreateConstInBoundsGEP2_64(Counters, 0, Index);
207   Value *Count = Builder.CreateLoad(Addr, "pgocount");
208   Count = Builder.CreateAdd(Count, Builder.getInt64(1));
209   Inc->replaceAllUsesWith(Builder.CreateStore(Count, Addr));
210   Inc->eraseFromParent();
211 }
212 
213 void InstrProfiling::lowerCoverageData(GlobalVariable *CoverageNamesVar) {
214 
215   ConstantArray *Names =
216       cast<ConstantArray>(CoverageNamesVar->getInitializer());
217   for (unsigned I = 0, E = Names->getNumOperands(); I < E; ++I) {
218     Constant *NC = Names->getOperand(I);
219     Value *V = NC->stripPointerCasts();
220     assert(isa<GlobalVariable>(V) && "Missing reference to function name");
221     GlobalVariable *Name = cast<GlobalVariable>(V);
222 
223     Name->setLinkage(GlobalValue::PrivateLinkage);
224     ReferencedNames.push_back(Name);
225   }
226 }
227 
228 /// Get the name of a profiling variable for a particular function.
229 static std::string getVarName(InstrProfIncrementInst *Inc, StringRef Prefix) {
230   StringRef NamePrefix = getInstrProfNameVarPrefix();
231   StringRef Name = Inc->getName()->getName().substr(NamePrefix.size());
232   return (Prefix + Name).str();
233 }
234 
235 static inline bool shouldRecordFunctionAddr(Function *F) {
236   // Check the linkage
237   if (!F->hasLinkOnceLinkage() && !F->hasLocalLinkage() &&
238       !F->hasAvailableExternallyLinkage())
239     return true;
240   // Prohibit function address recording if the function is both internal and
241   // COMDAT. This avoids the profile data variable referencing internal symbols
242   // in COMDAT.
243   if (F->hasLocalLinkage() && F->hasComdat())
244     return false;
245   // Check uses of this function for other than direct calls or invokes to it.
246   return F->hasAddressTaken();
247 }
248 
249 static inline bool needsComdatForCounter(Function &F, Module &M) {
250 
251   if (F.hasComdat())
252     return true;
253 
254   Triple TT(M.getTargetTriple());
255   if (!TT.isOSBinFormatELF())
256     return false;
257 
258   // See createPGOFuncNameVar for more details. To avoid link errors, profile
259   // counters for function with available_externally linkage needs to be changed
260   // to linkonce linkage. On ELF based systems, this leads to weak symbols to be
261   // created. Without using comdat, duplicate entries won't be removed by the
262   // linker leading to increased data segement size and raw profile size. Even
263   // worse, since the referenced counter from profile per-function data object
264   // will be resolved to the common strong definition, the profile counts for
265   // available_externally functions will end up being duplicated in raw profile
266   // data. This can result in distorted profile as the counts of those dups
267   // will be accumulated by the profile merger.
268   GlobalValue::LinkageTypes Linkage = F.getLinkage();
269   if (Linkage != GlobalValue::ExternalWeakLinkage &&
270       Linkage != GlobalValue::AvailableExternallyLinkage)
271     return false;
272 
273   return true;
274 }
275 
276 static inline Comdat *getOrCreateProfileComdat(Module &M, Function &F,
277                                                InstrProfIncrementInst *Inc) {
278   if (!needsComdatForCounter(F, M))
279     return nullptr;
280 
281   // COFF format requires a COMDAT section to have a key symbol with the same
282   // name. The linker targeting COFF also requires that the COMDAT
283   // a section is associated to must precede the associating section. For this
284   // reason, we must choose the counter var's name as the name of the comdat.
285   StringRef ComdatPrefix = (Triple(M.getTargetTriple()).isOSBinFormatCOFF()
286                                 ? getInstrProfCountersVarPrefix()
287                                 : getInstrProfComdatPrefix());
288   return M.getOrInsertComdat(StringRef(getVarName(Inc, ComdatPrefix)));
289 }
290 
291 GlobalVariable *
292 InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) {
293   GlobalVariable *NamePtr = Inc->getName();
294   auto It = ProfileDataMap.find(NamePtr);
295   PerFunctionProfileData PD;
296   if (It != ProfileDataMap.end()) {
297     if (It->second.RegionCounters)
298       return It->second.RegionCounters;
299     PD = It->second;
300   }
301 
302   // Move the name variable to the right section. Place them in a COMDAT group
303   // if the associated function is a COMDAT. This will make sure that
304   // only one copy of counters of the COMDAT function will be emitted after
305   // linking.
306   Function *Fn = Inc->getParent()->getParent();
307   Comdat *ProfileVarsComdat = nullptr;
308   ProfileVarsComdat = getOrCreateProfileComdat(*M, *Fn, Inc);
309 
310   uint64_t NumCounters = Inc->getNumCounters()->getZExtValue();
311   LLVMContext &Ctx = M->getContext();
312   ArrayType *CounterTy = ArrayType::get(Type::getInt64Ty(Ctx), NumCounters);
313 
314   // Create the counters variable.
315   auto *CounterPtr =
316       new GlobalVariable(*M, CounterTy, false, NamePtr->getLinkage(),
317                          Constant::getNullValue(CounterTy),
318                          getVarName(Inc, getInstrProfCountersVarPrefix()));
319   CounterPtr->setVisibility(NamePtr->getVisibility());
320   CounterPtr->setSection(getCountersSection());
321   CounterPtr->setAlignment(8);
322   CounterPtr->setComdat(ProfileVarsComdat);
323 
324   // Create data variable.
325   auto *Int8PtrTy = Type::getInt8PtrTy(Ctx);
326   auto *Int16Ty = Type::getInt16Ty(Ctx);
327   auto *Int16ArrayTy = ArrayType::get(Int16Ty, IPVK_Last+1);
328   Type *DataTypes[] = {
329     #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) LLVMType,
330     #include "llvm/ProfileData/InstrProfData.inc"
331   };
332   auto *DataTy = StructType::get(Ctx, makeArrayRef(DataTypes));
333 
334   Constant *FunctionAddr = shouldRecordFunctionAddr(Fn) ?
335                            ConstantExpr::getBitCast(Fn, Int8PtrTy) :
336                            ConstantPointerNull::get(Int8PtrTy);
337 
338   Constant *Int16ArrayVals[IPVK_Last+1];
339   for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind)
340     Int16ArrayVals[Kind] = ConstantInt::get(Int16Ty, PD.NumValueSites[Kind]);
341 
342   Constant *DataVals[] = {
343     #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) Init,
344     #include "llvm/ProfileData/InstrProfData.inc"
345   };
346   auto *Data = new GlobalVariable(*M, DataTy, false, NamePtr->getLinkage(),
347                                   ConstantStruct::get(DataTy, DataVals),
348                                   getVarName(Inc, getInstrProfDataVarPrefix()));
349   Data->setVisibility(NamePtr->getVisibility());
350   Data->setSection(getDataSection());
351   Data->setAlignment(INSTR_PROF_DATA_ALIGNMENT);
352   Data->setComdat(ProfileVarsComdat);
353 
354   PD.RegionCounters = CounterPtr;
355   PD.DataVar = Data;
356   ProfileDataMap[NamePtr] = PD;
357 
358   // Mark the data variable as used so that it isn't stripped out.
359   UsedVars.push_back(Data);
360   // Now that the linkage set by the FE has been passed to the data and counter
361   // variables, reset Name variable's linkage and visibility to private so that
362   // it can be removed later by the compiler.
363   NamePtr->setLinkage(GlobalValue::PrivateLinkage);
364   // Collect the referenced names to be used by emitNameData.
365   ReferencedNames.push_back(NamePtr);
366 
367   return CounterPtr;
368 }
369 
370 void InstrProfiling::emitNameData() {
371   std::string UncompressedData;
372 
373   if (ReferencedNames.empty())
374     return;
375 
376   std::string CompressedNameStr;
377   if (auto EC = collectPGOFuncNameStrings(ReferencedNames, CompressedNameStr,
378                                           DoNameCompression)) {
379     llvm::report_fatal_error(EC.message(), false);
380   }
381 
382   auto &Ctx = M->getContext();
383   auto *NamesVal = llvm::ConstantDataArray::getString(
384       Ctx, StringRef(CompressedNameStr), false);
385   NamesVar = new llvm::GlobalVariable(*M, NamesVal->getType(), true,
386                                       llvm::GlobalValue::PrivateLinkage,
387                                       NamesVal, getInstrProfNamesVarName());
388   NamesSize = CompressedNameStr.size();
389   NamesVar->setSection(getNameSection());
390   UsedVars.push_back(NamesVar);
391 }
392 
393 void InstrProfiling::emitRegistration() {
394   // Don't do this for Darwin.  compiler-rt uses linker magic.
395   if (Triple(M->getTargetTriple()).isOSDarwin())
396     return;
397 
398   // Use linker script magic to get data/cnts/name start/end.
399   if (Triple(M->getTargetTriple()).isOSLinux() ||
400       Triple(M->getTargetTriple()).isOSFreeBSD() ||
401       Triple(M->getTargetTriple()).isPS4CPU())
402     return;
403 
404   // Construct the function.
405   auto *VoidTy = Type::getVoidTy(M->getContext());
406   auto *VoidPtrTy = Type::getInt8PtrTy(M->getContext());
407   auto *Int64Ty = Type::getInt64Ty(M->getContext());
408   auto *RegisterFTy = FunctionType::get(VoidTy, false);
409   auto *RegisterF = Function::Create(RegisterFTy, GlobalValue::InternalLinkage,
410                                      getInstrProfRegFuncsName(), M);
411   RegisterF->setUnnamedAddr(true);
412   if (Options.NoRedZone) RegisterF->addFnAttr(Attribute::NoRedZone);
413 
414   auto *RuntimeRegisterTy = FunctionType::get(VoidTy, VoidPtrTy, false);
415   auto *RuntimeRegisterF =
416       Function::Create(RuntimeRegisterTy, GlobalVariable::ExternalLinkage,
417                        getInstrProfRegFuncName(), M);
418 
419   IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", RegisterF));
420   for (Value *Data : UsedVars)
421     if (Data != NamesVar)
422       IRB.CreateCall(RuntimeRegisterF, IRB.CreateBitCast(Data, VoidPtrTy));
423 
424   if (NamesVar) {
425     Type *ParamTypes[] = {VoidPtrTy, Int64Ty};
426     auto *NamesRegisterTy =
427         FunctionType::get(VoidTy, makeArrayRef(ParamTypes), false);
428     auto *NamesRegisterF =
429         Function::Create(NamesRegisterTy, GlobalVariable::ExternalLinkage,
430                          getInstrProfNamesRegFuncName(), M);
431     IRB.CreateCall(NamesRegisterF, {IRB.CreateBitCast(NamesVar, VoidPtrTy),
432                                     IRB.getInt64(NamesSize)});
433   }
434 
435   IRB.CreateRetVoid();
436 }
437 
438 void InstrProfiling::emitRuntimeHook() {
439 
440   // We expect the linker to be invoked with -u<hook_var> flag for linux,
441   // for which case there is no need to emit the user function.
442   if (Triple(M->getTargetTriple()).isOSLinux())
443     return;
444 
445   // If the module's provided its own runtime, we don't need to do anything.
446   if (M->getGlobalVariable(getInstrProfRuntimeHookVarName())) return;
447 
448   // Declare an external variable that will pull in the runtime initialization.
449   auto *Int32Ty = Type::getInt32Ty(M->getContext());
450   auto *Var =
451       new GlobalVariable(*M, Int32Ty, false, GlobalValue::ExternalLinkage,
452                          nullptr, getInstrProfRuntimeHookVarName());
453 
454   // Make a function that uses it.
455   auto *User = Function::Create(FunctionType::get(Int32Ty, false),
456                                 GlobalValue::LinkOnceODRLinkage,
457                                 getInstrProfRuntimeHookVarUseFuncName(), M);
458   User->addFnAttr(Attribute::NoInline);
459   if (Options.NoRedZone) User->addFnAttr(Attribute::NoRedZone);
460   User->setVisibility(GlobalValue::HiddenVisibility);
461 
462   IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", User));
463   auto *Load = IRB.CreateLoad(Var);
464   IRB.CreateRet(Load);
465 
466   // Mark the user variable as used so that it isn't stripped out.
467   UsedVars.push_back(User);
468 }
469 
470 void InstrProfiling::emitUses() {
471   if (UsedVars.empty())
472     return;
473 
474   GlobalVariable *LLVMUsed = M->getGlobalVariable("llvm.used");
475   std::vector<Constant *> MergedVars;
476   if (LLVMUsed) {
477     // Collect the existing members of llvm.used.
478     ConstantArray *Inits = cast<ConstantArray>(LLVMUsed->getInitializer());
479     for (unsigned I = 0, E = Inits->getNumOperands(); I != E; ++I)
480       MergedVars.push_back(Inits->getOperand(I));
481     LLVMUsed->eraseFromParent();
482   }
483 
484   Type *i8PTy = Type::getInt8PtrTy(M->getContext());
485   // Add uses for our data.
486   for (auto *Value : UsedVars)
487     MergedVars.push_back(
488         ConstantExpr::getBitCast(cast<Constant>(Value), i8PTy));
489 
490   // Recreate llvm.used.
491   ArrayType *ATy = ArrayType::get(i8PTy, MergedVars.size());
492   LLVMUsed =
493       new GlobalVariable(*M, ATy, false, GlobalValue::AppendingLinkage,
494                          ConstantArray::get(ATy, MergedVars), "llvm.used");
495   LLVMUsed->setSection("llvm.metadata");
496 }
497 
498 void InstrProfiling::emitInitialization() {
499   std::string InstrProfileOutput = Options.InstrProfileOutput;
500 
501   Constant *RegisterF = M->getFunction(getInstrProfRegFuncsName());
502   if (!RegisterF && InstrProfileOutput.empty()) return;
503 
504   // Create the initialization function.
505   auto *VoidTy = Type::getVoidTy(M->getContext());
506   auto *F = Function::Create(FunctionType::get(VoidTy, false),
507                              GlobalValue::InternalLinkage,
508                              getInstrProfInitFuncName(), M);
509   F->setUnnamedAddr(true);
510   F->addFnAttr(Attribute::NoInline);
511   if (Options.NoRedZone) F->addFnAttr(Attribute::NoRedZone);
512 
513   // Add the basic block and the necessary calls.
514   IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", F));
515   if (RegisterF)
516     IRB.CreateCall(RegisterF, {});
517   if (!InstrProfileOutput.empty()) {
518     auto *Int8PtrTy = Type::getInt8PtrTy(M->getContext());
519     auto *SetNameTy = FunctionType::get(VoidTy, Int8PtrTy, false);
520     auto *SetNameF = Function::Create(SetNameTy, GlobalValue::ExternalLinkage,
521                                       getInstrProfFileOverriderFuncName(), M);
522 
523     // Create variable for profile name.
524     Constant *ProfileNameConst =
525         ConstantDataArray::getString(M->getContext(), InstrProfileOutput, true);
526     GlobalVariable *ProfileName =
527         new GlobalVariable(*M, ProfileNameConst->getType(), true,
528                            GlobalValue::PrivateLinkage, ProfileNameConst);
529 
530     IRB.CreateCall(SetNameF, IRB.CreatePointerCast(ProfileName, Int8PtrTy));
531   }
532   IRB.CreateRetVoid();
533 
534   appendToGlobalCtors(*M, F, 0);
535 }
536