1 //===-- InstrProfiling.cpp - Frontend instrumentation based profiling -----===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This pass lowers instrprof_* intrinsics emitted by a frontend for profiling. 11 // It also builds the data structures and initialization code needed for 12 // updating execution counts and emitting the profile at runtime. 13 // 14 //===----------------------------------------------------------------------===// 15 16 #include "llvm/ADT/Triple.h" 17 #include "llvm/IR/IRBuilder.h" 18 #include "llvm/IR/IntrinsicInst.h" 19 #include "llvm/IR/Module.h" 20 #include "llvm/ProfileData/InstrProf.h" 21 #include "llvm/Transforms/InstrProfiling.h" 22 #include "llvm/Transforms/Utils/ModuleUtils.h" 23 24 using namespace llvm; 25 26 #define DEBUG_TYPE "instrprof" 27 28 namespace { 29 30 cl::opt<bool> DoNameCompression("enable-name-compression", 31 cl::desc("Enable name string compression"), 32 cl::init(true)); 33 34 class InstrProfilingLegacyPass : public ModulePass { 35 InstrProfiling InstrProf; 36 37 public: 38 static char ID; 39 InstrProfilingLegacyPass() : ModulePass(ID), InstrProf() {} 40 InstrProfilingLegacyPass(const InstrProfOptions &Options) 41 : ModulePass(ID), InstrProf(Options) {} 42 const char *getPassName() const override { 43 return "Frontend instrumentation-based coverage lowering"; 44 } 45 46 bool runOnModule(Module &M) override { return InstrProf.run(M); } 47 48 void getAnalysisUsage(AnalysisUsage &AU) const override { 49 AU.setPreservesCFG(); 50 } 51 }; 52 53 } // anonymous namespace 54 55 PreservedAnalyses InstrProfiling::run(Module &M, AnalysisManager<Module> &AM) { 56 if (!run(M)) 57 return PreservedAnalyses::all(); 58 59 return PreservedAnalyses::none(); 60 } 61 62 char InstrProfilingLegacyPass::ID = 0; 63 INITIALIZE_PASS(InstrProfilingLegacyPass, "instrprof", 64 "Frontend instrumentation-based coverage lowering.", false, 65 false) 66 67 ModulePass *llvm::createInstrProfilingLegacyPass(const InstrProfOptions &Options) { 68 return new InstrProfilingLegacyPass(Options); 69 } 70 71 bool InstrProfiling::isMachO() const { 72 return Triple(M->getTargetTriple()).isOSBinFormatMachO(); 73 } 74 75 /// Get the section name for the counter variables. 76 StringRef InstrProfiling::getCountersSection() const { 77 return getInstrProfCountersSectionName(isMachO()); 78 } 79 80 /// Get the section name for the name variables. 81 StringRef InstrProfiling::getNameSection() const { 82 return getInstrProfNameSectionName(isMachO()); 83 } 84 85 /// Get the section name for the profile data variables. 86 StringRef InstrProfiling::getDataSection() const { 87 return getInstrProfDataSectionName(isMachO()); 88 } 89 90 /// Get the section name for the coverage mapping data. 91 StringRef InstrProfiling::getCoverageSection() const { 92 return getInstrProfCoverageSectionName(isMachO()); 93 } 94 95 bool InstrProfiling::run(Module &M) { 96 bool MadeChange = false; 97 98 this->M = &M; 99 NamesVar = nullptr; 100 NamesSize = 0; 101 ProfileDataMap.clear(); 102 UsedVars.clear(); 103 104 // We did not know how many value sites there would be inside 105 // the instrumented function. This is counting the number of instrumented 106 // target value sites to enter it as field in the profile data variable. 107 for (Function &F : M) { 108 InstrProfIncrementInst *FirstProfIncInst = nullptr; 109 for (BasicBlock &BB : F) 110 for (auto I = BB.begin(), E = BB.end(); I != E; I++) 111 if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(I)) 112 computeNumValueSiteCounts(Ind); 113 else if (FirstProfIncInst == nullptr) 114 FirstProfIncInst = dyn_cast<InstrProfIncrementInst>(I); 115 116 // Value profiling intrinsic lowering requires per-function profile data 117 // variable to be created first. 118 if (FirstProfIncInst != nullptr) 119 static_cast<void>(getOrCreateRegionCounters(FirstProfIncInst)); 120 } 121 122 for (Function &F : M) 123 for (BasicBlock &BB : F) 124 for (auto I = BB.begin(), E = BB.end(); I != E;) { 125 auto Instr = I++; 126 if (auto *Inc = dyn_cast<InstrProfIncrementInst>(Instr)) { 127 lowerIncrement(Inc); 128 MadeChange = true; 129 } else if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(Instr)) { 130 lowerValueProfileInst(Ind); 131 MadeChange = true; 132 } 133 } 134 135 if (GlobalVariable *CoverageNamesVar = 136 M.getNamedGlobal(getCoverageUnusedNamesVarName())) { 137 lowerCoverageData(CoverageNamesVar); 138 MadeChange = true; 139 } 140 141 if (!MadeChange) 142 return false; 143 144 emitNameData(); 145 emitRegistration(); 146 emitRuntimeHook(); 147 emitUses(); 148 emitInitialization(); 149 return true; 150 } 151 152 static Constant *getOrInsertValueProfilingCall(Module &M) { 153 LLVMContext &Ctx = M.getContext(); 154 auto *ReturnTy = Type::getVoidTy(M.getContext()); 155 Type *ParamTypes[] = { 156 #define VALUE_PROF_FUNC_PARAM(ParamType, ParamName, ParamLLVMType) ParamLLVMType 157 #include "llvm/ProfileData/InstrProfData.inc" 158 }; 159 auto *ValueProfilingCallTy = 160 FunctionType::get(ReturnTy, makeArrayRef(ParamTypes), false); 161 return M.getOrInsertFunction(getInstrProfValueProfFuncName(), 162 ValueProfilingCallTy); 163 } 164 165 void InstrProfiling::computeNumValueSiteCounts(InstrProfValueProfileInst *Ind) { 166 167 GlobalVariable *Name = Ind->getName(); 168 uint64_t ValueKind = Ind->getValueKind()->getZExtValue(); 169 uint64_t Index = Ind->getIndex()->getZExtValue(); 170 auto It = ProfileDataMap.find(Name); 171 if (It == ProfileDataMap.end()) { 172 PerFunctionProfileData PD; 173 PD.NumValueSites[ValueKind] = Index + 1; 174 ProfileDataMap[Name] = PD; 175 } else if (It->second.NumValueSites[ValueKind] <= Index) 176 It->second.NumValueSites[ValueKind] = Index + 1; 177 } 178 179 void InstrProfiling::lowerValueProfileInst(InstrProfValueProfileInst *Ind) { 180 181 GlobalVariable *Name = Ind->getName(); 182 auto It = ProfileDataMap.find(Name); 183 assert(It != ProfileDataMap.end() && It->second.DataVar && 184 "value profiling detected in function with no counter incerement"); 185 186 GlobalVariable *DataVar = It->second.DataVar; 187 uint64_t ValueKind = Ind->getValueKind()->getZExtValue(); 188 uint64_t Index = Ind->getIndex()->getZExtValue(); 189 for (uint32_t Kind = IPVK_First; Kind < ValueKind; ++Kind) 190 Index += It->second.NumValueSites[Kind]; 191 192 IRBuilder<> Builder(Ind); 193 Value* Args[3] = {Ind->getTargetValue(), 194 Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()), 195 Builder.getInt32(Index)}; 196 Ind->replaceAllUsesWith( 197 Builder.CreateCall(getOrInsertValueProfilingCall(*M), Args)); 198 Ind->eraseFromParent(); 199 } 200 201 void InstrProfiling::lowerIncrement(InstrProfIncrementInst *Inc) { 202 GlobalVariable *Counters = getOrCreateRegionCounters(Inc); 203 204 IRBuilder<> Builder(Inc); 205 uint64_t Index = Inc->getIndex()->getZExtValue(); 206 Value *Addr = Builder.CreateConstInBoundsGEP2_64(Counters, 0, Index); 207 Value *Count = Builder.CreateLoad(Addr, "pgocount"); 208 Count = Builder.CreateAdd(Count, Builder.getInt64(1)); 209 Inc->replaceAllUsesWith(Builder.CreateStore(Count, Addr)); 210 Inc->eraseFromParent(); 211 } 212 213 void InstrProfiling::lowerCoverageData(GlobalVariable *CoverageNamesVar) { 214 215 ConstantArray *Names = 216 cast<ConstantArray>(CoverageNamesVar->getInitializer()); 217 for (unsigned I = 0, E = Names->getNumOperands(); I < E; ++I) { 218 Constant *NC = Names->getOperand(I); 219 Value *V = NC->stripPointerCasts(); 220 assert(isa<GlobalVariable>(V) && "Missing reference to function name"); 221 GlobalVariable *Name = cast<GlobalVariable>(V); 222 223 Name->setLinkage(GlobalValue::PrivateLinkage); 224 ReferencedNames.push_back(Name); 225 } 226 } 227 228 /// Get the name of a profiling variable for a particular function. 229 static std::string getVarName(InstrProfIncrementInst *Inc, StringRef Prefix) { 230 StringRef NamePrefix = getInstrProfNameVarPrefix(); 231 StringRef Name = Inc->getName()->getName().substr(NamePrefix.size()); 232 return (Prefix + Name).str(); 233 } 234 235 static inline bool shouldRecordFunctionAddr(Function *F) { 236 // Check the linkage 237 if (!F->hasLinkOnceLinkage() && !F->hasLocalLinkage() && 238 !F->hasAvailableExternallyLinkage()) 239 return true; 240 // Prohibit function address recording if the function is both internal and 241 // COMDAT. This avoids the profile data variable referencing internal symbols 242 // in COMDAT. 243 if (F->hasLocalLinkage() && F->hasComdat()) 244 return false; 245 // Check uses of this function for other than direct calls or invokes to it. 246 return F->hasAddressTaken(); 247 } 248 249 static inline bool needsComdatForCounter(Function &F, Module &M) { 250 251 if (F.hasComdat()) 252 return true; 253 254 Triple TT(M.getTargetTriple()); 255 if (!TT.isOSBinFormatELF()) 256 return false; 257 258 // See createPGOFuncNameVar for more details. To avoid link errors, profile 259 // counters for function with available_externally linkage needs to be changed 260 // to linkonce linkage. On ELF based systems, this leads to weak symbols to be 261 // created. Without using comdat, duplicate entries won't be removed by the 262 // linker leading to increased data segement size and raw profile size. Even 263 // worse, since the referenced counter from profile per-function data object 264 // will be resolved to the common strong definition, the profile counts for 265 // available_externally functions will end up being duplicated in raw profile 266 // data. This can result in distorted profile as the counts of those dups 267 // will be accumulated by the profile merger. 268 GlobalValue::LinkageTypes Linkage = F.getLinkage(); 269 if (Linkage != GlobalValue::ExternalWeakLinkage && 270 Linkage != GlobalValue::AvailableExternallyLinkage) 271 return false; 272 273 return true; 274 } 275 276 static inline Comdat *getOrCreateProfileComdat(Module &M, Function &F, 277 InstrProfIncrementInst *Inc) { 278 if (!needsComdatForCounter(F, M)) 279 return nullptr; 280 281 // COFF format requires a COMDAT section to have a key symbol with the same 282 // name. The linker targeting COFF also requires that the COMDAT 283 // a section is associated to must precede the associating section. For this 284 // reason, we must choose the counter var's name as the name of the comdat. 285 StringRef ComdatPrefix = (Triple(M.getTargetTriple()).isOSBinFormatCOFF() 286 ? getInstrProfCountersVarPrefix() 287 : getInstrProfComdatPrefix()); 288 return M.getOrInsertComdat(StringRef(getVarName(Inc, ComdatPrefix))); 289 } 290 291 GlobalVariable * 292 InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) { 293 GlobalVariable *NamePtr = Inc->getName(); 294 auto It = ProfileDataMap.find(NamePtr); 295 PerFunctionProfileData PD; 296 if (It != ProfileDataMap.end()) { 297 if (It->second.RegionCounters) 298 return It->second.RegionCounters; 299 PD = It->second; 300 } 301 302 // Move the name variable to the right section. Place them in a COMDAT group 303 // if the associated function is a COMDAT. This will make sure that 304 // only one copy of counters of the COMDAT function will be emitted after 305 // linking. 306 Function *Fn = Inc->getParent()->getParent(); 307 Comdat *ProfileVarsComdat = nullptr; 308 ProfileVarsComdat = getOrCreateProfileComdat(*M, *Fn, Inc); 309 310 uint64_t NumCounters = Inc->getNumCounters()->getZExtValue(); 311 LLVMContext &Ctx = M->getContext(); 312 ArrayType *CounterTy = ArrayType::get(Type::getInt64Ty(Ctx), NumCounters); 313 314 // Create the counters variable. 315 auto *CounterPtr = 316 new GlobalVariable(*M, CounterTy, false, NamePtr->getLinkage(), 317 Constant::getNullValue(CounterTy), 318 getVarName(Inc, getInstrProfCountersVarPrefix())); 319 CounterPtr->setVisibility(NamePtr->getVisibility()); 320 CounterPtr->setSection(getCountersSection()); 321 CounterPtr->setAlignment(8); 322 CounterPtr->setComdat(ProfileVarsComdat); 323 324 // Create data variable. 325 auto *Int8PtrTy = Type::getInt8PtrTy(Ctx); 326 auto *Int16Ty = Type::getInt16Ty(Ctx); 327 auto *Int16ArrayTy = ArrayType::get(Int16Ty, IPVK_Last+1); 328 Type *DataTypes[] = { 329 #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) LLVMType, 330 #include "llvm/ProfileData/InstrProfData.inc" 331 }; 332 auto *DataTy = StructType::get(Ctx, makeArrayRef(DataTypes)); 333 334 Constant *FunctionAddr = shouldRecordFunctionAddr(Fn) ? 335 ConstantExpr::getBitCast(Fn, Int8PtrTy) : 336 ConstantPointerNull::get(Int8PtrTy); 337 338 Constant *Int16ArrayVals[IPVK_Last+1]; 339 for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) 340 Int16ArrayVals[Kind] = ConstantInt::get(Int16Ty, PD.NumValueSites[Kind]); 341 342 Constant *DataVals[] = { 343 #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) Init, 344 #include "llvm/ProfileData/InstrProfData.inc" 345 }; 346 auto *Data = new GlobalVariable(*M, DataTy, false, NamePtr->getLinkage(), 347 ConstantStruct::get(DataTy, DataVals), 348 getVarName(Inc, getInstrProfDataVarPrefix())); 349 Data->setVisibility(NamePtr->getVisibility()); 350 Data->setSection(getDataSection()); 351 Data->setAlignment(INSTR_PROF_DATA_ALIGNMENT); 352 Data->setComdat(ProfileVarsComdat); 353 354 PD.RegionCounters = CounterPtr; 355 PD.DataVar = Data; 356 ProfileDataMap[NamePtr] = PD; 357 358 // Mark the data variable as used so that it isn't stripped out. 359 UsedVars.push_back(Data); 360 // Now that the linkage set by the FE has been passed to the data and counter 361 // variables, reset Name variable's linkage and visibility to private so that 362 // it can be removed later by the compiler. 363 NamePtr->setLinkage(GlobalValue::PrivateLinkage); 364 // Collect the referenced names to be used by emitNameData. 365 ReferencedNames.push_back(NamePtr); 366 367 return CounterPtr; 368 } 369 370 void InstrProfiling::emitNameData() { 371 std::string UncompressedData; 372 373 if (ReferencedNames.empty()) 374 return; 375 376 std::string CompressedNameStr; 377 collectPGOFuncNameStrings(ReferencedNames, CompressedNameStr, 378 DoNameCompression); 379 380 auto &Ctx = M->getContext(); 381 auto *NamesVal = llvm::ConstantDataArray::getString( 382 Ctx, StringRef(CompressedNameStr), false); 383 NamesVar = new llvm::GlobalVariable(*M, NamesVal->getType(), true, 384 llvm::GlobalValue::PrivateLinkage, 385 NamesVal, getInstrProfNamesVarName()); 386 NamesSize = CompressedNameStr.size(); 387 NamesVar->setSection(getNameSection()); 388 UsedVars.push_back(NamesVar); 389 } 390 391 void InstrProfiling::emitRegistration() { 392 // Don't do this for Darwin. compiler-rt uses linker magic. 393 if (Triple(M->getTargetTriple()).isOSDarwin()) 394 return; 395 396 // Use linker script magic to get data/cnts/name start/end. 397 if (Triple(M->getTargetTriple()).isOSLinux() || 398 Triple(M->getTargetTriple()).isOSFreeBSD() || 399 Triple(M->getTargetTriple()).isPS4CPU()) 400 return; 401 402 // Construct the function. 403 auto *VoidTy = Type::getVoidTy(M->getContext()); 404 auto *VoidPtrTy = Type::getInt8PtrTy(M->getContext()); 405 auto *Int64Ty = Type::getInt64Ty(M->getContext()); 406 auto *RegisterFTy = FunctionType::get(VoidTy, false); 407 auto *RegisterF = Function::Create(RegisterFTy, GlobalValue::InternalLinkage, 408 getInstrProfRegFuncsName(), M); 409 RegisterF->setUnnamedAddr(true); 410 if (Options.NoRedZone) RegisterF->addFnAttr(Attribute::NoRedZone); 411 412 auto *RuntimeRegisterTy = FunctionType::get(VoidTy, VoidPtrTy, false); 413 auto *RuntimeRegisterF = 414 Function::Create(RuntimeRegisterTy, GlobalVariable::ExternalLinkage, 415 getInstrProfRegFuncName(), M); 416 417 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", RegisterF)); 418 for (Value *Data : UsedVars) 419 if (Data != NamesVar) 420 IRB.CreateCall(RuntimeRegisterF, IRB.CreateBitCast(Data, VoidPtrTy)); 421 422 if (NamesVar) { 423 Type *ParamTypes[] = {VoidPtrTy, Int64Ty}; 424 auto *NamesRegisterTy = 425 FunctionType::get(VoidTy, makeArrayRef(ParamTypes), false); 426 auto *NamesRegisterF = 427 Function::Create(NamesRegisterTy, GlobalVariable::ExternalLinkage, 428 getInstrProfNamesRegFuncName(), M); 429 IRB.CreateCall(NamesRegisterF, {IRB.CreateBitCast(NamesVar, VoidPtrTy), 430 IRB.getInt64(NamesSize)}); 431 } 432 433 IRB.CreateRetVoid(); 434 } 435 436 void InstrProfiling::emitRuntimeHook() { 437 438 // We expect the linker to be invoked with -u<hook_var> flag for linux, 439 // for which case there is no need to emit the user function. 440 if (Triple(M->getTargetTriple()).isOSLinux()) 441 return; 442 443 // If the module's provided its own runtime, we don't need to do anything. 444 if (M->getGlobalVariable(getInstrProfRuntimeHookVarName())) return; 445 446 // Declare an external variable that will pull in the runtime initialization. 447 auto *Int32Ty = Type::getInt32Ty(M->getContext()); 448 auto *Var = 449 new GlobalVariable(*M, Int32Ty, false, GlobalValue::ExternalLinkage, 450 nullptr, getInstrProfRuntimeHookVarName()); 451 452 // Make a function that uses it. 453 auto *User = Function::Create(FunctionType::get(Int32Ty, false), 454 GlobalValue::LinkOnceODRLinkage, 455 getInstrProfRuntimeHookVarUseFuncName(), M); 456 User->addFnAttr(Attribute::NoInline); 457 if (Options.NoRedZone) User->addFnAttr(Attribute::NoRedZone); 458 User->setVisibility(GlobalValue::HiddenVisibility); 459 460 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", User)); 461 auto *Load = IRB.CreateLoad(Var); 462 IRB.CreateRet(Load); 463 464 // Mark the user variable as used so that it isn't stripped out. 465 UsedVars.push_back(User); 466 } 467 468 void InstrProfiling::emitUses() { 469 if (UsedVars.empty()) 470 return; 471 472 GlobalVariable *LLVMUsed = M->getGlobalVariable("llvm.used"); 473 std::vector<Constant *> MergedVars; 474 if (LLVMUsed) { 475 // Collect the existing members of llvm.used. 476 ConstantArray *Inits = cast<ConstantArray>(LLVMUsed->getInitializer()); 477 for (unsigned I = 0, E = Inits->getNumOperands(); I != E; ++I) 478 MergedVars.push_back(Inits->getOperand(I)); 479 LLVMUsed->eraseFromParent(); 480 } 481 482 Type *i8PTy = Type::getInt8PtrTy(M->getContext()); 483 // Add uses for our data. 484 for (auto *Value : UsedVars) 485 MergedVars.push_back( 486 ConstantExpr::getBitCast(cast<Constant>(Value), i8PTy)); 487 488 // Recreate llvm.used. 489 ArrayType *ATy = ArrayType::get(i8PTy, MergedVars.size()); 490 LLVMUsed = 491 new GlobalVariable(*M, ATy, false, GlobalValue::AppendingLinkage, 492 ConstantArray::get(ATy, MergedVars), "llvm.used"); 493 LLVMUsed->setSection("llvm.metadata"); 494 } 495 496 void InstrProfiling::emitInitialization() { 497 std::string InstrProfileOutput = Options.InstrProfileOutput; 498 499 Constant *RegisterF = M->getFunction(getInstrProfRegFuncsName()); 500 if (!RegisterF && InstrProfileOutput.empty()) return; 501 502 // Create the initialization function. 503 auto *VoidTy = Type::getVoidTy(M->getContext()); 504 auto *F = Function::Create(FunctionType::get(VoidTy, false), 505 GlobalValue::InternalLinkage, 506 getInstrProfInitFuncName(), M); 507 F->setUnnamedAddr(true); 508 F->addFnAttr(Attribute::NoInline); 509 if (Options.NoRedZone) F->addFnAttr(Attribute::NoRedZone); 510 511 // Add the basic block and the necessary calls. 512 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", F)); 513 if (RegisterF) 514 IRB.CreateCall(RegisterF, {}); 515 if (!InstrProfileOutput.empty()) { 516 auto *Int8PtrTy = Type::getInt8PtrTy(M->getContext()); 517 auto *SetNameTy = FunctionType::get(VoidTy, Int8PtrTy, false); 518 auto *SetNameF = Function::Create(SetNameTy, GlobalValue::ExternalLinkage, 519 getInstrProfFileOverriderFuncName(), M); 520 521 // Create variable for profile name. 522 Constant *ProfileNameConst = 523 ConstantDataArray::getString(M->getContext(), InstrProfileOutput, true); 524 GlobalVariable *ProfileName = 525 new GlobalVariable(*M, ProfileNameConst->getType(), true, 526 GlobalValue::PrivateLinkage, ProfileNameConst); 527 528 IRB.CreateCall(SetNameF, IRB.CreatePointerCast(ProfileName, Int8PtrTy)); 529 } 530 IRB.CreateRetVoid(); 531 532 appendToGlobalCtors(*M, F, 0); 533 } 534