1 //===-- InstrProfiling.cpp - Frontend instrumentation based profiling -----===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This pass lowers instrprof_* intrinsics emitted by a frontend for profiling. 11 // It also builds the data structures and initialization code needed for 12 // updating execution counts and emitting the profile at runtime. 13 // 14 //===----------------------------------------------------------------------===// 15 16 #include "llvm/ADT/Triple.h" 17 #include "llvm/IR/IRBuilder.h" 18 #include "llvm/IR/IntrinsicInst.h" 19 #include "llvm/IR/Module.h" 20 #include "llvm/ProfileData/InstrProf.h" 21 #include "llvm/Transforms/InstrProfiling.h" 22 #include "llvm/Transforms/Utils/ModuleUtils.h" 23 24 using namespace llvm; 25 26 #define DEBUG_TYPE "instrprof" 27 28 namespace { 29 30 cl::opt<bool> DoNameCompression("enable-name-compression", 31 cl::desc("Enable name string compression"), 32 cl::init(true)); 33 34 class InstrProfilingLegacyPass : public ModulePass { 35 InstrProfiling InstrProf; 36 37 public: 38 static char ID; 39 InstrProfilingLegacyPass() : ModulePass(ID), InstrProf() {} 40 InstrProfilingLegacyPass(const InstrProfOptions &Options) 41 : ModulePass(ID), InstrProf(Options) {} 42 const char *getPassName() const override { 43 return "Frontend instrumentation-based coverage lowering"; 44 } 45 46 bool runOnModule(Module &M) override { return InstrProf.run(M); } 47 48 void getAnalysisUsage(AnalysisUsage &AU) const override { 49 AU.setPreservesCFG(); 50 } 51 }; 52 53 } // anonymous namespace 54 55 PreservedAnalyses InstrProfiling::run(Module &M, AnalysisManager<Module> &AM) { 56 if (!run(M)) 57 return PreservedAnalyses::all(); 58 59 return PreservedAnalyses::none(); 60 } 61 62 char InstrProfilingLegacyPass::ID = 0; 63 INITIALIZE_PASS(InstrProfilingLegacyPass, "instrprof", 64 "Frontend instrumentation-based coverage lowering.", false, 65 false) 66 67 ModulePass *llvm::createInstrProfilingLegacyPass(const InstrProfOptions &Options) { 68 return new InstrProfilingLegacyPass(Options); 69 } 70 71 bool InstrProfiling::isMachO() const { 72 return Triple(M->getTargetTriple()).isOSBinFormatMachO(); 73 } 74 75 /// Get the section name for the counter variables. 76 StringRef InstrProfiling::getCountersSection() const { 77 return getInstrProfCountersSectionName(isMachO()); 78 } 79 80 /// Get the section name for the name variables. 81 StringRef InstrProfiling::getNameSection() const { 82 return getInstrProfNameSectionName(isMachO()); 83 } 84 85 /// Get the section name for the profile data variables. 86 StringRef InstrProfiling::getDataSection() const { 87 return getInstrProfDataSectionName(isMachO()); 88 } 89 90 /// Get the section name for the coverage mapping data. 91 StringRef InstrProfiling::getCoverageSection() const { 92 return getInstrProfCoverageSectionName(isMachO()); 93 } 94 95 bool InstrProfiling::run(Module &M) { 96 bool MadeChange = false; 97 98 this->M = &M; 99 NamesVar = nullptr; 100 NamesSize = 0; 101 ProfileDataMap.clear(); 102 UsedVars.clear(); 103 104 // We did not know how many value sites there would be inside 105 // the instrumented function. This is counting the number of instrumented 106 // target value sites to enter it as field in the profile data variable. 107 for (Function &F : M) { 108 InstrProfIncrementInst *FirstProfIncInst = nullptr; 109 for (BasicBlock &BB : F) 110 for (auto I = BB.begin(), E = BB.end(); I != E; I++) 111 if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(I)) 112 computeNumValueSiteCounts(Ind); 113 else if (FirstProfIncInst == nullptr) 114 FirstProfIncInst = dyn_cast<InstrProfIncrementInst>(I); 115 116 // Value profiling intrinsic lowering requires per-function profile data 117 // variable to be created first. 118 if (FirstProfIncInst != nullptr) 119 static_cast<void>(getOrCreateRegionCounters(FirstProfIncInst)); 120 } 121 122 for (Function &F : M) 123 for (BasicBlock &BB : F) 124 for (auto I = BB.begin(), E = BB.end(); I != E;) { 125 auto Instr = I++; 126 if (auto *Inc = dyn_cast<InstrProfIncrementInst>(Instr)) { 127 lowerIncrement(Inc); 128 MadeChange = true; 129 } else if (auto *Ind = dyn_cast<InstrProfValueProfileInst>(Instr)) { 130 lowerValueProfileInst(Ind); 131 MadeChange = true; 132 } 133 } 134 135 if (GlobalVariable *CoverageNamesVar = 136 M.getNamedGlobal(getCoverageUnusedNamesVarName())) { 137 lowerCoverageData(CoverageNamesVar); 138 MadeChange = true; 139 } 140 141 if (!MadeChange) 142 return false; 143 144 emitNameData(); 145 emitRegistration(); 146 emitRuntimeHook(); 147 emitUses(); 148 emitInitialization(); 149 return true; 150 } 151 152 static Constant *getOrInsertValueProfilingCall(Module &M) { 153 LLVMContext &Ctx = M.getContext(); 154 auto *ReturnTy = Type::getVoidTy(M.getContext()); 155 Type *ParamTypes[] = { 156 #define VALUE_PROF_FUNC_PARAM(ParamType, ParamName, ParamLLVMType) ParamLLVMType 157 #include "llvm/ProfileData/InstrProfData.inc" 158 }; 159 auto *ValueProfilingCallTy = 160 FunctionType::get(ReturnTy, makeArrayRef(ParamTypes), false); 161 return M.getOrInsertFunction(getInstrProfValueProfFuncName(), 162 ValueProfilingCallTy); 163 } 164 165 void InstrProfiling::computeNumValueSiteCounts(InstrProfValueProfileInst *Ind) { 166 167 GlobalVariable *Name = Ind->getName(); 168 uint64_t ValueKind = Ind->getValueKind()->getZExtValue(); 169 uint64_t Index = Ind->getIndex()->getZExtValue(); 170 auto It = ProfileDataMap.find(Name); 171 if (It == ProfileDataMap.end()) { 172 PerFunctionProfileData PD; 173 PD.NumValueSites[ValueKind] = Index + 1; 174 ProfileDataMap[Name] = PD; 175 } else if (It->second.NumValueSites[ValueKind] <= Index) 176 It->second.NumValueSites[ValueKind] = Index + 1; 177 } 178 179 void InstrProfiling::lowerValueProfileInst(InstrProfValueProfileInst *Ind) { 180 181 GlobalVariable *Name = Ind->getName(); 182 auto It = ProfileDataMap.find(Name); 183 assert(It != ProfileDataMap.end() && It->second.DataVar && 184 "value profiling detected in function with no counter incerement"); 185 186 GlobalVariable *DataVar = It->second.DataVar; 187 uint64_t ValueKind = Ind->getValueKind()->getZExtValue(); 188 uint64_t Index = Ind->getIndex()->getZExtValue(); 189 for (uint32_t Kind = IPVK_First; Kind < ValueKind; ++Kind) 190 Index += It->second.NumValueSites[Kind]; 191 192 IRBuilder<> Builder(Ind); 193 Value* Args[3] = {Ind->getTargetValue(), 194 Builder.CreateBitCast(DataVar, Builder.getInt8PtrTy()), 195 Builder.getInt32(Index)}; 196 Ind->replaceAllUsesWith( 197 Builder.CreateCall(getOrInsertValueProfilingCall(*M), Args)); 198 Ind->eraseFromParent(); 199 } 200 201 void InstrProfiling::lowerIncrement(InstrProfIncrementInst *Inc) { 202 GlobalVariable *Counters = getOrCreateRegionCounters(Inc); 203 204 IRBuilder<> Builder(Inc); 205 uint64_t Index = Inc->getIndex()->getZExtValue(); 206 Value *Addr = Builder.CreateConstInBoundsGEP2_64(Counters, 0, Index); 207 Value *Count = Builder.CreateLoad(Addr, "pgocount"); 208 Count = Builder.CreateAdd(Count, Builder.getInt64(1)); 209 Inc->replaceAllUsesWith(Builder.CreateStore(Count, Addr)); 210 Inc->eraseFromParent(); 211 } 212 213 void InstrProfiling::lowerCoverageData(GlobalVariable *CoverageNamesVar) { 214 215 ConstantArray *Names = 216 cast<ConstantArray>(CoverageNamesVar->getInitializer()); 217 for (unsigned I = 0, E = Names->getNumOperands(); I < E; ++I) { 218 Constant *NC = Names->getOperand(I); 219 Value *V = NC->stripPointerCasts(); 220 assert(isa<GlobalVariable>(V) && "Missing reference to function name"); 221 GlobalVariable *Name = cast<GlobalVariable>(V); 222 223 Name->setLinkage(GlobalValue::PrivateLinkage); 224 ReferencedNames.push_back(Name); 225 } 226 } 227 228 /// Get the name of a profiling variable for a particular function. 229 static std::string getVarName(InstrProfIncrementInst *Inc, StringRef Prefix) { 230 StringRef NamePrefix = getInstrProfNameVarPrefix(); 231 StringRef Name = Inc->getName()->getName().substr(NamePrefix.size()); 232 return (Prefix + Name).str(); 233 } 234 235 static inline bool shouldRecordFunctionAddr(Function *F) { 236 // Check the linkage 237 if (!F->hasLinkOnceLinkage() && !F->hasLocalLinkage() && 238 !F->hasAvailableExternallyLinkage()) 239 return true; 240 // Prohibit function address recording if the function is both internal and 241 // COMDAT. This avoids the profile data variable referencing internal symbols 242 // in COMDAT. 243 if (F->hasLocalLinkage() && F->hasComdat()) 244 return false; 245 // Check uses of this function for other than direct calls or invokes to it. 246 return F->hasAddressTaken(); 247 } 248 249 static inline bool needsComdatForCounter(Function &F, Module &M) { 250 251 if (F.hasComdat()) 252 return true; 253 254 Triple TT(M.getTargetTriple()); 255 if (!TT.isOSBinFormatELF()) 256 return false; 257 258 // See createPGOFuncNameVar for more details. To avoid link errors, profile 259 // counters for function with available_externally linkage needs to be changed 260 // to linkonce linkage. On ELF based systems, this leads to weak symbols to be 261 // created. Without using comdat, duplicate entries won't be removed by the 262 // linker leading to increased data segement size and raw profile size. Even 263 // worse, since the referenced counter from profile per-function data object 264 // will be resolved to the common strong definition, the profile counts for 265 // available_externally functions will end up being duplicated in raw profile 266 // data. This can result in distorted profile as the counts of those dups 267 // will be accumulated by the profile merger. 268 GlobalValue::LinkageTypes Linkage = F.getLinkage(); 269 if (Linkage != GlobalValue::ExternalWeakLinkage && 270 Linkage != GlobalValue::AvailableExternallyLinkage) 271 return false; 272 273 return true; 274 } 275 276 static inline Comdat *getOrCreateProfileComdat(Module &M, Function &F, 277 InstrProfIncrementInst *Inc) { 278 if (!needsComdatForCounter(F, M)) 279 return nullptr; 280 281 // COFF format requires a COMDAT section to have a key symbol with the same 282 // name. The linker targeting COFF also requires that the COMDAT 283 // a section is associated to must precede the associating section. For this 284 // reason, we must choose the counter var's name as the name of the comdat. 285 StringRef ComdatPrefix = (Triple(M.getTargetTriple()).isOSBinFormatCOFF() 286 ? getInstrProfCountersVarPrefix() 287 : getInstrProfComdatPrefix()); 288 return M.getOrInsertComdat(StringRef(getVarName(Inc, ComdatPrefix))); 289 } 290 291 GlobalVariable * 292 InstrProfiling::getOrCreateRegionCounters(InstrProfIncrementInst *Inc) { 293 GlobalVariable *NamePtr = Inc->getName(); 294 auto It = ProfileDataMap.find(NamePtr); 295 PerFunctionProfileData PD; 296 if (It != ProfileDataMap.end()) { 297 if (It->second.RegionCounters) 298 return It->second.RegionCounters; 299 PD = It->second; 300 } 301 302 // Move the name variable to the right section. Place them in a COMDAT group 303 // if the associated function is a COMDAT. This will make sure that 304 // only one copy of counters of the COMDAT function will be emitted after 305 // linking. 306 Function *Fn = Inc->getParent()->getParent(); 307 Comdat *ProfileVarsComdat = nullptr; 308 ProfileVarsComdat = getOrCreateProfileComdat(*M, *Fn, Inc); 309 310 uint64_t NumCounters = Inc->getNumCounters()->getZExtValue(); 311 LLVMContext &Ctx = M->getContext(); 312 ArrayType *CounterTy = ArrayType::get(Type::getInt64Ty(Ctx), NumCounters); 313 314 // Create the counters variable. 315 auto *CounterPtr = 316 new GlobalVariable(*M, CounterTy, false, NamePtr->getLinkage(), 317 Constant::getNullValue(CounterTy), 318 getVarName(Inc, getInstrProfCountersVarPrefix())); 319 CounterPtr->setVisibility(NamePtr->getVisibility()); 320 CounterPtr->setSection(getCountersSection()); 321 CounterPtr->setAlignment(8); 322 CounterPtr->setComdat(ProfileVarsComdat); 323 324 // Create data variable. 325 auto *Int8PtrTy = Type::getInt8PtrTy(Ctx); 326 auto *Int16Ty = Type::getInt16Ty(Ctx); 327 auto *Int16ArrayTy = ArrayType::get(Int16Ty, IPVK_Last+1); 328 Type *DataTypes[] = { 329 #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) LLVMType, 330 #include "llvm/ProfileData/InstrProfData.inc" 331 }; 332 auto *DataTy = StructType::get(Ctx, makeArrayRef(DataTypes)); 333 334 Constant *FunctionAddr = shouldRecordFunctionAddr(Fn) ? 335 ConstantExpr::getBitCast(Fn, Int8PtrTy) : 336 ConstantPointerNull::get(Int8PtrTy); 337 338 Constant *Int16ArrayVals[IPVK_Last+1]; 339 for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) 340 Int16ArrayVals[Kind] = ConstantInt::get(Int16Ty, PD.NumValueSites[Kind]); 341 342 Constant *DataVals[] = { 343 #define INSTR_PROF_DATA(Type, LLVMType, Name, Init) Init, 344 #include "llvm/ProfileData/InstrProfData.inc" 345 }; 346 auto *Data = new GlobalVariable(*M, DataTy, false, NamePtr->getLinkage(), 347 ConstantStruct::get(DataTy, DataVals), 348 getVarName(Inc, getInstrProfDataVarPrefix())); 349 Data->setVisibility(NamePtr->getVisibility()); 350 Data->setSection(getDataSection()); 351 Data->setAlignment(INSTR_PROF_DATA_ALIGNMENT); 352 Data->setComdat(ProfileVarsComdat); 353 354 PD.RegionCounters = CounterPtr; 355 PD.DataVar = Data; 356 ProfileDataMap[NamePtr] = PD; 357 358 // Mark the data variable as used so that it isn't stripped out. 359 UsedVars.push_back(Data); 360 // Now that the linkage set by the FE has been passed to the data and counter 361 // variables, reset Name variable's linkage and visibility to private so that 362 // it can be removed later by the compiler. 363 NamePtr->setLinkage(GlobalValue::PrivateLinkage); 364 // Collect the referenced names to be used by emitNameData. 365 ReferencedNames.push_back(NamePtr); 366 367 return CounterPtr; 368 } 369 370 void InstrProfiling::emitNameData() { 371 std::string UncompressedData; 372 373 if (ReferencedNames.empty()) 374 return; 375 376 std::string CompressedNameStr; 377 if (auto EC = collectPGOFuncNameStrings(ReferencedNames, CompressedNameStr, 378 DoNameCompression)) { 379 llvm::report_fatal_error(EC.message(), false); 380 } 381 382 auto &Ctx = M->getContext(); 383 auto *NamesVal = llvm::ConstantDataArray::getString( 384 Ctx, StringRef(CompressedNameStr), false); 385 NamesVar = new llvm::GlobalVariable(*M, NamesVal->getType(), true, 386 llvm::GlobalValue::PrivateLinkage, 387 NamesVal, getInstrProfNamesVarName()); 388 NamesSize = CompressedNameStr.size(); 389 NamesVar->setSection(getNameSection()); 390 UsedVars.push_back(NamesVar); 391 } 392 393 void InstrProfiling::emitRegistration() { 394 // Don't do this for Darwin. compiler-rt uses linker magic. 395 if (Triple(M->getTargetTriple()).isOSDarwin()) 396 return; 397 398 // Use linker script magic to get data/cnts/name start/end. 399 if (Triple(M->getTargetTriple()).isOSLinux() || 400 Triple(M->getTargetTriple()).isOSFreeBSD() || 401 Triple(M->getTargetTriple()).isPS4CPU()) 402 return; 403 404 // Construct the function. 405 auto *VoidTy = Type::getVoidTy(M->getContext()); 406 auto *VoidPtrTy = Type::getInt8PtrTy(M->getContext()); 407 auto *Int64Ty = Type::getInt64Ty(M->getContext()); 408 auto *RegisterFTy = FunctionType::get(VoidTy, false); 409 auto *RegisterF = Function::Create(RegisterFTy, GlobalValue::InternalLinkage, 410 getInstrProfRegFuncsName(), M); 411 RegisterF->setUnnamedAddr(true); 412 if (Options.NoRedZone) RegisterF->addFnAttr(Attribute::NoRedZone); 413 414 auto *RuntimeRegisterTy = FunctionType::get(VoidTy, VoidPtrTy, false); 415 auto *RuntimeRegisterF = 416 Function::Create(RuntimeRegisterTy, GlobalVariable::ExternalLinkage, 417 getInstrProfRegFuncName(), M); 418 419 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", RegisterF)); 420 for (Value *Data : UsedVars) 421 if (Data != NamesVar) 422 IRB.CreateCall(RuntimeRegisterF, IRB.CreateBitCast(Data, VoidPtrTy)); 423 424 if (NamesVar) { 425 Type *ParamTypes[] = {VoidPtrTy, Int64Ty}; 426 auto *NamesRegisterTy = 427 FunctionType::get(VoidTy, makeArrayRef(ParamTypes), false); 428 auto *NamesRegisterF = 429 Function::Create(NamesRegisterTy, GlobalVariable::ExternalLinkage, 430 getInstrProfNamesRegFuncName(), M); 431 IRB.CreateCall(NamesRegisterF, {IRB.CreateBitCast(NamesVar, VoidPtrTy), 432 IRB.getInt64(NamesSize)}); 433 } 434 435 IRB.CreateRetVoid(); 436 } 437 438 void InstrProfiling::emitRuntimeHook() { 439 440 // We expect the linker to be invoked with -u<hook_var> flag for linux, 441 // for which case there is no need to emit the user function. 442 if (Triple(M->getTargetTriple()).isOSLinux()) 443 return; 444 445 // If the module's provided its own runtime, we don't need to do anything. 446 if (M->getGlobalVariable(getInstrProfRuntimeHookVarName())) return; 447 448 // Declare an external variable that will pull in the runtime initialization. 449 auto *Int32Ty = Type::getInt32Ty(M->getContext()); 450 auto *Var = 451 new GlobalVariable(*M, Int32Ty, false, GlobalValue::ExternalLinkage, 452 nullptr, getInstrProfRuntimeHookVarName()); 453 454 // Make a function that uses it. 455 auto *User = Function::Create(FunctionType::get(Int32Ty, false), 456 GlobalValue::LinkOnceODRLinkage, 457 getInstrProfRuntimeHookVarUseFuncName(), M); 458 User->addFnAttr(Attribute::NoInline); 459 if (Options.NoRedZone) User->addFnAttr(Attribute::NoRedZone); 460 User->setVisibility(GlobalValue::HiddenVisibility); 461 462 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", User)); 463 auto *Load = IRB.CreateLoad(Var); 464 IRB.CreateRet(Load); 465 466 // Mark the user variable as used so that it isn't stripped out. 467 UsedVars.push_back(User); 468 } 469 470 void InstrProfiling::emitUses() { 471 if (UsedVars.empty()) 472 return; 473 474 GlobalVariable *LLVMUsed = M->getGlobalVariable("llvm.used"); 475 std::vector<Constant *> MergedVars; 476 if (LLVMUsed) { 477 // Collect the existing members of llvm.used. 478 ConstantArray *Inits = cast<ConstantArray>(LLVMUsed->getInitializer()); 479 for (unsigned I = 0, E = Inits->getNumOperands(); I != E; ++I) 480 MergedVars.push_back(Inits->getOperand(I)); 481 LLVMUsed->eraseFromParent(); 482 } 483 484 Type *i8PTy = Type::getInt8PtrTy(M->getContext()); 485 // Add uses for our data. 486 for (auto *Value : UsedVars) 487 MergedVars.push_back( 488 ConstantExpr::getBitCast(cast<Constant>(Value), i8PTy)); 489 490 // Recreate llvm.used. 491 ArrayType *ATy = ArrayType::get(i8PTy, MergedVars.size()); 492 LLVMUsed = 493 new GlobalVariable(*M, ATy, false, GlobalValue::AppendingLinkage, 494 ConstantArray::get(ATy, MergedVars), "llvm.used"); 495 LLVMUsed->setSection("llvm.metadata"); 496 } 497 498 void InstrProfiling::emitInitialization() { 499 std::string InstrProfileOutput = Options.InstrProfileOutput; 500 501 Constant *RegisterF = M->getFunction(getInstrProfRegFuncsName()); 502 if (!RegisterF && InstrProfileOutput.empty()) return; 503 504 // Create the initialization function. 505 auto *VoidTy = Type::getVoidTy(M->getContext()); 506 auto *F = Function::Create(FunctionType::get(VoidTy, false), 507 GlobalValue::InternalLinkage, 508 getInstrProfInitFuncName(), M); 509 F->setUnnamedAddr(true); 510 F->addFnAttr(Attribute::NoInline); 511 if (Options.NoRedZone) F->addFnAttr(Attribute::NoRedZone); 512 513 // Add the basic block and the necessary calls. 514 IRBuilder<> IRB(BasicBlock::Create(M->getContext(), "", F)); 515 if (RegisterF) 516 IRB.CreateCall(RegisterF, {}); 517 if (!InstrProfileOutput.empty()) { 518 auto *Int8PtrTy = Type::getInt8PtrTy(M->getContext()); 519 auto *SetNameTy = FunctionType::get(VoidTy, Int8PtrTy, false); 520 auto *SetNameF = Function::Create(SetNameTy, GlobalValue::ExternalLinkage, 521 getInstrProfFileOverriderFuncName(), M); 522 523 // Create variable for profile name. 524 Constant *ProfileNameConst = 525 ConstantDataArray::getString(M->getContext(), InstrProfileOutput, true); 526 GlobalVariable *ProfileName = 527 new GlobalVariable(*M, ProfileNameConst->getType(), true, 528 GlobalValue::PrivateLinkage, ProfileNameConst); 529 530 IRB.CreateCall(SetNameF, IRB.CreatePointerCast(ProfileName, Int8PtrTy)); 531 } 532 IRB.CreateRetVoid(); 533 534 appendToGlobalCtors(*M, F, 0); 535 } 536