1 //===- llvm-profdata.cpp - LLVM profile data tool -------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // llvm-profdata merges .profdata files.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/ADT/SmallSet.h"
15 #include "llvm/ADT/SmallVector.h"
16 #include "llvm/ADT/StringRef.h"
17 #include "llvm/IR/LLVMContext.h"
18 #include "llvm/ProfileData/InstrProfReader.h"
19 #include "llvm/ProfileData/InstrProfWriter.h"
20 #include "llvm/ProfileData/ProfileCommon.h"
21 #include "llvm/ProfileData/SampleProfReader.h"
22 #include "llvm/ProfileData/SampleProfWriter.h"
23 #include "llvm/Support/CommandLine.h"
24 #include "llvm/Support/Errc.h"
25 #include "llvm/Support/FileSystem.h"
26 #include "llvm/Support/Format.h"
27 #include "llvm/Support/InitLLVM.h"
28 #include "llvm/Support/MemoryBuffer.h"
29 #include "llvm/Support/Path.h"
30 #include "llvm/Support/WithColor.h"
31 #include "llvm/Support/ThreadPool.h"
32 #include "llvm/Support/raw_ostream.h"
33 #include <algorithm>
34 
35 using namespace llvm;
36 
37 enum ProfileFormat {
38   PF_None = 0,
39   PF_Text,
40   PF_Compact_Binary,
41   PF_GCC,
42   PF_Binary
43 };
44 
45 static void warn(Twine Message, std::string Whence = "",
46                  std::string Hint = "") {
47   WithColor::warning();
48   if (!Whence.empty())
49     errs() << Whence << ": ";
50   errs() << Message << "\n";
51   if (!Hint.empty())
52     WithColor::note() << Hint << "\n";
53 }
54 
55 static void exitWithError(Twine Message, std::string Whence = "",
56                           std::string Hint = "") {
57   WithColor::error();
58   if (!Whence.empty())
59     errs() << Whence << ": ";
60   errs() << Message << "\n";
61   if (!Hint.empty())
62     WithColor::note() << Hint << "\n";
63   ::exit(1);
64 }
65 
66 static void exitWithError(Error E, StringRef Whence = "") {
67   if (E.isA<InstrProfError>()) {
68     handleAllErrors(std::move(E), [&](const InstrProfError &IPE) {
69       instrprof_error instrError = IPE.get();
70       StringRef Hint = "";
71       if (instrError == instrprof_error::unrecognized_format) {
72         // Hint for common error of forgetting -sample for sample profiles.
73         Hint = "Perhaps you forgot to use the -sample option?";
74       }
75       exitWithError(IPE.message(), Whence, Hint);
76     });
77   }
78 
79   exitWithError(toString(std::move(E)), Whence);
80 }
81 
82 static void exitWithErrorCode(std::error_code EC, StringRef Whence = "") {
83   exitWithError(EC.message(), Whence);
84 }
85 
86 namespace {
87 enum ProfileKinds { instr, sample };
88 }
89 
90 static void handleMergeWriterError(Error E, StringRef WhenceFile = "",
91                                    StringRef WhenceFunction = "",
92                                    bool ShowHint = true) {
93   if (!WhenceFile.empty())
94     errs() << WhenceFile << ": ";
95   if (!WhenceFunction.empty())
96     errs() << WhenceFunction << ": ";
97 
98   auto IPE = instrprof_error::success;
99   E = handleErrors(std::move(E),
100                    [&IPE](std::unique_ptr<InstrProfError> E) -> Error {
101                      IPE = E->get();
102                      return Error(std::move(E));
103                    });
104   errs() << toString(std::move(E)) << "\n";
105 
106   if (ShowHint) {
107     StringRef Hint = "";
108     if (IPE != instrprof_error::success) {
109       switch (IPE) {
110       case instrprof_error::hash_mismatch:
111       case instrprof_error::count_mismatch:
112       case instrprof_error::value_site_count_mismatch:
113         Hint = "Make sure that all profile data to be merged is generated "
114                "from the same binary.";
115         break;
116       default:
117         break;
118       }
119     }
120 
121     if (!Hint.empty())
122       errs() << Hint << "\n";
123   }
124 }
125 
126 namespace {
127 /// A remapper from original symbol names to new symbol names based on a file
128 /// containing a list of mappings from old name to new name.
129 class SymbolRemapper {
130   std::unique_ptr<MemoryBuffer> File;
131   DenseMap<StringRef, StringRef> RemappingTable;
132 
133 public:
134   /// Build a SymbolRemapper from a file containing a list of old/new symbols.
135   static std::unique_ptr<SymbolRemapper> create(StringRef InputFile) {
136     auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFile);
137     if (!BufOrError)
138       exitWithErrorCode(BufOrError.getError(), InputFile);
139 
140     auto Remapper = llvm::make_unique<SymbolRemapper>();
141     Remapper->File = std::move(BufOrError.get());
142 
143     for (line_iterator LineIt(*Remapper->File, /*SkipBlanks=*/true, '#');
144          !LineIt.is_at_eof(); ++LineIt) {
145       std::pair<StringRef, StringRef> Parts = LineIt->split(' ');
146       if (Parts.first.empty() || Parts.second.empty() ||
147           Parts.second.count(' ')) {
148         exitWithError("unexpected line in remapping file",
149                       (InputFile + ":" + Twine(LineIt.line_number())).str(),
150                       "expected 'old_symbol new_symbol'");
151       }
152       Remapper->RemappingTable.insert(Parts);
153     }
154     return Remapper;
155   }
156 
157   /// Attempt to map the given old symbol into a new symbol.
158   ///
159   /// \return The new symbol, or \p Name if no such symbol was found.
160   StringRef operator()(StringRef Name) {
161     StringRef New = RemappingTable.lookup(Name);
162     return New.empty() ? Name : New;
163   }
164 };
165 }
166 
167 struct WeightedFile {
168   std::string Filename;
169   uint64_t Weight;
170 };
171 typedef SmallVector<WeightedFile, 5> WeightedFileVector;
172 
173 /// Keep track of merged data and reported errors.
174 struct WriterContext {
175   std::mutex Lock;
176   InstrProfWriter Writer;
177   Error Err;
178   std::string ErrWhence;
179   std::mutex &ErrLock;
180   SmallSet<instrprof_error, 4> &WriterErrorCodes;
181 
182   WriterContext(bool IsSparse, std::mutex &ErrLock,
183                 SmallSet<instrprof_error, 4> &WriterErrorCodes)
184       : Lock(), Writer(IsSparse), Err(Error::success()), ErrWhence(""),
185         ErrLock(ErrLock), WriterErrorCodes(WriterErrorCodes) {}
186 };
187 
188 /// Determine whether an error is fatal for profile merging.
189 static bool isFatalError(instrprof_error IPE) {
190   switch (IPE) {
191   default:
192     return true;
193   case instrprof_error::success:
194   case instrprof_error::eof:
195   case instrprof_error::unknown_function:
196   case instrprof_error::hash_mismatch:
197   case instrprof_error::count_mismatch:
198   case instrprof_error::counter_overflow:
199   case instrprof_error::value_site_count_mismatch:
200     return false;
201   }
202 }
203 
204 /// Load an input into a writer context.
205 static void loadInput(const WeightedFile &Input, SymbolRemapper *Remapper,
206                       WriterContext *WC) {
207   std::unique_lock<std::mutex> CtxGuard{WC->Lock};
208 
209   // If there's a pending hard error, don't do more work.
210   if (WC->Err)
211     return;
212 
213   // Copy the filename, because llvm::ThreadPool copied the input "const
214   // WeightedFile &" by value, making a reference to the filename within it
215   // invalid outside of this packaged task.
216   WC->ErrWhence = Input.Filename;
217 
218   auto ReaderOrErr = InstrProfReader::create(Input.Filename);
219   if (Error E = ReaderOrErr.takeError()) {
220     // Skip the empty profiles by returning sliently.
221     instrprof_error IPE = InstrProfError::take(std::move(E));
222     if (IPE != instrprof_error::empty_raw_profile)
223       WC->Err = make_error<InstrProfError>(IPE);
224     return;
225   }
226 
227   auto Reader = std::move(ReaderOrErr.get());
228   bool IsIRProfile = Reader->isIRLevelProfile();
229   if (WC->Writer.setIsIRLevelProfile(IsIRProfile)) {
230     WC->Err = make_error<StringError>(
231         "Merge IR generated profile with Clang generated profile.",
232         std::error_code());
233     return;
234   }
235 
236   for (auto &I : *Reader) {
237     if (Remapper)
238       I.Name = (*Remapper)(I.Name);
239     const StringRef FuncName = I.Name;
240     bool Reported = false;
241     WC->Writer.addRecord(std::move(I), Input.Weight, [&](Error E) {
242       if (Reported) {
243         consumeError(std::move(E));
244         return;
245       }
246       Reported = true;
247       // Only show hint the first time an error occurs.
248       instrprof_error IPE = InstrProfError::take(std::move(E));
249       std::unique_lock<std::mutex> ErrGuard{WC->ErrLock};
250       bool firstTime = WC->WriterErrorCodes.insert(IPE).second;
251       handleMergeWriterError(make_error<InstrProfError>(IPE), Input.Filename,
252                              FuncName, firstTime);
253     });
254   }
255   if (Reader->hasError()) {
256     if (Error E = Reader->getError()) {
257       instrprof_error IPE = InstrProfError::take(std::move(E));
258       if (isFatalError(IPE))
259         WC->Err = make_error<InstrProfError>(IPE);
260     }
261   }
262 }
263 
264 /// Merge the \p Src writer context into \p Dst.
265 static void mergeWriterContexts(WriterContext *Dst, WriterContext *Src) {
266   // If we've already seen a hard error, continuing with the merge would
267   // clobber it.
268   if (Dst->Err || Src->Err)
269     return;
270 
271   bool Reported = false;
272   Dst->Writer.mergeRecordsFromWriter(std::move(Src->Writer), [&](Error E) {
273     if (Reported) {
274       consumeError(std::move(E));
275       return;
276     }
277     Reported = true;
278     Dst->Err = std::move(E);
279   });
280 }
281 
282 static void mergeInstrProfile(const WeightedFileVector &Inputs,
283                               SymbolRemapper *Remapper,
284                               StringRef OutputFilename,
285                               ProfileFormat OutputFormat, bool OutputSparse,
286                               unsigned NumThreads) {
287   if (OutputFilename.compare("-") == 0)
288     exitWithError("Cannot write indexed profdata format to stdout.");
289 
290   if (OutputFormat != PF_Binary && OutputFormat != PF_Compact_Binary &&
291       OutputFormat != PF_Text)
292     exitWithError("Unknown format is specified.");
293 
294   std::error_code EC;
295   raw_fd_ostream Output(OutputFilename.data(), EC, sys::fs::F_None);
296   if (EC)
297     exitWithErrorCode(EC, OutputFilename);
298 
299   std::mutex ErrorLock;
300   SmallSet<instrprof_error, 4> WriterErrorCodes;
301 
302   // If NumThreads is not specified, auto-detect a good default.
303   if (NumThreads == 0)
304     NumThreads =
305         std::min(hardware_concurrency(), unsigned((Inputs.size() + 1) / 2));
306 
307   // Initialize the writer contexts.
308   SmallVector<std::unique_ptr<WriterContext>, 4> Contexts;
309   for (unsigned I = 0; I < NumThreads; ++I)
310     Contexts.emplace_back(llvm::make_unique<WriterContext>(
311         OutputSparse, ErrorLock, WriterErrorCodes));
312 
313   if (NumThreads == 1) {
314     for (const auto &Input : Inputs)
315       loadInput(Input, Remapper, Contexts[0].get());
316   } else {
317     ThreadPool Pool(NumThreads);
318 
319     // Load the inputs in parallel (N/NumThreads serial steps).
320     unsigned Ctx = 0;
321     for (const auto &Input : Inputs) {
322       Pool.async(loadInput, Input, Remapper, Contexts[Ctx].get());
323       Ctx = (Ctx + 1) % NumThreads;
324     }
325     Pool.wait();
326 
327     // Merge the writer contexts together (~ lg(NumThreads) serial steps).
328     unsigned Mid = Contexts.size() / 2;
329     unsigned End = Contexts.size();
330     assert(Mid > 0 && "Expected more than one context");
331     do {
332       for (unsigned I = 0; I < Mid; ++I)
333         Pool.async(mergeWriterContexts, Contexts[I].get(),
334                    Contexts[I + Mid].get());
335       Pool.wait();
336       if (End & 1) {
337         Pool.async(mergeWriterContexts, Contexts[0].get(),
338                    Contexts[End - 1].get());
339         Pool.wait();
340       }
341       End = Mid;
342       Mid /= 2;
343     } while (Mid > 0);
344   }
345 
346   // Handle deferred hard errors encountered during merging.
347   for (std::unique_ptr<WriterContext> &WC : Contexts) {
348     if (!WC->Err)
349       continue;
350     if (!WC->Err.isA<InstrProfError>())
351       exitWithError(std::move(WC->Err), WC->ErrWhence);
352 
353     instrprof_error IPE = InstrProfError::take(std::move(WC->Err));
354     if (isFatalError(IPE))
355       exitWithError(make_error<InstrProfError>(IPE), WC->ErrWhence);
356     else
357       warn(toString(make_error<InstrProfError>(IPE)),
358            WC->ErrWhence);
359   }
360 
361   InstrProfWriter &Writer = Contexts[0]->Writer;
362   if (OutputFormat == PF_Text) {
363     if (Error E = Writer.writeText(Output))
364       exitWithError(std::move(E));
365   } else {
366     Writer.write(Output);
367   }
368 }
369 
370 /// Make a copy of the given function samples with all symbol names remapped
371 /// by the provided symbol remapper.
372 static sampleprof::FunctionSamples
373 remapSamples(const sampleprof::FunctionSamples &Samples,
374              SymbolRemapper &Remapper, sampleprof_error &Error) {
375   sampleprof::FunctionSamples Result;
376   Result.setName(Remapper(Samples.getName()));
377   Result.addTotalSamples(Samples.getTotalSamples());
378   Result.addHeadSamples(Samples.getHeadSamples());
379   for (const auto &BodySample : Samples.getBodySamples()) {
380     Result.addBodySamples(BodySample.first.LineOffset,
381                           BodySample.first.Discriminator,
382                           BodySample.second.getSamples());
383     for (const auto &Target : BodySample.second.getCallTargets()) {
384       Result.addCalledTargetSamples(BodySample.first.LineOffset,
385                                     BodySample.first.Discriminator,
386                                     Remapper(Target.first()), Target.second);
387     }
388   }
389   for (const auto &CallsiteSamples : Samples.getCallsiteSamples()) {
390     sampleprof::FunctionSamplesMap &Target =
391         Result.functionSamplesAt(CallsiteSamples.first);
392     for (const auto &Callsite : CallsiteSamples.second) {
393       sampleprof::FunctionSamples Remapped =
394           remapSamples(Callsite.second, Remapper, Error);
395       MergeResult(Error, Target[Remapped.getName()].merge(Remapped));
396     }
397   }
398   return Result;
399 }
400 
401 static sampleprof::SampleProfileFormat FormatMap[] = {
402     sampleprof::SPF_None, sampleprof::SPF_Text, sampleprof::SPF_Compact_Binary,
403     sampleprof::SPF_GCC, sampleprof::SPF_Binary};
404 
405 static void mergeSampleProfile(const WeightedFileVector &Inputs,
406                                SymbolRemapper *Remapper,
407                                StringRef OutputFilename,
408                                ProfileFormat OutputFormat) {
409   using namespace sampleprof;
410   auto WriterOrErr =
411       SampleProfileWriter::create(OutputFilename, FormatMap[OutputFormat]);
412   if (std::error_code EC = WriterOrErr.getError())
413     exitWithErrorCode(EC, OutputFilename);
414 
415   auto Writer = std::move(WriterOrErr.get());
416   StringMap<FunctionSamples> ProfileMap;
417   SmallVector<std::unique_ptr<sampleprof::SampleProfileReader>, 5> Readers;
418   LLVMContext Context;
419   for (const auto &Input : Inputs) {
420     auto ReaderOrErr = SampleProfileReader::create(Input.Filename, Context);
421     if (std::error_code EC = ReaderOrErr.getError())
422       exitWithErrorCode(EC, Input.Filename);
423 
424     // We need to keep the readers around until after all the files are
425     // read so that we do not lose the function names stored in each
426     // reader's memory. The function names are needed to write out the
427     // merged profile map.
428     Readers.push_back(std::move(ReaderOrErr.get()));
429     const auto Reader = Readers.back().get();
430     if (std::error_code EC = Reader->read())
431       exitWithErrorCode(EC, Input.Filename);
432 
433     StringMap<FunctionSamples> &Profiles = Reader->getProfiles();
434     for (StringMap<FunctionSamples>::iterator I = Profiles.begin(),
435                                               E = Profiles.end();
436          I != E; ++I) {
437       sampleprof_error Result = sampleprof_error::success;
438       FunctionSamples Remapped =
439           Remapper ? remapSamples(I->second, *Remapper, Result)
440                    : FunctionSamples();
441       FunctionSamples &Samples = Remapper ? Remapped : I->second;
442       StringRef FName = Samples.getName();
443       MergeResult(Result, ProfileMap[FName].merge(Samples, Input.Weight));
444       if (Result != sampleprof_error::success) {
445         std::error_code EC = make_error_code(Result);
446         handleMergeWriterError(errorCodeToError(EC), Input.Filename, FName);
447       }
448     }
449   }
450   Writer->write(ProfileMap);
451 }
452 
453 static WeightedFile parseWeightedFile(const StringRef &WeightedFilename) {
454   StringRef WeightStr, FileName;
455   std::tie(WeightStr, FileName) = WeightedFilename.split(',');
456 
457   uint64_t Weight;
458   if (WeightStr.getAsInteger(10, Weight) || Weight < 1)
459     exitWithError("Input weight must be a positive integer.");
460 
461   return {FileName, Weight};
462 }
463 
464 static std::unique_ptr<MemoryBuffer>
465 getInputFilenamesFileBuf(const StringRef &InputFilenamesFile) {
466   if (InputFilenamesFile == "")
467     return {};
468 
469   auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFilenamesFile);
470   if (!BufOrError)
471     exitWithErrorCode(BufOrError.getError(), InputFilenamesFile);
472 
473   return std::move(*BufOrError);
474 }
475 
476 static void addWeightedInput(WeightedFileVector &WNI, const WeightedFile &WF) {
477   StringRef Filename = WF.Filename;
478   uint64_t Weight = WF.Weight;
479 
480   // If it's STDIN just pass it on.
481   if (Filename == "-") {
482     WNI.push_back({Filename, Weight});
483     return;
484   }
485 
486   llvm::sys::fs::file_status Status;
487   llvm::sys::fs::status(Filename, Status);
488   if (!llvm::sys::fs::exists(Status))
489     exitWithErrorCode(make_error_code(errc::no_such_file_or_directory),
490                       Filename);
491   // If it's a source file, collect it.
492   if (llvm::sys::fs::is_regular_file(Status)) {
493     WNI.push_back({Filename, Weight});
494     return;
495   }
496 
497   if (llvm::sys::fs::is_directory(Status)) {
498     std::error_code EC;
499     for (llvm::sys::fs::recursive_directory_iterator F(Filename, EC), E;
500          F != E && !EC; F.increment(EC)) {
501       if (llvm::sys::fs::is_regular_file(F->path())) {
502         addWeightedInput(WNI, {F->path(), Weight});
503       }
504     }
505     if (EC)
506       exitWithErrorCode(EC, Filename);
507   }
508 }
509 
510 static void parseInputFilenamesFile(MemoryBuffer *Buffer,
511                                     WeightedFileVector &WFV) {
512   if (!Buffer)
513     return;
514 
515   SmallVector<StringRef, 8> Entries;
516   StringRef Data = Buffer->getBuffer();
517   Data.split(Entries, '\n', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
518   for (const StringRef &FileWeightEntry : Entries) {
519     StringRef SanitizedEntry = FileWeightEntry.trim(" \t\v\f\r");
520     // Skip comments.
521     if (SanitizedEntry.startswith("#"))
522       continue;
523     // If there's no comma, it's an unweighted profile.
524     else if (SanitizedEntry.find(',') == StringRef::npos)
525       addWeightedInput(WFV, {SanitizedEntry, 1});
526     else
527       addWeightedInput(WFV, parseWeightedFile(SanitizedEntry));
528   }
529 }
530 
531 static int merge_main(int argc, const char *argv[]) {
532   cl::list<std::string> InputFilenames(cl::Positional,
533                                        cl::desc("<filename...>"));
534   cl::list<std::string> WeightedInputFilenames("weighted-input",
535                                                cl::desc("<weight>,<filename>"));
536   cl::opt<std::string> InputFilenamesFile(
537       "input-files", cl::init(""),
538       cl::desc("Path to file containing newline-separated "
539                "[<weight>,]<filename> entries"));
540   cl::alias InputFilenamesFileA("f", cl::desc("Alias for --input-files"),
541                                 cl::aliasopt(InputFilenamesFile));
542   cl::opt<bool> DumpInputFileList(
543       "dump-input-file-list", cl::init(false), cl::Hidden,
544       cl::desc("Dump the list of input files and their weights, then exit"));
545   cl::opt<std::string> RemappingFile("remapping-file", cl::value_desc("file"),
546                                      cl::desc("Symbol remapping file"));
547   cl::alias RemappingFileA("r", cl::desc("Alias for --remapping-file"),
548                            cl::aliasopt(RemappingFile));
549   cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
550                                       cl::init("-"), cl::Required,
551                                       cl::desc("Output file"));
552   cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
553                             cl::aliasopt(OutputFilename));
554   cl::opt<ProfileKinds> ProfileKind(
555       cl::desc("Profile kind:"), cl::init(instr),
556       cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
557                  clEnumVal(sample, "Sample profile")));
558   cl::opt<ProfileFormat> OutputFormat(
559       cl::desc("Format of output profile"), cl::init(PF_Binary),
560       cl::values(clEnumValN(PF_Binary, "binary", "Binary encoding (default)"),
561                  clEnumValN(PF_Compact_Binary, "compbinary",
562                             "Compact binary encoding"),
563                  clEnumValN(PF_Text, "text", "Text encoding"),
564                  clEnumValN(PF_GCC, "gcc",
565                             "GCC encoding (only meaningful for -sample)")));
566   cl::opt<bool> OutputSparse("sparse", cl::init(false),
567       cl::desc("Generate a sparse profile (only meaningful for -instr)"));
568   cl::opt<unsigned> NumThreads(
569       "num-threads", cl::init(0),
570       cl::desc("Number of merge threads to use (default: autodetect)"));
571   cl::alias NumThreadsA("j", cl::desc("Alias for --num-threads"),
572                         cl::aliasopt(NumThreads));
573 
574   cl::ParseCommandLineOptions(argc, argv, "LLVM profile data merger\n");
575 
576   WeightedFileVector WeightedInputs;
577   for (StringRef Filename : InputFilenames)
578     addWeightedInput(WeightedInputs, {Filename, 1});
579   for (StringRef WeightedFilename : WeightedInputFilenames)
580     addWeightedInput(WeightedInputs, parseWeightedFile(WeightedFilename));
581 
582   // Make sure that the file buffer stays alive for the duration of the
583   // weighted input vector's lifetime.
584   auto Buffer = getInputFilenamesFileBuf(InputFilenamesFile);
585   parseInputFilenamesFile(Buffer.get(), WeightedInputs);
586 
587   if (WeightedInputs.empty())
588     exitWithError("No input files specified. See " +
589                   sys::path::filename(argv[0]) + " -help");
590 
591   if (DumpInputFileList) {
592     for (auto &WF : WeightedInputs)
593       outs() << WF.Weight << "," << WF.Filename << "\n";
594     return 0;
595   }
596 
597   std::unique_ptr<SymbolRemapper> Remapper;
598   if (!RemappingFile.empty())
599     Remapper = SymbolRemapper::create(RemappingFile);
600 
601   if (ProfileKind == instr)
602     mergeInstrProfile(WeightedInputs, Remapper.get(), OutputFilename,
603                       OutputFormat, OutputSparse, NumThreads);
604   else
605     mergeSampleProfile(WeightedInputs, Remapper.get(), OutputFilename,
606                        OutputFormat);
607 
608   return 0;
609 }
610 
611 typedef struct ValueSitesStats {
612   ValueSitesStats()
613       : TotalNumValueSites(0), TotalNumValueSitesWithValueProfile(0),
614         TotalNumValues(0) {}
615   uint64_t TotalNumValueSites;
616   uint64_t TotalNumValueSitesWithValueProfile;
617   uint64_t TotalNumValues;
618   std::vector<unsigned> ValueSitesHistogram;
619 } ValueSitesStats;
620 
621 static void traverseAllValueSites(const InstrProfRecord &Func, uint32_t VK,
622                                   ValueSitesStats &Stats, raw_fd_ostream &OS,
623                                   InstrProfSymtab *Symtab) {
624   uint32_t NS = Func.getNumValueSites(VK);
625   Stats.TotalNumValueSites += NS;
626   for (size_t I = 0; I < NS; ++I) {
627     uint32_t NV = Func.getNumValueDataForSite(VK, I);
628     std::unique_ptr<InstrProfValueData[]> VD = Func.getValueForSite(VK, I);
629     Stats.TotalNumValues += NV;
630     if (NV) {
631       Stats.TotalNumValueSitesWithValueProfile++;
632       if (NV > Stats.ValueSitesHistogram.size())
633         Stats.ValueSitesHistogram.resize(NV, 0);
634       Stats.ValueSitesHistogram[NV - 1]++;
635     }
636     for (uint32_t V = 0; V < NV; V++) {
637       OS << "\t[ " << I << ", ";
638       if (Symtab == nullptr)
639         OS << VD[V].Value;
640       else
641         OS << Symtab->getFuncName(VD[V].Value);
642       OS << ", " << VD[V].Count << " ]\n";
643     }
644   }
645 }
646 
647 static void showValueSitesStats(raw_fd_ostream &OS, uint32_t VK,
648                                 ValueSitesStats &Stats) {
649   OS << "  Total number of sites: " << Stats.TotalNumValueSites << "\n";
650   OS << "  Total number of sites with values: "
651      << Stats.TotalNumValueSitesWithValueProfile << "\n";
652   OS << "  Total number of profiled values: " << Stats.TotalNumValues << "\n";
653 
654   OS << "  Value sites histogram:\n\tNumTargets, SiteCount\n";
655   for (unsigned I = 0; I < Stats.ValueSitesHistogram.size(); I++) {
656     if (Stats.ValueSitesHistogram[I] > 0)
657       OS << "\t" << I + 1 << ", " << Stats.ValueSitesHistogram[I] << "\n";
658   }
659 }
660 
661 static int showInstrProfile(const std::string &Filename, bool ShowCounts,
662                             uint32_t TopN, bool ShowIndirectCallTargets,
663                             bool ShowMemOPSizes, bool ShowDetailedSummary,
664                             std::vector<uint32_t> DetailedSummaryCutoffs,
665                             bool ShowAllFunctions,
666                             const std::string &ShowFunction, bool TextFormat,
667                             raw_fd_ostream &OS) {
668   auto ReaderOrErr = InstrProfReader::create(Filename);
669   std::vector<uint32_t> Cutoffs = std::move(DetailedSummaryCutoffs);
670   if (ShowDetailedSummary && Cutoffs.empty()) {
671     Cutoffs = {800000, 900000, 950000, 990000, 999000, 999900, 999990};
672   }
673   InstrProfSummaryBuilder Builder(std::move(Cutoffs));
674   if (Error E = ReaderOrErr.takeError())
675     exitWithError(std::move(E), Filename);
676 
677   auto Reader = std::move(ReaderOrErr.get());
678   bool IsIRInstr = Reader->isIRLevelProfile();
679   size_t ShownFunctions = 0;
680   int NumVPKind = IPVK_Last - IPVK_First + 1;
681   std::vector<ValueSitesStats> VPStats(NumVPKind);
682 
683   auto MinCmp = [](const std::pair<std::string, uint64_t> &v1,
684                    const std::pair<std::string, uint64_t> &v2) {
685     return v1.second > v2.second;
686   };
687 
688   std::priority_queue<std::pair<std::string, uint64_t>,
689                       std::vector<std::pair<std::string, uint64_t>>,
690                       decltype(MinCmp)>
691       HottestFuncs(MinCmp);
692 
693   // Add marker so that IR-level instrumentation round-trips properly.
694   if (TextFormat && IsIRInstr)
695     OS << ":ir\n";
696 
697   for (const auto &Func : *Reader) {
698     bool Show =
699         ShowAllFunctions || (!ShowFunction.empty() &&
700                              Func.Name.find(ShowFunction) != Func.Name.npos);
701 
702     bool doTextFormatDump = (Show && TextFormat);
703 
704     if (doTextFormatDump) {
705       InstrProfSymtab &Symtab = Reader->getSymtab();
706       InstrProfWriter::writeRecordInText(Func.Name, Func.Hash, Func, Symtab,
707                                          OS);
708       continue;
709     }
710 
711     assert(Func.Counts.size() > 0 && "function missing entry counter");
712     Builder.addRecord(Func);
713 
714     if (TopN) {
715       uint64_t FuncMax = 0;
716       for (size_t I = 0, E = Func.Counts.size(); I < E; ++I)
717         FuncMax = std::max(FuncMax, Func.Counts[I]);
718 
719       if (HottestFuncs.size() == TopN) {
720         if (HottestFuncs.top().second < FuncMax) {
721           HottestFuncs.pop();
722           HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
723         }
724       } else
725         HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
726     }
727 
728     if (Show) {
729 
730       if (!ShownFunctions)
731         OS << "Counters:\n";
732 
733       ++ShownFunctions;
734 
735       OS << "  " << Func.Name << ":\n"
736          << "    Hash: " << format("0x%016" PRIx64, Func.Hash) << "\n"
737          << "    Counters: " << Func.Counts.size() << "\n";
738       if (!IsIRInstr)
739         OS << "    Function count: " << Func.Counts[0] << "\n";
740 
741       if (ShowIndirectCallTargets)
742         OS << "    Indirect Call Site Count: "
743            << Func.getNumValueSites(IPVK_IndirectCallTarget) << "\n";
744 
745       uint32_t NumMemOPCalls = Func.getNumValueSites(IPVK_MemOPSize);
746       if (ShowMemOPSizes && NumMemOPCalls > 0)
747         OS << "    Number of Memory Intrinsics Calls: " << NumMemOPCalls
748            << "\n";
749 
750       if (ShowCounts) {
751         OS << "    Block counts: [";
752         size_t Start = (IsIRInstr ? 0 : 1);
753         for (size_t I = Start, E = Func.Counts.size(); I < E; ++I) {
754           OS << (I == Start ? "" : ", ") << Func.Counts[I];
755         }
756         OS << "]\n";
757       }
758 
759       if (ShowIndirectCallTargets) {
760         OS << "    Indirect Target Results:\n";
761         traverseAllValueSites(Func, IPVK_IndirectCallTarget,
762                               VPStats[IPVK_IndirectCallTarget], OS,
763                               &(Reader->getSymtab()));
764       }
765 
766       if (ShowMemOPSizes && NumMemOPCalls > 0) {
767         OS << "    Memory Intrinsic Size Results:\n";
768         traverseAllValueSites(Func, IPVK_MemOPSize, VPStats[IPVK_MemOPSize], OS,
769                               nullptr);
770       }
771     }
772   }
773   if (Reader->hasError())
774     exitWithError(Reader->getError(), Filename);
775 
776   if (TextFormat)
777     return 0;
778   std::unique_ptr<ProfileSummary> PS(Builder.getSummary());
779   OS << "Instrumentation level: "
780      << (Reader->isIRLevelProfile() ? "IR" : "Front-end") << "\n";
781   if (ShowAllFunctions || !ShowFunction.empty())
782     OS << "Functions shown: " << ShownFunctions << "\n";
783   OS << "Total functions: " << PS->getNumFunctions() << "\n";
784   OS << "Maximum function count: " << PS->getMaxFunctionCount() << "\n";
785   OS << "Maximum internal block count: " << PS->getMaxInternalCount() << "\n";
786 
787   if (TopN) {
788     std::vector<std::pair<std::string, uint64_t>> SortedHottestFuncs;
789     while (!HottestFuncs.empty()) {
790       SortedHottestFuncs.emplace_back(HottestFuncs.top());
791       HottestFuncs.pop();
792     }
793     OS << "Top " << TopN
794        << " functions with the largest internal block counts: \n";
795     for (auto &hotfunc : llvm::reverse(SortedHottestFuncs))
796       OS << "  " << hotfunc.first << ", max count = " << hotfunc.second << "\n";
797   }
798 
799   if (ShownFunctions && ShowIndirectCallTargets) {
800     OS << "Statistics for indirect call sites profile:\n";
801     showValueSitesStats(OS, IPVK_IndirectCallTarget,
802                         VPStats[IPVK_IndirectCallTarget]);
803   }
804 
805   if (ShownFunctions && ShowMemOPSizes) {
806     OS << "Statistics for memory intrinsic calls sizes profile:\n";
807     showValueSitesStats(OS, IPVK_MemOPSize, VPStats[IPVK_MemOPSize]);
808   }
809 
810   if (ShowDetailedSummary) {
811     OS << "Detailed summary:\n";
812     OS << "Total number of blocks: " << PS->getNumCounts() << "\n";
813     OS << "Total count: " << PS->getTotalCount() << "\n";
814     for (auto Entry : PS->getDetailedSummary()) {
815       OS << Entry.NumCounts << " blocks with count >= " << Entry.MinCount
816          << " account for "
817          << format("%0.6g", (float)Entry.Cutoff / ProfileSummary::Scale * 100)
818          << " percentage of the total counts.\n";
819     }
820   }
821   return 0;
822 }
823 
824 static int showSampleProfile(const std::string &Filename, bool ShowCounts,
825                              bool ShowAllFunctions,
826                              const std::string &ShowFunction,
827                              raw_fd_ostream &OS) {
828   using namespace sampleprof;
829   LLVMContext Context;
830   auto ReaderOrErr = SampleProfileReader::create(Filename, Context);
831   if (std::error_code EC = ReaderOrErr.getError())
832     exitWithErrorCode(EC, Filename);
833 
834   auto Reader = std::move(ReaderOrErr.get());
835   if (std::error_code EC = Reader->read())
836     exitWithErrorCode(EC, Filename);
837 
838   if (ShowAllFunctions || ShowFunction.empty())
839     Reader->dump(OS);
840   else
841     Reader->dumpFunctionProfile(ShowFunction, OS);
842 
843   return 0;
844 }
845 
846 static int show_main(int argc, const char *argv[]) {
847   cl::opt<std::string> Filename(cl::Positional, cl::Required,
848                                 cl::desc("<profdata-file>"));
849 
850   cl::opt<bool> ShowCounts("counts", cl::init(false),
851                            cl::desc("Show counter values for shown functions"));
852   cl::opt<bool> TextFormat(
853       "text", cl::init(false),
854       cl::desc("Show instr profile data in text dump format"));
855   cl::opt<bool> ShowIndirectCallTargets(
856       "ic-targets", cl::init(false),
857       cl::desc("Show indirect call site target values for shown functions"));
858   cl::opt<bool> ShowMemOPSizes(
859       "memop-sizes", cl::init(false),
860       cl::desc("Show the profiled sizes of the memory intrinsic calls "
861                "for shown functions"));
862   cl::opt<bool> ShowDetailedSummary("detailed-summary", cl::init(false),
863                                     cl::desc("Show detailed profile summary"));
864   cl::list<uint32_t> DetailedSummaryCutoffs(
865       cl::CommaSeparated, "detailed-summary-cutoffs",
866       cl::desc(
867           "Cutoff percentages (times 10000) for generating detailed summary"),
868       cl::value_desc("800000,901000,999999"));
869   cl::opt<bool> ShowAllFunctions("all-functions", cl::init(false),
870                                  cl::desc("Details for every function"));
871   cl::opt<std::string> ShowFunction("function",
872                                     cl::desc("Details for matching functions"));
873 
874   cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
875                                       cl::init("-"), cl::desc("Output file"));
876   cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
877                             cl::aliasopt(OutputFilename));
878   cl::opt<ProfileKinds> ProfileKind(
879       cl::desc("Profile kind:"), cl::init(instr),
880       cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
881                  clEnumVal(sample, "Sample profile")));
882   cl::opt<uint32_t> TopNFunctions(
883       "topn", cl::init(0),
884       cl::desc("Show the list of functions with the largest internal counts"));
885 
886   cl::ParseCommandLineOptions(argc, argv, "LLVM profile data summary\n");
887 
888   if (OutputFilename.empty())
889     OutputFilename = "-";
890 
891   std::error_code EC;
892   raw_fd_ostream OS(OutputFilename.data(), EC, sys::fs::F_Text);
893   if (EC)
894     exitWithErrorCode(EC, OutputFilename);
895 
896   if (ShowAllFunctions && !ShowFunction.empty())
897     WithColor::warning() << "-function argument ignored: showing all functions\n";
898 
899   std::vector<uint32_t> Cutoffs(DetailedSummaryCutoffs.begin(),
900                                 DetailedSummaryCutoffs.end());
901   if (ProfileKind == instr)
902     return showInstrProfile(Filename, ShowCounts, TopNFunctions,
903                             ShowIndirectCallTargets, ShowMemOPSizes,
904                             ShowDetailedSummary, DetailedSummaryCutoffs,
905                             ShowAllFunctions, ShowFunction, TextFormat, OS);
906   else
907     return showSampleProfile(Filename, ShowCounts, ShowAllFunctions,
908                              ShowFunction, OS);
909 }
910 
911 int main(int argc, const char *argv[]) {
912   InitLLVM X(argc, argv);
913 
914   StringRef ProgName(sys::path::filename(argv[0]));
915   if (argc > 1) {
916     int (*func)(int, const char *[]) = nullptr;
917 
918     if (strcmp(argv[1], "merge") == 0)
919       func = merge_main;
920     else if (strcmp(argv[1], "show") == 0)
921       func = show_main;
922 
923     if (func) {
924       std::string Invocation(ProgName.str() + " " + argv[1]);
925       argv[1] = Invocation.c_str();
926       return func(argc - 1, argv + 1);
927     }
928 
929     if (strcmp(argv[1], "-h") == 0 || strcmp(argv[1], "-help") == 0 ||
930         strcmp(argv[1], "--help") == 0) {
931 
932       errs() << "OVERVIEW: LLVM profile data tools\n\n"
933              << "USAGE: " << ProgName << " <command> [args...]\n"
934              << "USAGE: " << ProgName << " <command> -help\n\n"
935              << "See each individual command --help for more details.\n"
936              << "Available commands: merge, show\n";
937       return 0;
938     }
939   }
940 
941   if (argc < 2)
942     errs() << ProgName << ": No command specified!\n";
943   else
944     errs() << ProgName << ": Unknown command!\n";
945 
946   errs() << "USAGE: " << ProgName << " <merge|show> [args...]\n";
947   return 1;
948 }
949