1 //===- llvm-profdata.cpp - LLVM profile data tool -------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // llvm-profdata merges .profdata files.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/ADT/SmallSet.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/StringRef.h"
16 #include "llvm/IR/LLVMContext.h"
17 #include "llvm/ProfileData/InstrProfReader.h"
18 #include "llvm/ProfileData/InstrProfWriter.h"
19 #include "llvm/ProfileData/ProfileCommon.h"
20 #include "llvm/ProfileData/SampleProfReader.h"
21 #include "llvm/ProfileData/SampleProfWriter.h"
22 #include "llvm/Support/CommandLine.h"
23 #include "llvm/Support/Errc.h"
24 #include "llvm/Support/FileSystem.h"
25 #include "llvm/Support/Format.h"
26 #include "llvm/Support/InitLLVM.h"
27 #include "llvm/Support/MemoryBuffer.h"
28 #include "llvm/Support/Path.h"
29 #include "llvm/Support/ThreadPool.h"
30 #include "llvm/Support/WithColor.h"
31 #include "llvm/Support/raw_ostream.h"
32 #include <algorithm>
33 
34 using namespace llvm;
35 
36 enum ProfileFormat {
37   PF_None = 0,
38   PF_Text,
39   PF_Compact_Binary,
40   PF_GCC,
41   PF_Binary
42 };
43 
44 static void warn(Twine Message, std::string Whence = "",
45                  std::string Hint = "") {
46   WithColor::warning();
47   if (!Whence.empty())
48     errs() << Whence << ": ";
49   errs() << Message << "\n";
50   if (!Hint.empty())
51     WithColor::note() << Hint << "\n";
52 }
53 
54 static void exitWithError(Twine Message, std::string Whence = "",
55                           std::string Hint = "") {
56   WithColor::error();
57   if (!Whence.empty())
58     errs() << Whence << ": ";
59   errs() << Message << "\n";
60   if (!Hint.empty())
61     WithColor::note() << Hint << "\n";
62   ::exit(1);
63 }
64 
65 static void exitWithError(Error E, StringRef Whence = "") {
66   if (E.isA<InstrProfError>()) {
67     handleAllErrors(std::move(E), [&](const InstrProfError &IPE) {
68       instrprof_error instrError = IPE.get();
69       StringRef Hint = "";
70       if (instrError == instrprof_error::unrecognized_format) {
71         // Hint for common error of forgetting -sample for sample profiles.
72         Hint = "Perhaps you forgot to use the -sample option?";
73       }
74       exitWithError(IPE.message(), Whence, Hint);
75     });
76   }
77 
78   exitWithError(toString(std::move(E)), Whence);
79 }
80 
81 static void exitWithErrorCode(std::error_code EC, StringRef Whence = "") {
82   exitWithError(EC.message(), Whence);
83 }
84 
85 namespace {
86 enum ProfileKinds { instr, sample };
87 }
88 
89 static void handleMergeWriterError(Error E, StringRef WhenceFile = "",
90                                    StringRef WhenceFunction = "",
91                                    bool ShowHint = true) {
92   if (!WhenceFile.empty())
93     errs() << WhenceFile << ": ";
94   if (!WhenceFunction.empty())
95     errs() << WhenceFunction << ": ";
96 
97   auto IPE = instrprof_error::success;
98   E = handleErrors(std::move(E),
99                    [&IPE](std::unique_ptr<InstrProfError> E) -> Error {
100                      IPE = E->get();
101                      return Error(std::move(E));
102                    });
103   errs() << toString(std::move(E)) << "\n";
104 
105   if (ShowHint) {
106     StringRef Hint = "";
107     if (IPE != instrprof_error::success) {
108       switch (IPE) {
109       case instrprof_error::hash_mismatch:
110       case instrprof_error::count_mismatch:
111       case instrprof_error::value_site_count_mismatch:
112         Hint = "Make sure that all profile data to be merged is generated "
113                "from the same binary.";
114         break;
115       default:
116         break;
117       }
118     }
119 
120     if (!Hint.empty())
121       errs() << Hint << "\n";
122   }
123 }
124 
125 namespace {
126 /// A remapper from original symbol names to new symbol names based on a file
127 /// containing a list of mappings from old name to new name.
128 class SymbolRemapper {
129   std::unique_ptr<MemoryBuffer> File;
130   DenseMap<StringRef, StringRef> RemappingTable;
131 
132 public:
133   /// Build a SymbolRemapper from a file containing a list of old/new symbols.
134   static std::unique_ptr<SymbolRemapper> create(StringRef InputFile) {
135     auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFile);
136     if (!BufOrError)
137       exitWithErrorCode(BufOrError.getError(), InputFile);
138 
139     auto Remapper = llvm::make_unique<SymbolRemapper>();
140     Remapper->File = std::move(BufOrError.get());
141 
142     for (line_iterator LineIt(*Remapper->File, /*SkipBlanks=*/true, '#');
143          !LineIt.is_at_eof(); ++LineIt) {
144       std::pair<StringRef, StringRef> Parts = LineIt->split(' ');
145       if (Parts.first.empty() || Parts.second.empty() ||
146           Parts.second.count(' ')) {
147         exitWithError("unexpected line in remapping file",
148                       (InputFile + ":" + Twine(LineIt.line_number())).str(),
149                       "expected 'old_symbol new_symbol'");
150       }
151       Remapper->RemappingTable.insert(Parts);
152     }
153     return Remapper;
154   }
155 
156   /// Attempt to map the given old symbol into a new symbol.
157   ///
158   /// \return The new symbol, or \p Name if no such symbol was found.
159   StringRef operator()(StringRef Name) {
160     StringRef New = RemappingTable.lookup(Name);
161     return New.empty() ? Name : New;
162   }
163 };
164 }
165 
166 struct WeightedFile {
167   std::string Filename;
168   uint64_t Weight;
169 };
170 typedef SmallVector<WeightedFile, 5> WeightedFileVector;
171 
172 /// Keep track of merged data and reported errors.
173 struct WriterContext {
174   std::mutex Lock;
175   InstrProfWriter Writer;
176   Error Err;
177   std::string ErrWhence;
178   std::mutex &ErrLock;
179   SmallSet<instrprof_error, 4> &WriterErrorCodes;
180 
181   WriterContext(bool IsSparse, std::mutex &ErrLock,
182                 SmallSet<instrprof_error, 4> &WriterErrorCodes)
183       : Lock(), Writer(IsSparse), Err(Error::success()), ErrWhence(""),
184         ErrLock(ErrLock), WriterErrorCodes(WriterErrorCodes) {}
185 };
186 
187 /// Determine whether an error is fatal for profile merging.
188 static bool isFatalError(instrprof_error IPE) {
189   switch (IPE) {
190   default:
191     return true;
192   case instrprof_error::success:
193   case instrprof_error::eof:
194   case instrprof_error::unknown_function:
195   case instrprof_error::hash_mismatch:
196   case instrprof_error::count_mismatch:
197   case instrprof_error::counter_overflow:
198   case instrprof_error::value_site_count_mismatch:
199     return false;
200   }
201 }
202 
203 /// Load an input into a writer context.
204 static void loadInput(const WeightedFile &Input, SymbolRemapper *Remapper,
205                       WriterContext *WC) {
206   std::unique_lock<std::mutex> CtxGuard{WC->Lock};
207 
208   // If there's a pending hard error, don't do more work.
209   if (WC->Err)
210     return;
211 
212   // Copy the filename, because llvm::ThreadPool copied the input "const
213   // WeightedFile &" by value, making a reference to the filename within it
214   // invalid outside of this packaged task.
215   WC->ErrWhence = Input.Filename;
216 
217   auto ReaderOrErr = InstrProfReader::create(Input.Filename);
218   if (Error E = ReaderOrErr.takeError()) {
219     // Skip the empty profiles by returning sliently.
220     instrprof_error IPE = InstrProfError::take(std::move(E));
221     if (IPE != instrprof_error::empty_raw_profile)
222       WC->Err = make_error<InstrProfError>(IPE);
223     return;
224   }
225 
226   auto Reader = std::move(ReaderOrErr.get());
227   bool IsIRProfile = Reader->isIRLevelProfile();
228   bool HasCSIRProfile = Reader->hasCSIRLevelProfile();
229   if (WC->Writer.setIsIRLevelProfile(IsIRProfile, HasCSIRProfile)) {
230     WC->Err = make_error<StringError>(
231         "Merge IR generated profile with Clang generated profile.",
232         std::error_code());
233     return;
234   }
235 
236   for (auto &I : *Reader) {
237     if (Remapper)
238       I.Name = (*Remapper)(I.Name);
239     const StringRef FuncName = I.Name;
240     bool Reported = false;
241     WC->Writer.addRecord(std::move(I), Input.Weight, [&](Error E) {
242       if (Reported) {
243         consumeError(std::move(E));
244         return;
245       }
246       Reported = true;
247       // Only show hint the first time an error occurs.
248       instrprof_error IPE = InstrProfError::take(std::move(E));
249       std::unique_lock<std::mutex> ErrGuard{WC->ErrLock};
250       bool firstTime = WC->WriterErrorCodes.insert(IPE).second;
251       handleMergeWriterError(make_error<InstrProfError>(IPE), Input.Filename,
252                              FuncName, firstTime);
253     });
254   }
255   if (Reader->hasError()) {
256     if (Error E = Reader->getError()) {
257       instrprof_error IPE = InstrProfError::take(std::move(E));
258       if (isFatalError(IPE))
259         WC->Err = make_error<InstrProfError>(IPE);
260     }
261   }
262 }
263 
264 /// Merge the \p Src writer context into \p Dst.
265 static void mergeWriterContexts(WriterContext *Dst, WriterContext *Src) {
266   // If we've already seen a hard error, continuing with the merge would
267   // clobber it.
268   if (Dst->Err || Src->Err)
269     return;
270 
271   bool Reported = false;
272   Dst->Writer.mergeRecordsFromWriter(std::move(Src->Writer), [&](Error E) {
273     if (Reported) {
274       consumeError(std::move(E));
275       return;
276     }
277     Reported = true;
278     Dst->Err = std::move(E);
279   });
280 }
281 
282 static void mergeInstrProfile(const WeightedFileVector &Inputs,
283                               SymbolRemapper *Remapper,
284                               StringRef OutputFilename,
285                               ProfileFormat OutputFormat, bool OutputSparse,
286                               unsigned NumThreads) {
287   if (OutputFilename.compare("-") == 0)
288     exitWithError("Cannot write indexed profdata format to stdout.");
289 
290   if (OutputFormat != PF_Binary && OutputFormat != PF_Compact_Binary &&
291       OutputFormat != PF_Text)
292     exitWithError("Unknown format is specified.");
293 
294   std::error_code EC;
295   raw_fd_ostream Output(OutputFilename.data(), EC, sys::fs::F_None);
296   if (EC)
297     exitWithErrorCode(EC, OutputFilename);
298 
299   std::mutex ErrorLock;
300   SmallSet<instrprof_error, 4> WriterErrorCodes;
301 
302   // If NumThreads is not specified, auto-detect a good default.
303   if (NumThreads == 0)
304     NumThreads =
305         std::min(hardware_concurrency(), unsigned((Inputs.size() + 1) / 2));
306 
307   // Initialize the writer contexts.
308   SmallVector<std::unique_ptr<WriterContext>, 4> Contexts;
309   for (unsigned I = 0; I < NumThreads; ++I)
310     Contexts.emplace_back(llvm::make_unique<WriterContext>(
311         OutputSparse, ErrorLock, WriterErrorCodes));
312 
313   if (NumThreads == 1) {
314     for (const auto &Input : Inputs)
315       loadInput(Input, Remapper, Contexts[0].get());
316   } else {
317     ThreadPool Pool(NumThreads);
318 
319     // Load the inputs in parallel (N/NumThreads serial steps).
320     unsigned Ctx = 0;
321     for (const auto &Input : Inputs) {
322       Pool.async(loadInput, Input, Remapper, Contexts[Ctx].get());
323       Ctx = (Ctx + 1) % NumThreads;
324     }
325     Pool.wait();
326 
327     // Merge the writer contexts together (~ lg(NumThreads) serial steps).
328     unsigned Mid = Contexts.size() / 2;
329     unsigned End = Contexts.size();
330     assert(Mid > 0 && "Expected more than one context");
331     do {
332       for (unsigned I = 0; I < Mid; ++I)
333         Pool.async(mergeWriterContexts, Contexts[I].get(),
334                    Contexts[I + Mid].get());
335       Pool.wait();
336       if (End & 1) {
337         Pool.async(mergeWriterContexts, Contexts[0].get(),
338                    Contexts[End - 1].get());
339         Pool.wait();
340       }
341       End = Mid;
342       Mid /= 2;
343     } while (Mid > 0);
344   }
345 
346   // Handle deferred hard errors encountered during merging.
347   for (std::unique_ptr<WriterContext> &WC : Contexts) {
348     if (!WC->Err)
349       continue;
350     if (!WC->Err.isA<InstrProfError>())
351       exitWithError(std::move(WC->Err), WC->ErrWhence);
352 
353     instrprof_error IPE = InstrProfError::take(std::move(WC->Err));
354     if (isFatalError(IPE))
355       exitWithError(make_error<InstrProfError>(IPE), WC->ErrWhence);
356     else
357       warn(toString(make_error<InstrProfError>(IPE)),
358            WC->ErrWhence);
359   }
360 
361   InstrProfWriter &Writer = Contexts[0]->Writer;
362   if (OutputFormat == PF_Text) {
363     if (Error E = Writer.writeText(Output))
364       exitWithError(std::move(E));
365   } else {
366     Writer.write(Output);
367   }
368 }
369 
370 /// Make a copy of the given function samples with all symbol names remapped
371 /// by the provided symbol remapper.
372 static sampleprof::FunctionSamples
373 remapSamples(const sampleprof::FunctionSamples &Samples,
374              SymbolRemapper &Remapper, sampleprof_error &Error) {
375   sampleprof::FunctionSamples Result;
376   Result.setName(Remapper(Samples.getName()));
377   Result.addTotalSamples(Samples.getTotalSamples());
378   Result.addHeadSamples(Samples.getHeadSamples());
379   for (const auto &BodySample : Samples.getBodySamples()) {
380     Result.addBodySamples(BodySample.first.LineOffset,
381                           BodySample.first.Discriminator,
382                           BodySample.second.getSamples());
383     for (const auto &Target : BodySample.second.getCallTargets()) {
384       Result.addCalledTargetSamples(BodySample.first.LineOffset,
385                                     BodySample.first.Discriminator,
386                                     Remapper(Target.first()), Target.second);
387     }
388   }
389   for (const auto &CallsiteSamples : Samples.getCallsiteSamples()) {
390     sampleprof::FunctionSamplesMap &Target =
391         Result.functionSamplesAt(CallsiteSamples.first);
392     for (const auto &Callsite : CallsiteSamples.second) {
393       sampleprof::FunctionSamples Remapped =
394           remapSamples(Callsite.second, Remapper, Error);
395       MergeResult(Error, Target[Remapped.getName()].merge(Remapped));
396     }
397   }
398   return Result;
399 }
400 
401 static sampleprof::SampleProfileFormat FormatMap[] = {
402     sampleprof::SPF_None, sampleprof::SPF_Text, sampleprof::SPF_Compact_Binary,
403     sampleprof::SPF_GCC, sampleprof::SPF_Binary};
404 
405 static void mergeSampleProfile(const WeightedFileVector &Inputs,
406                                SymbolRemapper *Remapper,
407                                StringRef OutputFilename,
408                                ProfileFormat OutputFormat) {
409   using namespace sampleprof;
410   auto WriterOrErr =
411       SampleProfileWriter::create(OutputFilename, FormatMap[OutputFormat]);
412   if (std::error_code EC = WriterOrErr.getError())
413     exitWithErrorCode(EC, OutputFilename);
414 
415   auto Writer = std::move(WriterOrErr.get());
416   StringMap<FunctionSamples> ProfileMap;
417   SmallVector<std::unique_ptr<sampleprof::SampleProfileReader>, 5> Readers;
418   LLVMContext Context;
419   for (const auto &Input : Inputs) {
420     auto ReaderOrErr = SampleProfileReader::create(Input.Filename, Context);
421     if (std::error_code EC = ReaderOrErr.getError())
422       exitWithErrorCode(EC, Input.Filename);
423 
424     // We need to keep the readers around until after all the files are
425     // read so that we do not lose the function names stored in each
426     // reader's memory. The function names are needed to write out the
427     // merged profile map.
428     Readers.push_back(std::move(ReaderOrErr.get()));
429     const auto Reader = Readers.back().get();
430     if (std::error_code EC = Reader->read())
431       exitWithErrorCode(EC, Input.Filename);
432 
433     StringMap<FunctionSamples> &Profiles = Reader->getProfiles();
434     for (StringMap<FunctionSamples>::iterator I = Profiles.begin(),
435                                               E = Profiles.end();
436          I != E; ++I) {
437       sampleprof_error Result = sampleprof_error::success;
438       FunctionSamples Remapped =
439           Remapper ? remapSamples(I->second, *Remapper, Result)
440                    : FunctionSamples();
441       FunctionSamples &Samples = Remapper ? Remapped : I->second;
442       StringRef FName = Samples.getName();
443       MergeResult(Result, ProfileMap[FName].merge(Samples, Input.Weight));
444       if (Result != sampleprof_error::success) {
445         std::error_code EC = make_error_code(Result);
446         handleMergeWriterError(errorCodeToError(EC), Input.Filename, FName);
447       }
448     }
449   }
450   Writer->write(ProfileMap);
451 }
452 
453 static WeightedFile parseWeightedFile(const StringRef &WeightedFilename) {
454   StringRef WeightStr, FileName;
455   std::tie(WeightStr, FileName) = WeightedFilename.split(',');
456 
457   uint64_t Weight;
458   if (WeightStr.getAsInteger(10, Weight) || Weight < 1)
459     exitWithError("Input weight must be a positive integer.");
460 
461   return {FileName, Weight};
462 }
463 
464 static std::unique_ptr<MemoryBuffer>
465 getInputFilenamesFileBuf(const StringRef &InputFilenamesFile) {
466   if (InputFilenamesFile == "")
467     return {};
468 
469   auto BufOrError = MemoryBuffer::getFileOrSTDIN(InputFilenamesFile);
470   if (!BufOrError)
471     exitWithErrorCode(BufOrError.getError(), InputFilenamesFile);
472 
473   return std::move(*BufOrError);
474 }
475 
476 static void addWeightedInput(WeightedFileVector &WNI, const WeightedFile &WF) {
477   StringRef Filename = WF.Filename;
478   uint64_t Weight = WF.Weight;
479 
480   // If it's STDIN just pass it on.
481   if (Filename == "-") {
482     WNI.push_back({Filename, Weight});
483     return;
484   }
485 
486   llvm::sys::fs::file_status Status;
487   llvm::sys::fs::status(Filename, Status);
488   if (!llvm::sys::fs::exists(Status))
489     exitWithErrorCode(make_error_code(errc::no_such_file_or_directory),
490                       Filename);
491   // If it's a source file, collect it.
492   if (llvm::sys::fs::is_regular_file(Status)) {
493     WNI.push_back({Filename, Weight});
494     return;
495   }
496 
497   if (llvm::sys::fs::is_directory(Status)) {
498     std::error_code EC;
499     for (llvm::sys::fs::recursive_directory_iterator F(Filename, EC), E;
500          F != E && !EC; F.increment(EC)) {
501       if (llvm::sys::fs::is_regular_file(F->path())) {
502         addWeightedInput(WNI, {F->path(), Weight});
503       }
504     }
505     if (EC)
506       exitWithErrorCode(EC, Filename);
507   }
508 }
509 
510 static void parseInputFilenamesFile(MemoryBuffer *Buffer,
511                                     WeightedFileVector &WFV) {
512   if (!Buffer)
513     return;
514 
515   SmallVector<StringRef, 8> Entries;
516   StringRef Data = Buffer->getBuffer();
517   Data.split(Entries, '\n', /*MaxSplit=*/-1, /*KeepEmpty=*/false);
518   for (const StringRef &FileWeightEntry : Entries) {
519     StringRef SanitizedEntry = FileWeightEntry.trim(" \t\v\f\r");
520     // Skip comments.
521     if (SanitizedEntry.startswith("#"))
522       continue;
523     // If there's no comma, it's an unweighted profile.
524     else if (SanitizedEntry.find(',') == StringRef::npos)
525       addWeightedInput(WFV, {SanitizedEntry, 1});
526     else
527       addWeightedInput(WFV, parseWeightedFile(SanitizedEntry));
528   }
529 }
530 
531 static int merge_main(int argc, const char *argv[]) {
532   cl::list<std::string> InputFilenames(cl::Positional,
533                                        cl::desc("<filename...>"));
534   cl::list<std::string> WeightedInputFilenames("weighted-input",
535                                                cl::desc("<weight>,<filename>"));
536   cl::opt<std::string> InputFilenamesFile(
537       "input-files", cl::init(""),
538       cl::desc("Path to file containing newline-separated "
539                "[<weight>,]<filename> entries"));
540   cl::alias InputFilenamesFileA("f", cl::desc("Alias for --input-files"),
541                                 cl::aliasopt(InputFilenamesFile));
542   cl::opt<bool> DumpInputFileList(
543       "dump-input-file-list", cl::init(false), cl::Hidden,
544       cl::desc("Dump the list of input files and their weights, then exit"));
545   cl::opt<std::string> RemappingFile("remapping-file", cl::value_desc("file"),
546                                      cl::desc("Symbol remapping file"));
547   cl::alias RemappingFileA("r", cl::desc("Alias for --remapping-file"),
548                            cl::aliasopt(RemappingFile));
549   cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
550                                       cl::init("-"), cl::Required,
551                                       cl::desc("Output file"));
552   cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
553                             cl::aliasopt(OutputFilename));
554   cl::opt<ProfileKinds> ProfileKind(
555       cl::desc("Profile kind:"), cl::init(instr),
556       cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
557                  clEnumVal(sample, "Sample profile")));
558   cl::opt<ProfileFormat> OutputFormat(
559       cl::desc("Format of output profile"), cl::init(PF_Binary),
560       cl::values(clEnumValN(PF_Binary, "binary", "Binary encoding (default)"),
561                  clEnumValN(PF_Compact_Binary, "compbinary",
562                             "Compact binary encoding"),
563                  clEnumValN(PF_Text, "text", "Text encoding"),
564                  clEnumValN(PF_GCC, "gcc",
565                             "GCC encoding (only meaningful for -sample)")));
566   cl::opt<bool> OutputSparse("sparse", cl::init(false),
567       cl::desc("Generate a sparse profile (only meaningful for -instr)"));
568   cl::opt<unsigned> NumThreads(
569       "num-threads", cl::init(0),
570       cl::desc("Number of merge threads to use (default: autodetect)"));
571   cl::alias NumThreadsA("j", cl::desc("Alias for --num-threads"),
572                         cl::aliasopt(NumThreads));
573 
574   cl::ParseCommandLineOptions(argc, argv, "LLVM profile data merger\n");
575 
576   WeightedFileVector WeightedInputs;
577   for (StringRef Filename : InputFilenames)
578     addWeightedInput(WeightedInputs, {Filename, 1});
579   for (StringRef WeightedFilename : WeightedInputFilenames)
580     addWeightedInput(WeightedInputs, parseWeightedFile(WeightedFilename));
581 
582   // Make sure that the file buffer stays alive for the duration of the
583   // weighted input vector's lifetime.
584   auto Buffer = getInputFilenamesFileBuf(InputFilenamesFile);
585   parseInputFilenamesFile(Buffer.get(), WeightedInputs);
586 
587   if (WeightedInputs.empty())
588     exitWithError("No input files specified. See " +
589                   sys::path::filename(argv[0]) + " -help");
590 
591   if (DumpInputFileList) {
592     for (auto &WF : WeightedInputs)
593       outs() << WF.Weight << "," << WF.Filename << "\n";
594     return 0;
595   }
596 
597   std::unique_ptr<SymbolRemapper> Remapper;
598   if (!RemappingFile.empty())
599     Remapper = SymbolRemapper::create(RemappingFile);
600 
601   if (ProfileKind == instr)
602     mergeInstrProfile(WeightedInputs, Remapper.get(), OutputFilename,
603                       OutputFormat, OutputSparse, NumThreads);
604   else
605     mergeSampleProfile(WeightedInputs, Remapper.get(), OutputFilename,
606                        OutputFormat);
607 
608   return 0;
609 }
610 
611 typedef struct ValueSitesStats {
612   ValueSitesStats()
613       : TotalNumValueSites(0), TotalNumValueSitesWithValueProfile(0),
614         TotalNumValues(0) {}
615   uint64_t TotalNumValueSites;
616   uint64_t TotalNumValueSitesWithValueProfile;
617   uint64_t TotalNumValues;
618   std::vector<unsigned> ValueSitesHistogram;
619 } ValueSitesStats;
620 
621 static void traverseAllValueSites(const InstrProfRecord &Func, uint32_t VK,
622                                   ValueSitesStats &Stats, raw_fd_ostream &OS,
623                                   InstrProfSymtab *Symtab) {
624   uint32_t NS = Func.getNumValueSites(VK);
625   Stats.TotalNumValueSites += NS;
626   for (size_t I = 0; I < NS; ++I) {
627     uint32_t NV = Func.getNumValueDataForSite(VK, I);
628     std::unique_ptr<InstrProfValueData[]> VD = Func.getValueForSite(VK, I);
629     Stats.TotalNumValues += NV;
630     if (NV) {
631       Stats.TotalNumValueSitesWithValueProfile++;
632       if (NV > Stats.ValueSitesHistogram.size())
633         Stats.ValueSitesHistogram.resize(NV, 0);
634       Stats.ValueSitesHistogram[NV - 1]++;
635     }
636 
637     uint64_t SiteSum = 0;
638     for (uint32_t V = 0; V < NV; V++)
639       SiteSum += VD[V].Count;
640     if (SiteSum == 0)
641       SiteSum = 1;
642 
643     for (uint32_t V = 0; V < NV; V++) {
644       OS << "\t[ " << format("%2u", I) << ", ";
645       if (Symtab == nullptr)
646         OS << format("%4" PRIu64, VD[V].Value);
647       else
648         OS << Symtab->getFuncName(VD[V].Value);
649       OS << ", " << format("%10" PRId64, VD[V].Count) << " ] ("
650          << format("%.2f%%", (VD[V].Count * 100.0 / SiteSum)) << ")\n";
651     }
652   }
653 }
654 
655 static void showValueSitesStats(raw_fd_ostream &OS, uint32_t VK,
656                                 ValueSitesStats &Stats) {
657   OS << "  Total number of sites: " << Stats.TotalNumValueSites << "\n";
658   OS << "  Total number of sites with values: "
659      << Stats.TotalNumValueSitesWithValueProfile << "\n";
660   OS << "  Total number of profiled values: " << Stats.TotalNumValues << "\n";
661 
662   OS << "  Value sites histogram:\n\tNumTargets, SiteCount\n";
663   for (unsigned I = 0; I < Stats.ValueSitesHistogram.size(); I++) {
664     if (Stats.ValueSitesHistogram[I] > 0)
665       OS << "\t" << I + 1 << ", " << Stats.ValueSitesHistogram[I] << "\n";
666   }
667 }
668 
669 static int showInstrProfile(const std::string &Filename, bool ShowCounts,
670                             uint32_t TopN, bool ShowIndirectCallTargets,
671                             bool ShowMemOPSizes, bool ShowDetailedSummary,
672                             std::vector<uint32_t> DetailedSummaryCutoffs,
673                             bool ShowAllFunctions, bool ShowCS,
674                             uint64_t ValueCutoff, bool OnlyListBelow,
675                             const std::string &ShowFunction, bool TextFormat,
676                             raw_fd_ostream &OS) {
677   auto ReaderOrErr = InstrProfReader::create(Filename);
678   std::vector<uint32_t> Cutoffs = std::move(DetailedSummaryCutoffs);
679   if (ShowDetailedSummary && Cutoffs.empty()) {
680     Cutoffs = {800000, 900000, 950000, 990000, 999000, 999900, 999990};
681   }
682   InstrProfSummaryBuilder Builder(std::move(Cutoffs));
683   if (Error E = ReaderOrErr.takeError())
684     exitWithError(std::move(E), Filename);
685 
686   auto Reader = std::move(ReaderOrErr.get());
687   bool IsIRInstr = Reader->isIRLevelProfile();
688   size_t ShownFunctions = 0;
689   size_t BelowCutoffFunctions = 0;
690   int NumVPKind = IPVK_Last - IPVK_First + 1;
691   std::vector<ValueSitesStats> VPStats(NumVPKind);
692 
693   auto MinCmp = [](const std::pair<std::string, uint64_t> &v1,
694                    const std::pair<std::string, uint64_t> &v2) {
695     return v1.second > v2.second;
696   };
697 
698   std::priority_queue<std::pair<std::string, uint64_t>,
699                       std::vector<std::pair<std::string, uint64_t>>,
700                       decltype(MinCmp)>
701       HottestFuncs(MinCmp);
702 
703   if (!TextFormat && OnlyListBelow) {
704     OS << "The list of functions with the maximum counter less than "
705        << ValueCutoff << ":\n";
706   }
707 
708   // Add marker so that IR-level instrumentation round-trips properly.
709   if (TextFormat && IsIRInstr)
710     OS << ":ir\n";
711 
712   for (const auto &Func : *Reader) {
713     if (Reader->isIRLevelProfile()) {
714       bool FuncIsCS = NamedInstrProfRecord::hasCSFlagInHash(Func.Hash);
715       if (FuncIsCS != ShowCS)
716         continue;
717     }
718     bool Show =
719         ShowAllFunctions || (!ShowFunction.empty() &&
720                              Func.Name.find(ShowFunction) != Func.Name.npos);
721 
722     bool doTextFormatDump = (Show && TextFormat);
723 
724     if (doTextFormatDump) {
725       InstrProfSymtab &Symtab = Reader->getSymtab();
726       InstrProfWriter::writeRecordInText(Func.Name, Func.Hash, Func, Symtab,
727                                          OS);
728       continue;
729     }
730 
731     assert(Func.Counts.size() > 0 && "function missing entry counter");
732     Builder.addRecord(Func);
733 
734     uint64_t FuncMax = 0;
735     uint64_t FuncSum = 0;
736     for (size_t I = 0, E = Func.Counts.size(); I < E; ++I) {
737       FuncMax = std::max(FuncMax, Func.Counts[I]);
738       FuncSum += Func.Counts[I];
739     }
740 
741     if (FuncMax < ValueCutoff) {
742       ++BelowCutoffFunctions;
743       if (OnlyListBelow) {
744         OS << "  " << Func.Name << ": (Max = " << FuncMax
745            << " Sum = " << FuncSum << ")\n";
746       }
747       continue;
748     } else if (OnlyListBelow)
749       continue;
750 
751     if (TopN) {
752       if (HottestFuncs.size() == TopN) {
753         if (HottestFuncs.top().second < FuncMax) {
754           HottestFuncs.pop();
755           HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
756         }
757       } else
758         HottestFuncs.emplace(std::make_pair(std::string(Func.Name), FuncMax));
759     }
760 
761     if (Show) {
762       if (!ShownFunctions)
763         OS << "Counters:\n";
764 
765       ++ShownFunctions;
766 
767       OS << "  " << Func.Name << ":\n"
768          << "    Hash: " << format("0x%016" PRIx64, Func.Hash) << "\n"
769          << "    Counters: " << Func.Counts.size() << "\n";
770       if (!IsIRInstr)
771         OS << "    Function count: " << Func.Counts[0] << "\n";
772 
773       if (ShowIndirectCallTargets)
774         OS << "    Indirect Call Site Count: "
775            << Func.getNumValueSites(IPVK_IndirectCallTarget) << "\n";
776 
777       uint32_t NumMemOPCalls = Func.getNumValueSites(IPVK_MemOPSize);
778       if (ShowMemOPSizes && NumMemOPCalls > 0)
779         OS << "    Number of Memory Intrinsics Calls: " << NumMemOPCalls
780            << "\n";
781 
782       if (ShowCounts) {
783         OS << "    Block counts: [";
784         size_t Start = (IsIRInstr ? 0 : 1);
785         for (size_t I = Start, E = Func.Counts.size(); I < E; ++I) {
786           OS << (I == Start ? "" : ", ") << Func.Counts[I];
787         }
788         OS << "]\n";
789       }
790 
791       if (ShowIndirectCallTargets) {
792         OS << "    Indirect Target Results:\n";
793         traverseAllValueSites(Func, IPVK_IndirectCallTarget,
794                               VPStats[IPVK_IndirectCallTarget], OS,
795                               &(Reader->getSymtab()));
796       }
797 
798       if (ShowMemOPSizes && NumMemOPCalls > 0) {
799         OS << "    Memory Intrinsic Size Results:\n";
800         traverseAllValueSites(Func, IPVK_MemOPSize, VPStats[IPVK_MemOPSize], OS,
801                               nullptr);
802       }
803     }
804   }
805   if (Reader->hasError())
806     exitWithError(Reader->getError(), Filename);
807 
808   if (TextFormat)
809     return 0;
810   std::unique_ptr<ProfileSummary> PS(Builder.getSummary());
811   OS << "Instrumentation level: "
812      << (Reader->isIRLevelProfile() ? "IR" : "Front-end") << "\n";
813   if (ShowAllFunctions || !ShowFunction.empty())
814     OS << "Functions shown: " << ShownFunctions << "\n";
815   OS << "Total functions: " << PS->getNumFunctions() << "\n";
816   if (ValueCutoff > 0) {
817     OS << "Number of functions with maximum count (< " << ValueCutoff
818        << "): " << BelowCutoffFunctions << "\n";
819     OS << "Number of functions with maximum count (>= " << ValueCutoff
820        << "): " << PS->getNumFunctions() - BelowCutoffFunctions << "\n";
821   }
822   OS << "Maximum function count: " << PS->getMaxFunctionCount() << "\n";
823   OS << "Maximum internal block count: " << PS->getMaxInternalCount() << "\n";
824 
825   if (TopN) {
826     std::vector<std::pair<std::string, uint64_t>> SortedHottestFuncs;
827     while (!HottestFuncs.empty()) {
828       SortedHottestFuncs.emplace_back(HottestFuncs.top());
829       HottestFuncs.pop();
830     }
831     OS << "Top " << TopN
832        << " functions with the largest internal block counts: \n";
833     for (auto &hotfunc : llvm::reverse(SortedHottestFuncs))
834       OS << "  " << hotfunc.first << ", max count = " << hotfunc.second << "\n";
835   }
836 
837   if (ShownFunctions && ShowIndirectCallTargets) {
838     OS << "Statistics for indirect call sites profile:\n";
839     showValueSitesStats(OS, IPVK_IndirectCallTarget,
840                         VPStats[IPVK_IndirectCallTarget]);
841   }
842 
843   if (ShownFunctions && ShowMemOPSizes) {
844     OS << "Statistics for memory intrinsic calls sizes profile:\n";
845     showValueSitesStats(OS, IPVK_MemOPSize, VPStats[IPVK_MemOPSize]);
846   }
847 
848   if (ShowDetailedSummary) {
849     OS << "Detailed summary:\n";
850     OS << "Total number of blocks: " << PS->getNumCounts() << "\n";
851     OS << "Total count: " << PS->getTotalCount() << "\n";
852     for (auto Entry : PS->getDetailedSummary()) {
853       OS << Entry.NumCounts << " blocks with count >= " << Entry.MinCount
854          << " account for "
855          << format("%0.6g", (float)Entry.Cutoff / ProfileSummary::Scale * 100)
856          << " percentage of the total counts.\n";
857     }
858   }
859   return 0;
860 }
861 
862 static int showSampleProfile(const std::string &Filename, bool ShowCounts,
863                              bool ShowAllFunctions,
864                              const std::string &ShowFunction,
865                              raw_fd_ostream &OS) {
866   using namespace sampleprof;
867   LLVMContext Context;
868   auto ReaderOrErr = SampleProfileReader::create(Filename, Context);
869   if (std::error_code EC = ReaderOrErr.getError())
870     exitWithErrorCode(EC, Filename);
871 
872   auto Reader = std::move(ReaderOrErr.get());
873   if (std::error_code EC = Reader->read())
874     exitWithErrorCode(EC, Filename);
875 
876   if (ShowAllFunctions || ShowFunction.empty())
877     Reader->dump(OS);
878   else
879     Reader->dumpFunctionProfile(ShowFunction, OS);
880 
881   return 0;
882 }
883 
884 static int show_main(int argc, const char *argv[]) {
885   cl::opt<std::string> Filename(cl::Positional, cl::Required,
886                                 cl::desc("<profdata-file>"));
887 
888   cl::opt<bool> ShowCounts("counts", cl::init(false),
889                            cl::desc("Show counter values for shown functions"));
890   cl::opt<bool> TextFormat(
891       "text", cl::init(false),
892       cl::desc("Show instr profile data in text dump format"));
893   cl::opt<bool> ShowIndirectCallTargets(
894       "ic-targets", cl::init(false),
895       cl::desc("Show indirect call site target values for shown functions"));
896   cl::opt<bool> ShowMemOPSizes(
897       "memop-sizes", cl::init(false),
898       cl::desc("Show the profiled sizes of the memory intrinsic calls "
899                "for shown functions"));
900   cl::opt<bool> ShowDetailedSummary("detailed-summary", cl::init(false),
901                                     cl::desc("Show detailed profile summary"));
902   cl::list<uint32_t> DetailedSummaryCutoffs(
903       cl::CommaSeparated, "detailed-summary-cutoffs",
904       cl::desc(
905           "Cutoff percentages (times 10000) for generating detailed summary"),
906       cl::value_desc("800000,901000,999999"));
907   cl::opt<bool> ShowAllFunctions("all-functions", cl::init(false),
908                                  cl::desc("Details for every function"));
909   cl::opt<bool> ShowCS("showcs", cl::init(false),
910                        cl::desc("Show context sensitive counts"));
911   cl::opt<std::string> ShowFunction("function",
912                                     cl::desc("Details for matching functions"));
913 
914   cl::opt<std::string> OutputFilename("output", cl::value_desc("output"),
915                                       cl::init("-"), cl::desc("Output file"));
916   cl::alias OutputFilenameA("o", cl::desc("Alias for --output"),
917                             cl::aliasopt(OutputFilename));
918   cl::opt<ProfileKinds> ProfileKind(
919       cl::desc("Profile kind:"), cl::init(instr),
920       cl::values(clEnumVal(instr, "Instrumentation profile (default)"),
921                  clEnumVal(sample, "Sample profile")));
922   cl::opt<uint32_t> TopNFunctions(
923       "topn", cl::init(0),
924       cl::desc("Show the list of functions with the largest internal counts"));
925   cl::opt<uint32_t> ValueCutoff(
926       "value-cutoff", cl::init(0),
927       cl::desc("Set the count value cutoff. Functions with the maximum count "
928                "less than this value will not be printed out. (Default is 0)"));
929   cl::opt<bool> OnlyListBelow(
930       "list-below-cutoff", cl::init(false),
931       cl::desc("Only output names of functions whose max count values are "
932                "below the cutoff value"));
933   cl::ParseCommandLineOptions(argc, argv, "LLVM profile data summary\n");
934 
935   if (OutputFilename.empty())
936     OutputFilename = "-";
937 
938   std::error_code EC;
939   raw_fd_ostream OS(OutputFilename.data(), EC, sys::fs::F_Text);
940   if (EC)
941     exitWithErrorCode(EC, OutputFilename);
942 
943   if (ShowAllFunctions && !ShowFunction.empty())
944     WithColor::warning() << "-function argument ignored: showing all functions\n";
945 
946   std::vector<uint32_t> Cutoffs(DetailedSummaryCutoffs.begin(),
947                                 DetailedSummaryCutoffs.end());
948   if (ProfileKind == instr)
949     return showInstrProfile(Filename, ShowCounts, TopNFunctions,
950                             ShowIndirectCallTargets, ShowMemOPSizes,
951                             ShowDetailedSummary, DetailedSummaryCutoffs,
952                             ShowAllFunctions, ShowCS, ValueCutoff,
953                             OnlyListBelow, ShowFunction, TextFormat, OS);
954   else
955     return showSampleProfile(Filename, ShowCounts, ShowAllFunctions,
956                              ShowFunction, OS);
957 }
958 
959 int main(int argc, const char *argv[]) {
960   InitLLVM X(argc, argv);
961 
962   StringRef ProgName(sys::path::filename(argv[0]));
963   if (argc > 1) {
964     int (*func)(int, const char *[]) = nullptr;
965 
966     if (strcmp(argv[1], "merge") == 0)
967       func = merge_main;
968     else if (strcmp(argv[1], "show") == 0)
969       func = show_main;
970 
971     if (func) {
972       std::string Invocation(ProgName.str() + " " + argv[1]);
973       argv[1] = Invocation.c_str();
974       return func(argc - 1, argv + 1);
975     }
976 
977     if (strcmp(argv[1], "-h") == 0 || strcmp(argv[1], "-help") == 0 ||
978         strcmp(argv[1], "--help") == 0) {
979 
980       errs() << "OVERVIEW: LLVM profile data tools\n\n"
981              << "USAGE: " << ProgName << " <command> [args...]\n"
982              << "USAGE: " << ProgName << " <command> -help\n\n"
983              << "See each individual command --help for more details.\n"
984              << "Available commands: merge, show\n";
985       return 0;
986     }
987   }
988 
989   if (argc < 2)
990     errs() << ProgName << ": No command specified!\n";
991   else
992     errs() << ProgName << ": Unknown command!\n";
993 
994   errs() << "USAGE: " << ProgName << " <merge|show> [args...]\n";
995   return 1;
996 }
997