1de1ab26fSDiego Novillo //===- SampleProfReader.cpp - Read LLVM sample profile data ---------------===//
2de1ab26fSDiego Novillo //
32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6de1ab26fSDiego Novillo //
7de1ab26fSDiego Novillo //===----------------------------------------------------------------------===//
8de1ab26fSDiego Novillo //
9de1ab26fSDiego Novillo // This file implements the class that reads LLVM sample profiles. It
10bb5605caSDiego Novillo // supports three file formats: text, binary and gcov.
11de1ab26fSDiego Novillo //
12bb5605caSDiego Novillo // The textual representation is useful for debugging and testing purposes. The
13bb5605caSDiego Novillo // binary representation is more compact, resulting in smaller file sizes.
14de1ab26fSDiego Novillo //
15bb5605caSDiego Novillo // The gcov encoding is the one generated by GCC's AutoFDO profile creation
16bb5605caSDiego Novillo // tool (https://github.com/google/autofdo)
17de1ab26fSDiego Novillo //
18bb5605caSDiego Novillo // All three encodings can be used interchangeably as an input sample profile.
19de1ab26fSDiego Novillo //
20de1ab26fSDiego Novillo //===----------------------------------------------------------------------===//
21de1ab26fSDiego Novillo 
22de1ab26fSDiego Novillo #include "llvm/ProfileData/SampleProfReader.h"
23b93483dbSDiego Novillo #include "llvm/ADT/DenseMap.h"
2440ee23dbSEaswaran Raman #include "llvm/ADT/STLExtras.h"
25e78d131aSEugene Zelenko #include "llvm/ADT/StringRef.h"
26e78d131aSEugene Zelenko #include "llvm/IR/ProfileSummary.h"
27e78d131aSEugene Zelenko #include "llvm/ProfileData/ProfileCommon.h"
28e78d131aSEugene Zelenko #include "llvm/ProfileData/SampleProf.h"
296745ffe4SRong Xu #include "llvm/Support/CommandLine.h"
30b523790aSWei Mi #include "llvm/Support/Compression.h"
31de1ab26fSDiego Novillo #include "llvm/Support/ErrorOr.h"
32c572e92cSDiego Novillo #include "llvm/Support/LEB128.h"
33de1ab26fSDiego Novillo #include "llvm/Support/LineIterator.h"
346a14325dSWei Mi #include "llvm/Support/MD5.h"
35c572e92cSDiego Novillo #include "llvm/Support/MemoryBuffer.h"
36e78d131aSEugene Zelenko #include "llvm/Support/raw_ostream.h"
37e78d131aSEugene Zelenko #include <algorithm>
38e78d131aSEugene Zelenko #include <cstddef>
39e78d131aSEugene Zelenko #include <cstdint>
40e78d131aSEugene Zelenko #include <limits>
41e78d131aSEugene Zelenko #include <memory>
42a5d30421SWenlei He #include <set>
43e78d131aSEugene Zelenko #include <system_error>
44e78d131aSEugene Zelenko #include <vector>
45de1ab26fSDiego Novillo 
46de1ab26fSDiego Novillo using namespace llvm;
47e78d131aSEugene Zelenko using namespace sampleprof;
48de1ab26fSDiego Novillo 
496745ffe4SRong Xu #define DEBUG_TYPE "samplepgo-reader"
506745ffe4SRong Xu 
516745ffe4SRong Xu // This internal option specifies if the profile uses FS discriminators.
526745ffe4SRong Xu // It only applies to text, binary and compact binary format profiles.
536745ffe4SRong Xu // For ext-binary format profiles, the flag is set in the summary.
546745ffe4SRong Xu static cl::opt<bool> ProfileIsFSDisciminator(
556745ffe4SRong Xu     "profile-isfs", cl::Hidden, cl::init(false),
569b8425e4SRong Xu     cl::desc("Profile uses flow sensitive discriminators"));
576745ffe4SRong Xu 
585f8f34e4SAdrian Prantl /// Dump the function profile for \p FName.
59de1ab26fSDiego Novillo ///
60cb8d96e7SSimon Pilgrim /// \param FContext Name + context of the function to print.
61d5336ae2SDiego Novillo /// \param OS Stream to emit the output to.
62b9db7036SHongtao Yu void SampleProfileReader::dumpFunctionProfile(SampleContext FContext,
63d5336ae2SDiego Novillo                                               raw_ostream &OS) {
64b9db7036SHongtao Yu   OS << "Function: " << FContext.toString() << ": " << Profiles[FContext];
65de1ab26fSDiego Novillo }
66de1ab26fSDiego Novillo 
675f8f34e4SAdrian Prantl /// Dump all the function profiles found on stream \p OS.
68d5336ae2SDiego Novillo void SampleProfileReader::dump(raw_ostream &OS) {
69f27fee62SHongtao Yu   std::vector<NameFunctionSamples> V;
70f27fee62SHongtao Yu   sortFuncProfiles(Profiles, V);
71f27fee62SHongtao Yu   for (const auto &I : V)
72f27fee62SHongtao Yu     dumpFunctionProfile(I.first, OS);
73de1ab26fSDiego Novillo }
74de1ab26fSDiego Novillo 
755f8f34e4SAdrian Prantl /// Parse \p Input as function head.
766722688eSDehao Chen ///
776722688eSDehao Chen /// Parse one line of \p Input, and update function name in \p FName,
786722688eSDehao Chen /// function's total sample count in \p NumSamples, function's entry
796722688eSDehao Chen /// count in \p NumHeadSamples.
806722688eSDehao Chen ///
816722688eSDehao Chen /// \returns true if parsing is successful.
826722688eSDehao Chen static bool ParseHead(const StringRef &Input, StringRef &FName,
8338be3330SDiego Novillo                       uint64_t &NumSamples, uint64_t &NumHeadSamples) {
846722688eSDehao Chen   if (Input[0] == ' ')
856722688eSDehao Chen     return false;
866722688eSDehao Chen   size_t n2 = Input.rfind(':');
876722688eSDehao Chen   size_t n1 = Input.rfind(':', n2 - 1);
886722688eSDehao Chen   FName = Input.substr(0, n1);
896722688eSDehao Chen   if (Input.substr(n1 + 1, n2 - n1 - 1).getAsInteger(10, NumSamples))
906722688eSDehao Chen     return false;
916722688eSDehao Chen   if (Input.substr(n2 + 1).getAsInteger(10, NumHeadSamples))
926722688eSDehao Chen     return false;
936722688eSDehao Chen   return true;
946722688eSDehao Chen }
956722688eSDehao Chen 
965f8f34e4SAdrian Prantl /// Returns true if line offset \p L is legal (only has 16 bits).
9757d1dda5SDehao Chen static bool isOffsetLegal(unsigned L) { return (L & 0xffff) == L; }
9810042412SDehao Chen 
99ac068e01SHongtao Yu /// Parse \p Input that contains metadata.
100ac068e01SHongtao Yu /// Possible metadata:
101ac068e01SHongtao Yu /// - CFG Checksum information:
102ac068e01SHongtao Yu ///     !CFGChecksum: 12345
1031410db70SWenlei He /// - CFG Checksum information:
1041410db70SWenlei He ///     !Attributes: 1
105ac068e01SHongtao Yu /// Stores the FunctionHash (a.k.a. CFG Checksum) into \p FunctionHash.
1061410db70SWenlei He static bool parseMetadata(const StringRef &Input, uint64_t &FunctionHash,
1071410db70SWenlei He                           uint32_t &Attributes) {
1081410db70SWenlei He   if (Input.startswith("!CFGChecksum:")) {
109ac068e01SHongtao Yu     StringRef CFGInfo = Input.substr(strlen("!CFGChecksum:")).trim();
110ac068e01SHongtao Yu     return !CFGInfo.getAsInteger(10, FunctionHash);
111ac068e01SHongtao Yu   }
112ac068e01SHongtao Yu 
1131410db70SWenlei He   if (Input.startswith("!Attributes:")) {
1141410db70SWenlei He     StringRef Attrib = Input.substr(strlen("!Attributes:")).trim();
1151410db70SWenlei He     return !Attrib.getAsInteger(10, Attributes);
1161410db70SWenlei He   }
1171410db70SWenlei He 
1181410db70SWenlei He   return false;
1191410db70SWenlei He }
1201410db70SWenlei He 
121ac068e01SHongtao Yu enum class LineType {
122ac068e01SHongtao Yu   CallSiteProfile,
123ac068e01SHongtao Yu   BodyProfile,
124ac068e01SHongtao Yu   Metadata,
125ac068e01SHongtao Yu };
126ac068e01SHongtao Yu 
1275f8f34e4SAdrian Prantl /// Parse \p Input as line sample.
1286722688eSDehao Chen ///
1296722688eSDehao Chen /// \param Input input line.
130ac068e01SHongtao Yu /// \param LineTy Type of this line.
1316722688eSDehao Chen /// \param Depth the depth of the inline stack.
1326722688eSDehao Chen /// \param NumSamples total samples of the line/inlined callsite.
1336722688eSDehao Chen /// \param LineOffset line offset to the start of the function.
1346722688eSDehao Chen /// \param Discriminator discriminator of the line.
1356722688eSDehao Chen /// \param TargetCountMap map from indirect call target to count.
136ac068e01SHongtao Yu /// \param FunctionHash the function's CFG hash, used by pseudo probe.
1376722688eSDehao Chen ///
1386722688eSDehao Chen /// returns true if parsing is successful.
139ac068e01SHongtao Yu static bool ParseLine(const StringRef &Input, LineType &LineTy, uint32_t &Depth,
14038be3330SDiego Novillo                       uint64_t &NumSamples, uint32_t &LineOffset,
14138be3330SDiego Novillo                       uint32_t &Discriminator, StringRef &CalleeName,
142ac068e01SHongtao Yu                       DenseMap<StringRef, uint64_t> &TargetCountMap,
1431410db70SWenlei He                       uint64_t &FunctionHash, uint32_t &Attributes) {
1446722688eSDehao Chen   for (Depth = 0; Input[Depth] == ' '; Depth++)
1456722688eSDehao Chen     ;
1466722688eSDehao Chen   if (Depth == 0)
1476722688eSDehao Chen     return false;
1486722688eSDehao Chen 
149ac068e01SHongtao Yu   if (Depth == 1 && Input[Depth] == '!') {
150ac068e01SHongtao Yu     LineTy = LineType::Metadata;
1511410db70SWenlei He     return parseMetadata(Input.substr(Depth), FunctionHash, Attributes);
152ac068e01SHongtao Yu   }
153ac068e01SHongtao Yu 
1546722688eSDehao Chen   size_t n1 = Input.find(':');
1556722688eSDehao Chen   StringRef Loc = Input.substr(Depth, n1 - Depth);
1566722688eSDehao Chen   size_t n2 = Loc.find('.');
1576722688eSDehao Chen   if (n2 == StringRef::npos) {
15810042412SDehao Chen     if (Loc.getAsInteger(10, LineOffset) || !isOffsetLegal(LineOffset))
1596722688eSDehao Chen       return false;
1606722688eSDehao Chen     Discriminator = 0;
1616722688eSDehao Chen   } else {
1626722688eSDehao Chen     if (Loc.substr(0, n2).getAsInteger(10, LineOffset))
1636722688eSDehao Chen       return false;
1646722688eSDehao Chen     if (Loc.substr(n2 + 1).getAsInteger(10, Discriminator))
1656722688eSDehao Chen       return false;
1666722688eSDehao Chen   }
1676722688eSDehao Chen 
1686722688eSDehao Chen   StringRef Rest = Input.substr(n1 + 2);
169551aaa24SKazu Hirata   if (isDigit(Rest[0])) {
170ac068e01SHongtao Yu     LineTy = LineType::BodyProfile;
1716722688eSDehao Chen     size_t n3 = Rest.find(' ');
1726722688eSDehao Chen     if (n3 == StringRef::npos) {
1736722688eSDehao Chen       if (Rest.getAsInteger(10, NumSamples))
1746722688eSDehao Chen         return false;
1756722688eSDehao Chen     } else {
1766722688eSDehao Chen       if (Rest.substr(0, n3).getAsInteger(10, NumSamples))
1776722688eSDehao Chen         return false;
1786722688eSDehao Chen     }
179984ab0f1SWei Mi     // Find call targets and their sample counts.
180984ab0f1SWei Mi     // Note: In some cases, there are symbols in the profile which are not
181984ab0f1SWei Mi     // mangled. To accommodate such cases, use colon + integer pairs as the
182984ab0f1SWei Mi     // anchor points.
183984ab0f1SWei Mi     // An example:
184984ab0f1SWei Mi     // _M_construct<char *>:1000 string_view<std::allocator<char> >:437
185984ab0f1SWei Mi     // ":1000" and ":437" are used as anchor points so the string above will
186984ab0f1SWei Mi     // be interpreted as
187984ab0f1SWei Mi     // target: _M_construct<char *>
188984ab0f1SWei Mi     // count: 1000
189984ab0f1SWei Mi     // target: string_view<std::allocator<char> >
190984ab0f1SWei Mi     // count: 437
1916722688eSDehao Chen     while (n3 != StringRef::npos) {
1926722688eSDehao Chen       n3 += Rest.substr(n3).find_first_not_of(' ');
1936722688eSDehao Chen       Rest = Rest.substr(n3);
194984ab0f1SWei Mi       n3 = Rest.find_first_of(':');
195984ab0f1SWei Mi       if (n3 == StringRef::npos || n3 == 0)
1966722688eSDehao Chen         return false;
197984ab0f1SWei Mi 
198984ab0f1SWei Mi       StringRef Target;
199984ab0f1SWei Mi       uint64_t count, n4;
200984ab0f1SWei Mi       while (true) {
201984ab0f1SWei Mi         // Get the segment after the current colon.
202984ab0f1SWei Mi         StringRef AfterColon = Rest.substr(n3 + 1);
203984ab0f1SWei Mi         // Get the target symbol before the current colon.
204984ab0f1SWei Mi         Target = Rest.substr(0, n3);
205984ab0f1SWei Mi         // Check if the word after the current colon is an integer.
206984ab0f1SWei Mi         n4 = AfterColon.find_first_of(' ');
207984ab0f1SWei Mi         n4 = (n4 != StringRef::npos) ? n3 + n4 + 1 : Rest.size();
208984ab0f1SWei Mi         StringRef WordAfterColon = Rest.substr(n3 + 1, n4 - n3 - 1);
209984ab0f1SWei Mi         if (!WordAfterColon.getAsInteger(10, count))
210984ab0f1SWei Mi           break;
211984ab0f1SWei Mi 
212984ab0f1SWei Mi         // Try to find the next colon.
213984ab0f1SWei Mi         uint64_t n5 = AfterColon.find_first_of(':');
214984ab0f1SWei Mi         if (n5 == StringRef::npos)
215984ab0f1SWei Mi           return false;
216984ab0f1SWei Mi         n3 += n5 + 1;
217984ab0f1SWei Mi       }
218984ab0f1SWei Mi 
219984ab0f1SWei Mi       // An anchor point is found. Save the {target, count} pair
220984ab0f1SWei Mi       TargetCountMap[Target] = count;
221984ab0f1SWei Mi       if (n4 == Rest.size())
222984ab0f1SWei Mi         break;
223984ab0f1SWei Mi       // Change n3 to the next blank space after colon + integer pair.
224984ab0f1SWei Mi       n3 = n4;
2256722688eSDehao Chen     }
2266722688eSDehao Chen   } else {
227ac068e01SHongtao Yu     LineTy = LineType::CallSiteProfile;
22838be3330SDiego Novillo     size_t n3 = Rest.find_last_of(':');
2296722688eSDehao Chen     CalleeName = Rest.substr(0, n3);
2306722688eSDehao Chen     if (Rest.substr(n3 + 1).getAsInteger(10, NumSamples))
2316722688eSDehao Chen       return false;
2326722688eSDehao Chen   }
2336722688eSDehao Chen   return true;
2346722688eSDehao Chen }
2356722688eSDehao Chen 
2365f8f34e4SAdrian Prantl /// Load samples from a text file.
237de1ab26fSDiego Novillo ///
238de1ab26fSDiego Novillo /// See the documentation at the top of the file for an explanation of
239de1ab26fSDiego Novillo /// the expected format.
240de1ab26fSDiego Novillo ///
241de1ab26fSDiego Novillo /// \returns true if the file was loaded successfully, false otherwise.
2428c8ec1f6SWei Mi std::error_code SampleProfileReaderText::readImpl() {
243c572e92cSDiego Novillo   line_iterator LineIt(*Buffer, /*SkipBlanks=*/true, '#');
24448dd080cSNathan Slingerland   sampleprof_error Result = sampleprof_error::success;
245de1ab26fSDiego Novillo 
246aae1ed8eSDiego Novillo   InlineCallStack InlineStack;
247ac068e01SHongtao Yu   uint32_t ProbeProfileCount = 0;
248ac068e01SHongtao Yu 
249ac068e01SHongtao Yu   // SeenMetadata tracks whether we have processed metadata for the current
250ac068e01SHongtao Yu   // top-level function profile.
251ac068e01SHongtao Yu   bool SeenMetadata = false;
2526722688eSDehao Chen 
2536745ffe4SRong Xu   ProfileIsFS = ProfileIsFSDisciminator;
25424201b64SRong Xu   FunctionSamples::ProfileIsFS = ProfileIsFS;
2556722688eSDehao Chen   for (; !LineIt.is_at_eof(); ++LineIt) {
2566722688eSDehao Chen     if ((*LineIt)[(*LineIt).find_first_not_of(' ')] == '#')
2576722688eSDehao Chen       continue;
258de1ab26fSDiego Novillo     // Read the header of each function.
259de1ab26fSDiego Novillo     //
260de1ab26fSDiego Novillo     // Note that for function identifiers we are actually expecting
261de1ab26fSDiego Novillo     // mangled names, but we may not always get them. This happens when
262de1ab26fSDiego Novillo     // the compiler decides not to emit the function (e.g., it was inlined
263de1ab26fSDiego Novillo     // and removed). In this case, the binary will not have the linkage
264de1ab26fSDiego Novillo     // name for the function, so the profiler will emit the function's
265de1ab26fSDiego Novillo     // unmangled name, which may contain characters like ':' and '>' in its
266de1ab26fSDiego Novillo     // name (member functions, templates, etc).
267de1ab26fSDiego Novillo     //
268de1ab26fSDiego Novillo     // The only requirement we place on the identifier, then, is that it
269de1ab26fSDiego Novillo     // should not begin with a number.
2706722688eSDehao Chen     if ((*LineIt)[0] != ' ') {
27138be3330SDiego Novillo       uint64_t NumSamples, NumHeadSamples;
2726722688eSDehao Chen       StringRef FName;
2736722688eSDehao Chen       if (!ParseHead(*LineIt, FName, NumSamples, NumHeadSamples)) {
2743376a787SDiego Novillo         reportError(LineIt.line_number(),
275de1ab26fSDiego Novillo                     "Expected 'mangled_name:NUM:NUM', found " + *LineIt);
276c572e92cSDiego Novillo         return sampleprof_error::malformed;
277de1ab26fSDiego Novillo       }
278ac068e01SHongtao Yu       SeenMetadata = false;
279b9db7036SHongtao Yu       SampleContext FContext(FName, CSNameTable);
2806b989a17SWenlei He       if (FContext.hasContext())
2816b989a17SWenlei He         ++CSProfileCount;
2826b989a17SWenlei He       Profiles[FContext] = FunctionSamples();
2836b989a17SWenlei He       FunctionSamples &FProfile = Profiles[FContext];
2846b989a17SWenlei He       FProfile.setContext(FContext);
28548dd080cSNathan Slingerland       MergeResult(Result, FProfile.addTotalSamples(NumSamples));
28648dd080cSNathan Slingerland       MergeResult(Result, FProfile.addHeadSamples(NumHeadSamples));
2876722688eSDehao Chen       InlineStack.clear();
2886722688eSDehao Chen       InlineStack.push_back(&FProfile);
2896722688eSDehao Chen     } else {
29038be3330SDiego Novillo       uint64_t NumSamples;
2916722688eSDehao Chen       StringRef FName;
29238be3330SDiego Novillo       DenseMap<StringRef, uint64_t> TargetCountMap;
29338be3330SDiego Novillo       uint32_t Depth, LineOffset, Discriminator;
294ac068e01SHongtao Yu       LineType LineTy;
2951410db70SWenlei He       uint64_t FunctionHash = 0;
2961410db70SWenlei He       uint32_t Attributes = 0;
297ac068e01SHongtao Yu       if (!ParseLine(*LineIt, LineTy, Depth, NumSamples, LineOffset,
2981410db70SWenlei He                      Discriminator, FName, TargetCountMap, FunctionHash,
2991410db70SWenlei He                      Attributes)) {
3003376a787SDiego Novillo         reportError(LineIt.line_number(),
3013376a787SDiego Novillo                     "Expected 'NUM[.NUM]: NUM[ mangled_name:NUM]*', found " +
3023376a787SDiego Novillo                         *LineIt);
303c572e92cSDiego Novillo         return sampleprof_error::malformed;
304de1ab26fSDiego Novillo       }
305ac068e01SHongtao Yu       if (SeenMetadata && LineTy != LineType::Metadata) {
306ac068e01SHongtao Yu         // Metadata must be put at the end of a function profile.
307ac068e01SHongtao Yu         reportError(LineIt.line_number(),
308ac068e01SHongtao Yu                     "Found non-metadata after metadata: " + *LineIt);
309ac068e01SHongtao Yu         return sampleprof_error::malformed;
310ac068e01SHongtao Yu       }
3116745ffe4SRong Xu 
3126745ffe4SRong Xu       // Here we handle FS discriminators.
3136745ffe4SRong Xu       Discriminator &= getDiscriminatorMask();
3146745ffe4SRong Xu 
3156722688eSDehao Chen       while (InlineStack.size() > Depth) {
3166722688eSDehao Chen         InlineStack.pop_back();
317c572e92cSDiego Novillo       }
318ac068e01SHongtao Yu       switch (LineTy) {
319ac068e01SHongtao Yu       case LineType::CallSiteProfile: {
3206722688eSDehao Chen         FunctionSamples &FSamples = InlineStack.back()->functionSamplesAt(
321adcd0268SBenjamin Kramer             LineLocation(LineOffset, Discriminator))[std::string(FName)];
32257d1dda5SDehao Chen         FSamples.setName(FName);
32348dd080cSNathan Slingerland         MergeResult(Result, FSamples.addTotalSamples(NumSamples));
3246722688eSDehao Chen         InlineStack.push_back(&FSamples);
325ac068e01SHongtao Yu         break;
326ac068e01SHongtao Yu       }
327ac068e01SHongtao Yu       case LineType::BodyProfile: {
3286722688eSDehao Chen         while (InlineStack.size() > Depth) {
3296722688eSDehao Chen           InlineStack.pop_back();
3306722688eSDehao Chen         }
3316722688eSDehao Chen         FunctionSamples &FProfile = *InlineStack.back();
3326722688eSDehao Chen         for (const auto &name_count : TargetCountMap) {
33348dd080cSNathan Slingerland           MergeResult(Result, FProfile.addCalledTargetSamples(
33448dd080cSNathan Slingerland                                   LineOffset, Discriminator, name_count.first,
33548dd080cSNathan Slingerland                                   name_count.second));
336c572e92cSDiego Novillo         }
33748dd080cSNathan Slingerland         MergeResult(Result, FProfile.addBodySamples(LineOffset, Discriminator,
33848dd080cSNathan Slingerland                                                     NumSamples));
339ac068e01SHongtao Yu         break;
340ac068e01SHongtao Yu       }
341ac068e01SHongtao Yu       case LineType::Metadata: {
342ac068e01SHongtao Yu         FunctionSamples &FProfile = *InlineStack.back();
3431410db70SWenlei He         if (FunctionHash) {
344ac068e01SHongtao Yu           FProfile.setFunctionHash(FunctionHash);
345ac068e01SHongtao Yu           ++ProbeProfileCount;
3461410db70SWenlei He         }
3471410db70SWenlei He         if (Attributes)
3481410db70SWenlei He           FProfile.getContext().setAllAttributes(Attributes);
349ac068e01SHongtao Yu         SeenMetadata = true;
350ac068e01SHongtao Yu         break;
351ac068e01SHongtao Yu       }
3526722688eSDehao Chen       }
353de1ab26fSDiego Novillo     }
354de1ab26fSDiego Novillo   }
3556b989a17SWenlei He 
3567e99bddfSHongtao Yu   assert((CSProfileCount == 0 || CSProfileCount == Profiles.size()) &&
3576b989a17SWenlei He          "Cannot have both context-sensitive and regular profile");
3586b989a17SWenlei He   ProfileIsCS = (CSProfileCount > 0);
359ac068e01SHongtao Yu   assert((ProbeProfileCount == 0 || ProbeProfileCount == Profiles.size()) &&
360ac068e01SHongtao Yu          "Cannot have both probe-based profiles and regular profiles");
361ac068e01SHongtao Yu   ProfileIsProbeBased = (ProbeProfileCount > 0);
362ac068e01SHongtao Yu   FunctionSamples::ProfileIsProbeBased = ProfileIsProbeBased;
3637e99bddfSHongtao Yu   FunctionSamples::ProfileIsCS = ProfileIsCS;
3646b989a17SWenlei He 
36540ee23dbSEaswaran Raman   if (Result == sampleprof_error::success)
36640ee23dbSEaswaran Raman     computeSummary();
367de1ab26fSDiego Novillo 
36848dd080cSNathan Slingerland   return Result;
369de1ab26fSDiego Novillo }
370de1ab26fSDiego Novillo 
3714f823667SNathan Slingerland bool SampleProfileReaderText::hasFormat(const MemoryBuffer &Buffer) {
3724f823667SNathan Slingerland   bool result = false;
3734f823667SNathan Slingerland 
3744f823667SNathan Slingerland   // Check that the first non-comment line is a valid function header.
3754f823667SNathan Slingerland   line_iterator LineIt(Buffer, /*SkipBlanks=*/true, '#');
3764f823667SNathan Slingerland   if (!LineIt.is_at_eof()) {
3774f823667SNathan Slingerland     if ((*LineIt)[0] != ' ') {
3784f823667SNathan Slingerland       uint64_t NumSamples, NumHeadSamples;
3794f823667SNathan Slingerland       StringRef FName;
3804f823667SNathan Slingerland       result = ParseHead(*LineIt, FName, NumSamples, NumHeadSamples);
3814f823667SNathan Slingerland     }
3824f823667SNathan Slingerland   }
3834f823667SNathan Slingerland 
3844f823667SNathan Slingerland   return result;
3854f823667SNathan Slingerland }
3864f823667SNathan Slingerland 
387d5336ae2SDiego Novillo template <typename T> ErrorOr<T> SampleProfileReaderBinary::readNumber() {
388c572e92cSDiego Novillo   unsigned NumBytesRead = 0;
389c572e92cSDiego Novillo   std::error_code EC;
390c572e92cSDiego Novillo   uint64_t Val = decodeULEB128(Data, &NumBytesRead);
391c572e92cSDiego Novillo 
392c572e92cSDiego Novillo   if (Val > std::numeric_limits<T>::max())
393c572e92cSDiego Novillo     EC = sampleprof_error::malformed;
394c572e92cSDiego Novillo   else if (Data + NumBytesRead > End)
395c572e92cSDiego Novillo     EC = sampleprof_error::truncated;
396c572e92cSDiego Novillo   else
397c572e92cSDiego Novillo     EC = sampleprof_error::success;
398c572e92cSDiego Novillo 
399c572e92cSDiego Novillo   if (EC) {
4003376a787SDiego Novillo     reportError(0, EC.message());
401c572e92cSDiego Novillo     return EC;
402c572e92cSDiego Novillo   }
403c572e92cSDiego Novillo 
404c572e92cSDiego Novillo   Data += NumBytesRead;
405c572e92cSDiego Novillo   return static_cast<T>(Val);
406c572e92cSDiego Novillo }
407c572e92cSDiego Novillo 
408c572e92cSDiego Novillo ErrorOr<StringRef> SampleProfileReaderBinary::readString() {
409c572e92cSDiego Novillo   std::error_code EC;
410c572e92cSDiego Novillo   StringRef Str(reinterpret_cast<const char *>(Data));
411c572e92cSDiego Novillo   if (Data + Str.size() + 1 > End) {
412c572e92cSDiego Novillo     EC = sampleprof_error::truncated;
4133376a787SDiego Novillo     reportError(0, EC.message());
414c572e92cSDiego Novillo     return EC;
415c572e92cSDiego Novillo   }
416c572e92cSDiego Novillo 
417c572e92cSDiego Novillo   Data += Str.size() + 1;
418c572e92cSDiego Novillo   return Str;
419c572e92cSDiego Novillo }
420c572e92cSDiego Novillo 
421a0c0857eSWei Mi template <typename T>
4226a14325dSWei Mi ErrorOr<T> SampleProfileReaderBinary::readUnencodedNumber() {
4236a14325dSWei Mi   std::error_code EC;
4246a14325dSWei Mi 
4256a14325dSWei Mi   if (Data + sizeof(T) > End) {
4266a14325dSWei Mi     EC = sampleprof_error::truncated;
4276a14325dSWei Mi     reportError(0, EC.message());
4286a14325dSWei Mi     return EC;
4296a14325dSWei Mi   }
4306a14325dSWei Mi 
4316a14325dSWei Mi   using namespace support;
4326a14325dSWei Mi   T Val = endian::readNext<T, little, unaligned>(Data);
4336a14325dSWei Mi   return Val;
4346a14325dSWei Mi }
4356a14325dSWei Mi 
4366a14325dSWei Mi template <typename T>
437a0c0857eSWei Mi inline ErrorOr<uint32_t> SampleProfileReaderBinary::readStringIndex(T &Table) {
438760c5a8fSDiego Novillo   std::error_code EC;
43938be3330SDiego Novillo   auto Idx = readNumber<uint32_t>();
440760c5a8fSDiego Novillo   if (std::error_code EC = Idx.getError())
441760c5a8fSDiego Novillo     return EC;
442a0c0857eSWei Mi   if (*Idx >= Table.size())
443760c5a8fSDiego Novillo     return sampleprof_error::truncated_name_table;
444a0c0857eSWei Mi   return *Idx;
445a0c0857eSWei Mi }
446a0c0857eSWei Mi 
447be907324SWei Mi ErrorOr<StringRef> SampleProfileReaderBinary::readStringFromTable() {
448a0c0857eSWei Mi   auto Idx = readStringIndex(NameTable);
449a0c0857eSWei Mi   if (std::error_code EC = Idx.getError())
450a0c0857eSWei Mi     return EC;
451a0c0857eSWei Mi 
452760c5a8fSDiego Novillo   return NameTable[*Idx];
453760c5a8fSDiego Novillo }
454760c5a8fSDiego Novillo 
455b9db7036SHongtao Yu ErrorOr<SampleContext> SampleProfileReaderBinary::readSampleContextFromTable() {
456b9db7036SHongtao Yu   auto FName(readStringFromTable());
457b9db7036SHongtao Yu   if (std::error_code EC = FName.getError())
458b9db7036SHongtao Yu     return EC;
459b9db7036SHongtao Yu   return SampleContext(*FName);
460b9db7036SHongtao Yu }
461b9db7036SHongtao Yu 
46264e76853SWei Mi ErrorOr<StringRef> SampleProfileReaderExtBinaryBase::readStringFromTable() {
46364e76853SWei Mi   if (!FixedLengthMD5)
46464e76853SWei Mi     return SampleProfileReaderBinary::readStringFromTable();
46564e76853SWei Mi 
46664e76853SWei Mi   // read NameTable index.
46764e76853SWei Mi   auto Idx = readStringIndex(NameTable);
46864e76853SWei Mi   if (std::error_code EC = Idx.getError())
46964e76853SWei Mi     return EC;
47064e76853SWei Mi 
47164e76853SWei Mi   // Check whether the name to be accessed has been accessed before,
47264e76853SWei Mi   // if not, read it from memory directly.
47364e76853SWei Mi   StringRef &SR = NameTable[*Idx];
47464e76853SWei Mi   if (SR.empty()) {
47564e76853SWei Mi     const uint8_t *SavedData = Data;
47664e76853SWei Mi     Data = MD5NameMemStart + ((*Idx) * sizeof(uint64_t));
47764e76853SWei Mi     auto FID = readUnencodedNumber<uint64_t>();
47864e76853SWei Mi     if (std::error_code EC = FID.getError())
47964e76853SWei Mi       return EC;
48064e76853SWei Mi     // Save the string converted from uint64_t in MD5StringBuf. All the
48164e76853SWei Mi     // references to the name are all StringRefs refering to the string
48264e76853SWei Mi     // in MD5StringBuf.
48364e76853SWei Mi     MD5StringBuf->push_back(std::to_string(*FID));
48464e76853SWei Mi     SR = MD5StringBuf->back();
48564e76853SWei Mi     Data = SavedData;
48664e76853SWei Mi   }
48764e76853SWei Mi   return SR;
48864e76853SWei Mi }
48964e76853SWei Mi 
490a0c0857eSWei Mi ErrorOr<StringRef> SampleProfileReaderCompactBinary::readStringFromTable() {
491a0c0857eSWei Mi   auto Idx = readStringIndex(NameTable);
492a0c0857eSWei Mi   if (std::error_code EC = Idx.getError())
493a0c0857eSWei Mi     return EC;
494a0c0857eSWei Mi 
495a0c0857eSWei Mi   return StringRef(NameTable[*Idx]);
496a0c0857eSWei Mi }
497a0c0857eSWei Mi 
498a7f1e8efSDiego Novillo std::error_code
499a7f1e8efSDiego Novillo SampleProfileReaderBinary::readProfile(FunctionSamples &FProfile) {
500b93483dbSDiego Novillo   auto NumSamples = readNumber<uint64_t>();
501b93483dbSDiego Novillo   if (std::error_code EC = NumSamples.getError())
502c572e92cSDiego Novillo     return EC;
503b93483dbSDiego Novillo   FProfile.addTotalSamples(*NumSamples);
504c572e92cSDiego Novillo 
505c572e92cSDiego Novillo   // Read the samples in the body.
50638be3330SDiego Novillo   auto NumRecords = readNumber<uint32_t>();
507c572e92cSDiego Novillo   if (std::error_code EC = NumRecords.getError())
508c572e92cSDiego Novillo     return EC;
509a7f1e8efSDiego Novillo 
51038be3330SDiego Novillo   for (uint32_t I = 0; I < *NumRecords; ++I) {
511c572e92cSDiego Novillo     auto LineOffset = readNumber<uint64_t>();
512c572e92cSDiego Novillo     if (std::error_code EC = LineOffset.getError())
513c572e92cSDiego Novillo       return EC;
514c572e92cSDiego Novillo 
51510042412SDehao Chen     if (!isOffsetLegal(*LineOffset)) {
51610042412SDehao Chen       return std::error_code();
51710042412SDehao Chen     }
51810042412SDehao Chen 
519c572e92cSDiego Novillo     auto Discriminator = readNumber<uint64_t>();
520c572e92cSDiego Novillo     if (std::error_code EC = Discriminator.getError())
521c572e92cSDiego Novillo       return EC;
522c572e92cSDiego Novillo 
523c572e92cSDiego Novillo     auto NumSamples = readNumber<uint64_t>();
524c572e92cSDiego Novillo     if (std::error_code EC = NumSamples.getError())
525c572e92cSDiego Novillo       return EC;
526c572e92cSDiego Novillo 
52738be3330SDiego Novillo     auto NumCalls = readNumber<uint32_t>();
528c572e92cSDiego Novillo     if (std::error_code EC = NumCalls.getError())
529c572e92cSDiego Novillo       return EC;
530c572e92cSDiego Novillo 
5316745ffe4SRong Xu     // Here we handle FS discriminators:
5326745ffe4SRong Xu     uint32_t DiscriminatorVal = (*Discriminator) & getDiscriminatorMask();
5336745ffe4SRong Xu 
53438be3330SDiego Novillo     for (uint32_t J = 0; J < *NumCalls; ++J) {
535760c5a8fSDiego Novillo       auto CalledFunction(readStringFromTable());
536c572e92cSDiego Novillo       if (std::error_code EC = CalledFunction.getError())
537c572e92cSDiego Novillo         return EC;
538c572e92cSDiego Novillo 
539c572e92cSDiego Novillo       auto CalledFunctionSamples = readNumber<uint64_t>();
540c572e92cSDiego Novillo       if (std::error_code EC = CalledFunctionSamples.getError())
541c572e92cSDiego Novillo         return EC;
542c572e92cSDiego Novillo 
5436745ffe4SRong Xu       FProfile.addCalledTargetSamples(*LineOffset, DiscriminatorVal,
544a7f1e8efSDiego Novillo                                       *CalledFunction, *CalledFunctionSamples);
545c572e92cSDiego Novillo     }
546c572e92cSDiego Novillo 
5476745ffe4SRong Xu     FProfile.addBodySamples(*LineOffset, DiscriminatorVal, *NumSamples);
548c572e92cSDiego Novillo   }
549a7f1e8efSDiego Novillo 
550a7f1e8efSDiego Novillo   // Read all the samples for inlined function calls.
55138be3330SDiego Novillo   auto NumCallsites = readNumber<uint32_t>();
552a7f1e8efSDiego Novillo   if (std::error_code EC = NumCallsites.getError())
553a7f1e8efSDiego Novillo     return EC;
554a7f1e8efSDiego Novillo 
55538be3330SDiego Novillo   for (uint32_t J = 0; J < *NumCallsites; ++J) {
556a7f1e8efSDiego Novillo     auto LineOffset = readNumber<uint64_t>();
557a7f1e8efSDiego Novillo     if (std::error_code EC = LineOffset.getError())
558a7f1e8efSDiego Novillo       return EC;
559a7f1e8efSDiego Novillo 
560a7f1e8efSDiego Novillo     auto Discriminator = readNumber<uint64_t>();
561a7f1e8efSDiego Novillo     if (std::error_code EC = Discriminator.getError())
562a7f1e8efSDiego Novillo       return EC;
563a7f1e8efSDiego Novillo 
564760c5a8fSDiego Novillo     auto FName(readStringFromTable());
565a7f1e8efSDiego Novillo     if (std::error_code EC = FName.getError())
566a7f1e8efSDiego Novillo       return EC;
567a7f1e8efSDiego Novillo 
5686745ffe4SRong Xu     // Here we handle FS discriminators:
5696745ffe4SRong Xu     uint32_t DiscriminatorVal = (*Discriminator) & getDiscriminatorMask();
5706745ffe4SRong Xu 
5712c7ca9b5SDehao Chen     FunctionSamples &CalleeProfile = FProfile.functionSamplesAt(
5726745ffe4SRong Xu         LineLocation(*LineOffset, DiscriminatorVal))[std::string(*FName)];
57357d1dda5SDehao Chen     CalleeProfile.setName(*FName);
574a7f1e8efSDiego Novillo     if (std::error_code EC = readProfile(CalleeProfile))
575a7f1e8efSDiego Novillo       return EC;
576a7f1e8efSDiego Novillo   }
577a7f1e8efSDiego Novillo 
578a7f1e8efSDiego Novillo   return sampleprof_error::success;
579a7f1e8efSDiego Novillo }
580a7f1e8efSDiego Novillo 
58109dcfe68SWei Mi std::error_code
58209dcfe68SWei Mi SampleProfileReaderBinary::readFuncProfile(const uint8_t *Start) {
58309dcfe68SWei Mi   Data = Start;
584b93483dbSDiego Novillo   auto NumHeadSamples = readNumber<uint64_t>();
585b93483dbSDiego Novillo   if (std::error_code EC = NumHeadSamples.getError())
586b93483dbSDiego Novillo     return EC;
587b93483dbSDiego Novillo 
588b9db7036SHongtao Yu   ErrorOr<SampleContext> FContext(readSampleContextFromTable());
589b9db7036SHongtao Yu   if (std::error_code EC = FContext.getError())
590a7f1e8efSDiego Novillo     return EC;
591a7f1e8efSDiego Novillo 
592b9db7036SHongtao Yu   Profiles[*FContext] = FunctionSamples();
593b9db7036SHongtao Yu   FunctionSamples &FProfile = Profiles[*FContext];
594b9db7036SHongtao Yu   FProfile.setContext(*FContext);
595b93483dbSDiego Novillo   FProfile.addHeadSamples(*NumHeadSamples);
596b93483dbSDiego Novillo 
597b9db7036SHongtao Yu   if (FContext->hasContext())
5987e99bddfSHongtao Yu     CSProfileCount++;
5997e99bddfSHongtao Yu 
600a7f1e8efSDiego Novillo   if (std::error_code EC = readProfile(FProfile))
601a7f1e8efSDiego Novillo     return EC;
6026a14325dSWei Mi   return sampleprof_error::success;
603c572e92cSDiego Novillo }
604c572e92cSDiego Novillo 
6058c8ec1f6SWei Mi std::error_code SampleProfileReaderBinary::readImpl() {
6066745ffe4SRong Xu   ProfileIsFS = ProfileIsFSDisciminator;
60724201b64SRong Xu   FunctionSamples::ProfileIsFS = ProfileIsFS;
6086a14325dSWei Mi   while (!at_eof()) {
60909dcfe68SWei Mi     if (std::error_code EC = readFuncProfile(Data))
6106a14325dSWei Mi       return EC;
6116a14325dSWei Mi   }
6126a14325dSWei Mi 
6136a14325dSWei Mi   return sampleprof_error::success;
6146a14325dSWei Mi }
6156a14325dSWei Mi 
616b9db7036SHongtao Yu ErrorOr<SampleContextFrames>
617b9db7036SHongtao Yu SampleProfileReaderExtBinaryBase::readContextFromTable() {
618b9db7036SHongtao Yu   auto ContextIdx = readNumber<uint32_t>();
619b9db7036SHongtao Yu   if (std::error_code EC = ContextIdx.getError())
620b9db7036SHongtao Yu     return EC;
621b9db7036SHongtao Yu   if (*ContextIdx >= CSNameTable->size())
622b9db7036SHongtao Yu     return sampleprof_error::truncated_name_table;
623b9db7036SHongtao Yu   return (*CSNameTable)[*ContextIdx];
624b9db7036SHongtao Yu }
625b9db7036SHongtao Yu 
626b9db7036SHongtao Yu ErrorOr<SampleContext>
627b9db7036SHongtao Yu SampleProfileReaderExtBinaryBase::readSampleContextFromTable() {
628b9db7036SHongtao Yu   if (ProfileIsCS) {
629b9db7036SHongtao Yu     auto FContext(readContextFromTable());
630b9db7036SHongtao Yu     if (std::error_code EC = FContext.getError())
631b9db7036SHongtao Yu       return EC;
632b9db7036SHongtao Yu     return SampleContext(*FContext);
633b9db7036SHongtao Yu   } else {
634b9db7036SHongtao Yu     auto FName(readStringFromTable());
635b9db7036SHongtao Yu     if (std::error_code EC = FName.getError())
636b9db7036SHongtao Yu       return EC;
637b9db7036SHongtao Yu     return SampleContext(*FName);
638b9db7036SHongtao Yu   }
639b9db7036SHongtao Yu }
640b9db7036SHongtao Yu 
64193953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readOneSection(
642ebad6788SWei Mi     const uint8_t *Start, uint64_t Size, const SecHdrTableEntry &Entry) {
643077a9c70SWei Mi   Data = Start;
644b523790aSWei Mi   End = Start + Size;
645ebad6788SWei Mi   switch (Entry.Type) {
646be907324SWei Mi   case SecProfSummary:
647be907324SWei Mi     if (std::error_code EC = readSummary())
648be907324SWei Mi       return EC;
649b49eac71SWei Mi     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagPartial))
650b49eac71SWei Mi       Summary->setPartialProfile(true);
651a5d30421SWenlei He     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagFullContext))
652a5d30421SWenlei He       FunctionSamples::ProfileIsCS = ProfileIsCS = true;
6536745ffe4SRong Xu     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagFSDiscriminator))
6546745ffe4SRong Xu       FunctionSamples::ProfileIsFS = ProfileIsFS = true;
655be907324SWei Mi     break;
65664e76853SWei Mi   case SecNameTable: {
65764e76853SWei Mi     FixedLengthMD5 =
65864e76853SWei Mi         hasSecFlag(Entry, SecNameTableFlags::SecFlagFixedLengthMD5);
65964e76853SWei Mi     bool UseMD5 = hasSecFlag(Entry, SecNameTableFlags::SecFlagMD5Name);
66064e76853SWei Mi     assert((!FixedLengthMD5 || UseMD5) &&
66164e76853SWei Mi            "If FixedLengthMD5 is true, UseMD5 has to be true");
662ee35784aSWei Mi     FunctionSamples::HasUniqSuffix =
663ee35784aSWei Mi         hasSecFlag(Entry, SecNameTableFlags::SecFlagUniqSuffix);
66464e76853SWei Mi     if (std::error_code EC = readNameTableSec(UseMD5))
665be907324SWei Mi       return EC;
666be907324SWei Mi     break;
66764e76853SWei Mi   }
668b9db7036SHongtao Yu   case SecCSNameTable: {
669b9db7036SHongtao Yu     if (std::error_code EC = readCSNameTableSec())
670b9db7036SHongtao Yu       return EC;
671b9db7036SHongtao Yu     break;
672b9db7036SHongtao Yu   }
673be907324SWei Mi   case SecLBRProfile:
67409dcfe68SWei Mi     if (std::error_code EC = readFuncProfiles())
675be907324SWei Mi       return EC;
676be907324SWei Mi     break;
67709dcfe68SWei Mi   case SecFuncOffsetTable:
678f4711e0dSHongtao Yu     FuncOffsetsOrdered = hasSecFlag(Entry, SecFuncOffsetFlags::SecFlagOrdered);
67909dcfe68SWei Mi     if (std::error_code EC = readFuncOffsetTable())
680798e59b8SWei Mi       return EC;
681798e59b8SWei Mi     break;
6821410db70SWenlei He   case SecFuncMetadata: {
683ac068e01SHongtao Yu     ProfileIsProbeBased =
684ac068e01SHongtao Yu         hasSecFlag(Entry, SecFuncMetadataFlags::SecFlagIsProbeBased);
685ac068e01SHongtao Yu     FunctionSamples::ProfileIsProbeBased = ProfileIsProbeBased;
6861410db70SWenlei He     bool HasAttribute =
6871410db70SWenlei He         hasSecFlag(Entry, SecFuncMetadataFlags::SecFlagHasAttribute);
6881410db70SWenlei He     if (std::error_code EC = readFuncMetadata(HasAttribute))
689ac068e01SHongtao Yu       return EC;
690ac068e01SHongtao Yu     break;
6911410db70SWenlei He   }
69293953d41SWei Mi   case SecProfileSymbolList:
69393953d41SWei Mi     if (std::error_code EC = readProfileSymbolList())
69493953d41SWei Mi       return EC;
69593953d41SWei Mi     break;
696be907324SWei Mi   default:
69793953d41SWei Mi     if (std::error_code EC = readCustomSection(Entry))
69893953d41SWei Mi       return EC;
699077a9c70SWei Mi     break;
700be907324SWei Mi   }
701077a9c70SWei Mi   return sampleprof_error::success;
702077a9c70SWei Mi }
703077a9c70SWei Mi 
704ee35784aSWei Mi bool SampleProfileReaderExtBinaryBase::collectFuncsFromModule() {
705ee35784aSWei Mi   if (!M)
706ee35784aSWei Mi     return false;
70709dcfe68SWei Mi   FuncsToUse.clear();
708ee35784aSWei Mi   for (auto &F : *M)
70909dcfe68SWei Mi     FuncsToUse.insert(FunctionSamples::getCanonicalFnName(F));
710ee35784aSWei Mi   return true;
71109dcfe68SWei Mi }
71209dcfe68SWei Mi 
71393953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readFuncOffsetTable() {
714a906e3ecSWei Mi   // If there are more than one FuncOffsetTable, the profile read associated
715a906e3ecSWei Mi   // with previous FuncOffsetTable has to be done before next FuncOffsetTable
716a906e3ecSWei Mi   // is read.
717a906e3ecSWei Mi   FuncOffsetTable.clear();
718a906e3ecSWei Mi 
71909dcfe68SWei Mi   auto Size = readNumber<uint64_t>();
72009dcfe68SWei Mi   if (std::error_code EC = Size.getError())
72109dcfe68SWei Mi     return EC;
72209dcfe68SWei Mi 
72309dcfe68SWei Mi   FuncOffsetTable.reserve(*Size);
724f4711e0dSHongtao Yu 
725f4711e0dSHongtao Yu   if (FuncOffsetsOrdered) {
726f4711e0dSHongtao Yu     OrderedFuncOffsets =
727f4711e0dSHongtao Yu         std::make_unique<std::vector<std::pair<SampleContext, uint64_t>>>();
728f4711e0dSHongtao Yu     OrderedFuncOffsets->reserve(*Size);
729f4711e0dSHongtao Yu   }
730f4711e0dSHongtao Yu 
73109dcfe68SWei Mi   for (uint32_t I = 0; I < *Size; ++I) {
732f4711e0dSHongtao Yu     auto FContext(readSampleContextFromTable());
733f4711e0dSHongtao Yu     if (std::error_code EC = FContext.getError())
73409dcfe68SWei Mi       return EC;
73509dcfe68SWei Mi 
73609dcfe68SWei Mi     auto Offset = readNumber<uint64_t>();
73709dcfe68SWei Mi     if (std::error_code EC = Offset.getError())
73809dcfe68SWei Mi       return EC;
73909dcfe68SWei Mi 
740f4711e0dSHongtao Yu     FuncOffsetTable[*FContext] = *Offset;
741f4711e0dSHongtao Yu     if (FuncOffsetsOrdered)
742f4711e0dSHongtao Yu       OrderedFuncOffsets->emplace_back(*FContext, *Offset);
74309dcfe68SWei Mi   }
744f4711e0dSHongtao Yu 
74509dcfe68SWei Mi   return sampleprof_error::success;
74609dcfe68SWei Mi }
74709dcfe68SWei Mi 
74893953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readFuncProfiles() {
749ee35784aSWei Mi   // Collect functions used by current module if the Reader has been
750ee35784aSWei Mi   // given a module.
751ee35784aSWei Mi   // collectFuncsFromModule uses FunctionSamples::getCanonicalFnName
752ee35784aSWei Mi   // which will query FunctionSamples::HasUniqSuffix, so it has to be
753ee35784aSWei Mi   // called after FunctionSamples::HasUniqSuffix is set, i.e. after
754ee35784aSWei Mi   // NameTable section is read.
755ee35784aSWei Mi   bool LoadFuncsToBeUsed = collectFuncsFromModule();
756ee35784aSWei Mi 
757ee35784aSWei Mi   // When LoadFuncsToBeUsed is false, load all the function profiles.
75809dcfe68SWei Mi   const uint8_t *Start = Data;
759ee35784aSWei Mi   if (!LoadFuncsToBeUsed) {
76009dcfe68SWei Mi     while (Data < End) {
76109dcfe68SWei Mi       if (std::error_code EC = readFuncProfile(Data))
76209dcfe68SWei Mi         return EC;
76309dcfe68SWei Mi     }
76409dcfe68SWei Mi     assert(Data == End && "More data is read than expected");
7657e99bddfSHongtao Yu   } else {
766ee35784aSWei Mi     // Load function profiles on demand.
7678c8ec1f6SWei Mi     if (Remapper) {
76809dcfe68SWei Mi       for (auto Name : FuncsToUse) {
7698c8ec1f6SWei Mi         Remapper->insert(Name);
7708c8ec1f6SWei Mi       }
7718c8ec1f6SWei Mi     }
7728c8ec1f6SWei Mi 
7737ca80300SHongtao Yu     if (ProfileIsCS) {
7747ca80300SHongtao Yu       DenseSet<uint64_t> FuncGuidsToUse;
7757ca80300SHongtao Yu       if (useMD5()) {
7767ca80300SHongtao Yu         for (auto Name : FuncsToUse)
7777ca80300SHongtao Yu           FuncGuidsToUse.insert(Function::getGUID(Name));
7787ca80300SHongtao Yu       }
7797ca80300SHongtao Yu 
780f4711e0dSHongtao Yu       // For each function in current module, load all context profiles for
781f4711e0dSHongtao Yu       // the function as well as their callee contexts which can help profile
782f4711e0dSHongtao Yu       // guided importing for ThinLTO. This can be achieved by walking
783f4711e0dSHongtao Yu       // through an ordered context container, where contexts are laid out
784f4711e0dSHongtao Yu       // as if they were walked in preorder of a context trie. While
785f4711e0dSHongtao Yu       // traversing the trie, a link to the highest common ancestor node is
786f4711e0dSHongtao Yu       // kept so that all of its decendants will be loaded.
787f4711e0dSHongtao Yu       assert(OrderedFuncOffsets.get() &&
788f4711e0dSHongtao Yu              "func offset table should always be sorted in CS profile");
789f4711e0dSHongtao Yu       const SampleContext *CommonContext = nullptr;
790f4711e0dSHongtao Yu       for (const auto &NameOffset : *OrderedFuncOffsets) {
791f4711e0dSHongtao Yu         const auto &FContext = NameOffset.first;
792f4711e0dSHongtao Yu         auto FName = FContext.getName();
793f4711e0dSHongtao Yu         // For function in the current module, keep its farthest ancestor
794f4711e0dSHongtao Yu         // context. This can be used to load itself and its child and
795f4711e0dSHongtao Yu         // sibling contexts.
796f4711e0dSHongtao Yu         if ((useMD5() && FuncGuidsToUse.count(std::stoull(FName.data()))) ||
797f4711e0dSHongtao Yu             (!useMD5() && (FuncsToUse.count(FName) ||
798f4711e0dSHongtao Yu                            (Remapper && Remapper->exist(FName))))) {
799f4711e0dSHongtao Yu           if (!CommonContext || !CommonContext->IsPrefixOf(FContext))
800f4711e0dSHongtao Yu             CommonContext = &FContext;
801f4711e0dSHongtao Yu         }
802a5d30421SWenlei He 
803f4711e0dSHongtao Yu         if (CommonContext == &FContext ||
804f4711e0dSHongtao Yu             (CommonContext && CommonContext->IsPrefixOf(FContext))) {
805f4711e0dSHongtao Yu           // Load profile for the current context which originated from
806f4711e0dSHongtao Yu           // the common ancestor.
807f4711e0dSHongtao Yu           const uint8_t *FuncProfileAddr = Start + NameOffset.second;
808a5d30421SWenlei He           assert(FuncProfileAddr < End && "out of LBRProfile section");
809a5d30421SWenlei He           if (std::error_code EC = readFuncProfile(FuncProfileAddr))
810a5d30421SWenlei He             return EC;
811a5d30421SWenlei He         }
812a5d30421SWenlei He       }
813ebad6788SWei Mi     } else {
8147ca80300SHongtao Yu       if (useMD5()) {
8157ca80300SHongtao Yu         for (auto Name : FuncsToUse) {
8167ca80300SHongtao Yu           auto GUID = std::to_string(MD5Hash(Name));
8177ca80300SHongtao Yu           auto iter = FuncOffsetTable.find(StringRef(GUID));
8187ca80300SHongtao Yu           if (iter == FuncOffsetTable.end())
8197ca80300SHongtao Yu             continue;
8207ca80300SHongtao Yu           const uint8_t *FuncProfileAddr = Start + iter->second;
8217ca80300SHongtao Yu           assert(FuncProfileAddr < End && "out of LBRProfile section");
8227ca80300SHongtao Yu           if (std::error_code EC = readFuncProfile(FuncProfileAddr))
8237ca80300SHongtao Yu             return EC;
8247ca80300SHongtao Yu         }
8257ca80300SHongtao Yu       } else {
8268c8ec1f6SWei Mi         for (auto NameOffset : FuncOffsetTable) {
8277e99bddfSHongtao Yu           SampleContext FContext(NameOffset.first);
828b9db7036SHongtao Yu           auto FuncName = FContext.getName();
8298c8ec1f6SWei Mi           if (!FuncsToUse.count(FuncName) &&
8308c8ec1f6SWei Mi               (!Remapper || !Remapper->exist(FuncName)))
83109dcfe68SWei Mi             continue;
8328c8ec1f6SWei Mi           const uint8_t *FuncProfileAddr = Start + NameOffset.second;
83309dcfe68SWei Mi           assert(FuncProfileAddr < End && "out of LBRProfile section");
83409dcfe68SWei Mi           if (std::error_code EC = readFuncProfile(FuncProfileAddr))
83509dcfe68SWei Mi             return EC;
83609dcfe68SWei Mi         }
837ebad6788SWei Mi       }
8387ca80300SHongtao Yu     }
83909dcfe68SWei Mi     Data = End;
8407e99bddfSHongtao Yu   }
8417e99bddfSHongtao Yu   assert((CSProfileCount == 0 || CSProfileCount == Profiles.size()) &&
8427e99bddfSHongtao Yu          "Cannot have both context-sensitive and regular profile");
843a45d72e0SWenlei He   assert((!CSProfileCount || ProfileIsCS) &&
844a5d30421SWenlei He          "Section flag should be consistent with actual profile");
84509dcfe68SWei Mi   return sampleprof_error::success;
84609dcfe68SWei Mi }
84709dcfe68SWei Mi 
84893953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readProfileSymbolList() {
849b523790aSWei Mi   if (!ProfSymList)
850b523790aSWei Mi     ProfSymList = std::make_unique<ProfileSymbolList>();
851b523790aSWei Mi 
85209dcfe68SWei Mi   if (std::error_code EC = ProfSymList->read(Data, End - Data))
853798e59b8SWei Mi     return EC;
854798e59b8SWei Mi 
85509dcfe68SWei Mi   Data = End;
856b523790aSWei Mi   return sampleprof_error::success;
857b523790aSWei Mi }
858b523790aSWei Mi 
859b523790aSWei Mi std::error_code SampleProfileReaderExtBinaryBase::decompressSection(
860b523790aSWei Mi     const uint8_t *SecStart, const uint64_t SecSize,
861b523790aSWei Mi     const uint8_t *&DecompressBuf, uint64_t &DecompressBufSize) {
862b523790aSWei Mi   Data = SecStart;
863b523790aSWei Mi   End = SecStart + SecSize;
864b523790aSWei Mi   auto DecompressSize = readNumber<uint64_t>();
865b523790aSWei Mi   if (std::error_code EC = DecompressSize.getError())
866b523790aSWei Mi     return EC;
867b523790aSWei Mi   DecompressBufSize = *DecompressSize;
868b523790aSWei Mi 
869798e59b8SWei Mi   auto CompressSize = readNumber<uint64_t>();
870798e59b8SWei Mi   if (std::error_code EC = CompressSize.getError())
871798e59b8SWei Mi     return EC;
872798e59b8SWei Mi 
873b523790aSWei Mi   if (!llvm::zlib::isAvailable())
874b523790aSWei Mi     return sampleprof_error::zlib_unavailable;
875798e59b8SWei Mi 
876b523790aSWei Mi   StringRef CompressedStrings(reinterpret_cast<const char *>(Data),
877b523790aSWei Mi                               *CompressSize);
878b523790aSWei Mi   char *Buffer = Allocator.Allocate<char>(DecompressBufSize);
879283df8cfSWei Mi   size_t UCSize = DecompressBufSize;
880b523790aSWei Mi   llvm::Error E =
881283df8cfSWei Mi       zlib::uncompress(CompressedStrings, Buffer, UCSize);
882b523790aSWei Mi   if (E)
883b523790aSWei Mi     return sampleprof_error::uncompress_failed;
884b523790aSWei Mi   DecompressBuf = reinterpret_cast<const uint8_t *>(Buffer);
885798e59b8SWei Mi   return sampleprof_error::success;
886798e59b8SWei Mi }
887798e59b8SWei Mi 
8888c8ec1f6SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readImpl() {
889077a9c70SWei Mi   const uint8_t *BufStart =
890077a9c70SWei Mi       reinterpret_cast<const uint8_t *>(Buffer->getBufferStart());
891077a9c70SWei Mi 
892077a9c70SWei Mi   for (auto &Entry : SecHdrTable) {
893077a9c70SWei Mi     // Skip empty section.
894077a9c70SWei Mi     if (!Entry.Size)
895077a9c70SWei Mi       continue;
896b523790aSWei Mi 
89721b1ad03SWei Mi     // Skip sections without context when SkipFlatProf is true.
89821b1ad03SWei Mi     if (SkipFlatProf && hasSecFlag(Entry, SecCommonFlags::SecFlagFlat))
89921b1ad03SWei Mi       continue;
90021b1ad03SWei Mi 
901077a9c70SWei Mi     const uint8_t *SecStart = BufStart + Entry.Offset;
902b523790aSWei Mi     uint64_t SecSize = Entry.Size;
903b523790aSWei Mi 
904b523790aSWei Mi     // If the section is compressed, decompress it into a buffer
905b523790aSWei Mi     // DecompressBuf before reading the actual data. The pointee of
906b523790aSWei Mi     // 'Data' will be changed to buffer hold by DecompressBuf
907b523790aSWei Mi     // temporarily when reading the actual data.
908ebad6788SWei Mi     bool isCompressed = hasSecFlag(Entry, SecCommonFlags::SecFlagCompress);
909b523790aSWei Mi     if (isCompressed) {
910b523790aSWei Mi       const uint8_t *DecompressBuf;
911b523790aSWei Mi       uint64_t DecompressBufSize;
912b523790aSWei Mi       if (std::error_code EC = decompressSection(
913b523790aSWei Mi               SecStart, SecSize, DecompressBuf, DecompressBufSize))
914077a9c70SWei Mi         return EC;
915b523790aSWei Mi       SecStart = DecompressBuf;
916b523790aSWei Mi       SecSize = DecompressBufSize;
917b523790aSWei Mi     }
918b523790aSWei Mi 
919ebad6788SWei Mi     if (std::error_code EC = readOneSection(SecStart, SecSize, Entry))
920b523790aSWei Mi       return EC;
921b523790aSWei Mi     if (Data != SecStart + SecSize)
922be907324SWei Mi       return sampleprof_error::malformed;
923b523790aSWei Mi 
924b523790aSWei Mi     // Change the pointee of 'Data' from DecompressBuf to original Buffer.
925b523790aSWei Mi     if (isCompressed) {
926b523790aSWei Mi       Data = BufStart + Entry.Offset;
927b523790aSWei Mi       End = BufStart + Buffer->getBufferSize();
928b523790aSWei Mi     }
929be907324SWei Mi   }
930be907324SWei Mi 
931be907324SWei Mi   return sampleprof_error::success;
932be907324SWei Mi }
933be907324SWei Mi 
9348c8ec1f6SWei Mi std::error_code SampleProfileReaderCompactBinary::readImpl() {
935ee35784aSWei Mi   // Collect functions used by current module if the Reader has been
936ee35784aSWei Mi   // given a module.
937ee35784aSWei Mi   bool LoadFuncsToBeUsed = collectFuncsFromModule();
9386745ffe4SRong Xu   ProfileIsFS = ProfileIsFSDisciminator;
93924201b64SRong Xu   FunctionSamples::ProfileIsFS = ProfileIsFS;
940d3289544SWenlei He   std::vector<uint64_t> OffsetsToUse;
941ee35784aSWei Mi   if (!LoadFuncsToBeUsed) {
942ee35784aSWei Mi     // load all the function profiles.
943d3289544SWenlei He     for (auto FuncEntry : FuncOffsetTable) {
944d3289544SWenlei He       OffsetsToUse.push_back(FuncEntry.second);
945d3289544SWenlei He     }
946ee35784aSWei Mi   } else {
947ee35784aSWei Mi     // load function profiles on demand.
9486a14325dSWei Mi     for (auto Name : FuncsToUse) {
9496a14325dSWei Mi       auto GUID = std::to_string(MD5Hash(Name));
9506a14325dSWei Mi       auto iter = FuncOffsetTable.find(StringRef(GUID));
9516a14325dSWei Mi       if (iter == FuncOffsetTable.end())
9526a14325dSWei Mi         continue;
953d3289544SWenlei He       OffsetsToUse.push_back(iter->second);
954d3289544SWenlei He     }
955d3289544SWenlei He   }
956d3289544SWenlei He 
957d3289544SWenlei He   for (auto Offset : OffsetsToUse) {
9586a14325dSWei Mi     const uint8_t *SavedData = Data;
95909dcfe68SWei Mi     if (std::error_code EC = readFuncProfile(
96009dcfe68SWei Mi             reinterpret_cast<const uint8_t *>(Buffer->getBufferStart()) +
96109dcfe68SWei Mi             Offset))
9626a14325dSWei Mi       return EC;
9636a14325dSWei Mi     Data = SavedData;
9646a14325dSWei Mi   }
965c572e92cSDiego Novillo   return sampleprof_error::success;
966c572e92cSDiego Novillo }
967c572e92cSDiego Novillo 
968a0c0857eSWei Mi std::error_code SampleProfileReaderRawBinary::verifySPMagic(uint64_t Magic) {
969a0c0857eSWei Mi   if (Magic == SPMagic())
970a0c0857eSWei Mi     return sampleprof_error::success;
971a0c0857eSWei Mi   return sampleprof_error::bad_magic;
972a0c0857eSWei Mi }
973a0c0857eSWei Mi 
974be907324SWei Mi std::error_code SampleProfileReaderExtBinary::verifySPMagic(uint64_t Magic) {
975be907324SWei Mi   if (Magic == SPMagic(SPF_Ext_Binary))
976be907324SWei Mi     return sampleprof_error::success;
977be907324SWei Mi   return sampleprof_error::bad_magic;
978be907324SWei Mi }
979be907324SWei Mi 
980a0c0857eSWei Mi std::error_code
981a0c0857eSWei Mi SampleProfileReaderCompactBinary::verifySPMagic(uint64_t Magic) {
982a0c0857eSWei Mi   if (Magic == SPMagic(SPF_Compact_Binary))
983a0c0857eSWei Mi     return sampleprof_error::success;
984a0c0857eSWei Mi   return sampleprof_error::bad_magic;
985a0c0857eSWei Mi }
986a0c0857eSWei Mi 
987be907324SWei Mi std::error_code SampleProfileReaderBinary::readNameTable() {
988a0c0857eSWei Mi   auto Size = readNumber<uint32_t>();
989a0c0857eSWei Mi   if (std::error_code EC = Size.getError())
990a0c0857eSWei Mi     return EC;
991a906e3ecSWei Mi   NameTable.reserve(*Size + NameTable.size());
992a0c0857eSWei Mi   for (uint32_t I = 0; I < *Size; ++I) {
993a0c0857eSWei Mi     auto Name(readString());
994a0c0857eSWei Mi     if (std::error_code EC = Name.getError())
995a0c0857eSWei Mi       return EC;
996a0c0857eSWei Mi     NameTable.push_back(*Name);
997a0c0857eSWei Mi   }
998a0c0857eSWei Mi 
999a0c0857eSWei Mi   return sampleprof_error::success;
1000a0c0857eSWei Mi }
1001a0c0857eSWei Mi 
100293953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readMD5NameTable() {
1003ebad6788SWei Mi   auto Size = readNumber<uint64_t>();
1004ebad6788SWei Mi   if (std::error_code EC = Size.getError())
1005ebad6788SWei Mi     return EC;
1006ebad6788SWei Mi   MD5StringBuf = std::make_unique<std::vector<std::string>>();
1007ebad6788SWei Mi   MD5StringBuf->reserve(*Size);
100864e76853SWei Mi   if (FixedLengthMD5) {
100964e76853SWei Mi     // Preallocate and initialize NameTable so we can check whether a name
101064e76853SWei Mi     // index has been read before by checking whether the element in the
101164e76853SWei Mi     // NameTable is empty, meanwhile readStringIndex can do the boundary
101264e76853SWei Mi     // check using the size of NameTable.
101364e76853SWei Mi     NameTable.resize(*Size + NameTable.size());
101464e76853SWei Mi 
101564e76853SWei Mi     MD5NameMemStart = Data;
101664e76853SWei Mi     Data = Data + (*Size) * sizeof(uint64_t);
101764e76853SWei Mi     return sampleprof_error::success;
101864e76853SWei Mi   }
101964e76853SWei Mi   NameTable.reserve(*Size);
1020ebad6788SWei Mi   for (uint32_t I = 0; I < *Size; ++I) {
1021ebad6788SWei Mi     auto FID = readNumber<uint64_t>();
1022ebad6788SWei Mi     if (std::error_code EC = FID.getError())
1023ebad6788SWei Mi       return EC;
1024ebad6788SWei Mi     MD5StringBuf->push_back(std::to_string(*FID));
1025ebad6788SWei Mi     // NameTable is a vector of StringRef. Here it is pushing back a
1026ebad6788SWei Mi     // StringRef initialized with the last string in MD5stringBuf.
1027ebad6788SWei Mi     NameTable.push_back(MD5StringBuf->back());
1028ebad6788SWei Mi   }
1029ebad6788SWei Mi   return sampleprof_error::success;
1030ebad6788SWei Mi }
1031ebad6788SWei Mi 
103293953d41SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readNameTableSec(bool IsMD5) {
1033ebad6788SWei Mi   if (IsMD5)
1034ebad6788SWei Mi     return readMD5NameTable();
1035ebad6788SWei Mi   return SampleProfileReaderBinary::readNameTable();
1036ebad6788SWei Mi }
1037ebad6788SWei Mi 
1038b9db7036SHongtao Yu // Read in the CS name table section, which basically contains a list of context
1039b9db7036SHongtao Yu // vectors. Each element of a context vector, aka a frame, refers to the
1040b9db7036SHongtao Yu // underlying raw function names that are stored in the name table, as well as
1041b9db7036SHongtao Yu // a callsite identifier that only makes sense for non-leaf frames.
1042b9db7036SHongtao Yu std::error_code SampleProfileReaderExtBinaryBase::readCSNameTableSec() {
1043b9db7036SHongtao Yu   auto Size = readNumber<uint32_t>();
1044b9db7036SHongtao Yu   if (std::error_code EC = Size.getError())
1045b9db7036SHongtao Yu     return EC;
1046b9db7036SHongtao Yu 
1047b9db7036SHongtao Yu   std::vector<SampleContextFrameVector> *PNameVec =
1048b9db7036SHongtao Yu       new std::vector<SampleContextFrameVector>();
1049b9db7036SHongtao Yu   PNameVec->reserve(*Size);
1050b9db7036SHongtao Yu   for (uint32_t I = 0; I < *Size; ++I) {
1051b9db7036SHongtao Yu     PNameVec->emplace_back(SampleContextFrameVector());
1052b9db7036SHongtao Yu     auto ContextSize = readNumber<uint32_t>();
1053b9db7036SHongtao Yu     if (std::error_code EC = ContextSize.getError())
1054b9db7036SHongtao Yu       return EC;
1055b9db7036SHongtao Yu     for (uint32_t J = 0; J < *ContextSize; ++J) {
1056ac068e01SHongtao Yu       auto FName(readStringFromTable());
1057ac068e01SHongtao Yu       if (std::error_code EC = FName.getError())
1058ac068e01SHongtao Yu         return EC;
1059b9db7036SHongtao Yu       auto LineOffset = readNumber<uint64_t>();
1060b9db7036SHongtao Yu       if (std::error_code EC = LineOffset.getError())
1061b9db7036SHongtao Yu         return EC;
1062ac068e01SHongtao Yu 
1063b9db7036SHongtao Yu       if (!isOffsetLegal(*LineOffset))
1064b9db7036SHongtao Yu         return std::error_code();
10651410db70SWenlei He 
1066b9db7036SHongtao Yu       auto Discriminator = readNumber<uint64_t>();
1067b9db7036SHongtao Yu       if (std::error_code EC = Discriminator.getError())
1068b9db7036SHongtao Yu         return EC;
1069b9db7036SHongtao Yu 
1070b9db7036SHongtao Yu       PNameVec->back().emplace_back(
1071b9db7036SHongtao Yu           FName.get(), LineLocation(LineOffset.get(), Discriminator.get()));
1072b9db7036SHongtao Yu     }
1073b9db7036SHongtao Yu   }
1074b9db7036SHongtao Yu 
1075b9db7036SHongtao Yu   // From this point the underlying object of CSNameTable should be immutable.
1076b9db7036SHongtao Yu   CSNameTable.reset(PNameVec);
1077b9db7036SHongtao Yu   return sampleprof_error::success;
1078b9db7036SHongtao Yu }
1079b9db7036SHongtao Yu 
1080b9db7036SHongtao Yu std::error_code
1081b9db7036SHongtao Yu SampleProfileReaderExtBinaryBase::readFuncMetadata(bool ProfileHasAttribute) {
1082b9db7036SHongtao Yu   while (Data < End) {
1083b9db7036SHongtao Yu     auto FContext(readSampleContextFromTable());
1084b9db7036SHongtao Yu     if (std::error_code EC = FContext.getError())
1085b9db7036SHongtao Yu       return EC;
1086b9db7036SHongtao Yu 
1087b9db7036SHongtao Yu     bool ProfileInMap = Profiles.count(*FContext);
10881410db70SWenlei He     if (ProfileIsProbeBased) {
1089ac068e01SHongtao Yu       auto Checksum = readNumber<uint64_t>();
1090ac068e01SHongtao Yu       if (std::error_code EC = Checksum.getError())
1091ac068e01SHongtao Yu         return EC;
10921410db70SWenlei He       if (ProfileInMap)
1093b9db7036SHongtao Yu         Profiles[*FContext].setFunctionHash(*Checksum);
1094ac068e01SHongtao Yu     }
1095224fee82SHongtao Yu 
10961410db70SWenlei He     if (ProfileHasAttribute) {
10971410db70SWenlei He       auto Attributes = readNumber<uint32_t>();
10981410db70SWenlei He       if (std::error_code EC = Attributes.getError())
10991410db70SWenlei He         return EC;
11001410db70SWenlei He       if (ProfileInMap)
1101b9db7036SHongtao Yu         Profiles[*FContext].getContext().setAllAttributes(*Attributes);
11021410db70SWenlei He     }
11031410db70SWenlei He   }
11041410db70SWenlei He 
1105224fee82SHongtao Yu   assert(Data == End && "More data is read than expected");
1106ac068e01SHongtao Yu   return sampleprof_error::success;
1107ac068e01SHongtao Yu }
1108ac068e01SHongtao Yu 
1109a0c0857eSWei Mi std::error_code SampleProfileReaderCompactBinary::readNameTable() {
1110a0c0857eSWei Mi   auto Size = readNumber<uint64_t>();
1111a0c0857eSWei Mi   if (std::error_code EC = Size.getError())
1112a0c0857eSWei Mi     return EC;
1113a0c0857eSWei Mi   NameTable.reserve(*Size);
1114a0c0857eSWei Mi   for (uint32_t I = 0; I < *Size; ++I) {
1115a0c0857eSWei Mi     auto FID = readNumber<uint64_t>();
1116a0c0857eSWei Mi     if (std::error_code EC = FID.getError())
1117a0c0857eSWei Mi       return EC;
1118a0c0857eSWei Mi     NameTable.push_back(std::to_string(*FID));
1119a0c0857eSWei Mi   }
1120a0c0857eSWei Mi   return sampleprof_error::success;
1121a0c0857eSWei Mi }
1122a0c0857eSWei Mi 
1123a906e3ecSWei Mi std::error_code
1124a906e3ecSWei Mi SampleProfileReaderExtBinaryBase::readSecHdrTableEntry(uint32_t Idx) {
1125be907324SWei Mi   SecHdrTableEntry Entry;
1126be907324SWei Mi   auto Type = readUnencodedNumber<uint64_t>();
1127be907324SWei Mi   if (std::error_code EC = Type.getError())
1128be907324SWei Mi     return EC;
1129be907324SWei Mi   Entry.Type = static_cast<SecType>(*Type);
1130c572e92cSDiego Novillo 
1131b523790aSWei Mi   auto Flags = readUnencodedNumber<uint64_t>();
1132b523790aSWei Mi   if (std::error_code EC = Flags.getError())
1133be907324SWei Mi     return EC;
1134b523790aSWei Mi   Entry.Flags = *Flags;
1135be907324SWei Mi 
1136be907324SWei Mi   auto Offset = readUnencodedNumber<uint64_t>();
1137be907324SWei Mi   if (std::error_code EC = Offset.getError())
1138be907324SWei Mi     return EC;
1139be907324SWei Mi   Entry.Offset = *Offset;
1140be907324SWei Mi 
1141be907324SWei Mi   auto Size = readUnencodedNumber<uint64_t>();
1142be907324SWei Mi   if (std::error_code EC = Size.getError())
1143be907324SWei Mi     return EC;
1144be907324SWei Mi   Entry.Size = *Size;
1145be907324SWei Mi 
1146a906e3ecSWei Mi   Entry.LayoutIndex = Idx;
1147be907324SWei Mi   SecHdrTable.push_back(std::move(Entry));
1148be907324SWei Mi   return sampleprof_error::success;
1149be907324SWei Mi }
1150be907324SWei Mi 
1151be907324SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readSecHdrTable() {
1152be907324SWei Mi   auto EntryNum = readUnencodedNumber<uint64_t>();
1153be907324SWei Mi   if (std::error_code EC = EntryNum.getError())
1154be907324SWei Mi     return EC;
1155be907324SWei Mi 
1156be907324SWei Mi   for (uint32_t i = 0; i < (*EntryNum); i++)
1157a906e3ecSWei Mi     if (std::error_code EC = readSecHdrTableEntry(i))
1158be907324SWei Mi       return EC;
1159be907324SWei Mi 
1160be907324SWei Mi   return sampleprof_error::success;
1161be907324SWei Mi }
1162be907324SWei Mi 
1163be907324SWei Mi std::error_code SampleProfileReaderExtBinaryBase::readHeader() {
1164be907324SWei Mi   const uint8_t *BufStart =
1165be907324SWei Mi       reinterpret_cast<const uint8_t *>(Buffer->getBufferStart());
1166be907324SWei Mi   Data = BufStart;
1167be907324SWei Mi   End = BufStart + Buffer->getBufferSize();
1168be907324SWei Mi 
1169be907324SWei Mi   if (std::error_code EC = readMagicIdent())
1170be907324SWei Mi     return EC;
1171be907324SWei Mi 
1172be907324SWei Mi   if (std::error_code EC = readSecHdrTable())
1173be907324SWei Mi     return EC;
1174be907324SWei Mi 
1175be907324SWei Mi   return sampleprof_error::success;
1176be907324SWei Mi }
1177be907324SWei Mi 
1178eee532cdSWei Mi uint64_t SampleProfileReaderExtBinaryBase::getSectionSize(SecType Type) {
1179a906e3ecSWei Mi   uint64_t Size = 0;
1180eee532cdSWei Mi   for (auto &Entry : SecHdrTable) {
1181eee532cdSWei Mi     if (Entry.Type == Type)
1182a906e3ecSWei Mi       Size += Entry.Size;
1183eee532cdSWei Mi   }
1184a906e3ecSWei Mi   return Size;
1185eee532cdSWei Mi }
1186eee532cdSWei Mi 
1187eee532cdSWei Mi uint64_t SampleProfileReaderExtBinaryBase::getFileSize() {
118809dcfe68SWei Mi   // Sections in SecHdrTable is not necessarily in the same order as
118909dcfe68SWei Mi   // sections in the profile because section like FuncOffsetTable needs
119009dcfe68SWei Mi   // to be written after section LBRProfile but needs to be read before
119109dcfe68SWei Mi   // section LBRProfile, so we cannot simply use the last entry in
119209dcfe68SWei Mi   // SecHdrTable to calculate the file size.
119309dcfe68SWei Mi   uint64_t FileSize = 0;
119409dcfe68SWei Mi   for (auto &Entry : SecHdrTable) {
119509dcfe68SWei Mi     FileSize = std::max(Entry.Offset + Entry.Size, FileSize);
119609dcfe68SWei Mi   }
119709dcfe68SWei Mi   return FileSize;
1198eee532cdSWei Mi }
1199eee532cdSWei Mi 
1200b49eac71SWei Mi static std::string getSecFlagsStr(const SecHdrTableEntry &Entry) {
1201b49eac71SWei Mi   std::string Flags;
1202b49eac71SWei Mi   if (hasSecFlag(Entry, SecCommonFlags::SecFlagCompress))
1203b49eac71SWei Mi     Flags.append("{compressed,");
1204b49eac71SWei Mi   else
1205b49eac71SWei Mi     Flags.append("{");
1206b49eac71SWei Mi 
120721b1ad03SWei Mi   if (hasSecFlag(Entry, SecCommonFlags::SecFlagFlat))
120821b1ad03SWei Mi     Flags.append("flat,");
120921b1ad03SWei Mi 
1210b49eac71SWei Mi   switch (Entry.Type) {
1211b49eac71SWei Mi   case SecNameTable:
121264e76853SWei Mi     if (hasSecFlag(Entry, SecNameTableFlags::SecFlagFixedLengthMD5))
121364e76853SWei Mi       Flags.append("fixlenmd5,");
121464e76853SWei Mi     else if (hasSecFlag(Entry, SecNameTableFlags::SecFlagMD5Name))
1215b49eac71SWei Mi       Flags.append("md5,");
1216ee35784aSWei Mi     if (hasSecFlag(Entry, SecNameTableFlags::SecFlagUniqSuffix))
1217ee35784aSWei Mi       Flags.append("uniq,");
1218b49eac71SWei Mi     break;
1219b49eac71SWei Mi   case SecProfSummary:
1220b49eac71SWei Mi     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagPartial))
1221b49eac71SWei Mi       Flags.append("partial,");
1222a5d30421SWenlei He     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagFullContext))
1223a5d30421SWenlei He       Flags.append("context,");
12246745ffe4SRong Xu     if (hasSecFlag(Entry, SecProfSummaryFlags::SecFlagFSDiscriminator))
12256745ffe4SRong Xu       Flags.append("fs-discriminator,");
1226b49eac71SWei Mi     break;
1227f4711e0dSHongtao Yu   case SecFuncOffsetTable:
1228f4711e0dSHongtao Yu     if (hasSecFlag(Entry, SecFuncOffsetFlags::SecFlagOrdered))
1229f4711e0dSHongtao Yu       Flags.append("ordered,");
1230f4711e0dSHongtao Yu     break;
1231*d0eb472fSHongtao Yu   case SecFuncMetadata:
1232*d0eb472fSHongtao Yu     if (hasSecFlag(Entry, SecFuncMetadataFlags::SecFlagIsProbeBased))
1233*d0eb472fSHongtao Yu       Flags.append("probe,");
1234*d0eb472fSHongtao Yu     if (hasSecFlag(Entry, SecFuncMetadataFlags::SecFlagHasAttribute))
1235*d0eb472fSHongtao Yu       Flags.append("attr,");
1236*d0eb472fSHongtao Yu     break;
1237b49eac71SWei Mi   default:
1238b49eac71SWei Mi     break;
1239b49eac71SWei Mi   }
1240b49eac71SWei Mi   char &last = Flags.back();
1241b49eac71SWei Mi   if (last == ',')
1242b49eac71SWei Mi     last = '}';
1243b49eac71SWei Mi   else
1244b49eac71SWei Mi     Flags.append("}");
1245b49eac71SWei Mi   return Flags;
1246b49eac71SWei Mi }
1247b49eac71SWei Mi 
1248eee532cdSWei Mi bool SampleProfileReaderExtBinaryBase::dumpSectionInfo(raw_ostream &OS) {
1249eee532cdSWei Mi   uint64_t TotalSecsSize = 0;
1250eee532cdSWei Mi   for (auto &Entry : SecHdrTable) {
1251eee532cdSWei Mi     OS << getSecName(Entry.Type) << " - Offset: " << Entry.Offset
1252b49eac71SWei Mi        << ", Size: " << Entry.Size << ", Flags: " << getSecFlagsStr(Entry)
1253b49eac71SWei Mi        << "\n";
1254b49eac71SWei Mi     ;
1255a906e3ecSWei Mi     TotalSecsSize += Entry.Size;
1256eee532cdSWei Mi   }
1257eee532cdSWei Mi   uint64_t HeaderSize = SecHdrTable.front().Offset;
1258eee532cdSWei Mi   assert(HeaderSize + TotalSecsSize == getFileSize() &&
1259eee532cdSWei Mi          "Size of 'header + sections' doesn't match the total size of profile");
1260eee532cdSWei Mi 
1261eee532cdSWei Mi   OS << "Header Size: " << HeaderSize << "\n";
1262eee532cdSWei Mi   OS << "Total Sections Size: " << TotalSecsSize << "\n";
1263eee532cdSWei Mi   OS << "File Size: " << getFileSize() << "\n";
1264eee532cdSWei Mi   return true;
1265eee532cdSWei Mi }
1266eee532cdSWei Mi 
1267be907324SWei Mi std::error_code SampleProfileReaderBinary::readMagicIdent() {
1268c572e92cSDiego Novillo   // Read and check the magic identifier.
1269c572e92cSDiego Novillo   auto Magic = readNumber<uint64_t>();
1270c572e92cSDiego Novillo   if (std::error_code EC = Magic.getError())
1271c572e92cSDiego Novillo     return EC;
1272a0c0857eSWei Mi   else if (std::error_code EC = verifySPMagic(*Magic))
1273c6b96c8dSWei Mi     return EC;
1274c572e92cSDiego Novillo 
1275c572e92cSDiego Novillo   // Read the version number.
1276c572e92cSDiego Novillo   auto Version = readNumber<uint64_t>();
1277c572e92cSDiego Novillo   if (std::error_code EC = Version.getError())
1278c572e92cSDiego Novillo     return EC;
1279c572e92cSDiego Novillo   else if (*Version != SPVersion())
1280c572e92cSDiego Novillo     return sampleprof_error::unsupported_version;
1281c572e92cSDiego Novillo 
1282be907324SWei Mi   return sampleprof_error::success;
1283be907324SWei Mi }
1284be907324SWei Mi 
1285be907324SWei Mi std::error_code SampleProfileReaderBinary::readHeader() {
1286be907324SWei Mi   Data = reinterpret_cast<const uint8_t *>(Buffer->getBufferStart());
1287be907324SWei Mi   End = Data + Buffer->getBufferSize();
1288be907324SWei Mi 
1289be907324SWei Mi   if (std::error_code EC = readMagicIdent())
1290be907324SWei Mi     return EC;
1291be907324SWei Mi 
129240ee23dbSEaswaran Raman   if (std::error_code EC = readSummary())
129340ee23dbSEaswaran Raman     return EC;
129440ee23dbSEaswaran Raman 
1295a0c0857eSWei Mi   if (std::error_code EC = readNameTable())
1296760c5a8fSDiego Novillo     return EC;
1297c572e92cSDiego Novillo   return sampleprof_error::success;
1298c572e92cSDiego Novillo }
1299c572e92cSDiego Novillo 
13006a14325dSWei Mi std::error_code SampleProfileReaderCompactBinary::readHeader() {
13016a14325dSWei Mi   SampleProfileReaderBinary::readHeader();
13026a14325dSWei Mi   if (std::error_code EC = readFuncOffsetTable())
13036a14325dSWei Mi     return EC;
13046a14325dSWei Mi   return sampleprof_error::success;
13056a14325dSWei Mi }
13066a14325dSWei Mi 
13076a14325dSWei Mi std::error_code SampleProfileReaderCompactBinary::readFuncOffsetTable() {
13086a14325dSWei Mi   auto TableOffset = readUnencodedNumber<uint64_t>();
13096a14325dSWei Mi   if (std::error_code EC = TableOffset.getError())
13106a14325dSWei Mi     return EC;
13116a14325dSWei Mi 
13126a14325dSWei Mi   const uint8_t *SavedData = Data;
13136a14325dSWei Mi   const uint8_t *TableStart =
13146a14325dSWei Mi       reinterpret_cast<const uint8_t *>(Buffer->getBufferStart()) +
13156a14325dSWei Mi       *TableOffset;
13166a14325dSWei Mi   Data = TableStart;
13176a14325dSWei Mi 
13186a14325dSWei Mi   auto Size = readNumber<uint64_t>();
13196a14325dSWei Mi   if (std::error_code EC = Size.getError())
13206a14325dSWei Mi     return EC;
13216a14325dSWei Mi 
13226a14325dSWei Mi   FuncOffsetTable.reserve(*Size);
13236a14325dSWei Mi   for (uint32_t I = 0; I < *Size; ++I) {
13246a14325dSWei Mi     auto FName(readStringFromTable());
13256a14325dSWei Mi     if (std::error_code EC = FName.getError())
13266a14325dSWei Mi       return EC;
13276a14325dSWei Mi 
13286a14325dSWei Mi     auto Offset = readNumber<uint64_t>();
13296a14325dSWei Mi     if (std::error_code EC = Offset.getError())
13306a14325dSWei Mi       return EC;
13316a14325dSWei Mi 
13326a14325dSWei Mi     FuncOffsetTable[*FName] = *Offset;
13336a14325dSWei Mi   }
13346a14325dSWei Mi   End = TableStart;
13356a14325dSWei Mi   Data = SavedData;
13366a14325dSWei Mi   return sampleprof_error::success;
13376a14325dSWei Mi }
13386a14325dSWei Mi 
1339ee35784aSWei Mi bool SampleProfileReaderCompactBinary::collectFuncsFromModule() {
1340ee35784aSWei Mi   if (!M)
1341ee35784aSWei Mi     return false;
13426a14325dSWei Mi   FuncsToUse.clear();
1343ee35784aSWei Mi   for (auto &F : *M)
134409dcfe68SWei Mi     FuncsToUse.insert(FunctionSamples::getCanonicalFnName(F));
1345ee35784aSWei Mi   return true;
13466a14325dSWei Mi }
13476a14325dSWei Mi 
134840ee23dbSEaswaran Raman std::error_code SampleProfileReaderBinary::readSummaryEntry(
134940ee23dbSEaswaran Raman     std::vector<ProfileSummaryEntry> &Entries) {
135040ee23dbSEaswaran Raman   auto Cutoff = readNumber<uint64_t>();
135140ee23dbSEaswaran Raman   if (std::error_code EC = Cutoff.getError())
135240ee23dbSEaswaran Raman     return EC;
135340ee23dbSEaswaran Raman 
135440ee23dbSEaswaran Raman   auto MinBlockCount = readNumber<uint64_t>();
135540ee23dbSEaswaran Raman   if (std::error_code EC = MinBlockCount.getError())
135640ee23dbSEaswaran Raman     return EC;
135740ee23dbSEaswaran Raman 
135840ee23dbSEaswaran Raman   auto NumBlocks = readNumber<uint64_t>();
135940ee23dbSEaswaran Raman   if (std::error_code EC = NumBlocks.getError())
136040ee23dbSEaswaran Raman     return EC;
136140ee23dbSEaswaran Raman 
136240ee23dbSEaswaran Raman   Entries.emplace_back(*Cutoff, *MinBlockCount, *NumBlocks);
136340ee23dbSEaswaran Raman   return sampleprof_error::success;
136440ee23dbSEaswaran Raman }
136540ee23dbSEaswaran Raman 
136640ee23dbSEaswaran Raman std::error_code SampleProfileReaderBinary::readSummary() {
136740ee23dbSEaswaran Raman   auto TotalCount = readNumber<uint64_t>();
136840ee23dbSEaswaran Raman   if (std::error_code EC = TotalCount.getError())
136940ee23dbSEaswaran Raman     return EC;
137040ee23dbSEaswaran Raman 
137140ee23dbSEaswaran Raman   auto MaxBlockCount = readNumber<uint64_t>();
137240ee23dbSEaswaran Raman   if (std::error_code EC = MaxBlockCount.getError())
137340ee23dbSEaswaran Raman     return EC;
137440ee23dbSEaswaran Raman 
137540ee23dbSEaswaran Raman   auto MaxFunctionCount = readNumber<uint64_t>();
137640ee23dbSEaswaran Raman   if (std::error_code EC = MaxFunctionCount.getError())
137740ee23dbSEaswaran Raman     return EC;
137840ee23dbSEaswaran Raman 
137940ee23dbSEaswaran Raman   auto NumBlocks = readNumber<uint64_t>();
138040ee23dbSEaswaran Raman   if (std::error_code EC = NumBlocks.getError())
138140ee23dbSEaswaran Raman     return EC;
138240ee23dbSEaswaran Raman 
138340ee23dbSEaswaran Raman   auto NumFunctions = readNumber<uint64_t>();
138440ee23dbSEaswaran Raman   if (std::error_code EC = NumFunctions.getError())
138540ee23dbSEaswaran Raman     return EC;
138640ee23dbSEaswaran Raman 
138740ee23dbSEaswaran Raman   auto NumSummaryEntries = readNumber<uint64_t>();
138840ee23dbSEaswaran Raman   if (std::error_code EC = NumSummaryEntries.getError())
138940ee23dbSEaswaran Raman     return EC;
139040ee23dbSEaswaran Raman 
139140ee23dbSEaswaran Raman   std::vector<ProfileSummaryEntry> Entries;
139240ee23dbSEaswaran Raman   for (unsigned i = 0; i < *NumSummaryEntries; i++) {
139340ee23dbSEaswaran Raman     std::error_code EC = readSummaryEntry(Entries);
139440ee23dbSEaswaran Raman     if (EC != sampleprof_error::success)
139540ee23dbSEaswaran Raman       return EC;
139640ee23dbSEaswaran Raman   }
13970eaee545SJonas Devlieghere   Summary = std::make_unique<ProfileSummary>(
13987cefdb81SEaswaran Raman       ProfileSummary::PSK_Sample, Entries, *TotalCount, *MaxBlockCount, 0,
13997cefdb81SEaswaran Raman       *MaxFunctionCount, *NumBlocks, *NumFunctions);
140040ee23dbSEaswaran Raman 
140140ee23dbSEaswaran Raman   return sampleprof_error::success;
140240ee23dbSEaswaran Raman }
140340ee23dbSEaswaran Raman 
1404a0c0857eSWei Mi bool SampleProfileReaderRawBinary::hasFormat(const MemoryBuffer &Buffer) {
1405c572e92cSDiego Novillo   const uint8_t *Data =
1406c572e92cSDiego Novillo       reinterpret_cast<const uint8_t *>(Buffer.getBufferStart());
1407c572e92cSDiego Novillo   uint64_t Magic = decodeULEB128(Data);
1408c572e92cSDiego Novillo   return Magic == SPMagic();
1409c572e92cSDiego Novillo }
1410c572e92cSDiego Novillo 
1411be907324SWei Mi bool SampleProfileReaderExtBinary::hasFormat(const MemoryBuffer &Buffer) {
1412be907324SWei Mi   const uint8_t *Data =
1413be907324SWei Mi       reinterpret_cast<const uint8_t *>(Buffer.getBufferStart());
1414be907324SWei Mi   uint64_t Magic = decodeULEB128(Data);
1415be907324SWei Mi   return Magic == SPMagic(SPF_Ext_Binary);
1416be907324SWei Mi }
1417be907324SWei Mi 
1418a0c0857eSWei Mi bool SampleProfileReaderCompactBinary::hasFormat(const MemoryBuffer &Buffer) {
1419a0c0857eSWei Mi   const uint8_t *Data =
1420a0c0857eSWei Mi       reinterpret_cast<const uint8_t *>(Buffer.getBufferStart());
1421a0c0857eSWei Mi   uint64_t Magic = decodeULEB128(Data);
1422a0c0857eSWei Mi   return Magic == SPMagic(SPF_Compact_Binary);
1423a0c0857eSWei Mi }
1424a0c0857eSWei Mi 
14253376a787SDiego Novillo std::error_code SampleProfileReaderGCC::skipNextWord() {
14263376a787SDiego Novillo   uint32_t dummy;
14273376a787SDiego Novillo   if (!GcovBuffer.readInt(dummy))
14283376a787SDiego Novillo     return sampleprof_error::truncated;
14293376a787SDiego Novillo   return sampleprof_error::success;
14303376a787SDiego Novillo }
14313376a787SDiego Novillo 
14323376a787SDiego Novillo template <typename T> ErrorOr<T> SampleProfileReaderGCC::readNumber() {
14333376a787SDiego Novillo   if (sizeof(T) <= sizeof(uint32_t)) {
14343376a787SDiego Novillo     uint32_t Val;
14353376a787SDiego Novillo     if (GcovBuffer.readInt(Val) && Val <= std::numeric_limits<T>::max())
14363376a787SDiego Novillo       return static_cast<T>(Val);
14373376a787SDiego Novillo   } else if (sizeof(T) <= sizeof(uint64_t)) {
14383376a787SDiego Novillo     uint64_t Val;
14393376a787SDiego Novillo     if (GcovBuffer.readInt64(Val) && Val <= std::numeric_limits<T>::max())
14403376a787SDiego Novillo       return static_cast<T>(Val);
14413376a787SDiego Novillo   }
14423376a787SDiego Novillo 
14433376a787SDiego Novillo   std::error_code EC = sampleprof_error::malformed;
14443376a787SDiego Novillo   reportError(0, EC.message());
14453376a787SDiego Novillo   return EC;
14463376a787SDiego Novillo }
14473376a787SDiego Novillo 
14483376a787SDiego Novillo ErrorOr<StringRef> SampleProfileReaderGCC::readString() {
14493376a787SDiego Novillo   StringRef Str;
14503376a787SDiego Novillo   if (!GcovBuffer.readString(Str))
14513376a787SDiego Novillo     return sampleprof_error::truncated;
14523376a787SDiego Novillo   return Str;
14533376a787SDiego Novillo }
14543376a787SDiego Novillo 
14553376a787SDiego Novillo std::error_code SampleProfileReaderGCC::readHeader() {
14563376a787SDiego Novillo   // Read the magic identifier.
14573376a787SDiego Novillo   if (!GcovBuffer.readGCDAFormat())
14583376a787SDiego Novillo     return sampleprof_error::unrecognized_format;
14593376a787SDiego Novillo 
14603376a787SDiego Novillo   // Read the version number. Note - the GCC reader does not validate this
14613376a787SDiego Novillo   // version, but the profile creator generates v704.
14623376a787SDiego Novillo   GCOV::GCOVVersion version;
14633376a787SDiego Novillo   if (!GcovBuffer.readGCOVVersion(version))
14643376a787SDiego Novillo     return sampleprof_error::unrecognized_format;
14653376a787SDiego Novillo 
14662d00eb17SFangrui Song   if (version != GCOV::V407)
14673376a787SDiego Novillo     return sampleprof_error::unsupported_version;
14683376a787SDiego Novillo 
14693376a787SDiego Novillo   // Skip the empty integer.
14703376a787SDiego Novillo   if (std::error_code EC = skipNextWord())
14713376a787SDiego Novillo     return EC;
14723376a787SDiego Novillo 
14733376a787SDiego Novillo   return sampleprof_error::success;
14743376a787SDiego Novillo }
14753376a787SDiego Novillo 
14763376a787SDiego Novillo std::error_code SampleProfileReaderGCC::readSectionTag(uint32_t Expected) {
14773376a787SDiego Novillo   uint32_t Tag;
14783376a787SDiego Novillo   if (!GcovBuffer.readInt(Tag))
14793376a787SDiego Novillo     return sampleprof_error::truncated;
14803376a787SDiego Novillo 
14813376a787SDiego Novillo   if (Tag != Expected)
14823376a787SDiego Novillo     return sampleprof_error::malformed;
14833376a787SDiego Novillo 
14843376a787SDiego Novillo   if (std::error_code EC = skipNextWord())
14853376a787SDiego Novillo     return EC;
14863376a787SDiego Novillo 
14873376a787SDiego Novillo   return sampleprof_error::success;
14883376a787SDiego Novillo }
14893376a787SDiego Novillo 
14903376a787SDiego Novillo std::error_code SampleProfileReaderGCC::readNameTable() {
14913376a787SDiego Novillo   if (std::error_code EC = readSectionTag(GCOVTagAFDOFileNames))
14923376a787SDiego Novillo     return EC;
14933376a787SDiego Novillo 
14943376a787SDiego Novillo   uint32_t Size;
14953376a787SDiego Novillo   if (!GcovBuffer.readInt(Size))
14963376a787SDiego Novillo     return sampleprof_error::truncated;
14973376a787SDiego Novillo 
14983376a787SDiego Novillo   for (uint32_t I = 0; I < Size; ++I) {
14993376a787SDiego Novillo     StringRef Str;
15003376a787SDiego Novillo     if (!GcovBuffer.readString(Str))
15013376a787SDiego Novillo       return sampleprof_error::truncated;
1502adcd0268SBenjamin Kramer     Names.push_back(std::string(Str));
15033376a787SDiego Novillo   }
15043376a787SDiego Novillo 
15053376a787SDiego Novillo   return sampleprof_error::success;
15063376a787SDiego Novillo }
15073376a787SDiego Novillo 
15083376a787SDiego Novillo std::error_code SampleProfileReaderGCC::readFunctionProfiles() {
15093376a787SDiego Novillo   if (std::error_code EC = readSectionTag(GCOVTagAFDOFunction))
15103376a787SDiego Novillo     return EC;
15113376a787SDiego Novillo 
15123376a787SDiego Novillo   uint32_t NumFunctions;
15133376a787SDiego Novillo   if (!GcovBuffer.readInt(NumFunctions))
15143376a787SDiego Novillo     return sampleprof_error::truncated;
15153376a787SDiego Novillo 
1516aae1ed8eSDiego Novillo   InlineCallStack Stack;
15173376a787SDiego Novillo   for (uint32_t I = 0; I < NumFunctions; ++I)
1518aae1ed8eSDiego Novillo     if (std::error_code EC = readOneFunctionProfile(Stack, true, 0))
15193376a787SDiego Novillo       return EC;
15203376a787SDiego Novillo 
152140ee23dbSEaswaran Raman   computeSummary();
15223376a787SDiego Novillo   return sampleprof_error::success;
15233376a787SDiego Novillo }
15243376a787SDiego Novillo 
1525aae1ed8eSDiego Novillo std::error_code SampleProfileReaderGCC::readOneFunctionProfile(
1526aae1ed8eSDiego Novillo     const InlineCallStack &InlineStack, bool Update, uint32_t Offset) {
15273376a787SDiego Novillo   uint64_t HeadCount = 0;
1528aae1ed8eSDiego Novillo   if (InlineStack.size() == 0)
15293376a787SDiego Novillo     if (!GcovBuffer.readInt64(HeadCount))
15303376a787SDiego Novillo       return sampleprof_error::truncated;
15313376a787SDiego Novillo 
15323376a787SDiego Novillo   uint32_t NameIdx;
15333376a787SDiego Novillo   if (!GcovBuffer.readInt(NameIdx))
15343376a787SDiego Novillo     return sampleprof_error::truncated;
15353376a787SDiego Novillo 
15363376a787SDiego Novillo   StringRef Name(Names[NameIdx]);
15373376a787SDiego Novillo 
15383376a787SDiego Novillo   uint32_t NumPosCounts;
15393376a787SDiego Novillo   if (!GcovBuffer.readInt(NumPosCounts))
15403376a787SDiego Novillo     return sampleprof_error::truncated;
15413376a787SDiego Novillo 
1542aae1ed8eSDiego Novillo   uint32_t NumCallsites;
1543aae1ed8eSDiego Novillo   if (!GcovBuffer.readInt(NumCallsites))
15443376a787SDiego Novillo     return sampleprof_error::truncated;
15453376a787SDiego Novillo 
1546aae1ed8eSDiego Novillo   FunctionSamples *FProfile = nullptr;
1547aae1ed8eSDiego Novillo   if (InlineStack.size() == 0) {
1548aae1ed8eSDiego Novillo     // If this is a top function that we have already processed, do not
1549aae1ed8eSDiego Novillo     // update its profile again.  This happens in the presence of
1550aae1ed8eSDiego Novillo     // function aliases.  Since these aliases share the same function
1551aae1ed8eSDiego Novillo     // body, there will be identical replicated profiles for the
1552aae1ed8eSDiego Novillo     // original function.  In this case, we simply not bother updating
1553aae1ed8eSDiego Novillo     // the profile of the original function.
1554aae1ed8eSDiego Novillo     FProfile = &Profiles[Name];
1555aae1ed8eSDiego Novillo     FProfile->addHeadSamples(HeadCount);
1556aae1ed8eSDiego Novillo     if (FProfile->getTotalSamples() > 0)
15573376a787SDiego Novillo       Update = false;
1558aae1ed8eSDiego Novillo   } else {
1559aae1ed8eSDiego Novillo     // Otherwise, we are reading an inlined instance. The top of the
1560aae1ed8eSDiego Novillo     // inline stack contains the profile of the caller. Insert this
1561aae1ed8eSDiego Novillo     // callee in the caller's CallsiteMap.
1562aae1ed8eSDiego Novillo     FunctionSamples *CallerProfile = InlineStack.front();
1563aae1ed8eSDiego Novillo     uint32_t LineOffset = Offset >> 16;
1564aae1ed8eSDiego Novillo     uint32_t Discriminator = Offset & 0xffff;
1565aae1ed8eSDiego Novillo     FProfile = &CallerProfile->functionSamplesAt(
1566adcd0268SBenjamin Kramer         LineLocation(LineOffset, Discriminator))[std::string(Name)];
15673376a787SDiego Novillo   }
156857d1dda5SDehao Chen   FProfile->setName(Name);
15693376a787SDiego Novillo 
15703376a787SDiego Novillo   for (uint32_t I = 0; I < NumPosCounts; ++I) {
15713376a787SDiego Novillo     uint32_t Offset;
15723376a787SDiego Novillo     if (!GcovBuffer.readInt(Offset))
15733376a787SDiego Novillo       return sampleprof_error::truncated;
15743376a787SDiego Novillo 
15753376a787SDiego Novillo     uint32_t NumTargets;
15763376a787SDiego Novillo     if (!GcovBuffer.readInt(NumTargets))
15773376a787SDiego Novillo       return sampleprof_error::truncated;
15783376a787SDiego Novillo 
15793376a787SDiego Novillo     uint64_t Count;
15803376a787SDiego Novillo     if (!GcovBuffer.readInt64(Count))
15813376a787SDiego Novillo       return sampleprof_error::truncated;
15823376a787SDiego Novillo 
1583aae1ed8eSDiego Novillo     // The line location is encoded in the offset as:
1584aae1ed8eSDiego Novillo     //   high 16 bits: line offset to the start of the function.
1585aae1ed8eSDiego Novillo     //   low 16 bits: discriminator.
1586aae1ed8eSDiego Novillo     uint32_t LineOffset = Offset >> 16;
1587aae1ed8eSDiego Novillo     uint32_t Discriminator = Offset & 0xffff;
15883376a787SDiego Novillo 
1589aae1ed8eSDiego Novillo     InlineCallStack NewStack;
1590aae1ed8eSDiego Novillo     NewStack.push_back(FProfile);
15911d0bc055SKazu Hirata     llvm::append_range(NewStack, InlineStack);
1592aae1ed8eSDiego Novillo     if (Update) {
1593aae1ed8eSDiego Novillo       // Walk up the inline stack, adding the samples on this line to
1594aae1ed8eSDiego Novillo       // the total sample count of the callers in the chain.
1595aae1ed8eSDiego Novillo       for (auto CallerProfile : NewStack)
1596aae1ed8eSDiego Novillo         CallerProfile->addTotalSamples(Count);
1597aae1ed8eSDiego Novillo 
1598aae1ed8eSDiego Novillo       // Update the body samples for the current profile.
1599aae1ed8eSDiego Novillo       FProfile->addBodySamples(LineOffset, Discriminator, Count);
1600aae1ed8eSDiego Novillo     }
1601aae1ed8eSDiego Novillo 
1602aae1ed8eSDiego Novillo     // Process the list of functions called at an indirect call site.
1603aae1ed8eSDiego Novillo     // These are all the targets that a function pointer (or virtual
1604aae1ed8eSDiego Novillo     // function) resolved at runtime.
16053376a787SDiego Novillo     for (uint32_t J = 0; J < NumTargets; J++) {
16063376a787SDiego Novillo       uint32_t HistVal;
16073376a787SDiego Novillo       if (!GcovBuffer.readInt(HistVal))
16083376a787SDiego Novillo         return sampleprof_error::truncated;
16093376a787SDiego Novillo 
16103376a787SDiego Novillo       if (HistVal != HIST_TYPE_INDIR_CALL_TOPN)
16113376a787SDiego Novillo         return sampleprof_error::malformed;
16123376a787SDiego Novillo 
16133376a787SDiego Novillo       uint64_t TargetIdx;
16143376a787SDiego Novillo       if (!GcovBuffer.readInt64(TargetIdx))
16153376a787SDiego Novillo         return sampleprof_error::truncated;
16163376a787SDiego Novillo       StringRef TargetName(Names[TargetIdx]);
16173376a787SDiego Novillo 
16183376a787SDiego Novillo       uint64_t TargetCount;
16193376a787SDiego Novillo       if (!GcovBuffer.readInt64(TargetCount))
16203376a787SDiego Novillo         return sampleprof_error::truncated;
16213376a787SDiego Novillo 
1622920677a9SDehao Chen       if (Update)
1623920677a9SDehao Chen         FProfile->addCalledTargetSamples(LineOffset, Discriminator,
1624aae1ed8eSDiego Novillo                                          TargetName, TargetCount);
16253376a787SDiego Novillo     }
16263376a787SDiego Novillo   }
16273376a787SDiego Novillo 
1628aae1ed8eSDiego Novillo   // Process all the inlined callers into the current function. These
1629aae1ed8eSDiego Novillo   // are all the callsites that were inlined into this function.
1630aae1ed8eSDiego Novillo   for (uint32_t I = 0; I < NumCallsites; I++) {
16313376a787SDiego Novillo     // The offset is encoded as:
16323376a787SDiego Novillo     //   high 16 bits: line offset to the start of the function.
16333376a787SDiego Novillo     //   low 16 bits: discriminator.
16343376a787SDiego Novillo     uint32_t Offset;
16353376a787SDiego Novillo     if (!GcovBuffer.readInt(Offset))
16363376a787SDiego Novillo       return sampleprof_error::truncated;
1637aae1ed8eSDiego Novillo     InlineCallStack NewStack;
1638aae1ed8eSDiego Novillo     NewStack.push_back(FProfile);
16391d0bc055SKazu Hirata     llvm::append_range(NewStack, InlineStack);
1640aae1ed8eSDiego Novillo     if (std::error_code EC = readOneFunctionProfile(NewStack, Update, Offset))
16413376a787SDiego Novillo       return EC;
16423376a787SDiego Novillo   }
16433376a787SDiego Novillo 
16443376a787SDiego Novillo   return sampleprof_error::success;
16453376a787SDiego Novillo }
16463376a787SDiego Novillo 
16475f8f34e4SAdrian Prantl /// Read a GCC AutoFDO profile.
16483376a787SDiego Novillo ///
16493376a787SDiego Novillo /// This format is generated by the Linux Perf conversion tool at
16503376a787SDiego Novillo /// https://github.com/google/autofdo.
16518c8ec1f6SWei Mi std::error_code SampleProfileReaderGCC::readImpl() {
16526745ffe4SRong Xu   assert(!ProfileIsFSDisciminator && "Gcc profiles not support FSDisciminator");
16533376a787SDiego Novillo   // Read the string table.
16543376a787SDiego Novillo   if (std::error_code EC = readNameTable())
16553376a787SDiego Novillo     return EC;
16563376a787SDiego Novillo 
16573376a787SDiego Novillo   // Read the source profile.
16583376a787SDiego Novillo   if (std::error_code EC = readFunctionProfiles())
16593376a787SDiego Novillo     return EC;
16603376a787SDiego Novillo 
16613376a787SDiego Novillo   return sampleprof_error::success;
16623376a787SDiego Novillo }
16633376a787SDiego Novillo 
16643376a787SDiego Novillo bool SampleProfileReaderGCC::hasFormat(const MemoryBuffer &Buffer) {
16653376a787SDiego Novillo   StringRef Magic(reinterpret_cast<const char *>(Buffer.getBufferStart()));
16663376a787SDiego Novillo   return Magic == "adcg*704";
16673376a787SDiego Novillo }
16683376a787SDiego Novillo 
16698c8ec1f6SWei Mi void SampleProfileReaderItaniumRemapper::applyRemapping(LLVMContext &Ctx) {
1670ebad6788SWei Mi   // If the reader uses MD5 to represent string, we can't remap it because
167128436358SRichard Smith   // we don't know what the original function names were.
1672ebad6788SWei Mi   if (Reader.useMD5()) {
167328436358SRichard Smith     Ctx.diagnose(DiagnosticInfoSampleProfile(
16748c8ec1f6SWei Mi         Reader.getBuffer()->getBufferIdentifier(),
167528436358SRichard Smith         "Profile data remapping cannot be applied to profile data "
167628436358SRichard Smith         "in compact format (original mangled names are not available).",
167728436358SRichard Smith         DS_Warning));
16788c8ec1f6SWei Mi     return;
167928436358SRichard Smith   }
168028436358SRichard Smith 
16816b989a17SWenlei He   // CSSPGO-TODO: Remapper is not yet supported.
16826b989a17SWenlei He   // We will need to remap the entire context string.
16838c8ec1f6SWei Mi   assert(Remappings && "should be initialized while creating remapper");
1684c67ccf5fSWei Mi   for (auto &Sample : Reader.getProfiles()) {
1685c67ccf5fSWei Mi     DenseSet<StringRef> NamesInSample;
1686c67ccf5fSWei Mi     Sample.second.findAllNames(NamesInSample);
1687c67ccf5fSWei Mi     for (auto &Name : NamesInSample)
1688c67ccf5fSWei Mi       if (auto Key = Remappings->insert(Name))
1689c67ccf5fSWei Mi         NameMap.insert({Key, Name});
1690c67ccf5fSWei Mi   }
169128436358SRichard Smith 
16928c8ec1f6SWei Mi   RemappingApplied = true;
169328436358SRichard Smith }
169428436358SRichard Smith 
1695c67ccf5fSWei Mi Optional<StringRef>
1696c67ccf5fSWei Mi SampleProfileReaderItaniumRemapper::lookUpNameInProfile(StringRef Fname) {
16978c8ec1f6SWei Mi   if (auto Key = Remappings->lookup(Fname))
1698c67ccf5fSWei Mi     return NameMap.lookup(Key);
1699c67ccf5fSWei Mi   return None;
170028436358SRichard Smith }
170128436358SRichard Smith 
17025f8f34e4SAdrian Prantl /// Prepare a memory buffer for the contents of \p Filename.
1703de1ab26fSDiego Novillo ///
1704c572e92cSDiego Novillo /// \returns an error code indicating the status of the buffer.
1705fcd55607SDiego Novillo static ErrorOr<std::unique_ptr<MemoryBuffer>>
17060da23a27SBenjamin Kramer setupMemoryBuffer(const Twine &Filename) {
1707e71994a2SJonathan Crowther   auto BufferOrErr = MemoryBuffer::getFileOrSTDIN(Filename, /*IsText=*/true);
1708c572e92cSDiego Novillo   if (std::error_code EC = BufferOrErr.getError())
1709c572e92cSDiego Novillo     return EC;
1710fcd55607SDiego Novillo   auto Buffer = std::move(BufferOrErr.get());
1711c572e92cSDiego Novillo 
1712c572e92cSDiego Novillo   // Sanity check the file.
1713260fe3ecSZachary Turner   if (uint64_t(Buffer->getBufferSize()) > std::numeric_limits<uint32_t>::max())
1714c572e92cSDiego Novillo     return sampleprof_error::too_large;
1715c572e92cSDiego Novillo 
1716c55cf4afSBill Wendling   return std::move(Buffer);
1717c572e92cSDiego Novillo }
1718c572e92cSDiego Novillo 
17195f8f34e4SAdrian Prantl /// Create a sample profile reader based on the format of the input file.
1720c572e92cSDiego Novillo ///
1721c572e92cSDiego Novillo /// \param Filename The file to open.
1722c572e92cSDiego Novillo ///
1723c572e92cSDiego Novillo /// \param C The LLVM context to use to emit diagnostics.
1724c572e92cSDiego Novillo ///
17258d581857SRong Xu /// \param P The FSDiscriminatorPass.
17268d581857SRong Xu ///
17278c8ec1f6SWei Mi /// \param RemapFilename The file used for profile remapping.
17288c8ec1f6SWei Mi ///
1729c572e92cSDiego Novillo /// \returns an error code indicating the status of the created reader.
1730fcd55607SDiego Novillo ErrorOr<std::unique_ptr<SampleProfileReader>>
17318c8ec1f6SWei Mi SampleProfileReader::create(const std::string Filename, LLVMContext &C,
17328d581857SRong Xu                             FSDiscriminatorPass P,
17338c8ec1f6SWei Mi                             const std::string RemapFilename) {
1734fcd55607SDiego Novillo   auto BufferOrError = setupMemoryBuffer(Filename);
1735fcd55607SDiego Novillo   if (std::error_code EC = BufferOrError.getError())
1736c572e92cSDiego Novillo     return EC;
17378d581857SRong Xu   return create(BufferOrError.get(), C, P, RemapFilename);
173851abea74SNathan Slingerland }
1739c572e92cSDiego Novillo 
174028436358SRichard Smith /// Create a sample profile remapper from the given input, to remap the
174128436358SRichard Smith /// function names in the given profile data.
174228436358SRichard Smith ///
174328436358SRichard Smith /// \param Filename The file to open.
174428436358SRichard Smith ///
17458c8ec1f6SWei Mi /// \param Reader The profile reader the remapper is going to be applied to.
17468c8ec1f6SWei Mi ///
174728436358SRichard Smith /// \param C The LLVM context to use to emit diagnostics.
174828436358SRichard Smith ///
174928436358SRichard Smith /// \returns an error code indicating the status of the created reader.
17508c8ec1f6SWei Mi ErrorOr<std::unique_ptr<SampleProfileReaderItaniumRemapper>>
17518c8ec1f6SWei Mi SampleProfileReaderItaniumRemapper::create(const std::string Filename,
17528c8ec1f6SWei Mi                                            SampleProfileReader &Reader,
17538c8ec1f6SWei Mi                                            LLVMContext &C) {
175428436358SRichard Smith   auto BufferOrError = setupMemoryBuffer(Filename);
175528436358SRichard Smith   if (std::error_code EC = BufferOrError.getError())
175628436358SRichard Smith     return EC;
17578c8ec1f6SWei Mi   return create(BufferOrError.get(), Reader, C);
17588c8ec1f6SWei Mi }
17598c8ec1f6SWei Mi 
17608c8ec1f6SWei Mi /// Create a sample profile remapper from the given input, to remap the
17618c8ec1f6SWei Mi /// function names in the given profile data.
17628c8ec1f6SWei Mi ///
17638c8ec1f6SWei Mi /// \param B The memory buffer to create the reader from (assumes ownership).
17648c8ec1f6SWei Mi ///
17658c8ec1f6SWei Mi /// \param C The LLVM context to use to emit diagnostics.
17668c8ec1f6SWei Mi ///
17678c8ec1f6SWei Mi /// \param Reader The profile reader the remapper is going to be applied to.
17688c8ec1f6SWei Mi ///
17698c8ec1f6SWei Mi /// \returns an error code indicating the status of the created reader.
17708c8ec1f6SWei Mi ErrorOr<std::unique_ptr<SampleProfileReaderItaniumRemapper>>
17718c8ec1f6SWei Mi SampleProfileReaderItaniumRemapper::create(std::unique_ptr<MemoryBuffer> &B,
17728c8ec1f6SWei Mi                                            SampleProfileReader &Reader,
17738c8ec1f6SWei Mi                                            LLVMContext &C) {
17748c8ec1f6SWei Mi   auto Remappings = std::make_unique<SymbolRemappingReader>();
17758c8ec1f6SWei Mi   if (Error E = Remappings->read(*B.get())) {
17768c8ec1f6SWei Mi     handleAllErrors(
17778c8ec1f6SWei Mi         std::move(E), [&](const SymbolRemappingParseError &ParseError) {
17788c8ec1f6SWei Mi           C.diagnose(DiagnosticInfoSampleProfile(B->getBufferIdentifier(),
17798c8ec1f6SWei Mi                                                  ParseError.getLineNum(),
17808c8ec1f6SWei Mi                                                  ParseError.getMessage()));
17818c8ec1f6SWei Mi         });
17828c8ec1f6SWei Mi     return sampleprof_error::malformed;
17838c8ec1f6SWei Mi   }
17848c8ec1f6SWei Mi 
17850eaee545SJonas Devlieghere   return std::make_unique<SampleProfileReaderItaniumRemapper>(
17868c8ec1f6SWei Mi       std::move(B), std::move(Remappings), Reader);
178728436358SRichard Smith }
178828436358SRichard Smith 
17895f8f34e4SAdrian Prantl /// Create a sample profile reader based on the format of the input data.
179051abea74SNathan Slingerland ///
179151abea74SNathan Slingerland /// \param B The memory buffer to create the reader from (assumes ownership).
179251abea74SNathan Slingerland ///
179351abea74SNathan Slingerland /// \param C The LLVM context to use to emit diagnostics.
179451abea74SNathan Slingerland ///
17958d581857SRong Xu /// \param P The FSDiscriminatorPass.
17968d581857SRong Xu ///
17978c8ec1f6SWei Mi /// \param RemapFilename The file used for profile remapping.
17988c8ec1f6SWei Mi ///
179951abea74SNathan Slingerland /// \returns an error code indicating the status of the created reader.
180051abea74SNathan Slingerland ErrorOr<std::unique_ptr<SampleProfileReader>>
18018c8ec1f6SWei Mi SampleProfileReader::create(std::unique_ptr<MemoryBuffer> &B, LLVMContext &C,
18028d581857SRong Xu                             FSDiscriminatorPass P,
18038c8ec1f6SWei Mi                             const std::string RemapFilename) {
1804fcd55607SDiego Novillo   std::unique_ptr<SampleProfileReader> Reader;
1805a0c0857eSWei Mi   if (SampleProfileReaderRawBinary::hasFormat(*B))
1806a0c0857eSWei Mi     Reader.reset(new SampleProfileReaderRawBinary(std::move(B), C));
1807be907324SWei Mi   else if (SampleProfileReaderExtBinary::hasFormat(*B))
1808be907324SWei Mi     Reader.reset(new SampleProfileReaderExtBinary(std::move(B), C));
1809a0c0857eSWei Mi   else if (SampleProfileReaderCompactBinary::hasFormat(*B))
1810a0c0857eSWei Mi     Reader.reset(new SampleProfileReaderCompactBinary(std::move(B), C));
181151abea74SNathan Slingerland   else if (SampleProfileReaderGCC::hasFormat(*B))
181251abea74SNathan Slingerland     Reader.reset(new SampleProfileReaderGCC(std::move(B), C));
181351abea74SNathan Slingerland   else if (SampleProfileReaderText::hasFormat(*B))
181451abea74SNathan Slingerland     Reader.reset(new SampleProfileReaderText(std::move(B), C));
18154f823667SNathan Slingerland   else
18164f823667SNathan Slingerland     return sampleprof_error::unrecognized_format;
1817c572e92cSDiego Novillo 
18188c8ec1f6SWei Mi   if (!RemapFilename.empty()) {
18198c8ec1f6SWei Mi     auto ReaderOrErr =
18208c8ec1f6SWei Mi         SampleProfileReaderItaniumRemapper::create(RemapFilename, *Reader, C);
18218c8ec1f6SWei Mi     if (std::error_code EC = ReaderOrErr.getError()) {
18228c8ec1f6SWei Mi       std::string Msg = "Could not create remapper: " + EC.message();
18238c8ec1f6SWei Mi       C.diagnose(DiagnosticInfoSampleProfile(RemapFilename, Msg));
18248c8ec1f6SWei Mi       return EC;
18258c8ec1f6SWei Mi     }
18268c8ec1f6SWei Mi     Reader->Remapper = std::move(ReaderOrErr.get());
18278c8ec1f6SWei Mi   }
18288c8ec1f6SWei Mi 
182994d44c97SWei Mi   FunctionSamples::Format = Reader->getFormat();
1830be907324SWei Mi   if (std::error_code EC = Reader->readHeader()) {
1831fcd55607SDiego Novillo     return EC;
1832be907324SWei Mi   }
1833fcd55607SDiego Novillo 
18348d581857SRong Xu   Reader->setDiscriminatorMaskedBitFrom(P);
18358d581857SRong Xu 
1836c55cf4afSBill Wendling   return std::move(Reader);
1837de1ab26fSDiego Novillo }
183840ee23dbSEaswaran Raman 
183940ee23dbSEaswaran Raman // For text and GCC file formats, we compute the summary after reading the
184040ee23dbSEaswaran Raman // profile. Binary format has the profile summary in its header.
184140ee23dbSEaswaran Raman void SampleProfileReader::computeSummary() {
1842e5a17e3fSEaswaran Raman   SampleProfileSummaryBuilder Builder(ProfileSummaryBuilder::DefaultCutoffs);
1843801d9cc7SWenlei He   Summary = Builder.computeSummaryForProfiles(Profiles);
184440ee23dbSEaswaran Raman }
1845