xref: /llvm-project-15.0.7/llvm/lib/XRay/Trace.cpp (revision 957151bd)
1 //===- Trace.cpp - XRay Trace Loading implementation. ---------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // XRay log reader implementation.
11 //
12 //===----------------------------------------------------------------------===//
13 #include "llvm/XRay/Trace.h"
14 #include "llvm/ADT/STLExtras.h"
15 #include "llvm/Support/DataExtractor.h"
16 #include "llvm/Support/Error.h"
17 #include "llvm/Support/FileSystem.h"
18 #include "llvm/XRay/YAMLXRayRecord.h"
19 
20 using namespace llvm;
21 using namespace llvm::xray;
22 using llvm::yaml::Input;
23 
24 namespace {
25 using XRayRecordStorage =
26     std::aligned_storage<sizeof(XRayRecord), alignof(XRayRecord)>::type;
27 
28 // Populates the FileHeader reference by reading the first 32 bytes of the file.
29 Error readBinaryFormatHeader(StringRef Data, XRayFileHeader &FileHeader) {
30   // FIXME: Maybe deduce whether the data is little or big-endian using some
31   // magic bytes in the beginning of the file?
32 
33   // First 32 bytes of the file will always be the header. We assume a certain
34   // format here:
35   //
36   //   (2)   uint16 : version
37   //   (2)   uint16 : type
38   //   (4)   uint32 : bitfield
39   //   (8)   uint64 : cycle frequency
40   //   (16)  -      : padding
41 
42   DataExtractor HeaderExtractor(Data, true, 8);
43   uint32_t OffsetPtr = 0;
44   FileHeader.Version = HeaderExtractor.getU16(&OffsetPtr);
45   FileHeader.Type = HeaderExtractor.getU16(&OffsetPtr);
46   uint32_t Bitfield = HeaderExtractor.getU32(&OffsetPtr);
47   FileHeader.ConstantTSC = Bitfield & 1uL;
48   FileHeader.NonstopTSC = Bitfield & 1uL << 1;
49   FileHeader.CycleFrequency = HeaderExtractor.getU64(&OffsetPtr);
50   std::memcpy(&FileHeader.FreeFormData, Data.bytes_begin() + OffsetPtr, 16);
51   if (FileHeader.Version != 1 && FileHeader.Version != 2)
52     return make_error<StringError>(
53         Twine("Unsupported XRay file version: ") + Twine(FileHeader.Version),
54         std::make_error_code(std::errc::invalid_argument));
55   return Error::success();
56 }
57 
58 Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader,
59                          std::vector<XRayRecord> &Records) {
60   if (Data.size() < 32)
61     return make_error<StringError>(
62         "Not enough bytes for an XRay log.",
63         std::make_error_code(std::errc::invalid_argument));
64 
65   if (Data.size() - 32 == 0 || Data.size() % 32 != 0)
66     return make_error<StringError>(
67         "Invalid-sized XRay data.",
68         std::make_error_code(std::errc::invalid_argument));
69 
70   if (auto E = readBinaryFormatHeader(Data, FileHeader))
71     return E;
72 
73   // Each record after the header will be 32 bytes, in the following format:
74   //
75   //   (2)   uint16 : record type
76   //   (1)   uint8  : cpu id
77   //   (1)   uint8  : type
78   //   (4)   sint32 : function id
79   //   (8)   uint64 : tsc
80   //   (4)   uint32 : thread id
81   //   (12)  -      : padding
82   for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(32)) {
83     DataExtractor RecordExtractor(S, true, 8);
84     uint32_t OffsetPtr = 0;
85     switch (auto RecordType = RecordExtractor.getU16(&OffsetPtr)) {
86     case 0: { // Normal records.
87       Records.emplace_back();
88       auto &Record = Records.back();
89       Record.RecordType = RecordType;
90       Record.CPU = RecordExtractor.getU8(&OffsetPtr);
91       auto Type = RecordExtractor.getU8(&OffsetPtr);
92       switch (Type) {
93       case 0:
94         Record.Type = RecordTypes::ENTER;
95         break;
96       case 1:
97         Record.Type = RecordTypes::EXIT;
98         break;
99       case 2:
100         Record.Type = RecordTypes::TAIL_EXIT;
101         break;
102       case 3:
103         Record.Type = RecordTypes::ENTER_ARG;
104         break;
105       default:
106         return make_error<StringError>(
107             Twine("Unknown record type '") + Twine(int{Type}) + "'",
108             std::make_error_code(std::errc::executable_format_error));
109       }
110       Record.FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t));
111       Record.TSC = RecordExtractor.getU64(&OffsetPtr);
112       Record.TId = RecordExtractor.getU32(&OffsetPtr);
113       break;
114     }
115     case 1: { // Arg payload record.
116       auto &Record = Records.back();
117       // Advance two bytes to avoid padding.
118       OffsetPtr += 2;
119       int32_t FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t));
120       auto TId = RecordExtractor.getU32(&OffsetPtr);
121       if (Record.FuncId != FuncId || Record.TId != TId)
122         return make_error<StringError>(
123             Twine("Corrupted log, found payload following non-matching "
124                   "function + thread record. Record for ") +
125                 Twine(Record.FuncId) + " != " + Twine(FuncId),
126             std::make_error_code(std::errc::executable_format_error));
127       // Advance another four bytes to avoid padding.
128       OffsetPtr += 4;
129       auto Arg = RecordExtractor.getU64(&OffsetPtr);
130       Record.CallArgs.push_back(Arg);
131       break;
132     }
133     default:
134       return make_error<StringError>(
135           Twine("Unknown record type == ") + Twine(RecordType),
136           std::make_error_code(std::errc::executable_format_error));
137     }
138   }
139   return Error::success();
140 }
141 
142 /// When reading from a Flight Data Recorder mode log, metadata records are
143 /// sparse compared to packed function records, so we must maintain state as we
144 /// read through the sequence of entries. This allows the reader to denormalize
145 /// the CPUId and Thread Id onto each Function Record and transform delta
146 /// encoded TSC values into absolute encodings on each record.
147 struct FDRState {
148   uint16_t CPUId;
149   uint16_t ThreadId;
150   uint64_t BaseTSC;
151 
152   /// Encode some of the state transitions for the FDR log reader as explicit
153   /// checks. These are expectations for the next Record in the stream.
154   enum class Token {
155     NEW_BUFFER_RECORD_OR_EOF,
156     WALLCLOCK_RECORD,
157     NEW_CPU_ID_RECORD,
158     FUNCTION_SEQUENCE,
159     SCAN_TO_END_OF_THREAD_BUF,
160     CUSTOM_EVENT_DATA,
161     CALL_ARGUMENT,
162   };
163   Token Expects;
164 
165   // Each threads buffer may have trailing garbage to scan over, so we track our
166   // progress.
167   uint64_t CurrentBufferSize;
168   uint64_t CurrentBufferConsumed;
169 };
170 
171 const char *fdrStateToTwine(const FDRState::Token &state) {
172   switch (state) {
173   case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF:
174     return "NEW_BUFFER_RECORD_OR_EOF";
175   case FDRState::Token::WALLCLOCK_RECORD:
176     return "WALLCLOCK_RECORD";
177   case FDRState::Token::NEW_CPU_ID_RECORD:
178     return "NEW_CPU_ID_RECORD";
179   case FDRState::Token::FUNCTION_SEQUENCE:
180     return "FUNCTION_SEQUENCE";
181   case FDRState::Token::SCAN_TO_END_OF_THREAD_BUF:
182     return "SCAN_TO_END_OF_THREAD_BUF";
183   case FDRState::Token::CUSTOM_EVENT_DATA:
184     return "CUSTOM_EVENT_DATA";
185   case FDRState::Token::CALL_ARGUMENT:
186     return "CALL_ARGUMENT";
187   }
188   return "UNKNOWN";
189 }
190 
191 /// State transition when a NewBufferRecord is encountered.
192 Error processFDRNewBufferRecord(FDRState &State, uint8_t RecordFirstByte,
193                                 DataExtractor &RecordExtractor) {
194 
195   if (State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF)
196     return make_error<StringError>(
197         "Malformed log. Read New Buffer record kind out of sequence",
198         std::make_error_code(std::errc::executable_format_error));
199   uint32_t OffsetPtr = 1; // 1 byte into record.
200   State.ThreadId = RecordExtractor.getU16(&OffsetPtr);
201   State.Expects = FDRState::Token::WALLCLOCK_RECORD;
202   return Error::success();
203 }
204 
205 /// State transition when an EndOfBufferRecord is encountered.
206 Error processFDREndOfBufferRecord(FDRState &State, uint8_t RecordFirstByte,
207                                   DataExtractor &RecordExtractor) {
208   if (State.Expects == FDRState::Token::NEW_BUFFER_RECORD_OR_EOF)
209     return make_error<StringError>(
210         "Malformed log. Received EOB message without current buffer.",
211         std::make_error_code(std::errc::executable_format_error));
212   State.Expects = FDRState::Token::SCAN_TO_END_OF_THREAD_BUF;
213   return Error::success();
214 }
215 
216 /// State transition when a NewCPUIdRecord is encountered.
217 Error processFDRNewCPUIdRecord(FDRState &State, uint8_t RecordFirstByte,
218                                DataExtractor &RecordExtractor) {
219   if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE &&
220       State.Expects != FDRState::Token::NEW_CPU_ID_RECORD)
221     return make_error<StringError>(
222         "Malformed log. Read NewCPUId record kind out of sequence",
223         std::make_error_code(std::errc::executable_format_error));
224   uint32_t OffsetPtr = 1; // Read starting after the first byte.
225   State.CPUId = RecordExtractor.getU16(&OffsetPtr);
226   State.BaseTSC = RecordExtractor.getU64(&OffsetPtr);
227   State.Expects = FDRState::Token::FUNCTION_SEQUENCE;
228   return Error::success();
229 }
230 
231 /// State transition when a TSCWrapRecord (overflow detection) is encountered.
232 Error processFDRTSCWrapRecord(FDRState &State, uint8_t RecordFirstByte,
233                               DataExtractor &RecordExtractor) {
234   if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE)
235     return make_error<StringError>(
236         "Malformed log. Read TSCWrap record kind out of sequence",
237         std::make_error_code(std::errc::executable_format_error));
238   uint32_t OffsetPtr = 1; // Read starting after the first byte.
239   State.BaseTSC = RecordExtractor.getU64(&OffsetPtr);
240   return Error::success();
241 }
242 
243 /// State transition when a WallTimeMarkerRecord is encountered.
244 Error processFDRWallTimeRecord(FDRState &State, uint8_t RecordFirstByte,
245                                DataExtractor &RecordExtractor) {
246   if (State.Expects != FDRState::Token::WALLCLOCK_RECORD)
247     return make_error<StringError>(
248         "Malformed log. Read Wallclock record kind out of sequence",
249         std::make_error_code(std::errc::executable_format_error));
250   // We don't encode the wall time into any of the records.
251   // XRayRecords are concerned with the TSC instead.
252   State.Expects = FDRState::Token::NEW_CPU_ID_RECORD;
253   return Error::success();
254 }
255 
256 /// State transition when a CustomEventMarker is encountered.
257 Error processCustomEventMarker(FDRState &State, uint8_t RecordFirstByte,
258                                DataExtractor &RecordExtractor,
259                                size_t &RecordSize) {
260   // We can encounter a CustomEventMarker anywhere in the log, so we can handle
261   // it regardless of the expectation. However, we do set the expectation to
262   // read a set number of fixed bytes, as described in the metadata.
263   uint32_t OffsetPtr = 1; // Read after the first byte.
264   uint32_t DataSize = RecordExtractor.getU32(&OffsetPtr);
265   uint64_t TSC = RecordExtractor.getU64(&OffsetPtr);
266 
267   // FIXME: Actually represent the record through the API. For now we only
268   // skip through the data.
269   (void)TSC;
270   RecordSize = 16 + DataSize;
271   return Error::success();
272 }
273 
274 /// State transition when a CallArgumentRecord is encountered.
275 Error processFDRCallArgumentRecord(FDRState &State, uint8_t RecordFirstByte,
276                                    DataExtractor &RecordExtractor,
277                                    std::vector<XRayRecord> &Records) {
278   uint32_t OffsetPtr = 1; // Read starting after the first byte.
279   auto &Enter = Records.back();
280 
281   if (Enter.Type != RecordTypes::ENTER)
282     return make_error<StringError>(
283         "CallArgument needs to be right after a function entry",
284         std::make_error_code(std::errc::executable_format_error));
285   Enter.Type = RecordTypes::ENTER_ARG;
286   Enter.CallArgs.emplace_back(RecordExtractor.getU64(&OffsetPtr));
287   return Error::success();
288 }
289 
290 /// Advances the state machine for reading the FDR record type by reading one
291 /// Metadata Record and updating the State appropriately based on the kind of
292 /// record encountered. The RecordKind is encoded in the first byte of the
293 /// Record, which the caller should pass in because they have already read it
294 /// to determine that this is a metadata record as opposed to a function record.
295 Error processFDRMetadataRecord(FDRState &State, uint8_t RecordFirstByte,
296                                DataExtractor &RecordExtractor,
297                                size_t &RecordSize,
298                                std::vector<XRayRecord> &Records) {
299   // The remaining 7 bits are the RecordKind enum.
300   uint8_t RecordKind = RecordFirstByte >> 1;
301   switch (RecordKind) {
302   case 0: // NewBuffer
303     if (auto E =
304             processFDRNewBufferRecord(State, RecordFirstByte, RecordExtractor))
305       return E;
306     break;
307   case 1: // EndOfBuffer
308     if (auto E = processFDREndOfBufferRecord(State, RecordFirstByte,
309                                              RecordExtractor))
310       return E;
311     break;
312   case 2: // NewCPUId
313     if (auto E =
314             processFDRNewCPUIdRecord(State, RecordFirstByte, RecordExtractor))
315       return E;
316     break;
317   case 3: // TSCWrap
318     if (auto E =
319             processFDRTSCWrapRecord(State, RecordFirstByte, RecordExtractor))
320       return E;
321     break;
322   case 4: // WallTimeMarker
323     if (auto E =
324             processFDRWallTimeRecord(State, RecordFirstByte, RecordExtractor))
325       return E;
326     break;
327   case 5: // CustomEventMarker
328     if (auto E = processCustomEventMarker(State, RecordFirstByte,
329                                           RecordExtractor, RecordSize))
330       return E;
331     break;
332   case 6: // CallArgument
333     if (auto E = processFDRCallArgumentRecord(State, RecordFirstByte,
334                                               RecordExtractor, Records))
335       return E;
336     break;
337   default:
338     // Widen the record type to uint16_t to prevent conversion to char.
339     return make_error<StringError>(
340         Twine("Illegal metadata record type: ")
341             .concat(Twine(static_cast<unsigned>(RecordKind))),
342         std::make_error_code(std::errc::executable_format_error));
343   }
344   return Error::success();
345 }
346 
347 /// Reads a function record from an FDR format log, appending a new XRayRecord
348 /// to the vector being populated and updating the State with a new value
349 /// reference value to interpret TSC deltas.
350 ///
351 /// The XRayRecord constructed includes information from the function record
352 /// processed here as well as Thread ID and CPU ID formerly extracted into
353 /// State.
354 Error processFDRFunctionRecord(FDRState &State, uint8_t RecordFirstByte,
355                                DataExtractor &RecordExtractor,
356                                std::vector<XRayRecord> &Records) {
357   switch (State.Expects) {
358   case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF:
359     return make_error<StringError>(
360         "Malformed log. Received Function Record before new buffer setup.",
361         std::make_error_code(std::errc::executable_format_error));
362   case FDRState::Token::WALLCLOCK_RECORD:
363     return make_error<StringError>(
364         "Malformed log. Received Function Record when expecting wallclock.",
365         std::make_error_code(std::errc::executable_format_error));
366   case FDRState::Token::NEW_CPU_ID_RECORD:
367     return make_error<StringError>(
368         "Malformed log. Received Function Record before first CPU record.",
369         std::make_error_code(std::errc::executable_format_error));
370   default:
371     Records.emplace_back();
372     auto &Record = Records.back();
373     Record.RecordType = 0; // Record is type NORMAL.
374     // Strip off record type bit and use the next three bits.
375     uint8_t RecordType = (RecordFirstByte >> 1) & 0x07;
376     switch (RecordType) {
377     case static_cast<uint8_t>(RecordTypes::ENTER):
378       Record.Type = RecordTypes::ENTER;
379       break;
380     case static_cast<uint8_t>(RecordTypes::EXIT):
381       Record.Type = RecordTypes::EXIT;
382       break;
383     case static_cast<uint8_t>(RecordTypes::TAIL_EXIT):
384       Record.Type = RecordTypes::TAIL_EXIT;
385       break;
386     default:
387       // Cast to an unsigned integer to not interpret the record type as a char.
388       return make_error<StringError>(
389           Twine("Illegal function record type: ")
390               .concat(Twine(static_cast<unsigned>(RecordType))),
391           std::make_error_code(std::errc::executable_format_error));
392     }
393     Record.CPU = State.CPUId;
394     Record.TId = State.ThreadId;
395     // Back up to read first 32 bits, including the 4 we pulled RecordType
396     // and RecordKind out of. The remaining 28 are FunctionId.
397     uint32_t OffsetPtr = 0;
398     // Despite function Id being a signed int on XRayRecord,
399     // when it is written to an FDR format, the top bits are truncated,
400     // so it is effectively an unsigned value. When we shift off the
401     // top four bits, we want the shift to be logical, so we read as
402     // uint32_t.
403     uint32_t FuncIdBitField = RecordExtractor.getU32(&OffsetPtr);
404     Record.FuncId = FuncIdBitField >> 4;
405     // FunctionRecords have a 32 bit delta from the previous absolute TSC
406     // or TSC delta. If this would overflow, we should read a TSCWrap record
407     // with an absolute TSC reading.
408     uint64_t NewTSC = State.BaseTSC + RecordExtractor.getU32(&OffsetPtr);
409     State.BaseTSC = NewTSC;
410     Record.TSC = NewTSC;
411   }
412   return Error::success();
413 }
414 
415 /// Reads a log in FDR mode for version 1 of this binary format. FDR mode is
416 /// defined as part of the compiler-rt project in xray_fdr_logging.h, and such
417 /// a log consists of the familiar 32 bit XRayHeader, followed by sequences of
418 /// of interspersed 16 byte Metadata Records and 8 byte Function Records.
419 ///
420 /// The following is an attempt to document the grammar of the format, which is
421 /// parsed by this function for little-endian machines. Since the format makes
422 /// use of BitFields, when we support big-endian architectures, we will need to
423 /// adjust not only the endianness parameter to llvm's RecordExtractor, but also
424 /// the bit twiddling logic, which is consistent with the little-endian
425 /// convention that BitFields within a struct will first be packed into the
426 /// least significant bits the address they belong to.
427 ///
428 /// We expect a format complying with the grammar in the following pseudo-EBNF.
429 ///
430 /// FDRLog: XRayFileHeader ThreadBuffer*
431 /// XRayFileHeader: 32 bytes to identify the log as FDR with machine metadata.
432 ///     Includes BufferSize
433 /// ThreadBuffer: NewBuffer WallClockTime NewCPUId FunctionSequence EOB
434 /// BufSize: 8 byte unsigned integer indicating how large the buffer is.
435 /// NewBuffer: 16 byte metadata record with Thread Id.
436 /// WallClockTime: 16 byte metadata record with human readable time.
437 /// NewCPUId: 16 byte metadata record with CPUId and a 64 bit TSC reading.
438 /// EOB: 16 byte record in a thread buffer plus mem garbage to fill BufSize.
439 /// FunctionSequence: NewCPUId | TSCWrap | FunctionRecord
440 /// TSCWrap: 16 byte metadata record with a full 64 bit TSC reading.
441 /// FunctionRecord: 8 byte record with FunctionId, entry/exit, and TSC delta.
442 Error loadFDRLog(StringRef Data, XRayFileHeader &FileHeader,
443                  std::vector<XRayRecord> &Records) {
444   if (Data.size() < 32)
445     return make_error<StringError>(
446         "Not enough bytes for an XRay log.",
447         std::make_error_code(std::errc::invalid_argument));
448 
449   // For an FDR log, there are records sized 16 and 8 bytes.
450   // There actually may be no records if no non-trivial functions are
451   // instrumented.
452   if (Data.size() % 8 != 0)
453     return make_error<StringError>(
454         "Invalid-sized XRay data.",
455         std::make_error_code(std::errc::invalid_argument));
456 
457   if (auto E = readBinaryFormatHeader(Data, FileHeader))
458     return E;
459 
460   uint64_t BufferSize = 0;
461   {
462     StringRef ExtraDataRef(FileHeader.FreeFormData, 16);
463     DataExtractor ExtraDataExtractor(ExtraDataRef, true, 8);
464     uint32_t ExtraDataOffset = 0;
465     BufferSize = ExtraDataExtractor.getU64(&ExtraDataOffset);
466   }
467   FDRState State{0,          0, 0, FDRState::Token::NEW_BUFFER_RECORD_OR_EOF,
468                  BufferSize, 0};
469   // RecordSize will tell the loop how far to seek ahead based on the record
470   // type that we have just read.
471   size_t RecordSize = 0;
472   for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(RecordSize)) {
473     DataExtractor RecordExtractor(S, true, 8);
474     uint32_t OffsetPtr = 0;
475     if (State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF) {
476       RecordSize = State.CurrentBufferSize - State.CurrentBufferConsumed;
477       if (S.size() < RecordSize) {
478         return make_error<StringError>(
479             Twine("Incomplete thread buffer. Expected at least ") +
480                 Twine(RecordSize) + " bytes but found " + Twine(S.size()),
481             make_error_code(std::errc::invalid_argument));
482       }
483       State.CurrentBufferConsumed = 0;
484       State.Expects = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF;
485       continue;
486     }
487     uint8_t BitField = RecordExtractor.getU8(&OffsetPtr);
488     bool isMetadataRecord = BitField & 0x01uL;
489     if (isMetadataRecord) {
490       RecordSize = 16;
491       if (auto E = processFDRMetadataRecord(State, BitField, RecordExtractor,
492                                             RecordSize, Records))
493         return E;
494     } else { // Process Function Record
495       RecordSize = 8;
496       if (auto E = processFDRFunctionRecord(State, BitField, RecordExtractor,
497                                             Records))
498         return E;
499     }
500     State.CurrentBufferConsumed += RecordSize;
501   }
502 
503   // Having iterated over everything we've been given, we've either consumed
504   // everything and ended up in the end state, or were told to skip the rest.
505   bool Finished = State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF &&
506                   State.CurrentBufferSize == State.CurrentBufferConsumed;
507   if (State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF && !Finished)
508     return make_error<StringError>(
509         Twine("Encountered EOF with unexpected state expectation ") +
510             fdrStateToTwine(State.Expects) +
511             ". Remaining expected bytes in thread buffer total " +
512             Twine(State.CurrentBufferSize - State.CurrentBufferConsumed),
513         std::make_error_code(std::errc::executable_format_error));
514 
515   return Error::success();
516 }
517 
518 Error loadYAMLLog(StringRef Data, XRayFileHeader &FileHeader,
519                   std::vector<XRayRecord> &Records) {
520   YAMLXRayTrace Trace;
521   Input In(Data);
522   In >> Trace;
523   if (In.error())
524     return make_error<StringError>("Failed loading YAML Data.", In.error());
525 
526   FileHeader.Version = Trace.Header.Version;
527   FileHeader.Type = Trace.Header.Type;
528   FileHeader.ConstantTSC = Trace.Header.ConstantTSC;
529   FileHeader.NonstopTSC = Trace.Header.NonstopTSC;
530   FileHeader.CycleFrequency = Trace.Header.CycleFrequency;
531 
532   if (FileHeader.Version != 1)
533     return make_error<StringError>(
534         Twine("Unsupported XRay file version: ") + Twine(FileHeader.Version),
535         std::make_error_code(std::errc::invalid_argument));
536 
537   Records.clear();
538   std::transform(Trace.Records.begin(), Trace.Records.end(),
539                  std::back_inserter(Records), [&](const YAMLXRayRecord &R) {
540                    return XRayRecord{R.RecordType, R.CPU, R.Type,    R.FuncId,
541                                      R.TSC,        R.TId, R.CallArgs};
542                  });
543   return Error::success();
544 }
545 } // namespace
546 
547 Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
548   int Fd;
549   if (auto EC = sys::fs::openFileForRead(Filename, Fd)) {
550     return make_error<StringError>(
551         Twine("Cannot read log from '") + Filename + "'", EC);
552   }
553 
554   uint64_t FileSize;
555   if (auto EC = sys::fs::file_size(Filename, FileSize)) {
556     return make_error<StringError>(
557         Twine("Cannot read log from '") + Filename + "'", EC);
558   }
559   if (FileSize < 4) {
560     return make_error<StringError>(
561         Twine("File '") + Filename + "' too small for XRay.",
562         std::make_error_code(std::errc::executable_format_error));
563   }
564 
565   // Map the opened file into memory and use a StringRef to access it later.
566   std::error_code EC;
567   sys::fs::mapped_file_region MappedFile(
568       Fd, sys::fs::mapped_file_region::mapmode::readonly, FileSize, 0, EC);
569   if (EC) {
570     return make_error<StringError>(
571         Twine("Cannot read log from '") + Filename + "'", EC);
572   }
573   auto Data = StringRef(MappedFile.data(), MappedFile.size());
574 
575   // Attempt to detect the file type using file magic. We have a slight bias
576   // towards the binary format, and we do this by making sure that the first 4
577   // bytes of the binary file is some combination of the following byte
578   // patterns: (observe the code loading them assumes they're little endian)
579   //
580   //   0x01 0x00 0x00 0x00 - version 1, "naive" format
581   //   0x01 0x00 0x01 0x00 - version 1, "flight data recorder" format
582   //
583   // YAML files don't typically have those first four bytes as valid text so we
584   // try loading assuming YAML if we don't find these bytes.
585   //
586   // Only if we can't load either the binary or the YAML format will we yield an
587   // error.
588   StringRef Magic(MappedFile.data(), 4);
589   DataExtractor HeaderExtractor(Magic, true, 8);
590   uint32_t OffsetPtr = 0;
591   uint16_t Version = HeaderExtractor.getU16(&OffsetPtr);
592   uint16_t Type = HeaderExtractor.getU16(&OffsetPtr);
593 
594   enum BinaryFormatType { NAIVE_FORMAT = 0, FLIGHT_DATA_RECORDER_FORMAT = 1 };
595 
596   Trace T;
597   if (Type == NAIVE_FORMAT && (Version == 1 || Version == 2)) {
598     if (auto E = loadNaiveFormatLog(Data, T.FileHeader, T.Records))
599       return std::move(E);
600   } else if (Version == 1 && Type == FLIGHT_DATA_RECORDER_FORMAT) {
601     if (auto E = loadFDRLog(Data, T.FileHeader, T.Records))
602       return std::move(E);
603   } else {
604     if (auto E = loadYAMLLog(Data, T.FileHeader, T.Records))
605       return std::move(E);
606   }
607 
608   if (Sort)
609     std::sort(T.Records.begin(), T.Records.end(),
610               [&](const XRayRecord &L, const XRayRecord &R) {
611                 return L.TSC < R.TSC;
612               });
613 
614   return std::move(T);
615 }
616