1 //===- Trace.cpp - XRay Trace Loading implementation. ---------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // XRay log reader implementation. 11 // 12 //===----------------------------------------------------------------------===// 13 #include "llvm/XRay/Trace.h" 14 #include "llvm/ADT/STLExtras.h" 15 #include "llvm/Support/DataExtractor.h" 16 #include "llvm/Support/Error.h" 17 #include "llvm/Support/FileSystem.h" 18 #include "llvm/XRay/YAMLXRayRecord.h" 19 20 using namespace llvm; 21 using namespace llvm::xray; 22 using llvm::yaml::Input; 23 24 namespace { 25 using XRayRecordStorage = 26 std::aligned_storage<sizeof(XRayRecord), alignof(XRayRecord)>::type; 27 28 // Populates the FileHeader reference by reading the first 32 bytes of the file. 29 Error readBinaryFormatHeader(StringRef Data, XRayFileHeader &FileHeader) { 30 // FIXME: Maybe deduce whether the data is little or big-endian using some 31 // magic bytes in the beginning of the file? 32 33 // First 32 bytes of the file will always be the header. We assume a certain 34 // format here: 35 // 36 // (2) uint16 : version 37 // (2) uint16 : type 38 // (4) uint32 : bitfield 39 // (8) uint64 : cycle frequency 40 // (16) - : padding 41 42 DataExtractor HeaderExtractor(Data, true, 8); 43 uint32_t OffsetPtr = 0; 44 FileHeader.Version = HeaderExtractor.getU16(&OffsetPtr); 45 FileHeader.Type = HeaderExtractor.getU16(&OffsetPtr); 46 uint32_t Bitfield = HeaderExtractor.getU32(&OffsetPtr); 47 FileHeader.ConstantTSC = Bitfield & 1uL; 48 FileHeader.NonstopTSC = Bitfield & 1uL << 1; 49 FileHeader.CycleFrequency = HeaderExtractor.getU64(&OffsetPtr); 50 std::memcpy(&FileHeader.FreeFormData, Data.bytes_begin() + OffsetPtr, 16); 51 if (FileHeader.Version != 1 && FileHeader.Version != 2) 52 return make_error<StringError>( 53 Twine("Unsupported XRay file version: ") + Twine(FileHeader.Version), 54 std::make_error_code(std::errc::invalid_argument)); 55 return Error::success(); 56 } 57 58 Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader, 59 std::vector<XRayRecord> &Records) { 60 if (Data.size() < 32) 61 return make_error<StringError>( 62 "Not enough bytes for an XRay log.", 63 std::make_error_code(std::errc::invalid_argument)); 64 65 if (Data.size() - 32 == 0 || Data.size() % 32 != 0) 66 return make_error<StringError>( 67 "Invalid-sized XRay data.", 68 std::make_error_code(std::errc::invalid_argument)); 69 70 if (auto E = readBinaryFormatHeader(Data, FileHeader)) 71 return E; 72 73 // Each record after the header will be 32 bytes, in the following format: 74 // 75 // (2) uint16 : record type 76 // (1) uint8 : cpu id 77 // (1) uint8 : type 78 // (4) sint32 : function id 79 // (8) uint64 : tsc 80 // (4) uint32 : thread id 81 // (12) - : padding 82 for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(32)) { 83 DataExtractor RecordExtractor(S, true, 8); 84 uint32_t OffsetPtr = 0; 85 switch (auto RecordType = RecordExtractor.getU16(&OffsetPtr)) { 86 case 0: { // Normal records. 87 Records.emplace_back(); 88 auto &Record = Records.back(); 89 Record.RecordType = RecordType; 90 Record.CPU = RecordExtractor.getU8(&OffsetPtr); 91 auto Type = RecordExtractor.getU8(&OffsetPtr); 92 switch (Type) { 93 case 0: 94 Record.Type = RecordTypes::ENTER; 95 break; 96 case 1: 97 Record.Type = RecordTypes::EXIT; 98 break; 99 case 2: 100 Record.Type = RecordTypes::TAIL_EXIT; 101 break; 102 case 3: 103 Record.Type = RecordTypes::ENTER_ARG; 104 break; 105 default: 106 return make_error<StringError>( 107 Twine("Unknown record type '") + Twine(int{Type}) + "'", 108 std::make_error_code(std::errc::executable_format_error)); 109 } 110 Record.FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t)); 111 Record.TSC = RecordExtractor.getU64(&OffsetPtr); 112 Record.TId = RecordExtractor.getU32(&OffsetPtr); 113 break; 114 } 115 case 1: { // Arg payload record. 116 auto &Record = Records.back(); 117 // Advance two bytes to avoid padding. 118 OffsetPtr += 2; 119 int32_t FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t)); 120 auto TId = RecordExtractor.getU32(&OffsetPtr); 121 if (Record.FuncId != FuncId || Record.TId != TId) 122 return make_error<StringError>( 123 Twine("Corrupted log, found arg payload following non-matching " 124 "function + thread record. Record for function ") + 125 Twine(Record.FuncId) + " != " + Twine(FuncId) + "; offset: " + 126 Twine(S.data() - Data.data()), 127 std::make_error_code(std::errc::executable_format_error)); 128 // Advance another four bytes to avoid padding. 129 OffsetPtr += 4; 130 auto Arg = RecordExtractor.getU64(&OffsetPtr); 131 Record.CallArgs.push_back(Arg); 132 break; 133 } 134 default: 135 return make_error<StringError>( 136 Twine("Unknown record type == ") + Twine(RecordType), 137 std::make_error_code(std::errc::executable_format_error)); 138 } 139 } 140 return Error::success(); 141 } 142 143 /// When reading from a Flight Data Recorder mode log, metadata records are 144 /// sparse compared to packed function records, so we must maintain state as we 145 /// read through the sequence of entries. This allows the reader to denormalize 146 /// the CPUId and Thread Id onto each Function Record and transform delta 147 /// encoded TSC values into absolute encodings on each record. 148 struct FDRState { 149 uint16_t CPUId; 150 uint16_t ThreadId; 151 uint64_t BaseTSC; 152 153 /// Encode some of the state transitions for the FDR log reader as explicit 154 /// checks. These are expectations for the next Record in the stream. 155 enum class Token { 156 NEW_BUFFER_RECORD_OR_EOF, 157 WALLCLOCK_RECORD, 158 NEW_CPU_ID_RECORD, 159 FUNCTION_SEQUENCE, 160 SCAN_TO_END_OF_THREAD_BUF, 161 CUSTOM_EVENT_DATA, 162 CALL_ARGUMENT, 163 BUFFER_EXTENTS, 164 }; 165 Token Expects; 166 167 // Each threads buffer may have trailing garbage to scan over, so we track our 168 // progress. 169 uint64_t CurrentBufferSize; 170 uint64_t CurrentBufferConsumed; 171 }; 172 173 const char *fdrStateToTwine(const FDRState::Token &state) { 174 switch (state) { 175 case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF: 176 return "NEW_BUFFER_RECORD_OR_EOF"; 177 case FDRState::Token::WALLCLOCK_RECORD: 178 return "WALLCLOCK_RECORD"; 179 case FDRState::Token::NEW_CPU_ID_RECORD: 180 return "NEW_CPU_ID_RECORD"; 181 case FDRState::Token::FUNCTION_SEQUENCE: 182 return "FUNCTION_SEQUENCE"; 183 case FDRState::Token::SCAN_TO_END_OF_THREAD_BUF: 184 return "SCAN_TO_END_OF_THREAD_BUF"; 185 case FDRState::Token::CUSTOM_EVENT_DATA: 186 return "CUSTOM_EVENT_DATA"; 187 case FDRState::Token::CALL_ARGUMENT: 188 return "CALL_ARGUMENT"; 189 case FDRState::Token::BUFFER_EXTENTS: 190 return "BUFFER_EXTENTS"; 191 } 192 return "UNKNOWN"; 193 } 194 195 /// State transition when a NewBufferRecord is encountered. 196 Error processFDRNewBufferRecord(FDRState &State, uint8_t RecordFirstByte, 197 DataExtractor &RecordExtractor) { 198 199 if (State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF) 200 return make_error<StringError>( 201 Twine("Malformed log. Read New Buffer record kind out of sequence; " 202 "expected: ") + 203 fdrStateToTwine(State.Expects), 204 std::make_error_code(std::errc::executable_format_error)); 205 uint32_t OffsetPtr = 1; // 1 byte into record. 206 State.ThreadId = RecordExtractor.getU16(&OffsetPtr); 207 State.Expects = FDRState::Token::WALLCLOCK_RECORD; 208 return Error::success(); 209 } 210 211 /// State transition when an EndOfBufferRecord is encountered. 212 Error processFDREndOfBufferRecord(FDRState &State, uint8_t RecordFirstByte, 213 DataExtractor &RecordExtractor) { 214 if (State.Expects == FDRState::Token::NEW_BUFFER_RECORD_OR_EOF) 215 return make_error<StringError>( 216 Twine("Malformed log. Received EOB message without current buffer; " 217 "expected: ") + 218 fdrStateToTwine(State.Expects), 219 std::make_error_code(std::errc::executable_format_error)); 220 State.Expects = FDRState::Token::SCAN_TO_END_OF_THREAD_BUF; 221 return Error::success(); 222 } 223 224 /// State transition when a NewCPUIdRecord is encountered. 225 Error processFDRNewCPUIdRecord(FDRState &State, uint8_t RecordFirstByte, 226 DataExtractor &RecordExtractor) { 227 if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE && 228 State.Expects != FDRState::Token::NEW_CPU_ID_RECORD) 229 return make_error<StringError>( 230 Twine("Malformed log. Read NewCPUId record kind out of sequence; " 231 "expected: ") + 232 fdrStateToTwine(State.Expects), 233 std::make_error_code(std::errc::executable_format_error)); 234 uint32_t OffsetPtr = 1; // Read starting after the first byte. 235 State.CPUId = RecordExtractor.getU16(&OffsetPtr); 236 State.BaseTSC = RecordExtractor.getU64(&OffsetPtr); 237 State.Expects = FDRState::Token::FUNCTION_SEQUENCE; 238 return Error::success(); 239 } 240 241 /// State transition when a TSCWrapRecord (overflow detection) is encountered. 242 Error processFDRTSCWrapRecord(FDRState &State, uint8_t RecordFirstByte, 243 DataExtractor &RecordExtractor) { 244 if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE) 245 return make_error<StringError>( 246 Twine("Malformed log. Read TSCWrap record kind out of sequence; " 247 "expecting: ") + 248 fdrStateToTwine(State.Expects), 249 std::make_error_code(std::errc::executable_format_error)); 250 uint32_t OffsetPtr = 1; // Read starting after the first byte. 251 State.BaseTSC = RecordExtractor.getU64(&OffsetPtr); 252 return Error::success(); 253 } 254 255 /// State transition when a WallTimeMarkerRecord is encountered. 256 Error processFDRWallTimeRecord(FDRState &State, uint8_t RecordFirstByte, 257 DataExtractor &RecordExtractor) { 258 if (State.Expects != FDRState::Token::WALLCLOCK_RECORD) 259 return make_error<StringError>( 260 Twine("Malformed log. Read Wallclock record kind out of sequence; " 261 "expecting: ") + 262 fdrStateToTwine(State.Expects), 263 std::make_error_code(std::errc::executable_format_error)); 264 265 // TODO: Someday, reconcile the TSC ticks to wall clock time for presentation 266 // purposes. For now, we're ignoring these records. 267 State.Expects = FDRState::Token::NEW_CPU_ID_RECORD; 268 return Error::success(); 269 } 270 271 /// State transition when a CustomEventMarker is encountered. 272 Error processCustomEventMarker(FDRState &State, uint8_t RecordFirstByte, 273 DataExtractor &RecordExtractor, 274 size_t &RecordSize) { 275 // We can encounter a CustomEventMarker anywhere in the log, so we can handle 276 // it regardless of the expectation. However, we do set the expectation to 277 // read a set number of fixed bytes, as described in the metadata. 278 uint32_t OffsetPtr = 1; // Read after the first byte. 279 uint32_t DataSize = RecordExtractor.getU32(&OffsetPtr); 280 uint64_t TSC = RecordExtractor.getU64(&OffsetPtr); 281 282 // FIXME: Actually represent the record through the API. For now we only 283 // skip through the data. 284 (void)TSC; 285 RecordSize = 16 + DataSize; 286 return Error::success(); 287 } 288 289 /// State transition when an BufferExtents record is encountered. 290 Error processBufferExtents(FDRState &State, uint8_t RecordFirstByte, 291 DataExtractor &RecordExtractor) { 292 if (State.Expects != FDRState::Token::BUFFER_EXTENTS) 293 return make_error<StringError>( 294 Twine("Malformed log. Buffer Extents unexpected; expected: ") + 295 fdrStateToTwine(State.Expects), 296 std::make_error_code(std::errc::executable_format_error)); 297 uint32_t OffsetPtr = 1; // Read after the first byte. 298 State.CurrentBufferSize = RecordExtractor.getU64(&OffsetPtr); 299 State.Expects = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF; 300 return Error::success(); 301 } 302 303 /// State transition when a CallArgumentRecord is encountered. 304 Error processFDRCallArgumentRecord(FDRState &State, uint8_t RecordFirstByte, 305 DataExtractor &RecordExtractor, 306 std::vector<XRayRecord> &Records) { 307 uint32_t OffsetPtr = 1; // Read starting after the first byte. 308 auto &Enter = Records.back(); 309 310 if (Enter.Type != RecordTypes::ENTER) 311 return make_error<StringError>( 312 "CallArgument needs to be right after a function entry", 313 std::make_error_code(std::errc::executable_format_error)); 314 Enter.Type = RecordTypes::ENTER_ARG; 315 Enter.CallArgs.emplace_back(RecordExtractor.getU64(&OffsetPtr)); 316 return Error::success(); 317 } 318 319 /// Advances the state machine for reading the FDR record type by reading one 320 /// Metadata Record and updating the State appropriately based on the kind of 321 /// record encountered. The RecordKind is encoded in the first byte of the 322 /// Record, which the caller should pass in because they have already read it 323 /// to determine that this is a metadata record as opposed to a function record. 324 /// 325 /// Beginning with Version 2 of the FDR log, we do not depend on the size of the 326 /// buffer, but rather use the extents to determine how far to read in the log 327 /// for this particular buffer. 328 Error processFDRMetadataRecord(FDRState &State, uint8_t RecordFirstByte, 329 DataExtractor &RecordExtractor, 330 size_t &RecordSize, 331 std::vector<XRayRecord> &Records, 332 uint16_t Version) { 333 // The remaining 7 bits are the RecordKind enum. 334 uint8_t RecordKind = RecordFirstByte >> 1; 335 switch (RecordKind) { 336 case 0: // NewBuffer 337 if (auto E = 338 processFDRNewBufferRecord(State, RecordFirstByte, RecordExtractor)) 339 return E; 340 break; 341 case 1: // EndOfBuffer 342 if (Version >= 2) 343 return make_error<StringError>( 344 "Since Version 2 of FDR logging, we no longer support EOB records.", 345 std::make_error_code(std::errc::executable_format_error)); 346 if (auto E = processFDREndOfBufferRecord(State, RecordFirstByte, 347 RecordExtractor)) 348 return E; 349 break; 350 case 2: // NewCPUId 351 if (auto E = 352 processFDRNewCPUIdRecord(State, RecordFirstByte, RecordExtractor)) 353 return E; 354 break; 355 case 3: // TSCWrap 356 if (auto E = 357 processFDRTSCWrapRecord(State, RecordFirstByte, RecordExtractor)) 358 return E; 359 break; 360 case 4: // WallTimeMarker 361 if (auto E = 362 processFDRWallTimeRecord(State, RecordFirstByte, RecordExtractor)) 363 return E; 364 break; 365 case 5: // CustomEventMarker 366 if (auto E = processCustomEventMarker(State, RecordFirstByte, 367 RecordExtractor, RecordSize)) 368 return E; 369 break; 370 case 6: // CallArgument 371 if (auto E = processFDRCallArgumentRecord(State, RecordFirstByte, 372 RecordExtractor, Records)) 373 return E; 374 break; 375 case 7: // BufferExtents 376 if (auto E = processBufferExtents(State, RecordFirstByte, RecordExtractor)) 377 return E; 378 break; 379 default: 380 // Widen the record type to uint16_t to prevent conversion to char. 381 return make_error<StringError>( 382 Twine("Illegal metadata record type: ") 383 .concat(Twine(static_cast<unsigned>(RecordKind))), 384 std::make_error_code(std::errc::executable_format_error)); 385 } 386 return Error::success(); 387 } 388 389 /// Reads a function record from an FDR format log, appending a new XRayRecord 390 /// to the vector being populated and updating the State with a new value 391 /// reference value to interpret TSC deltas. 392 /// 393 /// The XRayRecord constructed includes information from the function record 394 /// processed here as well as Thread ID and CPU ID formerly extracted into 395 /// State. 396 Error processFDRFunctionRecord(FDRState &State, uint8_t RecordFirstByte, 397 DataExtractor &RecordExtractor, 398 std::vector<XRayRecord> &Records) { 399 switch (State.Expects) { 400 case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF: 401 return make_error<StringError>( 402 "Malformed log. Received Function Record before new buffer setup.", 403 std::make_error_code(std::errc::executable_format_error)); 404 case FDRState::Token::WALLCLOCK_RECORD: 405 return make_error<StringError>( 406 "Malformed log. Received Function Record when expecting wallclock.", 407 std::make_error_code(std::errc::executable_format_error)); 408 case FDRState::Token::NEW_CPU_ID_RECORD: 409 return make_error<StringError>( 410 "Malformed log. Received Function Record before first CPU record.", 411 std::make_error_code(std::errc::executable_format_error)); 412 default: 413 Records.emplace_back(); 414 auto &Record = Records.back(); 415 Record.RecordType = 0; // Record is type NORMAL. 416 // Strip off record type bit and use the next three bits. 417 uint8_t RecordType = (RecordFirstByte >> 1) & 0x07; 418 switch (RecordType) { 419 case static_cast<uint8_t>(RecordTypes::ENTER): 420 Record.Type = RecordTypes::ENTER; 421 break; 422 case static_cast<uint8_t>(RecordTypes::EXIT): 423 Record.Type = RecordTypes::EXIT; 424 break; 425 case static_cast<uint8_t>(RecordTypes::TAIL_EXIT): 426 Record.Type = RecordTypes::TAIL_EXIT; 427 break; 428 default: 429 // Cast to an unsigned integer to not interpret the record type as a char. 430 return make_error<StringError>( 431 Twine("Illegal function record type: ") 432 .concat(Twine(static_cast<unsigned>(RecordType))), 433 std::make_error_code(std::errc::executable_format_error)); 434 } 435 Record.CPU = State.CPUId; 436 Record.TId = State.ThreadId; 437 // Back up to read first 32 bits, including the 4 we pulled RecordType 438 // and RecordKind out of. The remaining 28 are FunctionId. 439 uint32_t OffsetPtr = 0; 440 // Despite function Id being a signed int on XRayRecord, 441 // when it is written to an FDR format, the top bits are truncated, 442 // so it is effectively an unsigned value. When we shift off the 443 // top four bits, we want the shift to be logical, so we read as 444 // uint32_t. 445 uint32_t FuncIdBitField = RecordExtractor.getU32(&OffsetPtr); 446 Record.FuncId = FuncIdBitField >> 4; 447 // FunctionRecords have a 32 bit delta from the previous absolute TSC 448 // or TSC delta. If this would overflow, we should read a TSCWrap record 449 // with an absolute TSC reading. 450 uint64_t NewTSC = State.BaseTSC + RecordExtractor.getU32(&OffsetPtr); 451 State.BaseTSC = NewTSC; 452 Record.TSC = NewTSC; 453 } 454 return Error::success(); 455 } 456 457 /// Reads a log in FDR mode for version 1 of this binary format. FDR mode is 458 /// defined as part of the compiler-rt project in xray_fdr_logging.h, and such 459 /// a log consists of the familiar 32 bit XRayHeader, followed by sequences of 460 /// of interspersed 16 byte Metadata Records and 8 byte Function Records. 461 /// 462 /// The following is an attempt to document the grammar of the format, which is 463 /// parsed by this function for little-endian machines. Since the format makes 464 /// use of BitFields, when we support big-endian architectures, we will need to 465 /// adjust not only the endianness parameter to llvm's RecordExtractor, but also 466 /// the bit twiddling logic, which is consistent with the little-endian 467 /// convention that BitFields within a struct will first be packed into the 468 /// least significant bits the address they belong to. 469 /// 470 /// We expect a format complying with the grammar in the following pseudo-EBNF 471 /// in Version 1 of the FDR log. 472 /// 473 /// FDRLog: XRayFileHeader ThreadBuffer* 474 /// XRayFileHeader: 32 bytes to identify the log as FDR with machine metadata. 475 /// Includes BufferSize 476 /// ThreadBuffer: NewBuffer WallClockTime NewCPUId FunctionSequence EOB 477 /// BufSize: 8 byte unsigned integer indicating how large the buffer is. 478 /// NewBuffer: 16 byte metadata record with Thread Id. 479 /// WallClockTime: 16 byte metadata record with human readable time. 480 /// NewCPUId: 16 byte metadata record with CPUId and a 64 bit TSC reading. 481 /// EOB: 16 byte record in a thread buffer plus mem garbage to fill BufSize. 482 /// FunctionSequence: NewCPUId | TSCWrap | FunctionRecord 483 /// TSCWrap: 16 byte metadata record with a full 64 bit TSC reading. 484 /// FunctionRecord: 8 byte record with FunctionId, entry/exit, and TSC delta. 485 /// 486 /// In Version 2, we make the following changes: 487 /// 488 /// ThreadBuffer: BufferExtents NewBuffer WallClockTime NewCPUId 489 /// FunctionSequence 490 /// BufferExtents: 16 byte metdata record describing how many usable bytes are 491 /// in the buffer. This is measured from the start of the buffer 492 /// and must always be at least 48 (bytes). 493 /// EOB: *deprecated* 494 Error loadFDRLog(StringRef Data, XRayFileHeader &FileHeader, 495 std::vector<XRayRecord> &Records) { 496 if (Data.size() < 32) 497 return make_error<StringError>( 498 "Not enough bytes for an XRay log.", 499 std::make_error_code(std::errc::invalid_argument)); 500 501 // For an FDR log, there are records sized 16 and 8 bytes. 502 // There actually may be no records if no non-trivial functions are 503 // instrumented. 504 if (Data.size() % 8 != 0) 505 return make_error<StringError>( 506 "Invalid-sized XRay data.", 507 std::make_error_code(std::errc::invalid_argument)); 508 509 if (auto E = readBinaryFormatHeader(Data, FileHeader)) 510 return E; 511 512 uint64_t BufferSize = 0; 513 { 514 StringRef ExtraDataRef(FileHeader.FreeFormData, 16); 515 DataExtractor ExtraDataExtractor(ExtraDataRef, true, 8); 516 uint32_t ExtraDataOffset = 0; 517 BufferSize = ExtraDataExtractor.getU64(&ExtraDataOffset); 518 } 519 520 FDRState::Token InitialExpectation; 521 switch (FileHeader.Version) { 522 case 1: 523 InitialExpectation = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF; 524 break; 525 case 2: 526 InitialExpectation = FDRState::Token::BUFFER_EXTENTS; 527 break; 528 default: 529 return make_error<StringError>( 530 Twine("Unsupported version '") + Twine(FileHeader.Version) + "'", 531 std::make_error_code(std::errc::executable_format_error)); 532 } 533 FDRState State{0, 0, 0, InitialExpectation, BufferSize, 0}; 534 535 // RecordSize will tell the loop how far to seek ahead based on the record 536 // type that we have just read. 537 size_t RecordSize = 0; 538 for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(RecordSize)) { 539 DataExtractor RecordExtractor(S, true, 8); 540 uint32_t OffsetPtr = 0; 541 if (State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF) { 542 RecordSize = State.CurrentBufferSize - State.CurrentBufferConsumed; 543 if (S.size() < RecordSize) { 544 return make_error<StringError>( 545 Twine("Incomplete thread buffer. Expected at least ") + 546 Twine(RecordSize) + " bytes but found " + Twine(S.size()), 547 make_error_code(std::errc::invalid_argument)); 548 } 549 State.CurrentBufferConsumed = 0; 550 State.Expects = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF; 551 continue; 552 } 553 uint8_t BitField = RecordExtractor.getU8(&OffsetPtr); 554 bool isMetadataRecord = BitField & 0x01uL; 555 bool isBufferExtents = 556 (BitField >> 1) == 7; // BufferExtents record kind == 7 557 if (isMetadataRecord) { 558 RecordSize = 16; 559 if (auto E = 560 processFDRMetadataRecord(State, BitField, RecordExtractor, 561 RecordSize, Records, FileHeader.Version)) 562 return E; 563 } else { // Process Function Record 564 RecordSize = 8; 565 if (auto E = processFDRFunctionRecord(State, BitField, RecordExtractor, 566 Records)) 567 return E; 568 } 569 570 // The BufferExtents record is technically not part of the buffer, so we 571 // don't count the size of that record against the buffer's actual size. 572 if (!isBufferExtents) 573 State.CurrentBufferConsumed += RecordSize; 574 assert(State.CurrentBufferConsumed <= State.CurrentBufferSize); 575 if (FileHeader.Version == 2 && 576 State.CurrentBufferSize == State.CurrentBufferConsumed) { 577 // In Version 2 of the log, we don't need to scan to the end of the thread 578 // buffer if we've already consumed all the bytes we need to. 579 State.Expects = FDRState::Token::BUFFER_EXTENTS; 580 State.CurrentBufferSize = BufferSize; 581 State.CurrentBufferConsumed = 0; 582 } 583 } 584 585 // Having iterated over everything we've been given, we've either consumed 586 // everything and ended up in the end state, or were told to skip the rest. 587 bool Finished = State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF && 588 State.CurrentBufferSize == State.CurrentBufferConsumed; 589 if ((State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF && 590 State.Expects != FDRState::Token::BUFFER_EXTENTS) && 591 !Finished) 592 return make_error<StringError>( 593 Twine("Encountered EOF with unexpected state expectation ") + 594 fdrStateToTwine(State.Expects) + 595 ". Remaining expected bytes in thread buffer total " + 596 Twine(State.CurrentBufferSize - State.CurrentBufferConsumed), 597 std::make_error_code(std::errc::executable_format_error)); 598 599 return Error::success(); 600 } 601 602 Error loadYAMLLog(StringRef Data, XRayFileHeader &FileHeader, 603 std::vector<XRayRecord> &Records) { 604 YAMLXRayTrace Trace; 605 Input In(Data); 606 In >> Trace; 607 if (In.error()) 608 return make_error<StringError>("Failed loading YAML Data.", In.error()); 609 610 FileHeader.Version = Trace.Header.Version; 611 FileHeader.Type = Trace.Header.Type; 612 FileHeader.ConstantTSC = Trace.Header.ConstantTSC; 613 FileHeader.NonstopTSC = Trace.Header.NonstopTSC; 614 FileHeader.CycleFrequency = Trace.Header.CycleFrequency; 615 616 if (FileHeader.Version != 1) 617 return make_error<StringError>( 618 Twine("Unsupported XRay file version: ") + Twine(FileHeader.Version), 619 std::make_error_code(std::errc::invalid_argument)); 620 621 Records.clear(); 622 std::transform(Trace.Records.begin(), Trace.Records.end(), 623 std::back_inserter(Records), [&](const YAMLXRayRecord &R) { 624 return XRayRecord{R.RecordType, R.CPU, R.Type, R.FuncId, 625 R.TSC, R.TId, R.CallArgs}; 626 }); 627 return Error::success(); 628 } 629 } // namespace 630 631 Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) { 632 int Fd; 633 if (auto EC = sys::fs::openFileForRead(Filename, Fd)) { 634 return make_error<StringError>( 635 Twine("Cannot read log from '") + Filename + "'", EC); 636 } 637 638 uint64_t FileSize; 639 if (auto EC = sys::fs::file_size(Filename, FileSize)) { 640 return make_error<StringError>( 641 Twine("Cannot read log from '") + Filename + "'", EC); 642 } 643 if (FileSize < 4) { 644 return make_error<StringError>( 645 Twine("File '") + Filename + "' too small for XRay.", 646 std::make_error_code(std::errc::executable_format_error)); 647 } 648 649 // Map the opened file into memory and use a StringRef to access it later. 650 std::error_code EC; 651 sys::fs::mapped_file_region MappedFile( 652 Fd, sys::fs::mapped_file_region::mapmode::readonly, FileSize, 0, EC); 653 if (EC) { 654 return make_error<StringError>( 655 Twine("Cannot read log from '") + Filename + "'", EC); 656 } 657 auto Data = StringRef(MappedFile.data(), MappedFile.size()); 658 659 // Attempt to detect the file type using file magic. We have a slight bias 660 // towards the binary format, and we do this by making sure that the first 4 661 // bytes of the binary file is some combination of the following byte 662 // patterns: (observe the code loading them assumes they're little endian) 663 // 664 // 0x01 0x00 0x00 0x00 - version 1, "naive" format 665 // 0x01 0x00 0x01 0x00 - version 1, "flight data recorder" format 666 // 0x02 0x00 0x01 0x00 - version 2, "flight data recorder" format 667 // 668 // YAML files don't typically have those first four bytes as valid text so we 669 // try loading assuming YAML if we don't find these bytes. 670 // 671 // Only if we can't load either the binary or the YAML format will we yield an 672 // error. 673 StringRef Magic(MappedFile.data(), 4); 674 DataExtractor HeaderExtractor(Magic, true, 8); 675 uint32_t OffsetPtr = 0; 676 uint16_t Version = HeaderExtractor.getU16(&OffsetPtr); 677 uint16_t Type = HeaderExtractor.getU16(&OffsetPtr); 678 679 enum BinaryFormatType { NAIVE_FORMAT = 0, FLIGHT_DATA_RECORDER_FORMAT = 1 }; 680 681 Trace T; 682 switch (Type) { 683 case NAIVE_FORMAT: 684 if (Version == 1 || Version == 2) { 685 if (auto E = loadNaiveFormatLog(Data, T.FileHeader, T.Records)) 686 return std::move(E); 687 } else { 688 return make_error<StringError>( 689 Twine("Unsupported version for Basic/Naive Mode logging: ") + 690 Twine(Version), 691 std::make_error_code(std::errc::executable_format_error)); 692 } 693 break; 694 case FLIGHT_DATA_RECORDER_FORMAT: 695 if (Version == 1 || Version == 2) { 696 if (auto E = loadFDRLog(Data, T.FileHeader, T.Records)) 697 return std::move(E); 698 } else { 699 return make_error<StringError>( 700 Twine("Unsupported version for FDR Mode logging: ") + Twine(Version), 701 std::make_error_code(std::errc::executable_format_error)); 702 } 703 break; 704 default: 705 if (auto E = loadYAMLLog(Data, T.FileHeader, T.Records)) 706 return std::move(E); 707 } 708 709 if (Sort) 710 std::stable_sort(T.Records.begin(), T.Records.end(), 711 [&](const XRayRecord &L, const XRayRecord &R) { 712 return L.TSC < R.TSC; 713 }); 714 715 return std::move(T); 716 } 717