summaryrefslogtreecommitdiffstats
path: root/gnu/llvm/lib/XRay/Trace.cpp
diff options
context:
space:
mode:
authorpatrick <patrick@openbsd.org>2019-06-23 21:36:31 +0000
committerpatrick <patrick@openbsd.org>2019-06-23 21:36:31 +0000
commit23f101f37937a1bd4a29726cab2f76e0fb038b35 (patch)
treef7da7d6b32c2e07114da399150bfa88d72187012 /gnu/llvm/lib/XRay/Trace.cpp
parentsort previous; ok deraadt (diff)
downloadwireguard-openbsd-23f101f37937a1bd4a29726cab2f76e0fb038b35.tar.xz
wireguard-openbsd-23f101f37937a1bd4a29726cab2f76e0fb038b35.zip
Import LLVM 8.0.0 release including clang, lld and lldb.
Diffstat (limited to 'gnu/llvm/lib/XRay/Trace.cpp')
-rw-r--r--gnu/llvm/lib/XRay/Trace.cpp736
1 files changed, 221 insertions, 515 deletions
diff --git a/gnu/llvm/lib/XRay/Trace.cpp b/gnu/llvm/lib/XRay/Trace.cpp
index a8764b25483..4f28f3f754c 100644
--- a/gnu/llvm/lib/XRay/Trace.cpp
+++ b/gnu/llvm/lib/XRay/Trace.cpp
@@ -15,7 +15,16 @@
#include "llvm/Support/DataExtractor.h"
#include "llvm/Support/Error.h"
#include "llvm/Support/FileSystem.h"
+#include "llvm/XRay/BlockIndexer.h"
+#include "llvm/XRay/BlockVerifier.h"
+#include "llvm/XRay/FDRRecordConsumer.h"
+#include "llvm/XRay/FDRRecordProducer.h"
+#include "llvm/XRay/FDRRecords.h"
+#include "llvm/XRay/FDRTraceExpander.h"
+#include "llvm/XRay/FileHeaderReader.h"
#include "llvm/XRay/YAMLXRayRecord.h"
+#include <memory>
+#include <vector>
using namespace llvm;
using namespace llvm::xray;
@@ -25,38 +34,8 @@ namespace {
using XRayRecordStorage =
std::aligned_storage<sizeof(XRayRecord), alignof(XRayRecord)>::type;
-// Populates the FileHeader reference by reading the first 32 bytes of the file.
-Error readBinaryFormatHeader(StringRef Data, XRayFileHeader &FileHeader) {
- // FIXME: Maybe deduce whether the data is little or big-endian using some
- // magic bytes in the beginning of the file?
-
- // First 32 bytes of the file will always be the header. We assume a certain
- // format here:
- //
- // (2) uint16 : version
- // (2) uint16 : type
- // (4) uint32 : bitfield
- // (8) uint64 : cycle frequency
- // (16) - : padding
-
- DataExtractor HeaderExtractor(Data, true, 8);
- uint32_t OffsetPtr = 0;
- FileHeader.Version = HeaderExtractor.getU16(&OffsetPtr);
- FileHeader.Type = HeaderExtractor.getU16(&OffsetPtr);
- uint32_t Bitfield = HeaderExtractor.getU32(&OffsetPtr);
- FileHeader.ConstantTSC = Bitfield & 1uL;
- FileHeader.NonstopTSC = Bitfield & 1uL << 1;
- FileHeader.CycleFrequency = HeaderExtractor.getU64(&OffsetPtr);
- std::memcpy(&FileHeader.FreeFormData, Data.bytes_begin() + OffsetPtr, 16);
- if (FileHeader.Version != 1 && FileHeader.Version != 2 &&
- FileHeader.Version != 3)
- return make_error<StringError>(
- Twine("Unsupported XRay file version: ") + Twine(FileHeader.Version),
- std::make_error_code(std::errc::invalid_argument));
- return Error::success();
-}
-
-Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader,
+Error loadNaiveFormatLog(StringRef Data, bool IsLittleEndian,
+ XRayFileHeader &FileHeader,
std::vector<XRayRecord> &Records) {
if (Data.size() < 32)
return make_error<StringError>(
@@ -68,8 +47,12 @@ Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader,
"Invalid-sized XRay data.",
std::make_error_code(std::errc::invalid_argument));
- if (auto E = readBinaryFormatHeader(Data, FileHeader))
- return E;
+ DataExtractor Reader(Data, IsLittleEndian, 8);
+ uint32_t OffsetPtr = 0;
+ auto FileHeaderOrError = readBinaryFormatHeader(Reader, OffsetPtr);
+ if (!FileHeaderOrError)
+ return FileHeaderOrError.takeError();
+ FileHeader = std::move(FileHeaderOrError.get());
// Each record after the header will be 32 bytes, in the following format:
//
@@ -81,16 +64,38 @@ Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader,
// (4) uint32 : thread id
// (4) uint32 : process id
// (8) - : padding
- for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(32)) {
- DataExtractor RecordExtractor(S, true, 8);
- uint32_t OffsetPtr = 0;
- switch (auto RecordType = RecordExtractor.getU16(&OffsetPtr)) {
+ while (Reader.isValidOffset(OffsetPtr)) {
+ if (!Reader.isValidOffsetForDataOfSize(OffsetPtr, 32))
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Not enough bytes to read a full record at offset %d.", OffsetPtr);
+ auto PreReadOffset = OffsetPtr;
+ auto RecordType = Reader.getU16(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading record type at offset %d.", OffsetPtr);
+
+ switch (RecordType) {
case 0: { // Normal records.
Records.emplace_back();
auto &Record = Records.back();
Record.RecordType = RecordType;
- Record.CPU = RecordExtractor.getU8(&OffsetPtr);
- auto Type = RecordExtractor.getU8(&OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ Record.CPU = Reader.getU8(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading CPU field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ auto Type = Reader.getU8(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading record type field at offset %d.", OffsetPtr);
+
switch (Type) {
case 0:
Record.Type = RecordTypes::ENTER;
@@ -105,393 +110,96 @@ Error loadNaiveFormatLog(StringRef Data, XRayFileHeader &FileHeader,
Record.Type = RecordTypes::ENTER_ARG;
break;
default:
- return make_error<StringError>(
- Twine("Unknown record type '") + Twine(int{Type}) + "'",
- std::make_error_code(std::errc::executable_format_error));
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Unknown record type '%d' at offset %d.", Type, OffsetPtr);
}
- Record.FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t));
- Record.TSC = RecordExtractor.getU64(&OffsetPtr);
- Record.TId = RecordExtractor.getU32(&OffsetPtr);
- Record.PId = RecordExtractor.getU32(&OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ Record.FuncId = Reader.getSigned(&OffsetPtr, sizeof(int32_t));
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading function id field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ Record.TSC = Reader.getU64(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading TSC field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ Record.TId = Reader.getU32(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading thread id field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ Record.PId = Reader.getU32(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading process id at offset %d.", OffsetPtr);
+
break;
}
case 1: { // Arg payload record.
auto &Record = Records.back();
- // Advance two bytes to avoid padding.
+
+ // We skip the next two bytes of the record, because we don't need the
+ // type and the CPU record for arg payloads.
OffsetPtr += 2;
- int32_t FuncId = RecordExtractor.getSigned(&OffsetPtr, sizeof(int32_t));
- auto TId = RecordExtractor.getU32(&OffsetPtr);
- auto PId = RecordExtractor.getU32(&OffsetPtr);
+ PreReadOffset = OffsetPtr;
+ int32_t FuncId = Reader.getSigned(&OffsetPtr, sizeof(int32_t));
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading function id field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ auto TId = Reader.getU32(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading thread id field at offset %d.", OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ auto PId = Reader.getU32(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading process id field at offset %d.", OffsetPtr);
// Make a check for versions above 3 for the Pid field
if (Record.FuncId != FuncId || Record.TId != TId ||
(FileHeader.Version >= 3 ? Record.PId != PId : false))
- return make_error<StringError>(
- Twine("Corrupted log, found arg payload following non-matching "
- "function + thread record. Record for function ") +
- Twine(Record.FuncId) + " != " + Twine(FuncId) + "; offset: " +
- Twine(S.data() - Data.data()),
- std::make_error_code(std::errc::executable_format_error));
-
- auto Arg = RecordExtractor.getU64(&OffsetPtr);
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Corrupted log, found arg payload following non-matching "
+ "function+thread record. Record for function %d != %d at offset "
+ "%d",
+ Record.FuncId, FuncId, OffsetPtr);
+
+ PreReadOffset = OffsetPtr;
+ auto Arg = Reader.getU64(&OffsetPtr);
+ if (OffsetPtr == PreReadOffset)
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Failed reading argument payload at offset %d.", OffsetPtr);
+
Record.CallArgs.push_back(Arg);
break;
}
default:
- return make_error<StringError>(
- Twine("Unknown record type == ") + Twine(RecordType),
- std::make_error_code(std::errc::executable_format_error));
+ return createStringError(
+ std::make_error_code(std::errc::executable_format_error),
+ "Unknown record type '%d' at offset %d.", RecordType, OffsetPtr);
}
- }
- return Error::success();
-}
-
-/// When reading from a Flight Data Recorder mode log, metadata records are
-/// sparse compared to packed function records, so we must maintain state as we
-/// read through the sequence of entries. This allows the reader to denormalize
-/// the CPUId and Thread Id onto each Function Record and transform delta
-/// encoded TSC values into absolute encodings on each record.
-struct FDRState {
- uint16_t CPUId;
- uint16_t ThreadId;
- int32_t ProcessId;
- uint64_t BaseTSC;
-
- /// Encode some of the state transitions for the FDR log reader as explicit
- /// checks. These are expectations for the next Record in the stream.
- enum class Token {
- NEW_BUFFER_RECORD_OR_EOF,
- WALLCLOCK_RECORD,
- NEW_CPU_ID_RECORD,
- FUNCTION_SEQUENCE,
- SCAN_TO_END_OF_THREAD_BUF,
- CUSTOM_EVENT_DATA,
- CALL_ARGUMENT,
- BUFFER_EXTENTS,
- PID_RECORD,
- };
- Token Expects;
-
- // Each threads buffer may have trailing garbage to scan over, so we track our
- // progress.
- uint64_t CurrentBufferSize;
- uint64_t CurrentBufferConsumed;
-};
-
-const char *fdrStateToTwine(const FDRState::Token &state) {
- switch (state) {
- case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF:
- return "NEW_BUFFER_RECORD_OR_EOF";
- case FDRState::Token::WALLCLOCK_RECORD:
- return "WALLCLOCK_RECORD";
- case FDRState::Token::NEW_CPU_ID_RECORD:
- return "NEW_CPU_ID_RECORD";
- case FDRState::Token::FUNCTION_SEQUENCE:
- return "FUNCTION_SEQUENCE";
- case FDRState::Token::SCAN_TO_END_OF_THREAD_BUF:
- return "SCAN_TO_END_OF_THREAD_BUF";
- case FDRState::Token::CUSTOM_EVENT_DATA:
- return "CUSTOM_EVENT_DATA";
- case FDRState::Token::CALL_ARGUMENT:
- return "CALL_ARGUMENT";
- case FDRState::Token::BUFFER_EXTENTS:
- return "BUFFER_EXTENTS";
- case FDRState::Token::PID_RECORD:
- return "PID_RECORD";
- }
- return "UNKNOWN";
-}
-
-/// State transition when a NewBufferRecord is encountered.
-Error processFDRNewBufferRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
-
- if (State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF)
- return make_error<StringError>(
- Twine("Malformed log. Read New Buffer record kind out of sequence; "
- "expected: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
- uint32_t OffsetPtr = 1; // 1 byte into record.
- State.ThreadId = RecordExtractor.getU16(&OffsetPtr);
- State.Expects = FDRState::Token::WALLCLOCK_RECORD;
- return Error::success();
-}
-
-/// State transition when an EndOfBufferRecord is encountered.
-Error processFDREndOfBufferRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
- if (State.Expects == FDRState::Token::NEW_BUFFER_RECORD_OR_EOF)
- return make_error<StringError>(
- Twine("Malformed log. Received EOB message without current buffer; "
- "expected: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
- State.Expects = FDRState::Token::SCAN_TO_END_OF_THREAD_BUF;
- return Error::success();
-}
-
-/// State transition when a NewCPUIdRecord is encountered.
-Error processFDRNewCPUIdRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
- if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE &&
- State.Expects != FDRState::Token::NEW_CPU_ID_RECORD)
- return make_error<StringError>(
- Twine("Malformed log. Read NewCPUId record kind out of sequence; "
- "expected: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
- uint32_t OffsetPtr = 1; // Read starting after the first byte.
- State.CPUId = RecordExtractor.getU16(&OffsetPtr);
- State.BaseTSC = RecordExtractor.getU64(&OffsetPtr);
- State.Expects = FDRState::Token::FUNCTION_SEQUENCE;
- return Error::success();
-}
-
-/// State transition when a TSCWrapRecord (overflow detection) is encountered.
-Error processFDRTSCWrapRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
- if (State.Expects != FDRState::Token::FUNCTION_SEQUENCE)
- return make_error<StringError>(
- Twine("Malformed log. Read TSCWrap record kind out of sequence; "
- "expecting: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
- uint32_t OffsetPtr = 1; // Read starting after the first byte.
- State.BaseTSC = RecordExtractor.getU64(&OffsetPtr);
- return Error::success();
-}
-
-/// State transition when a WallTimeMarkerRecord is encountered.
-Error processFDRWallTimeRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
- if (State.Expects != FDRState::Token::WALLCLOCK_RECORD)
- return make_error<StringError>(
- Twine("Malformed log. Read Wallclock record kind out of sequence; "
- "expecting: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
-
- // TODO: Someday, reconcile the TSC ticks to wall clock time for presentation
- // purposes. For now, we're ignoring these records.
- State.Expects = FDRState::Token::NEW_CPU_ID_RECORD;
- return Error::success();
-}
-
-/// State transition when a PidRecord is encountered.
-Error processFDRPidRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
-
- if (State.Expects != FDRState::Token::PID_RECORD)
- return make_error<StringError>(
- Twine("Malformed log. Read Pid record kind out of sequence; "
- "expected: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
-
- uint32_t OffsetPtr = 1; // Read starting after the first byte.
- State.ProcessId = RecordExtractor.getU32(&OffsetPtr);
- State.Expects = FDRState::Token::NEW_CPU_ID_RECORD;
- return Error::success();
-}
-
-/// State transition when a CustomEventMarker is encountered.
-Error processCustomEventMarker(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor,
- size_t &RecordSize) {
- // We can encounter a CustomEventMarker anywhere in the log, so we can handle
- // it regardless of the expectation. However, we do set the expectation to
- // read a set number of fixed bytes, as described in the metadata.
- uint32_t OffsetPtr = 1; // Read after the first byte.
- uint32_t DataSize = RecordExtractor.getU32(&OffsetPtr);
- uint64_t TSC = RecordExtractor.getU64(&OffsetPtr);
-
- // FIXME: Actually represent the record through the API. For now we only
- // skip through the data.
- (void)TSC;
- RecordSize = 16 + DataSize;
- return Error::success();
-}
-
-/// State transition when an BufferExtents record is encountered.
-Error processBufferExtents(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor) {
- if (State.Expects != FDRState::Token::BUFFER_EXTENTS)
- return make_error<StringError>(
- Twine("Malformed log. Buffer Extents unexpected; expected: ") +
- fdrStateToTwine(State.Expects),
- std::make_error_code(std::errc::executable_format_error));
- uint32_t OffsetPtr = 1; // Read after the first byte.
- State.CurrentBufferSize = RecordExtractor.getU64(&OffsetPtr);
- State.Expects = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF;
- return Error::success();
-}
-
-/// State transition when a CallArgumentRecord is encountered.
-Error processFDRCallArgumentRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor,
- std::vector<XRayRecord> &Records) {
- uint32_t OffsetPtr = 1; // Read starting after the first byte.
- auto &Enter = Records.back();
-
- if (Enter.Type != RecordTypes::ENTER)
- return make_error<StringError>(
- "CallArgument needs to be right after a function entry",
- std::make_error_code(std::errc::executable_format_error));
- Enter.Type = RecordTypes::ENTER_ARG;
- Enter.CallArgs.emplace_back(RecordExtractor.getU64(&OffsetPtr));
- return Error::success();
-}
-
-/// Advances the state machine for reading the FDR record type by reading one
-/// Metadata Record and updating the State appropriately based on the kind of
-/// record encountered. The RecordKind is encoded in the first byte of the
-/// Record, which the caller should pass in because they have already read it
-/// to determine that this is a metadata record as opposed to a function record.
-///
-/// Beginning with Version 2 of the FDR log, we do not depend on the size of the
-/// buffer, but rather use the extents to determine how far to read in the log
-/// for this particular buffer.
-///
-/// In Version 3, FDR log now includes a pid metadata record after
-/// WallTimeMarker
-Error processFDRMetadataRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor,
- size_t &RecordSize,
- std::vector<XRayRecord> &Records,
- uint16_t Version) {
- // The remaining 7 bits are the RecordKind enum.
- uint8_t RecordKind = RecordFirstByte >> 1;
- switch (RecordKind) {
- case 0: // NewBuffer
- if (auto E =
- processFDRNewBufferRecord(State, RecordFirstByte, RecordExtractor))
- return E;
- break;
- case 1: // EndOfBuffer
- if (Version >= 2)
- return make_error<StringError>(
- "Since Version 2 of FDR logging, we no longer support EOB records.",
- std::make_error_code(std::errc::executable_format_error));
- if (auto E = processFDREndOfBufferRecord(State, RecordFirstByte,
- RecordExtractor))
- return E;
- break;
- case 2: // NewCPUId
- if (auto E =
- processFDRNewCPUIdRecord(State, RecordFirstByte, RecordExtractor))
- return E;
- break;
- case 3: // TSCWrap
- if (auto E =
- processFDRTSCWrapRecord(State, RecordFirstByte, RecordExtractor))
- return E;
- break;
- case 4: // WallTimeMarker
- if (auto E =
- processFDRWallTimeRecord(State, RecordFirstByte, RecordExtractor))
- return E;
- // In Version 3 and and above, a PidRecord is expected after WallTimeRecord
- if (Version >= 3)
- State.Expects = FDRState::Token::PID_RECORD;
- break;
- case 5: // CustomEventMarker
- if (auto E = processCustomEventMarker(State, RecordFirstByte,
- RecordExtractor, RecordSize))
- return E;
- break;
- case 6: // CallArgument
- if (auto E = processFDRCallArgumentRecord(State, RecordFirstByte,
- RecordExtractor, Records))
- return E;
- break;
- case 7: // BufferExtents
- if (auto E = processBufferExtents(State, RecordFirstByte, RecordExtractor))
- return E;
- break;
- case 9: // Pid
- if (auto E = processFDRPidRecord(State, RecordFirstByte, RecordExtractor))
- return E;
- break;
- default:
- // Widen the record type to uint16_t to prevent conversion to char.
- return make_error<StringError>(
- Twine("Illegal metadata record type: ")
- .concat(Twine(static_cast<unsigned>(RecordKind))),
- std::make_error_code(std::errc::executable_format_error));
- }
- return Error::success();
-}
-
-/// Reads a function record from an FDR format log, appending a new XRayRecord
-/// to the vector being populated and updating the State with a new value
-/// reference value to interpret TSC deltas.
-///
-/// The XRayRecord constructed includes information from the function record
-/// processed here as well as Thread ID and CPU ID formerly extracted into
-/// State.
-Error processFDRFunctionRecord(FDRState &State, uint8_t RecordFirstByte,
- DataExtractor &RecordExtractor,
- std::vector<XRayRecord> &Records) {
- switch (State.Expects) {
- case FDRState::Token::NEW_BUFFER_RECORD_OR_EOF:
- return make_error<StringError>(
- "Malformed log. Received Function Record before new buffer setup.",
- std::make_error_code(std::errc::executable_format_error));
- case FDRState::Token::WALLCLOCK_RECORD:
- return make_error<StringError>(
- "Malformed log. Received Function Record when expecting wallclock.",
- std::make_error_code(std::errc::executable_format_error));
- case FDRState::Token::PID_RECORD:
- return make_error<StringError>(
- "Malformed log. Received Function Record when expecting pid.",
- std::make_error_code(std::errc::executable_format_error));
- case FDRState::Token::NEW_CPU_ID_RECORD:
- return make_error<StringError>(
- "Malformed log. Received Function Record before first CPU record.",
- std::make_error_code(std::errc::executable_format_error));
- default:
- Records.emplace_back();
- auto &Record = Records.back();
- Record.RecordType = 0; // Record is type NORMAL.
- // Strip off record type bit and use the next three bits.
- uint8_t RecordType = (RecordFirstByte >> 1) & 0x07;
- switch (RecordType) {
- case static_cast<uint8_t>(RecordTypes::ENTER):
- Record.Type = RecordTypes::ENTER;
- break;
- case static_cast<uint8_t>(RecordTypes::EXIT):
- Record.Type = RecordTypes::EXIT;
- break;
- case static_cast<uint8_t>(RecordTypes::TAIL_EXIT):
- Record.Type = RecordTypes::TAIL_EXIT;
- break;
- default:
- // Cast to an unsigned integer to not interpret the record type as a char.
- return make_error<StringError>(
- Twine("Illegal function record type: ")
- .concat(Twine(static_cast<unsigned>(RecordType))),
- std::make_error_code(std::errc::executable_format_error));
- }
- Record.CPU = State.CPUId;
- Record.TId = State.ThreadId;
- Record.PId = State.ProcessId;
- // Back up to read first 32 bits, including the 4 we pulled RecordType
- // and RecordKind out of. The remaining 28 are FunctionId.
- uint32_t OffsetPtr = 0;
- // Despite function Id being a signed int on XRayRecord,
- // when it is written to an FDR format, the top bits are truncated,
- // so it is effectively an unsigned value. When we shift off the
- // top four bits, we want the shift to be logical, so we read as
- // uint32_t.
- uint32_t FuncIdBitField = RecordExtractor.getU32(&OffsetPtr);
- Record.FuncId = FuncIdBitField >> 4;
- // FunctionRecords have a 32 bit delta from the previous absolute TSC
- // or TSC delta. If this would overflow, we should read a TSCWrap record
- // with an absolute TSC reading.
- uint64_t NewTSC = State.BaseTSC + RecordExtractor.getU32(&OffsetPtr);
- State.BaseTSC = NewTSC;
- Record.TSC = NewTSC;
+ // Advance the offset pointer enough bytes to align to 32-byte records for
+ // basic mode logs.
+ OffsetPtr += 8;
}
return Error::success();
}
@@ -539,112 +247,97 @@ Error processFDRFunctionRecord(FDRState &State, uint8_t RecordFirstByte,
/// ThreadBuffer: BufferExtents NewBuffer WallClockTime Pid NewCPUId
/// FunctionSequence
/// EOB: *deprecated*
-Error loadFDRLog(StringRef Data, XRayFileHeader &FileHeader,
- std::vector<XRayRecord> &Records) {
+///
+/// In Version 4, we make the following changes:
+///
+/// CustomEventRecord now includes the CPU data.
+///
+/// In Version 5, we make the following changes:
+///
+/// CustomEventRecord and TypedEventRecord now use TSC delta encoding similar to
+/// what FunctionRecord instances use, and we no longer need to include the CPU
+/// id in the CustomEventRecord.
+///
+Error loadFDRLog(StringRef Data, bool IsLittleEndian,
+ XRayFileHeader &FileHeader, std::vector<XRayRecord> &Records) {
+
if (Data.size() < 32)
- return make_error<StringError>(
- "Not enough bytes for an XRay log.",
- std::make_error_code(std::errc::invalid_argument));
+ return createStringError(std::make_error_code(std::errc::invalid_argument),
+ "Not enough bytes for an XRay FDR log.");
+ DataExtractor DE(Data, IsLittleEndian, 8);
- // For an FDR log, there are records sized 16 and 8 bytes.
- // There actually may be no records if no non-trivial functions are
- // instrumented.
- if (Data.size() % 8 != 0)
- return make_error<StringError>(
- "Invalid-sized XRay data.",
- std::make_error_code(std::errc::invalid_argument));
+ uint32_t OffsetPtr = 0;
+ auto FileHeaderOrError = readBinaryFormatHeader(DE, OffsetPtr);
+ if (!FileHeaderOrError)
+ return FileHeaderOrError.takeError();
+ FileHeader = std::move(FileHeaderOrError.get());
- if (auto E = readBinaryFormatHeader(Data, FileHeader))
- return E;
+ // First we load the records into memory.
+ std::vector<std::unique_ptr<Record>> FDRRecords;
- uint64_t BufferSize = 0;
{
- StringRef ExtraDataRef(FileHeader.FreeFormData, 16);
- DataExtractor ExtraDataExtractor(ExtraDataRef, true, 8);
- uint32_t ExtraDataOffset = 0;
- BufferSize = ExtraDataExtractor.getU64(&ExtraDataOffset);
+ FileBasedRecordProducer P(FileHeader, DE, OffsetPtr);
+ LogBuilderConsumer C(FDRRecords);
+ while (DE.isValidOffsetForDataOfSize(OffsetPtr, 1)) {
+ auto R = P.produce();
+ if (!R)
+ return R.takeError();
+ if (auto E = C.consume(std::move(R.get())))
+ return E;
+ }
}
- FDRState::Token InitialExpectation;
- switch (FileHeader.Version) {
- case 1:
- InitialExpectation = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF;
- break;
- case 2:
- case 3:
- InitialExpectation = FDRState::Token::BUFFER_EXTENTS;
- break;
- default:
- return make_error<StringError>(
- Twine("Unsupported version '") + Twine(FileHeader.Version) + "'",
- std::make_error_code(std::errc::executable_format_error));
+ // Next we index the records into blocks.
+ BlockIndexer::Index Index;
+ {
+ BlockIndexer Indexer(Index);
+ for (auto &R : FDRRecords)
+ if (auto E = R->apply(Indexer))
+ return E;
+ if (auto E = Indexer.flush())
+ return E;
}
- FDRState State{0, 0, 0, 0, InitialExpectation, BufferSize, 0};
-
- // RecordSize will tell the loop how far to seek ahead based on the record
- // type that we have just read.
- size_t RecordSize = 0;
- for (auto S = Data.drop_front(32); !S.empty(); S = S.drop_front(RecordSize)) {
- DataExtractor RecordExtractor(S, true, 8);
- uint32_t OffsetPtr = 0;
- if (State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF) {
- RecordSize = State.CurrentBufferSize - State.CurrentBufferConsumed;
- if (S.size() < RecordSize) {
- return make_error<StringError>(
- Twine("Incomplete thread buffer. Expected at least ") +
- Twine(RecordSize) + " bytes but found " + Twine(S.size()),
- make_error_code(std::errc::invalid_argument));
+
+ // Then we verify the consistency of the blocks.
+ {
+ for (auto &PTB : Index) {
+ auto &Blocks = PTB.second;
+ for (auto &B : Blocks) {
+ BlockVerifier Verifier;
+ for (auto *R : B.Records)
+ if (auto E = R->apply(Verifier))
+ return E;
+ if (auto E = Verifier.verify())
+ return E;
}
- State.CurrentBufferConsumed = 0;
- State.Expects = FDRState::Token::NEW_BUFFER_RECORD_OR_EOF;
- continue;
- }
- uint8_t BitField = RecordExtractor.getU8(&OffsetPtr);
- bool isMetadataRecord = BitField & 0x01uL;
- bool isBufferExtents =
- (BitField >> 1) == 7; // BufferExtents record kind == 7
- if (isMetadataRecord) {
- RecordSize = 16;
- if (auto E =
- processFDRMetadataRecord(State, BitField, RecordExtractor,
- RecordSize, Records, FileHeader.Version))
- return E;
- } else { // Process Function Record
- RecordSize = 8;
- if (auto E = processFDRFunctionRecord(State, BitField, RecordExtractor,
- Records))
- return E;
}
+ }
- // The BufferExtents record is technically not part of the buffer, so we
- // don't count the size of that record against the buffer's actual size.
- if (!isBufferExtents)
- State.CurrentBufferConsumed += RecordSize;
- assert(State.CurrentBufferConsumed <= State.CurrentBufferSize);
- if ((FileHeader.Version == 2 || FileHeader.Version == 3) &&
- State.CurrentBufferSize == State.CurrentBufferConsumed) {
- // In Version 2 of the log, we don't need to scan to the end of the thread
- // buffer if we've already consumed all the bytes we need to.
- State.Expects = FDRState::Token::BUFFER_EXTENTS;
- State.CurrentBufferSize = BufferSize;
- State.CurrentBufferConsumed = 0;
+ // This is now the meat of the algorithm. Here we sort the blocks according to
+ // the Walltime record in each of the blocks for the same thread. This allows
+ // us to more consistently recreate the execution trace in temporal order.
+ // After the sort, we then reconstitute `Trace` records using a stateful
+ // visitor associated with a single process+thread pair.
+ {
+ for (auto &PTB : Index) {
+ auto &Blocks = PTB.second;
+ llvm::sort(Blocks, [](const BlockIndexer::Block &L,
+ const BlockIndexer::Block &R) {
+ return (L.WallclockTime->seconds() < R.WallclockTime->seconds() &&
+ L.WallclockTime->nanos() < R.WallclockTime->nanos());
+ });
+ auto Adder = [&](const XRayRecord &R) { Records.push_back(R); };
+ TraceExpander Expander(Adder, FileHeader.Version);
+ for (auto &B : Blocks) {
+ for (auto *R : B.Records)
+ if (auto E = R->apply(Expander))
+ return E;
+ }
+ if (auto E = Expander.flush())
+ return E;
}
}
- // Having iterated over everything we've been given, we've either consumed
- // everything and ended up in the end state, or were told to skip the rest.
- bool Finished = State.Expects == FDRState::Token::SCAN_TO_END_OF_THREAD_BUF &&
- State.CurrentBufferSize == State.CurrentBufferConsumed;
- if ((State.Expects != FDRState::Token::NEW_BUFFER_RECORD_OR_EOF &&
- State.Expects != FDRState::Token::BUFFER_EXTENTS) &&
- !Finished)
- return make_error<StringError>(
- Twine("Encountered EOF with unexpected state expectation ") +
- fdrStateToTwine(State.Expects) +
- ". Remaining expected bytes in thread buffer total " +
- Twine(State.CurrentBufferSize - State.CurrentBufferConsumed),
- std::make_error_code(std::errc::executable_format_error));
-
return Error::success();
}
@@ -670,8 +363,9 @@ Error loadYAMLLog(StringRef Data, XRayFileHeader &FileHeader,
Records.clear();
std::transform(Trace.Records.begin(), Trace.Records.end(),
std::back_inserter(Records), [&](const YAMLXRayRecord &R) {
- return XRayRecord{R.RecordType, R.CPU, R.Type, R.FuncId,
- R.TSC, R.TId, R.PId, R.CallArgs};
+ return XRayRecord{R.RecordType, R.CPU, R.Type,
+ R.FuncId, R.TSC, R.TId,
+ R.PId, R.CallArgs, R.Data};
});
return Error::success();
}
@@ -705,6 +399,17 @@ Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
}
auto Data = StringRef(MappedFile.data(), MappedFile.size());
+ // TODO: Lift the endianness and implementation selection here.
+ DataExtractor LittleEndianDE(Data, true, 8);
+ auto TraceOrError = loadTrace(LittleEndianDE, Sort);
+ if (!TraceOrError) {
+ DataExtractor BigEndianDE(Data, false, 8);
+ TraceOrError = loadTrace(BigEndianDE, Sort);
+ }
+ return TraceOrError;
+}
+
+Expected<Trace> llvm::xray::loadTrace(const DataExtractor &DE, bool Sort) {
// Attempt to detect the file type using file magic. We have a slight bias
// towards the binary format, and we do this by making sure that the first 4
// bytes of the binary file is some combination of the following byte
@@ -719,8 +424,7 @@ Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
//
// Only if we can't load either the binary or the YAML format will we yield an
// error.
- StringRef Magic(MappedFile.data(), 4);
- DataExtractor HeaderExtractor(Magic, true, 8);
+ DataExtractor HeaderExtractor(DE.getData(), DE.isLittleEndian(), 8);
uint32_t OffsetPtr = 0;
uint16_t Version = HeaderExtractor.getU16(&OffsetPtr);
uint16_t Type = HeaderExtractor.getU16(&OffsetPtr);
@@ -731,7 +435,8 @@ Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
switch (Type) {
case NAIVE_FORMAT:
if (Version == 1 || Version == 2 || Version == 3) {
- if (auto E = loadNaiveFormatLog(Data, T.FileHeader, T.Records))
+ if (auto E = loadNaiveFormatLog(DE.getData(), DE.isLittleEndian(),
+ T.FileHeader, T.Records))
return std::move(E);
} else {
return make_error<StringError>(
@@ -741,8 +446,9 @@ Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
}
break;
case FLIGHT_DATA_RECORDER_FORMAT:
- if (Version == 1 || Version == 2 || Version == 3) {
- if (auto E = loadFDRLog(Data, T.FileHeader, T.Records))
+ if (Version >= 1 && Version <= 5) {
+ if (auto E = loadFDRLog(DE.getData(), DE.isLittleEndian(), T.FileHeader,
+ T.Records))
return std::move(E);
} else {
return make_error<StringError>(
@@ -751,15 +457,15 @@ Expected<Trace> llvm::xray::loadTraceFile(StringRef Filename, bool Sort) {
}
break;
default:
- if (auto E = loadYAMLLog(Data, T.FileHeader, T.Records))
+ if (auto E = loadYAMLLog(DE.getData(), T.FileHeader, T.Records))
return std::move(E);
}
if (Sort)
std::stable_sort(T.Records.begin(), T.Records.end(),
- [&](const XRayRecord &L, const XRayRecord &R) {
- return L.TSC < R.TSC;
- });
+ [&](const XRayRecord &L, const XRayRecord &R) {
+ return L.TSC < R.TSC;
+ });
return std::move(T);
}