572 lines
16 KiB
C++
572 lines
16 KiB
C++
/*
|
|
* Copyright (C) 2015 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#ifndef SIMPLE_PERF_RECORD_H_
|
|
#define SIMPLE_PERF_RECORD_H_
|
|
|
|
#include <stdio.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <memory>
|
|
#include <queue>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include <android-base/logging.h>
|
|
|
|
#include "build_id.h"
|
|
#include "perf_event.h"
|
|
|
|
enum user_record_type {
|
|
PERF_RECORD_USER_DEFINED_TYPE_START = 64,
|
|
PERF_RECORD_ATTR = 64,
|
|
PERF_RECORD_EVENT_TYPE,
|
|
PERF_RECORD_TRACING_DATA,
|
|
PERF_RECORD_BUILD_ID,
|
|
PERF_RECORD_FINISHED_ROUND,
|
|
|
|
SIMPLE_PERF_RECORD_TYPE_START = 32768,
|
|
SIMPLE_PERF_RECORD_KERNEL_SYMBOL,
|
|
// TODO: remove DsoRecord and SymbolRecord.
|
|
SIMPLE_PERF_RECORD_DSO,
|
|
SIMPLE_PERF_RECORD_SYMBOL,
|
|
SIMPLE_PERF_RECORD_SPLIT,
|
|
SIMPLE_PERF_RECORD_SPLIT_END,
|
|
SIMPLE_PERF_RECORD_EVENT_ID,
|
|
};
|
|
|
|
// perf_event_header uses u16 to store record size. However, that is not
|
|
// enough for storing records like KERNEL_SYMBOL or TRACING_DATA. So define
|
|
// a simpleperf_record_header struct to store record header for simpleperf
|
|
// defined records (type > SIMPLE_PERF_RECORD_TYPE_START).
|
|
struct simpleperf_record_header {
|
|
uint32_t type;
|
|
uint16_t size1;
|
|
uint16_t size0;
|
|
};
|
|
|
|
static_assert(
|
|
sizeof(simpleperf_record_header) == sizeof(perf_event_header),
|
|
"simpleperf_record_header should have the same size as perf_event_header");
|
|
|
|
struct PerfSampleIpType {
|
|
uint64_t ip;
|
|
};
|
|
|
|
struct PerfSampleTidType {
|
|
uint32_t pid, tid;
|
|
};
|
|
|
|
struct PerfSampleTimeType {
|
|
uint64_t time;
|
|
};
|
|
|
|
struct PerfSampleAddrType {
|
|
uint64_t addr;
|
|
};
|
|
|
|
struct PerfSampleIdType {
|
|
uint64_t id;
|
|
};
|
|
|
|
struct PerfSampleStreamIdType {
|
|
uint64_t stream_id;
|
|
};
|
|
|
|
struct PerfSampleCpuType {
|
|
uint32_t cpu, res;
|
|
};
|
|
|
|
struct PerfSamplePeriodType {
|
|
uint64_t period;
|
|
};
|
|
|
|
struct PerfSampleCallChainType {
|
|
uint64_t ip_nr;
|
|
const uint64_t* ips;
|
|
};
|
|
|
|
struct PerfSampleRawType {
|
|
uint32_t size;
|
|
const char* data;
|
|
};
|
|
|
|
struct BranchStackItemType {
|
|
uint64_t from;
|
|
uint64_t to;
|
|
uint64_t flags;
|
|
};
|
|
|
|
struct PerfSampleBranchStackType {
|
|
uint64_t stack_nr;
|
|
const BranchStackItemType* stack;
|
|
};
|
|
|
|
struct PerfSampleRegsUserType {
|
|
uint64_t abi;
|
|
uint64_t reg_mask;
|
|
uint64_t reg_nr;
|
|
const uint64_t* regs;
|
|
};
|
|
|
|
struct PerfSampleStackUserType {
|
|
uint64_t size;
|
|
const char* data;
|
|
uint64_t dyn_size;
|
|
};
|
|
|
|
struct RecordHeader {
|
|
public:
|
|
uint32_t type;
|
|
uint16_t misc;
|
|
uint32_t size;
|
|
|
|
RecordHeader() : type(0), misc(0), size(0) {}
|
|
|
|
explicit RecordHeader(const char* p) {
|
|
auto pheader = reinterpret_cast<const perf_event_header*>(p);
|
|
if (pheader->type < SIMPLE_PERF_RECORD_TYPE_START) {
|
|
type = pheader->type;
|
|
misc = pheader->misc;
|
|
size = pheader->size;
|
|
} else {
|
|
auto sheader = reinterpret_cast<const simpleperf_record_header*>(p);
|
|
type = sheader->type;
|
|
misc = 0;
|
|
size = (sheader->size1 << 16) | sheader->size0;
|
|
}
|
|
}
|
|
|
|
void MoveToBinaryFormat(char*& p) const {
|
|
if (type < SIMPLE_PERF_RECORD_TYPE_START) {
|
|
auto pheader = reinterpret_cast<perf_event_header*>(p);
|
|
pheader->type = type;
|
|
pheader->misc = misc;
|
|
CHECK_LT(size, 1u << 16);
|
|
pheader->size = static_cast<uint16_t>(size);
|
|
} else {
|
|
auto sheader = reinterpret_cast<simpleperf_record_header*>(p);
|
|
sheader->type = type;
|
|
CHECK_EQ(misc, 0u);
|
|
sheader->size1 = size >> 16;
|
|
sheader->size0 = size & 0xffff;
|
|
}
|
|
p += sizeof(perf_event_header);
|
|
}
|
|
};
|
|
|
|
// SampleId is optional at the end of a record in binary format. Its content is
|
|
// determined by sample_id_all and sample_type in perf_event_attr. To avoid the
|
|
// complexity of referring to perf_event_attr each time, we copy sample_id_all
|
|
// and sample_type inside the SampleId structure.
|
|
struct SampleId {
|
|
bool sample_id_all;
|
|
uint64_t sample_type;
|
|
|
|
PerfSampleTidType tid_data; // Valid if sample_id_all && PERF_SAMPLE_TID.
|
|
PerfSampleTimeType time_data; // Valid if sample_id_all && PERF_SAMPLE_TIME.
|
|
PerfSampleIdType id_data; // Valid if sample_id_all && PERF_SAMPLE_ID.
|
|
PerfSampleStreamIdType
|
|
stream_id_data; // Valid if sample_id_all && PERF_SAMPLE_STREAM_ID.
|
|
PerfSampleCpuType cpu_data; // Valid if sample_id_all && PERF_SAMPLE_CPU.
|
|
|
|
SampleId();
|
|
|
|
// Create the content of sample_id. It depends on the attr we use.
|
|
size_t CreateContent(const perf_event_attr& attr, uint64_t event_id);
|
|
|
|
// Parse sample_id from binary format in the buffer pointed by p.
|
|
void ReadFromBinaryFormat(const perf_event_attr& attr, const char* p,
|
|
const char* end);
|
|
|
|
// Write the binary format of sample_id to the buffer pointed by p.
|
|
void WriteToBinaryFormat(char*& p) const;
|
|
void Dump(size_t indent) const;
|
|
size_t Size() const;
|
|
};
|
|
|
|
// Usually one record contains the following three parts in order in binary
|
|
// format:
|
|
// RecordHeader (at the head of a record, containing type and size info)
|
|
// data depends on the record type
|
|
// SampleId (optional part at the end of a record)
|
|
// We hold the common parts (RecordHeader and SampleId) in the base class
|
|
// Record, and hold the type specific data part in classes derived from Record.
|
|
struct Record {
|
|
RecordHeader header;
|
|
SampleId sample_id;
|
|
|
|
Record() : binary_(nullptr), own_binary_(false) {}
|
|
explicit Record(const char* p) : header(p), binary_(p), own_binary_(false) {}
|
|
Record(Record&& other);
|
|
|
|
virtual ~Record() {
|
|
if (own_binary_) {
|
|
delete[] binary_;
|
|
}
|
|
}
|
|
|
|
void OwnBinary() { own_binary_ = true; }
|
|
|
|
uint32_t type() const { return header.type; }
|
|
|
|
uint16_t misc() const { return header.misc; }
|
|
|
|
uint32_t size() const { return header.size; }
|
|
|
|
static uint32_t header_size() { return sizeof(perf_event_header); }
|
|
|
|
bool InKernel() const {
|
|
return (header.misc & PERF_RECORD_MISC_CPUMODE_MASK) ==
|
|
PERF_RECORD_MISC_KERNEL;
|
|
}
|
|
|
|
void SetTypeAndMisc(uint32_t type, uint16_t misc) {
|
|
header.type = type;
|
|
header.misc = misc;
|
|
}
|
|
|
|
void SetSize(uint32_t size) { header.size = size; }
|
|
|
|
void Dump(size_t indent = 0) const;
|
|
|
|
const char* Binary() const { return binary_; }
|
|
|
|
virtual uint64_t Timestamp() const;
|
|
virtual uint32_t Cpu() const;
|
|
virtual uint64_t Id() const;
|
|
|
|
protected:
|
|
void UpdateBinary(const char* new_binary);
|
|
virtual void DumpData(size_t) const = 0;
|
|
|
|
const char* binary_;
|
|
bool own_binary_;
|
|
|
|
DISALLOW_COPY_AND_ASSIGN(Record);
|
|
};
|
|
|
|
struct MmapRecord : public Record {
|
|
struct MmapRecordDataType {
|
|
uint32_t pid, tid;
|
|
uint64_t addr;
|
|
uint64_t len;
|
|
uint64_t pgoff;
|
|
};
|
|
const MmapRecordDataType* data;
|
|
const char* filename;
|
|
|
|
MmapRecord(const perf_event_attr& attr, const char* p);
|
|
|
|
MmapRecord(const perf_event_attr& attr, bool in_kernel, uint32_t pid,
|
|
uint32_t tid, uint64_t addr, uint64_t len, uint64_t pgoff,
|
|
const std::string& filename, uint64_t event_id, uint64_t time = 0);
|
|
|
|
void SetDataAndFilename(const MmapRecordDataType& data,
|
|
const std::string& filename);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct Mmap2Record : public Record {
|
|
struct Mmap2RecordDataType {
|
|
uint32_t pid, tid;
|
|
uint64_t addr;
|
|
uint64_t len;
|
|
uint64_t pgoff;
|
|
uint32_t maj;
|
|
uint32_t min;
|
|
uint64_t ino;
|
|
uint64_t ino_generation;
|
|
uint32_t prot, flags;
|
|
};
|
|
const Mmap2RecordDataType* data;
|
|
const char* filename;
|
|
|
|
Mmap2Record(const perf_event_attr& attr, const char* p);
|
|
|
|
void SetDataAndFilename(const Mmap2RecordDataType& data,
|
|
const std::string& filename);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct CommRecord : public Record {
|
|
struct CommRecordDataType {
|
|
uint32_t pid, tid;
|
|
};
|
|
const CommRecordDataType* data;
|
|
const char* comm;
|
|
|
|
CommRecord(const perf_event_attr& attr, const char* p);
|
|
|
|
CommRecord(const perf_event_attr& attr, uint32_t pid, uint32_t tid,
|
|
const std::string& comm, uint64_t event_id, uint64_t time);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct ExitOrForkRecord : public Record {
|
|
struct ExitOrForkRecordDataType {
|
|
uint32_t pid, ppid;
|
|
uint32_t tid, ptid;
|
|
uint64_t time;
|
|
};
|
|
const ExitOrForkRecordDataType* data;
|
|
|
|
ExitOrForkRecord(const perf_event_attr& attr, const char* p);
|
|
|
|
ExitOrForkRecord() : data(nullptr) {}
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct ExitRecord : public ExitOrForkRecord {
|
|
ExitRecord(const perf_event_attr& attr, const char* p)
|
|
: ExitOrForkRecord(attr, p) {}
|
|
};
|
|
|
|
struct ForkRecord : public ExitOrForkRecord {
|
|
ForkRecord(const perf_event_attr& attr, const char* p)
|
|
: ExitOrForkRecord(attr, p) {}
|
|
|
|
ForkRecord(const perf_event_attr& attr, uint32_t pid, uint32_t tid,
|
|
uint32_t ppid, uint32_t ptid, uint64_t event_id);
|
|
};
|
|
|
|
struct LostRecord : public Record {
|
|
uint64_t id;
|
|
uint64_t lost;
|
|
|
|
LostRecord(const perf_event_attr& attr, const char* p);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct SampleRecord : public Record {
|
|
uint64_t sample_type; // sample_type is a bit mask determining which fields
|
|
// below are valid.
|
|
|
|
PerfSampleIpType ip_data; // Valid if PERF_SAMPLE_IP.
|
|
PerfSampleTidType tid_data; // Valid if PERF_SAMPLE_TID.
|
|
PerfSampleTimeType time_data; // Valid if PERF_SAMPLE_TIME.
|
|
PerfSampleAddrType addr_data; // Valid if PERF_SAMPLE_ADDR.
|
|
PerfSampleIdType id_data; // Valid if PERF_SAMPLE_ID.
|
|
PerfSampleStreamIdType stream_id_data; // Valid if PERF_SAMPLE_STREAM_ID.
|
|
PerfSampleCpuType cpu_data; // Valid if PERF_SAMPLE_CPU.
|
|
PerfSamplePeriodType period_data; // Valid if PERF_SAMPLE_PERIOD.
|
|
|
|
PerfSampleCallChainType callchain_data; // Valid if PERF_SAMPLE_CALLCHAIN.
|
|
PerfSampleRawType raw_data; // Valid if PERF_SAMPLE_RAW.
|
|
PerfSampleBranchStackType
|
|
branch_stack_data; // Valid if PERF_SAMPLE_BRANCH_STACK.
|
|
PerfSampleRegsUserType regs_user_data; // Valid if PERF_SAMPLE_REGS_USER.
|
|
PerfSampleStackUserType stack_user_data; // Valid if PERF_SAMPLE_STACK_USER.
|
|
|
|
SampleRecord(const perf_event_attr& attr, const char* p);
|
|
SampleRecord(const perf_event_attr& attr, uint64_t id, uint64_t ip,
|
|
uint32_t pid, uint32_t tid, uint64_t time, uint32_t cpu,
|
|
uint64_t period, const std::vector<uint64_t>& ips);
|
|
|
|
void ReplaceRegAndStackWithCallChain(const std::vector<uint64_t>& ips);
|
|
uint64_t Timestamp() const override;
|
|
uint32_t Cpu() const override;
|
|
uint64_t Id() const override;
|
|
|
|
uint64_t GetValidStackSize() const {
|
|
// If stack_user_data.dyn_size == 0, it may be because the kernel misses
|
|
// the patch to update dyn_size, like in N9 (See b/22612370). So assume
|
|
// all stack data is valid if dyn_size == 0.
|
|
if (stack_user_data.dyn_size == 0) {
|
|
return stack_user_data.size;
|
|
}
|
|
return stack_user_data.dyn_size;
|
|
}
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
// BuildIdRecord is defined in user-space, stored in BuildId feature section in
|
|
// record file.
|
|
struct BuildIdRecord : public Record {
|
|
uint32_t pid;
|
|
BuildId build_id;
|
|
const char* filename;
|
|
|
|
explicit BuildIdRecord(const char* p);
|
|
|
|
BuildIdRecord(bool in_kernel, pid_t pid, const BuildId& build_id,
|
|
const std::string& filename);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct KernelSymbolRecord : public Record {
|
|
uint32_t kallsyms_size;
|
|
const char* kallsyms;
|
|
|
|
explicit KernelSymbolRecord(const char* p);
|
|
|
|
explicit KernelSymbolRecord(const std::string& kallsyms);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct DsoRecord : public Record {
|
|
uint64_t dso_type;
|
|
uint64_t dso_id;
|
|
uint64_t min_vaddr;
|
|
const char* dso_name;
|
|
|
|
explicit DsoRecord(const char* p);
|
|
|
|
DsoRecord(uint64_t dso_type, uint64_t dso_id, const std::string& dso_name,
|
|
uint64_t min_vaddr);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct SymbolRecord : public Record {
|
|
uint64_t addr;
|
|
uint64_t len;
|
|
uint64_t dso_id;
|
|
const char* name;
|
|
|
|
explicit SymbolRecord(const char* p);
|
|
|
|
SymbolRecord(uint64_t addr, uint64_t len, const std::string& name,
|
|
uint64_t dso_id);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct TracingDataRecord : public Record {
|
|
uint32_t data_size;
|
|
const char* data;
|
|
|
|
explicit TracingDataRecord(const char* p);
|
|
|
|
explicit TracingDataRecord(const std::vector<char>& tracing_data);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
struct EventIdRecord : public Record {
|
|
uint64_t count;
|
|
struct EventIdData {
|
|
uint64_t attr_id;
|
|
uint64_t event_id;
|
|
} const* data;
|
|
|
|
explicit EventIdRecord(const char* p);
|
|
|
|
explicit EventIdRecord(const std::vector<uint64_t>& data);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
// UnknownRecord is used for unknown record types, it makes sure all unknown
|
|
// records are not changed when modifying perf.data.
|
|
struct UnknownRecord : public Record {
|
|
const char* data;
|
|
|
|
explicit UnknownRecord(const char* p);
|
|
|
|
protected:
|
|
void DumpData(size_t indent) const override;
|
|
};
|
|
|
|
// Read record from the buffer pointed by [p]. But the record doesn't own
|
|
// the buffer.
|
|
std::unique_ptr<Record> ReadRecordFromBuffer(const perf_event_attr& attr,
|
|
uint32_t type, const char* p);
|
|
|
|
// Read record from the buffer pointed by [p]. And the record owns the buffer.
|
|
std::unique_ptr<Record> ReadRecordFromOwnedBuffer(const perf_event_attr& attr,
|
|
uint32_t type, const char* p);
|
|
|
|
// Read records from the buffer pointed by [buf]. None of the records own
|
|
// the buffer.
|
|
std::vector<std::unique_ptr<Record>> ReadRecordsFromBuffer(
|
|
const perf_event_attr& attr, const char* buf, size_t buf_size);
|
|
|
|
// Read one record from the buffer pointed by [p]. But the record doesn't
|
|
// own the buffer.
|
|
std::unique_ptr<Record> ReadRecordFromBuffer(const perf_event_attr& attr,
|
|
const char* p);
|
|
|
|
// RecordCache is a cache used when receiving records from the kernel.
|
|
// It sorts received records based on type and timestamp, and pops records
|
|
// in sorted order. Records from the kernel need to be sorted because
|
|
// records may come from different cpus at the same time, and it is affected
|
|
// by the order in which we collect records from different cpus.
|
|
// RecordCache pushes records and pops sorted record online. It uses two checks
|
|
// to help ensure that records are popped in order. Each time we pop a record A,
|
|
// it is the earliest record among all records in the cache. In addition, we
|
|
// have checks for min_cache_size and min_time_diff. For min_cache_size check,
|
|
// we check if the cache size >= min_cache_size, which is based on the
|
|
// assumption that if we have received (min_cache_size - 1) records after
|
|
// record A, we are not likely to receive a record earlier than A. For
|
|
// min_time_diff check, we check if record A is generated min_time_diff ns
|
|
// earlier than the latest record, which is based on the assumption that if we
|
|
// have received a record for time t, we are not likely to receive a record for
|
|
// time (t - min_time_diff) or earlier.
|
|
class RecordCache {
|
|
public:
|
|
explicit RecordCache(bool has_timestamp, size_t min_cache_size = 1000u,
|
|
uint64_t min_time_diff_in_ns = 1000000u);
|
|
~RecordCache();
|
|
void Push(std::unique_ptr<Record> record);
|
|
void Push(std::vector<std::unique_ptr<Record>> records);
|
|
std::unique_ptr<Record> Pop();
|
|
std::vector<std::unique_ptr<Record>> PopAll();
|
|
std::unique_ptr<Record> ForcedPop();
|
|
|
|
private:
|
|
struct RecordWithSeq {
|
|
uint32_t seq;
|
|
Record* record;
|
|
|
|
RecordWithSeq(uint32_t seq, Record* record) : seq(seq), record(record) {}
|
|
bool IsHappensBefore(const RecordWithSeq& other) const;
|
|
};
|
|
|
|
struct RecordComparator {
|
|
bool operator()(const RecordWithSeq& r1, const RecordWithSeq& r2);
|
|
};
|
|
|
|
bool has_timestamp_;
|
|
size_t min_cache_size_;
|
|
uint64_t min_time_diff_in_ns_;
|
|
uint64_t last_time_;
|
|
uint32_t cur_seq_;
|
|
std::priority_queue<RecordWithSeq, std::vector<RecordWithSeq>,
|
|
RecordComparator> queue_;
|
|
};
|
|
|
|
#endif // SIMPLE_PERF_RECORD_H_
|