mirror of
https://mirrors.bfsu.edu.cn/git/linux.git
synced 2024-12-15 15:04:27 +08:00
a7fe9a443b
If virtual timestamps are detected, set sample time field accordingly, otherwise warn the user that the samples will not include accurate time data. | Test notes (FEAT_TRF platform) | | $ ./perf record -e cs_etm//u -a -- sleep 4 | $ ./perf script --fields +time | perf 422 [000] 163.375100: 1 branches:uH: 0 [unknown] ([unknown]) | perf 422 [000] 163.375100: 1 branches:uH: ffffb8009544 ioctl+0x14 (/lib/aarch64-linux-gnu/libc-2.27.so) | perf 422 [000] 163.375100: 1 branches:uH: aaaaab6bebf4 perf_evsel__run_ioctl+0x90 (/home/german/linux/tools/perf/perf) | [...] | perf 422 [000] 167.393100: 1 branches:uH: aaaaab6bda00 __xyarray__entry+0x74 (/home/german/linux/tools/perf/perf) | perf 422 [000] 167.393099: 1 branches:uH: aaaaab6bda0c __xyarray__entry+0x80 (/home/german/linux/tools/perf/perf) | perf 422 [000] 167.393099: 1 branches:uH: ffffb8009538 ioctl+0x8 (/lib/aarch64-linux-gnu/libc-2.27.so) | | The time from the first sample to the last sample is 4 seconds Now that times are converted to nanoseconds, also try to estimate the timestamps more accurately be dividing by some fixed value for instructions per ns. This prevents long ranges from being estimated too far in the past than would be realistic. Signed-off-by: German Gomez <german.gomez@arm.com> Acked-by: Suzuki Poulouse <suzuki.poulose@arm.com> Tested-by: Tanmay Jagdale <tanmay@marvell.com> Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com> Cc: Bharat Bhushan <bbhushan2@marvell.com> Cc: George Cherian <gcherian@marvell.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Jiri Olsa <jolsa@kernel.org> Cc: John Garry <john.g.garry@oracle.com> Cc: Leo Yan <leo.yan@linaro.org> Cc: Linu Cherian <lcherian@marvell.com> Cc: Mark Rutland <mark.rutland@arm.com> Cc: Mathieu Poirier <mathieu.poirier@linaro.org> Cc: Mike Leach <mike.leach@linaro.org> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Sunil Kovvuri Goutham <sgoutham@marvell.com> Cc: Will Deacon <will@kernel.org> Cc: coresight@lists.linaro.org Cc: linux-arm-kernel@lists.infradead.org Link: https://lore.kernel.org/r/20230120143702.4035046-8-james.clark@arm.com Signed-off-by: James Clark <james.clark@arm.com> Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
246 lines
6.6 KiB
C
246 lines
6.6 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
/*
|
|
* Copyright(C) 2015 Linaro Limited. All rights reserved.
|
|
* Author: Mathieu Poirier <mathieu.poirier@linaro.org>
|
|
*/
|
|
|
|
#ifndef INCLUDE__UTIL_PERF_CS_ETM_H__
|
|
#define INCLUDE__UTIL_PERF_CS_ETM_H__
|
|
|
|
#include "debug.h"
|
|
#include "util/event.h"
|
|
#include <linux/bits.h>
|
|
|
|
struct perf_session;
|
|
|
|
/*
|
|
* Versioning header in case things need to change in the future. That way
|
|
* decoding of old snapshot is still possible.
|
|
*/
|
|
enum {
|
|
/* Starting with 0x0 */
|
|
CS_HEADER_VERSION,
|
|
/* PMU->type (32 bit), total # of CPUs (32 bit) */
|
|
CS_PMU_TYPE_CPUS,
|
|
CS_ETM_SNAPSHOT,
|
|
CS_HEADER_VERSION_MAX,
|
|
};
|
|
|
|
/*
|
|
* Update the version for new format.
|
|
*
|
|
* New version 1 format adds a param count to the per cpu metadata.
|
|
* This allows easy adding of new metadata parameters.
|
|
* Requires that new params always added after current ones.
|
|
* Also allows client reader to handle file versions that are different by
|
|
* checking the number of params in the file vs the number expected.
|
|
*/
|
|
#define CS_HEADER_CURRENT_VERSION 1
|
|
|
|
/* Beginning of header common to both ETMv3 and V4 */
|
|
enum {
|
|
CS_ETM_MAGIC,
|
|
CS_ETM_CPU,
|
|
/* Number of trace config params in following ETM specific block */
|
|
CS_ETM_NR_TRC_PARAMS,
|
|
CS_ETM_COMMON_BLK_MAX_V1,
|
|
};
|
|
|
|
/* ETMv3/PTM metadata */
|
|
enum {
|
|
/* Dynamic, configurable parameters */
|
|
CS_ETM_ETMCR = CS_ETM_COMMON_BLK_MAX_V1,
|
|
CS_ETM_ETMTRACEIDR,
|
|
/* RO, taken from sysFS */
|
|
CS_ETM_ETMCCER,
|
|
CS_ETM_ETMIDR,
|
|
CS_ETM_PRIV_MAX,
|
|
};
|
|
|
|
/* define fixed version 0 length - allow new format reader to read old files. */
|
|
#define CS_ETM_NR_TRC_PARAMS_V0 (CS_ETM_ETMIDR - CS_ETM_ETMCR + 1)
|
|
|
|
/* ETMv4 metadata */
|
|
enum {
|
|
/* Dynamic, configurable parameters */
|
|
CS_ETMV4_TRCCONFIGR = CS_ETM_COMMON_BLK_MAX_V1,
|
|
CS_ETMV4_TRCTRACEIDR,
|
|
/* RO, taken from sysFS */
|
|
CS_ETMV4_TRCIDR0,
|
|
CS_ETMV4_TRCIDR1,
|
|
CS_ETMV4_TRCIDR2,
|
|
CS_ETMV4_TRCIDR8,
|
|
CS_ETMV4_TRCAUTHSTATUS,
|
|
CS_ETMV4_TS_SOURCE,
|
|
CS_ETMV4_PRIV_MAX,
|
|
};
|
|
|
|
/* define fixed version 0 length - allow new format reader to read old files. */
|
|
#define CS_ETMV4_NR_TRC_PARAMS_V0 (CS_ETMV4_TRCAUTHSTATUS - CS_ETMV4_TRCCONFIGR + 1)
|
|
|
|
/*
|
|
* ETE metadata is ETMv4 plus TRCDEVARCH register and doesn't support header V0 since it was
|
|
* added in header V1
|
|
*/
|
|
enum {
|
|
/* Dynamic, configurable parameters */
|
|
CS_ETE_TRCCONFIGR = CS_ETM_COMMON_BLK_MAX_V1,
|
|
CS_ETE_TRCTRACEIDR,
|
|
/* RO, taken from sysFS */
|
|
CS_ETE_TRCIDR0,
|
|
CS_ETE_TRCIDR1,
|
|
CS_ETE_TRCIDR2,
|
|
CS_ETE_TRCIDR8,
|
|
CS_ETE_TRCAUTHSTATUS,
|
|
CS_ETE_TRCDEVARCH,
|
|
CS_ETE_TS_SOURCE,
|
|
CS_ETE_PRIV_MAX
|
|
};
|
|
|
|
/*
|
|
* ETMv3 exception encoding number:
|
|
* See Embedded Trace Macrocell specification (ARM IHI 0014Q)
|
|
* table 7-12 Encoding of Exception[3:0] for non-ARMv7-M processors.
|
|
*/
|
|
enum {
|
|
CS_ETMV3_EXC_NONE = 0,
|
|
CS_ETMV3_EXC_DEBUG_HALT = 1,
|
|
CS_ETMV3_EXC_SMC = 2,
|
|
CS_ETMV3_EXC_HYP = 3,
|
|
CS_ETMV3_EXC_ASYNC_DATA_ABORT = 4,
|
|
CS_ETMV3_EXC_JAZELLE_THUMBEE = 5,
|
|
CS_ETMV3_EXC_PE_RESET = 8,
|
|
CS_ETMV3_EXC_UNDEFINED_INSTR = 9,
|
|
CS_ETMV3_EXC_SVC = 10,
|
|
CS_ETMV3_EXC_PREFETCH_ABORT = 11,
|
|
CS_ETMV3_EXC_DATA_FAULT = 12,
|
|
CS_ETMV3_EXC_GENERIC = 13,
|
|
CS_ETMV3_EXC_IRQ = 14,
|
|
CS_ETMV3_EXC_FIQ = 15,
|
|
};
|
|
|
|
/*
|
|
* ETMv4 exception encoding number:
|
|
* See ARM Embedded Trace Macrocell Architecture Specification (ARM IHI 0064D)
|
|
* table 6-12 Possible values for the TYPE field in an Exception instruction
|
|
* trace packet, for ARMv7-A/R and ARMv8-A/R PEs.
|
|
*/
|
|
enum {
|
|
CS_ETMV4_EXC_RESET = 0,
|
|
CS_ETMV4_EXC_DEBUG_HALT = 1,
|
|
CS_ETMV4_EXC_CALL = 2,
|
|
CS_ETMV4_EXC_TRAP = 3,
|
|
CS_ETMV4_EXC_SYSTEM_ERROR = 4,
|
|
CS_ETMV4_EXC_INST_DEBUG = 6,
|
|
CS_ETMV4_EXC_DATA_DEBUG = 7,
|
|
CS_ETMV4_EXC_ALIGNMENT = 10,
|
|
CS_ETMV4_EXC_INST_FAULT = 11,
|
|
CS_ETMV4_EXC_DATA_FAULT = 12,
|
|
CS_ETMV4_EXC_IRQ = 14,
|
|
CS_ETMV4_EXC_FIQ = 15,
|
|
CS_ETMV4_EXC_END = 31,
|
|
};
|
|
|
|
enum cs_etm_sample_type {
|
|
CS_ETM_EMPTY,
|
|
CS_ETM_RANGE,
|
|
CS_ETM_DISCONTINUITY,
|
|
CS_ETM_EXCEPTION,
|
|
CS_ETM_EXCEPTION_RET,
|
|
};
|
|
|
|
enum cs_etm_isa {
|
|
CS_ETM_ISA_UNKNOWN,
|
|
CS_ETM_ISA_A64,
|
|
CS_ETM_ISA_A32,
|
|
CS_ETM_ISA_T32,
|
|
};
|
|
|
|
struct cs_etm_queue;
|
|
|
|
struct cs_etm_packet {
|
|
enum cs_etm_sample_type sample_type;
|
|
enum cs_etm_isa isa;
|
|
u64 start_addr;
|
|
u64 end_addr;
|
|
u32 instr_count;
|
|
u32 last_instr_type;
|
|
u32 last_instr_subtype;
|
|
u32 flags;
|
|
u32 exception_number;
|
|
u8 last_instr_cond;
|
|
u8 last_instr_taken_branch;
|
|
u8 last_instr_size;
|
|
u8 trace_chan_id;
|
|
int cpu;
|
|
};
|
|
|
|
#define CS_ETM_PACKET_MAX_BUFFER 1024
|
|
|
|
/*
|
|
* When working with per-thread scenarios the process under trace can
|
|
* be scheduled on any CPU and as such, more than one traceID may be
|
|
* associated with the same process. Since a traceID of '0' is illegal
|
|
* as per the CoreSight architecture, use that specific value to
|
|
* identify the queue where all packets (with any traceID) are
|
|
* aggregated.
|
|
*/
|
|
#define CS_ETM_PER_THREAD_TRACEID 0
|
|
|
|
struct cs_etm_packet_queue {
|
|
u32 packet_count;
|
|
u32 head;
|
|
u32 tail;
|
|
u32 instr_count;
|
|
u64 cs_timestamp; /* Timestamp from trace data, converted to ns if possible */
|
|
u64 next_cs_timestamp;
|
|
struct cs_etm_packet packet_buffer[CS_ETM_PACKET_MAX_BUFFER];
|
|
};
|
|
|
|
#define KiB(x) ((x) * 1024)
|
|
#define MiB(x) ((x) * 1024 * 1024)
|
|
|
|
#define CS_ETM_INVAL_ADDR 0xdeadbeefdeadbeefUL
|
|
|
|
#define BMVAL(val, lsb, msb) ((val & GENMASK(msb, lsb)) >> lsb)
|
|
|
|
#define CS_ETM_HEADER_SIZE (CS_HEADER_VERSION_MAX * sizeof(u64))
|
|
|
|
#define __perf_cs_etmv3_magic 0x3030303030303030ULL
|
|
#define __perf_cs_etmv4_magic 0x4040404040404040ULL
|
|
#define __perf_cs_ete_magic 0x5050505050505050ULL
|
|
#define CS_ETMV3_PRIV_SIZE (CS_ETM_PRIV_MAX * sizeof(u64))
|
|
#define CS_ETMV4_PRIV_SIZE (CS_ETMV4_PRIV_MAX * sizeof(u64))
|
|
#define CS_ETE_PRIV_SIZE (CS_ETE_PRIV_MAX * sizeof(u64))
|
|
|
|
#define INFO_HEADER_SIZE (sizeof(((struct perf_record_auxtrace_info *)0)->type) + \
|
|
sizeof(((struct perf_record_auxtrace_info *)0)->reserved__))
|
|
|
|
int cs_etm__process_auxtrace_info(union perf_event *event,
|
|
struct perf_session *session);
|
|
|
|
#ifdef HAVE_CSTRACE_SUPPORT
|
|
int cs_etm__get_cpu(u8 trace_chan_id, int *cpu);
|
|
int cs_etm__get_pid_fmt(u8 trace_chan_id, u64 *pid_fmt);
|
|
int cs_etm__etmq_set_tid(struct cs_etm_queue *etmq,
|
|
pid_t tid, u8 trace_chan_id);
|
|
bool cs_etm__etmq_is_timeless(struct cs_etm_queue *etmq);
|
|
void cs_etm__etmq_set_traceid_queue_timestamp(struct cs_etm_queue *etmq,
|
|
u8 trace_chan_id);
|
|
struct cs_etm_packet_queue
|
|
*cs_etm__etmq_get_packet_queue(struct cs_etm_queue *etmq, u8 trace_chan_id);
|
|
int cs_etm__process_auxtrace_info_full(union perf_event *event __maybe_unused,
|
|
struct perf_session *session __maybe_unused);
|
|
u64 cs_etm__convert_sample_time(struct cs_etm_queue *etmq, u64 cs_timestamp);
|
|
#else
|
|
static inline int
|
|
cs_etm__process_auxtrace_info_full(union perf_event *event __maybe_unused,
|
|
struct perf_session *session __maybe_unused)
|
|
{
|
|
pr_err("\nCS ETM Trace: OpenCSD is not linked in, please recompile with CORESIGHT=1\n");
|
|
return -1;
|
|
}
|
|
#endif
|
|
|
|
#endif
|