XMM registers can be collected on Icelake and later platforms. Add specific arch__intr_reg_mask(), which creating an event to check if the kernel and hardware can collect XMM registers. Test on Skylake which doesn't support XMM registers collection. There is nothing changed. #perf record -I? available registers: AX BX CX DX SI DI BP SP IP FLAGS CS SS R8 R9 R10 R11 R12 R13 R14 R15 Usage: perf record [<options>] [<command>] or: perf record [<options>] -- <command> [<options>] -I, --intr-regs[=<any register>] sample selected machine registers on interrupt, use '-I?' to list register names #perf record -I [ perf record: Woken up 1 times to write data ] [ perf record: Captured and wrote 0.905 MB perf.data (2520 samples) ] #perf evlist -v cycles: size: 112, { sample_period, sample_freq }: 4000, sample_type: IP|TID|TIME|CPU|PERIOD|REGS_INTR, read_format: ID, disabled: 1, inherit: 1, mmap: 1, comm: 1, freq: 1, task: 1, precise_ip: 3, sample_id_all: 1, exclude_guest: 1, mmap2: 1, comm_exec: 1, ksymbol: 1, bpf_event: 1, sample_regs_intr: 0xff0fff Test on Icelake which support XMM registers collection. #perf record -I? available registers: AX BX CX DX SI DI BP SP IP FLAGS CS SS R8 R9 R10 R11 R12 R13 R14 R15 XMM0 XMM1 XMM2 XMM3 XMM4 XMM5 XMM6 XMM7 XMM8 XMM9 XMM10 XMM11 XMM12 XMM13 XMM14 XMM15 Usage: perf record [<options>] [<command>] or: perf record [<options>] -- <command> [<options>] -I, --intr-regs[=<any register>] sample selected machine registers on interrupt, use '-I?' to list register names #perf record -I [ perf record: Woken up 1 times to write data ] [ perf record: Captured and wrote 0.800 MB perf.data (318 samples) ] #perf evlist -v cycles: size: 112, { sample_period, sample_freq }: 4000, sample_type: IP|TID|TIME|CPU|PERIOD|REGS_INTR, read_format: ID, disabled: 1, inherit: 1, mmap: 1, comm: 1, freq: 1, task: 1, precise_ip: 3, sample_id_all: 1, exclude_guest: 1, mmap2: 1, comm_exec: 1, ksymbol: 1, bpf_event: 1, sample_regs_intr: 0xffffffff00ff0fff Committer notes: Don't set attr.sample_period as a named struct init, as it is part of an unnamed union in 'struct perf_event_attr', and doing so breaks the build on older gcc versions, such as: gcc version 4.1.2 20080704 (Red Hat 4.1.2-55) gcc version 4.4.7 20120313 (Red Hat 4.4.7-23) (GCC) arch/x86/util/perf_regs.c: In function 'arch__intr_reg_mask': arch/x86/util/perf_regs.c:279: error: unknown field 'sample_period' specified in initializer cc1: warnings being treated as errors arch/x86/util/perf_regs.c:279: warning: missing braces around initializer arch/x86/util/perf_regs.c:279: warning: (near initialization for 'attr.<anonymous>') Signed-off-by: Kan Liang <kan.liang@linux.intel.com> [ Only on a lenovo t480s, a skylake machine, where the XMM registers didn't show up in -I?/--user-regs=? as expected ] Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com> Cc: Andi Kleen <ak@linux.intel.com> Cc: Jiri Olsa <jolsa@kernel.org> Link: http://lkml.kernel.org/r/1557865174-56264-3-git-send-email-kan.liang@linux.intel.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
110 lines
2.2 KiB
C
110 lines
2.2 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#ifndef ARCH_PERF_REGS_H
|
|
#define ARCH_PERF_REGS_H
|
|
|
|
#include <stdlib.h>
|
|
#include <linux/types.h>
|
|
#include <asm/perf_regs.h>
|
|
|
|
void perf_regs_load(u64 *regs);
|
|
|
|
#define PERF_REGS_MAX PERF_REG_X86_XMM_MAX
|
|
#define PERF_XMM_REGS_MASK (~((1ULL << PERF_REG_X86_XMM0) - 1))
|
|
#ifndef HAVE_ARCH_X86_64_SUPPORT
|
|
#define PERF_REGS_MASK ((1ULL << PERF_REG_X86_32_MAX) - 1)
|
|
#define PERF_SAMPLE_REGS_ABI PERF_SAMPLE_REGS_ABI_32
|
|
#else
|
|
#define REG_NOSUPPORT ((1ULL << PERF_REG_X86_DS) | \
|
|
(1ULL << PERF_REG_X86_ES) | \
|
|
(1ULL << PERF_REG_X86_FS) | \
|
|
(1ULL << PERF_REG_X86_GS))
|
|
#define PERF_REGS_MASK (((1ULL << PERF_REG_X86_64_MAX) - 1) & ~REG_NOSUPPORT)
|
|
#define PERF_SAMPLE_REGS_ABI PERF_SAMPLE_REGS_ABI_64
|
|
#endif
|
|
#define PERF_REG_IP PERF_REG_X86_IP
|
|
#define PERF_REG_SP PERF_REG_X86_SP
|
|
|
|
static inline const char *perf_reg_name(int id)
|
|
{
|
|
switch (id) {
|
|
case PERF_REG_X86_AX:
|
|
return "AX";
|
|
case PERF_REG_X86_BX:
|
|
return "BX";
|
|
case PERF_REG_X86_CX:
|
|
return "CX";
|
|
case PERF_REG_X86_DX:
|
|
return "DX";
|
|
case PERF_REG_X86_SI:
|
|
return "SI";
|
|
case PERF_REG_X86_DI:
|
|
return "DI";
|
|
case PERF_REG_X86_BP:
|
|
return "BP";
|
|
case PERF_REG_X86_SP:
|
|
return "SP";
|
|
case PERF_REG_X86_IP:
|
|
return "IP";
|
|
case PERF_REG_X86_FLAGS:
|
|
return "FLAGS";
|
|
case PERF_REG_X86_CS:
|
|
return "CS";
|
|
case PERF_REG_X86_SS:
|
|
return "SS";
|
|
case PERF_REG_X86_DS:
|
|
return "DS";
|
|
case PERF_REG_X86_ES:
|
|
return "ES";
|
|
case PERF_REG_X86_FS:
|
|
return "FS";
|
|
case PERF_REG_X86_GS:
|
|
return "GS";
|
|
#ifdef HAVE_ARCH_X86_64_SUPPORT
|
|
case PERF_REG_X86_R8:
|
|
return "R8";
|
|
case PERF_REG_X86_R9:
|
|
return "R9";
|
|
case PERF_REG_X86_R10:
|
|
return "R10";
|
|
case PERF_REG_X86_R11:
|
|
return "R11";
|
|
case PERF_REG_X86_R12:
|
|
return "R12";
|
|
case PERF_REG_X86_R13:
|
|
return "R13";
|
|
case PERF_REG_X86_R14:
|
|
return "R14";
|
|
case PERF_REG_X86_R15:
|
|
return "R15";
|
|
#endif /* HAVE_ARCH_X86_64_SUPPORT */
|
|
|
|
#define XMM(x) \
|
|
case PERF_REG_X86_XMM ## x: \
|
|
case PERF_REG_X86_XMM ## x + 1: \
|
|
return "XMM" #x;
|
|
XMM(0)
|
|
XMM(1)
|
|
XMM(2)
|
|
XMM(3)
|
|
XMM(4)
|
|
XMM(5)
|
|
XMM(6)
|
|
XMM(7)
|
|
XMM(8)
|
|
XMM(9)
|
|
XMM(10)
|
|
XMM(11)
|
|
XMM(12)
|
|
XMM(13)
|
|
XMM(14)
|
|
XMM(15)
|
|
#undef XMM
|
|
default:
|
|
return NULL;
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
#endif /* ARCH_PERF_REGS_H */
|