9d6a1df9b2
Scanning all PMUs is expensive as all PMUs sysfs entries are loaded, benchmarking shows more than 4x the cost: ``` $ perf bench internals pmu-scan -i 1000 Computing performance of sysfs PMU event scan for 1000 times Average core PMU scanning took: 989.231 usec (+- 1.535 usec) Average PMU scanning took: 4309.425 usec (+- 74.322 usec) ``` Add new perf_pmus__scan_core routine that scans just core PMUs. Replace perf_pmus__scan calls with perf_pmus__scan_core when non-core PMUs are being ignored. Reviewed-by: Kan Liang <kan.liang@linux.intel.com> Signed-off-by: Ian Rogers <irogers@google.com> Cc: Adrian Hunter <adrian.hunter@intel.com> Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com> Cc: Ali Saidi <alisaidi@amazon.com> Cc: Athira Rajeev <atrajeev@linux.vnet.ibm.com> Cc: Dmitrii Dolgov <9erthalion6@gmail.com> Cc: Huacai Chen <chenhuacai@kernel.org> Cc: Ingo Molnar <mingo@redhat.com> Cc: James Clark <james.clark@arm.com> Cc: Jing Zhang <renyu.zj@linux.alibaba.com> Cc: Jiri Olsa <jolsa@kernel.org> Cc: John Garry <john.g.garry@oracle.com> Cc: Kajol Jain <kjain@linux.ibm.com> Cc: Kang Minchul <tegongkang@gmail.com> Cc: Leo Yan <leo.yan@linaro.org> Cc: Madhavan Srinivasan <maddy@linux.ibm.com> Cc: Mark Rutland <mark.rutland@arm.com> Cc: Mike Leach <mike.leach@linaro.org> Cc: Ming Wang <wangming01@loongson.cn> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Ravi Bangoria <ravi.bangoria@amd.com> Cc: Rob Herring <robh@kernel.org> Cc: Sandipan Das <sandipan.das@amd.com> Cc: Sean Christopherson <seanjc@google.com> Cc: Suzuki Poulouse <suzuki.poulose@arm.com> Cc: Thomas Richter <tmricht@linux.ibm.com> Cc: Will Deacon <will@kernel.org> Cc: Xing Zhengjun <zhengjun.xing@linux.intel.com> Cc: coresight@lists.linaro.org Cc: linux-arm-kernel@lists.infradead.org Link: https://lore.kernel.org/r/20230527072210.2900565-30-irogers@google.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
1044 lines
26 KiB
C
1044 lines
26 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
#include "math.h"
|
|
#include "parse-events.h"
|
|
#include "pmu.h"
|
|
#include "pmus.h"
|
|
#include "tests.h"
|
|
#include <errno.h>
|
|
#include <stdio.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/zalloc.h>
|
|
#include "debug.h"
|
|
#include "../pmu-events/pmu-events.h"
|
|
#include <perf/evlist.h>
|
|
#include "util/evlist.h"
|
|
#include "util/expr.h"
|
|
#include "util/hashmap.h"
|
|
#include "util/parse-events.h"
|
|
#include "metricgroup.h"
|
|
#include "stat.h"
|
|
|
|
struct perf_pmu_test_event {
|
|
/* used for matching against events from generated pmu-events.c */
|
|
struct pmu_event event;
|
|
|
|
/* used for matching against event aliases */
|
|
/* extra events for aliases */
|
|
const char *alias_str;
|
|
|
|
/*
|
|
* Note: For when PublicDescription does not exist in the JSON, we
|
|
* will have no long_desc in pmu_event.long_desc, but long_desc may
|
|
* be set in the alias.
|
|
*/
|
|
const char *alias_long_desc;
|
|
|
|
/* PMU which we should match against */
|
|
const char *matching_pmu;
|
|
};
|
|
|
|
struct perf_pmu_test_pmu {
|
|
struct perf_pmu pmu;
|
|
struct perf_pmu_test_event const *aliases[10];
|
|
};
|
|
|
|
static const struct perf_pmu_test_event bp_l1_btb_correct = {
|
|
.event = {
|
|
.name = "bp_l1_btb_correct",
|
|
.event = "event=0x8a",
|
|
.desc = "L1 BTB Correction",
|
|
.topic = "branch",
|
|
},
|
|
.alias_str = "event=0x8a",
|
|
.alias_long_desc = "L1 BTB Correction",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event bp_l2_btb_correct = {
|
|
.event = {
|
|
.name = "bp_l2_btb_correct",
|
|
.event = "event=0x8b",
|
|
.desc = "L2 BTB Correction",
|
|
.topic = "branch",
|
|
},
|
|
.alias_str = "event=0x8b",
|
|
.alias_long_desc = "L2 BTB Correction",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event segment_reg_loads_any = {
|
|
.event = {
|
|
.name = "segment_reg_loads.any",
|
|
.event = "event=0x6,period=200000,umask=0x80",
|
|
.desc = "Number of segment register loads",
|
|
.topic = "other",
|
|
},
|
|
.alias_str = "event=0x6,period=0x30d40,umask=0x80",
|
|
.alias_long_desc = "Number of segment register loads",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event dispatch_blocked_any = {
|
|
.event = {
|
|
.name = "dispatch_blocked.any",
|
|
.event = "event=0x9,period=200000,umask=0x20",
|
|
.desc = "Memory cluster signals to block micro-op dispatch for any reason",
|
|
.topic = "other",
|
|
},
|
|
.alias_str = "event=0x9,period=0x30d40,umask=0x20",
|
|
.alias_long_desc = "Memory cluster signals to block micro-op dispatch for any reason",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event eist_trans = {
|
|
.event = {
|
|
.name = "eist_trans",
|
|
.event = "event=0x3a,period=200000,umask=0x0",
|
|
.desc = "Number of Enhanced Intel SpeedStep(R) Technology (EIST) transitions",
|
|
.topic = "other",
|
|
},
|
|
.alias_str = "event=0x3a,period=0x30d40,umask=0",
|
|
.alias_long_desc = "Number of Enhanced Intel SpeedStep(R) Technology (EIST) transitions",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event l3_cache_rd = {
|
|
.event = {
|
|
.name = "l3_cache_rd",
|
|
.event = "event=0x40",
|
|
.desc = "L3 cache access, read",
|
|
.long_desc = "Attributable Level 3 cache access, read",
|
|
.topic = "cache",
|
|
},
|
|
.alias_str = "event=0x40",
|
|
.alias_long_desc = "Attributable Level 3 cache access, read",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event *core_events[] = {
|
|
&bp_l1_btb_correct,
|
|
&bp_l2_btb_correct,
|
|
&segment_reg_loads_any,
|
|
&dispatch_blocked_any,
|
|
&eist_trans,
|
|
&l3_cache_rd,
|
|
NULL
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_hisi_ddrc_flux_wcmd = {
|
|
.event = {
|
|
.name = "uncore_hisi_ddrc.flux_wcmd",
|
|
.event = "event=0x2",
|
|
.desc = "DDRC write commands. Unit: hisi_sccl,ddrc ",
|
|
.topic = "uncore",
|
|
.long_desc = "DDRC write commands",
|
|
.pmu = "hisi_sccl,ddrc",
|
|
},
|
|
.alias_str = "event=0x2",
|
|
.alias_long_desc = "DDRC write commands",
|
|
.matching_pmu = "hisi_sccl1_ddrc2",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event unc_cbo_xsnp_response_miss_eviction = {
|
|
.event = {
|
|
.name = "unc_cbo_xsnp_response.miss_eviction",
|
|
.event = "event=0x22,umask=0x81",
|
|
.desc = "A cross-core snoop resulted from L3 Eviction which misses in some processor core. Unit: uncore_cbox ",
|
|
.topic = "uncore",
|
|
.long_desc = "A cross-core snoop resulted from L3 Eviction which misses in some processor core",
|
|
.pmu = "uncore_cbox",
|
|
},
|
|
.alias_str = "event=0x22,umask=0x81",
|
|
.alias_long_desc = "A cross-core snoop resulted from L3 Eviction which misses in some processor core",
|
|
.matching_pmu = "uncore_cbox_0",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_hyphen = {
|
|
.event = {
|
|
.name = "event-hyphen",
|
|
.event = "event=0xe0,umask=0x00",
|
|
.desc = "UNC_CBO_HYPHEN. Unit: uncore_cbox ",
|
|
.topic = "uncore",
|
|
.long_desc = "UNC_CBO_HYPHEN",
|
|
.pmu = "uncore_cbox",
|
|
},
|
|
.alias_str = "event=0xe0,umask=0",
|
|
.alias_long_desc = "UNC_CBO_HYPHEN",
|
|
.matching_pmu = "uncore_cbox_0",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_two_hyph = {
|
|
.event = {
|
|
.name = "event-two-hyph",
|
|
.event = "event=0xc0,umask=0x00",
|
|
.desc = "UNC_CBO_TWO_HYPH. Unit: uncore_cbox ",
|
|
.topic = "uncore",
|
|
.long_desc = "UNC_CBO_TWO_HYPH",
|
|
.pmu = "uncore_cbox",
|
|
},
|
|
.alias_str = "event=0xc0,umask=0",
|
|
.alias_long_desc = "UNC_CBO_TWO_HYPH",
|
|
.matching_pmu = "uncore_cbox_0",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_hisi_l3c_rd_hit_cpipe = {
|
|
.event = {
|
|
.name = "uncore_hisi_l3c.rd_hit_cpipe",
|
|
.event = "event=0x7",
|
|
.desc = "Total read hits. Unit: hisi_sccl,l3c ",
|
|
.topic = "uncore",
|
|
.long_desc = "Total read hits",
|
|
.pmu = "hisi_sccl,l3c",
|
|
},
|
|
.alias_str = "event=0x7",
|
|
.alias_long_desc = "Total read hits",
|
|
.matching_pmu = "hisi_sccl3_l3c7",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_imc_free_running_cache_miss = {
|
|
.event = {
|
|
.name = "uncore_imc_free_running.cache_miss",
|
|
.event = "event=0x12",
|
|
.desc = "Total cache misses. Unit: uncore_imc_free_running ",
|
|
.topic = "uncore",
|
|
.long_desc = "Total cache misses",
|
|
.pmu = "uncore_imc_free_running",
|
|
},
|
|
.alias_str = "event=0x12",
|
|
.alias_long_desc = "Total cache misses",
|
|
.matching_pmu = "uncore_imc_free_running_0",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event uncore_imc_cache_hits = {
|
|
.event = {
|
|
.name = "uncore_imc.cache_hits",
|
|
.event = "event=0x34",
|
|
.desc = "Total cache hits. Unit: uncore_imc ",
|
|
.topic = "uncore",
|
|
.long_desc = "Total cache hits",
|
|
.pmu = "uncore_imc",
|
|
},
|
|
.alias_str = "event=0x34",
|
|
.alias_long_desc = "Total cache hits",
|
|
.matching_pmu = "uncore_imc_0",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event *uncore_events[] = {
|
|
&uncore_hisi_ddrc_flux_wcmd,
|
|
&unc_cbo_xsnp_response_miss_eviction,
|
|
&uncore_hyphen,
|
|
&uncore_two_hyph,
|
|
&uncore_hisi_l3c_rd_hit_cpipe,
|
|
&uncore_imc_free_running_cache_miss,
|
|
&uncore_imc_cache_hits,
|
|
NULL
|
|
};
|
|
|
|
static const struct perf_pmu_test_event sys_ddr_pmu_write_cycles = {
|
|
.event = {
|
|
.name = "sys_ddr_pmu.write_cycles",
|
|
.event = "event=0x2b",
|
|
.desc = "ddr write-cycles event. Unit: uncore_sys_ddr_pmu ",
|
|
.topic = "uncore",
|
|
.pmu = "uncore_sys_ddr_pmu",
|
|
.compat = "v8",
|
|
},
|
|
.alias_str = "event=0x2b",
|
|
.alias_long_desc = "ddr write-cycles event. Unit: uncore_sys_ddr_pmu ",
|
|
.matching_pmu = "uncore_sys_ddr_pmu",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event sys_ccn_pmu_read_cycles = {
|
|
.event = {
|
|
.name = "sys_ccn_pmu.read_cycles",
|
|
.event = "config=0x2c",
|
|
.desc = "ccn read-cycles event. Unit: uncore_sys_ccn_pmu ",
|
|
.topic = "uncore",
|
|
.pmu = "uncore_sys_ccn_pmu",
|
|
.compat = "0x01",
|
|
},
|
|
.alias_str = "config=0x2c",
|
|
.alias_long_desc = "ccn read-cycles event. Unit: uncore_sys_ccn_pmu ",
|
|
.matching_pmu = "uncore_sys_ccn_pmu",
|
|
};
|
|
|
|
static const struct perf_pmu_test_event *sys_events[] = {
|
|
&sys_ddr_pmu_write_cycles,
|
|
&sys_ccn_pmu_read_cycles,
|
|
NULL
|
|
};
|
|
|
|
static bool is_same(const char *reference, const char *test)
|
|
{
|
|
if (!reference && !test)
|
|
return true;
|
|
|
|
if (reference && !test)
|
|
return false;
|
|
|
|
if (!reference && test)
|
|
return false;
|
|
|
|
return !strcmp(reference, test);
|
|
}
|
|
|
|
static int compare_pmu_events(const struct pmu_event *e1, const struct pmu_event *e2)
|
|
{
|
|
if (!is_same(e1->name, e2->name)) {
|
|
pr_debug2("testing event e1 %s: mismatched name string, %s vs %s\n",
|
|
e1->name, e1->name, e2->name);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->compat, e2->compat)) {
|
|
pr_debug2("testing event e1 %s: mismatched compat string, %s vs %s\n",
|
|
e1->name, e1->compat, e2->compat);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->event, e2->event)) {
|
|
pr_debug2("testing event e1 %s: mismatched event, %s vs %s\n",
|
|
e1->name, e1->event, e2->event);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->desc, e2->desc)) {
|
|
pr_debug2("testing event e1 %s: mismatched desc, %s vs %s\n",
|
|
e1->name, e1->desc, e2->desc);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->topic, e2->topic)) {
|
|
pr_debug2("testing event e1 %s: mismatched topic, %s vs %s\n",
|
|
e1->name, e1->topic, e2->topic);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->long_desc, e2->long_desc)) {
|
|
pr_debug2("testing event e1 %s: mismatched long_desc, %s vs %s\n",
|
|
e1->name, e1->long_desc, e2->long_desc);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->pmu, e2->pmu)) {
|
|
pr_debug2("testing event e1 %s: mismatched pmu string, %s vs %s\n",
|
|
e1->name, e1->pmu, e2->pmu);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(e1->unit, e2->unit)) {
|
|
pr_debug2("testing event e1 %s: mismatched unit, %s vs %s\n",
|
|
e1->name, e1->unit, e2->unit);
|
|
return -1;
|
|
}
|
|
|
|
if (e1->perpkg != e2->perpkg) {
|
|
pr_debug2("testing event e1 %s: mismatched perpkg, %d vs %d\n",
|
|
e1->name, e1->perpkg, e2->perpkg);
|
|
return -1;
|
|
}
|
|
|
|
if (e1->deprecated != e2->deprecated) {
|
|
pr_debug2("testing event e1 %s: mismatched deprecated, %d vs %d\n",
|
|
e1->name, e1->deprecated, e2->deprecated);
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int compare_alias_to_test_event(struct perf_pmu_alias *alias,
|
|
struct perf_pmu_test_event const *test_event,
|
|
char const *pmu_name)
|
|
{
|
|
struct pmu_event const *event = &test_event->event;
|
|
|
|
/* An alias was found, ensure everything is in order */
|
|
if (!is_same(alias->name, event->name)) {
|
|
pr_debug("testing aliases PMU %s: mismatched name, %s vs %s\n",
|
|
pmu_name, alias->name, event->name);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(alias->desc, event->desc)) {
|
|
pr_debug("testing aliases PMU %s: mismatched desc, %s vs %s\n",
|
|
pmu_name, alias->desc, event->desc);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(alias->long_desc, test_event->alias_long_desc)) {
|
|
pr_debug("testing aliases PMU %s: mismatched long_desc, %s vs %s\n",
|
|
pmu_name, alias->long_desc,
|
|
test_event->alias_long_desc);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(alias->topic, event->topic)) {
|
|
pr_debug("testing aliases PMU %s: mismatched topic, %s vs %s\n",
|
|
pmu_name, alias->topic, event->topic);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(alias->str, test_event->alias_str)) {
|
|
pr_debug("testing aliases PMU %s: mismatched str, %s vs %s\n",
|
|
pmu_name, alias->str, test_event->alias_str);
|
|
return -1;
|
|
}
|
|
|
|
if (!is_same(alias->long_desc, test_event->alias_long_desc)) {
|
|
pr_debug("testing aliases PMU %s: mismatched long desc, %s vs %s\n",
|
|
pmu_name, alias->str, test_event->alias_long_desc);
|
|
return -1;
|
|
}
|
|
|
|
|
|
if (!is_same(alias->pmu_name, test_event->event.pmu)) {
|
|
pr_debug("testing aliases PMU %s: mismatched pmu_name, %s vs %s\n",
|
|
pmu_name, alias->pmu_name, test_event->event.pmu);
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int test__pmu_event_table_core_callback(const struct pmu_event *pe,
|
|
const struct pmu_events_table *table __maybe_unused,
|
|
void *data)
|
|
{
|
|
int *map_events = data;
|
|
struct perf_pmu_test_event const **test_event_table;
|
|
bool found = false;
|
|
|
|
if (pe->pmu)
|
|
test_event_table = &uncore_events[0];
|
|
else
|
|
test_event_table = &core_events[0];
|
|
|
|
for (; *test_event_table; test_event_table++) {
|
|
struct perf_pmu_test_event const *test_event = *test_event_table;
|
|
struct pmu_event const *event = &test_event->event;
|
|
|
|
if (strcmp(pe->name, event->name))
|
|
continue;
|
|
found = true;
|
|
(*map_events)++;
|
|
|
|
if (compare_pmu_events(pe, event))
|
|
return -1;
|
|
|
|
pr_debug("testing event table %s: pass\n", pe->name);
|
|
}
|
|
if (!found) {
|
|
pr_err("testing event table: could not find event %s\n", pe->name);
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int test__pmu_event_table_sys_callback(const struct pmu_event *pe,
|
|
const struct pmu_events_table *table __maybe_unused,
|
|
void *data)
|
|
{
|
|
int *map_events = data;
|
|
struct perf_pmu_test_event const **test_event_table;
|
|
bool found = false;
|
|
|
|
test_event_table = &sys_events[0];
|
|
|
|
for (; *test_event_table; test_event_table++) {
|
|
struct perf_pmu_test_event const *test_event = *test_event_table;
|
|
struct pmu_event const *event = &test_event->event;
|
|
|
|
if (strcmp(pe->name, event->name))
|
|
continue;
|
|
found = true;
|
|
(*map_events)++;
|
|
|
|
if (compare_pmu_events(pe, event))
|
|
return TEST_FAIL;
|
|
|
|
pr_debug("testing sys event table %s: pass\n", pe->name);
|
|
}
|
|
if (!found) {
|
|
pr_debug("testing sys event table: could not find event %s\n", pe->name);
|
|
return TEST_FAIL;
|
|
}
|
|
return TEST_OK;
|
|
}
|
|
|
|
/* Verify generated events from pmu-events.c are as expected */
|
|
static int test__pmu_event_table(struct test_suite *test __maybe_unused,
|
|
int subtest __maybe_unused)
|
|
{
|
|
const struct pmu_events_table *sys_event_table =
|
|
find_sys_events_table("pmu_events__test_soc_sys");
|
|
const struct pmu_events_table *table = find_core_events_table("testarch", "testcpu");
|
|
int map_events = 0, expected_events, err;
|
|
|
|
/* ignore 3x sentinels */
|
|
expected_events = ARRAY_SIZE(core_events) +
|
|
ARRAY_SIZE(uncore_events) +
|
|
ARRAY_SIZE(sys_events) - 3;
|
|
|
|
if (!table || !sys_event_table)
|
|
return -1;
|
|
|
|
err = pmu_events_table_for_each_event(table, test__pmu_event_table_core_callback,
|
|
&map_events);
|
|
if (err)
|
|
return err;
|
|
|
|
err = pmu_events_table_for_each_event(sys_event_table, test__pmu_event_table_sys_callback,
|
|
&map_events);
|
|
if (err)
|
|
return err;
|
|
|
|
if (map_events != expected_events) {
|
|
pr_err("testing event table: found %d, but expected %d\n",
|
|
map_events, expected_events);
|
|
return TEST_FAIL;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static struct perf_pmu_alias *find_alias(const char *test_event, struct list_head *aliases)
|
|
{
|
|
struct perf_pmu_alias *alias;
|
|
|
|
list_for_each_entry(alias, aliases, list)
|
|
if (!strcmp(test_event, alias->name))
|
|
return alias;
|
|
|
|
return NULL;
|
|
}
|
|
|
|
/* Verify aliases are as expected */
|
|
static int __test_core_pmu_event_aliases(char *pmu_name, int *count)
|
|
{
|
|
struct perf_pmu_test_event const **test_event_table;
|
|
struct perf_pmu *pmu;
|
|
LIST_HEAD(aliases);
|
|
int res = 0;
|
|
const struct pmu_events_table *table = find_core_events_table("testarch", "testcpu");
|
|
struct perf_pmu_alias *a, *tmp;
|
|
|
|
if (!table)
|
|
return -1;
|
|
|
|
test_event_table = &core_events[0];
|
|
|
|
pmu = zalloc(sizeof(*pmu));
|
|
if (!pmu)
|
|
return -1;
|
|
|
|
pmu->name = pmu_name;
|
|
|
|
pmu_add_cpu_aliases_table(&aliases, pmu, table);
|
|
|
|
for (; *test_event_table; test_event_table++) {
|
|
struct perf_pmu_test_event const *test_event = *test_event_table;
|
|
struct pmu_event const *event = &test_event->event;
|
|
struct perf_pmu_alias *alias = find_alias(event->name, &aliases);
|
|
|
|
if (!alias) {
|
|
pr_debug("testing aliases core PMU %s: no alias, alias_table->name=%s\n",
|
|
pmu_name, event->name);
|
|
res = -1;
|
|
break;
|
|
}
|
|
|
|
if (compare_alias_to_test_event(alias, test_event, pmu_name)) {
|
|
res = -1;
|
|
break;
|
|
}
|
|
|
|
(*count)++;
|
|
pr_debug2("testing aliases core PMU %s: matched event %s\n",
|
|
pmu_name, alias->name);
|
|
}
|
|
|
|
list_for_each_entry_safe(a, tmp, &aliases, list) {
|
|
list_del(&a->list);
|
|
perf_pmu_free_alias(a);
|
|
}
|
|
free(pmu);
|
|
return res;
|
|
}
|
|
|
|
static int __test_uncore_pmu_event_aliases(struct perf_pmu_test_pmu *test_pmu)
|
|
{
|
|
int alias_count = 0, to_match_count = 0, matched_count = 0;
|
|
struct perf_pmu_test_event const **table;
|
|
struct perf_pmu *pmu = &test_pmu->pmu;
|
|
const char *pmu_name = pmu->name;
|
|
struct perf_pmu_alias *a, *tmp, *alias;
|
|
const struct pmu_events_table *events_table;
|
|
LIST_HEAD(aliases);
|
|
int res = 0;
|
|
|
|
events_table = find_core_events_table("testarch", "testcpu");
|
|
if (!events_table)
|
|
return -1;
|
|
pmu_add_cpu_aliases_table(&aliases, pmu, events_table);
|
|
pmu_add_sys_aliases(&aliases, pmu);
|
|
|
|
/* Count how many aliases we generated */
|
|
list_for_each_entry(alias, &aliases, list)
|
|
alias_count++;
|
|
|
|
/* Count how many aliases we expect from the known table */
|
|
for (table = &test_pmu->aliases[0]; *table; table++)
|
|
to_match_count++;
|
|
|
|
if (alias_count != to_match_count) {
|
|
pr_debug("testing aliases uncore PMU %s: mismatch expected aliases (%d) vs found (%d)\n",
|
|
pmu_name, to_match_count, alias_count);
|
|
res = -1;
|
|
goto out;
|
|
}
|
|
|
|
list_for_each_entry(alias, &aliases, list) {
|
|
bool matched = false;
|
|
|
|
for (table = &test_pmu->aliases[0]; *table; table++) {
|
|
struct perf_pmu_test_event const *test_event = *table;
|
|
struct pmu_event const *event = &test_event->event;
|
|
|
|
if (!strcmp(event->name, alias->name)) {
|
|
if (compare_alias_to_test_event(alias,
|
|
test_event,
|
|
pmu_name)) {
|
|
continue;
|
|
}
|
|
matched = true;
|
|
matched_count++;
|
|
}
|
|
}
|
|
|
|
if (matched == false) {
|
|
pr_debug("testing aliases uncore PMU %s: could not match alias %s\n",
|
|
pmu_name, alias->name);
|
|
res = -1;
|
|
goto out;
|
|
}
|
|
}
|
|
|
|
if (alias_count != matched_count) {
|
|
pr_debug("testing aliases uncore PMU %s: mismatch found aliases (%d) vs matched (%d)\n",
|
|
pmu_name, matched_count, alias_count);
|
|
res = -1;
|
|
}
|
|
|
|
out:
|
|
list_for_each_entry_safe(a, tmp, &aliases, list) {
|
|
list_del(&a->list);
|
|
perf_pmu_free_alias(a);
|
|
}
|
|
return res;
|
|
}
|
|
|
|
static struct perf_pmu_test_pmu test_pmus[] = {
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"hisi_sccl1_ddrc2",
|
|
.is_uncore = 1,
|
|
},
|
|
.aliases = {
|
|
&uncore_hisi_ddrc_flux_wcmd,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"uncore_cbox_0",
|
|
.is_uncore = 1,
|
|
},
|
|
.aliases = {
|
|
&unc_cbo_xsnp_response_miss_eviction,
|
|
&uncore_hyphen,
|
|
&uncore_two_hyph,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"hisi_sccl3_l3c7",
|
|
.is_uncore = 1,
|
|
},
|
|
.aliases = {
|
|
&uncore_hisi_l3c_rd_hit_cpipe,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"uncore_imc_free_running_0",
|
|
.is_uncore = 1,
|
|
},
|
|
.aliases = {
|
|
&uncore_imc_free_running_cache_miss,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"uncore_imc_0",
|
|
.is_uncore = 1,
|
|
},
|
|
.aliases = {
|
|
&uncore_imc_cache_hits,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"uncore_sys_ddr_pmu0",
|
|
.is_uncore = 1,
|
|
.id = (char *)"v8",
|
|
},
|
|
.aliases = {
|
|
&sys_ddr_pmu_write_cycles,
|
|
},
|
|
},
|
|
{
|
|
.pmu = {
|
|
.name = (char *)"uncore_sys_ccn_pmu4",
|
|
.is_uncore = 1,
|
|
.id = (char *)"0x01",
|
|
},
|
|
.aliases = {
|
|
&sys_ccn_pmu_read_cycles,
|
|
},
|
|
},
|
|
};
|
|
|
|
/* Test that aliases generated are as expected */
|
|
static int test__aliases(struct test_suite *test __maybe_unused,
|
|
int subtest __maybe_unused)
|
|
{
|
|
struct perf_pmu *pmu = NULL;
|
|
unsigned long i;
|
|
|
|
while ((pmu = perf_pmus__scan_core(pmu)) != NULL) {
|
|
int count = 0;
|
|
|
|
if (list_empty(&pmu->format)) {
|
|
pr_debug2("skipping testing core PMU %s\n", pmu->name);
|
|
continue;
|
|
}
|
|
|
|
if (__test_core_pmu_event_aliases(pmu->name, &count)) {
|
|
pr_debug("testing core PMU %s aliases: failed\n", pmu->name);
|
|
return -1;
|
|
}
|
|
|
|
if (count == 0) {
|
|
pr_debug("testing core PMU %s aliases: no events to match\n",
|
|
pmu->name);
|
|
return -1;
|
|
}
|
|
|
|
pr_debug("testing core PMU %s aliases: pass\n", pmu->name);
|
|
}
|
|
|
|
for (i = 0; i < ARRAY_SIZE(test_pmus); i++) {
|
|
int res = __test_uncore_pmu_event_aliases(&test_pmus[i]);
|
|
|
|
if (res)
|
|
return res;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static bool is_number(const char *str)
|
|
{
|
|
char *end_ptr;
|
|
double v;
|
|
|
|
errno = 0;
|
|
v = strtod(str, &end_ptr);
|
|
(void)v; // We're not interested in this value, only if it is valid
|
|
return errno == 0 && end_ptr != str;
|
|
}
|
|
|
|
static int check_parse_id(const char *id, struct parse_events_error *error,
|
|
struct perf_pmu *fake_pmu)
|
|
{
|
|
struct evlist *evlist;
|
|
int ret;
|
|
char *dup, *cur;
|
|
|
|
/* Numbers are always valid. */
|
|
if (is_number(id))
|
|
return 0;
|
|
|
|
evlist = evlist__new();
|
|
if (!evlist)
|
|
return -ENOMEM;
|
|
|
|
dup = strdup(id);
|
|
if (!dup)
|
|
return -ENOMEM;
|
|
|
|
for (cur = strchr(dup, '@') ; cur; cur = strchr(++cur, '@'))
|
|
*cur = '/';
|
|
|
|
ret = __parse_events(evlist, dup, /*pmu_filter=*/NULL, error, fake_pmu,
|
|
/*warn_if_reordered=*/true);
|
|
free(dup);
|
|
|
|
evlist__delete(evlist);
|
|
return ret;
|
|
}
|
|
|
|
static int check_parse_fake(const char *id)
|
|
{
|
|
struct parse_events_error error;
|
|
int ret;
|
|
|
|
parse_events_error__init(&error);
|
|
ret = check_parse_id(id, &error, &perf_pmu__fake);
|
|
parse_events_error__exit(&error);
|
|
return ret;
|
|
}
|
|
|
|
struct metric {
|
|
struct list_head list;
|
|
struct metric_ref metric_ref;
|
|
};
|
|
|
|
static int test__parsing_callback(const struct pmu_metric *pm,
|
|
const struct pmu_metrics_table *table,
|
|
void *data)
|
|
{
|
|
int *failures = data;
|
|
int k;
|
|
struct evlist *evlist;
|
|
struct perf_cpu_map *cpus;
|
|
struct evsel *evsel;
|
|
struct rblist metric_events = {
|
|
.nr_entries = 0,
|
|
};
|
|
int err = 0;
|
|
|
|
if (!pm->metric_expr)
|
|
return 0;
|
|
|
|
pr_debug("Found metric '%s'\n", pm->metric_name);
|
|
(*failures)++;
|
|
|
|
/*
|
|
* We need to prepare evlist for stat mode running on CPU 0
|
|
* because that's where all the stats are going to be created.
|
|
*/
|
|
evlist = evlist__new();
|
|
if (!evlist)
|
|
return -ENOMEM;
|
|
|
|
cpus = perf_cpu_map__new("0");
|
|
if (!cpus) {
|
|
evlist__delete(evlist);
|
|
return -ENOMEM;
|
|
}
|
|
|
|
perf_evlist__set_maps(&evlist->core, cpus, NULL);
|
|
|
|
err = metricgroup__parse_groups_test(evlist, table, pm->metric_name, &metric_events);
|
|
if (err) {
|
|
if (!strcmp(pm->metric_name, "M1") || !strcmp(pm->metric_name, "M2") ||
|
|
!strcmp(pm->metric_name, "M3")) {
|
|
(*failures)--;
|
|
pr_debug("Expected broken metric %s skipping\n", pm->metric_name);
|
|
err = 0;
|
|
}
|
|
goto out_err;
|
|
}
|
|
|
|
err = evlist__alloc_stats(/*config=*/NULL, evlist, /*alloc_raw=*/false);
|
|
if (err)
|
|
goto out_err;
|
|
/*
|
|
* Add all ids with a made up value. The value may trigger divide by
|
|
* zero when subtracted and so try to make them unique.
|
|
*/
|
|
k = 1;
|
|
evlist__alloc_aggr_stats(evlist, 1);
|
|
evlist__for_each_entry(evlist, evsel) {
|
|
evsel->stats->aggr->counts.val = k;
|
|
if (evsel__name_is(evsel, "duration_time"))
|
|
update_stats(&walltime_nsecs_stats, k);
|
|
k++;
|
|
}
|
|
evlist__for_each_entry(evlist, evsel) {
|
|
struct metric_event *me = metricgroup__lookup(&metric_events, evsel, false);
|
|
|
|
if (me != NULL) {
|
|
struct metric_expr *mexp;
|
|
|
|
list_for_each_entry (mexp, &me->head, nd) {
|
|
if (strcmp(mexp->metric_name, pm->metric_name))
|
|
continue;
|
|
pr_debug("Result %f\n", test_generic_metric(mexp, 0));
|
|
err = 0;
|
|
(*failures)--;
|
|
goto out_err;
|
|
}
|
|
}
|
|
}
|
|
pr_debug("Didn't find parsed metric %s", pm->metric_name);
|
|
err = 1;
|
|
out_err:
|
|
if (err)
|
|
pr_debug("Broken metric %s\n", pm->metric_name);
|
|
|
|
/* ... cleanup. */
|
|
metricgroup__rblist_exit(&metric_events);
|
|
evlist__free_stats(evlist);
|
|
perf_cpu_map__put(cpus);
|
|
evlist__delete(evlist);
|
|
return err;
|
|
}
|
|
|
|
static int test__parsing(struct test_suite *test __maybe_unused,
|
|
int subtest __maybe_unused)
|
|
{
|
|
int failures = 0;
|
|
|
|
pmu_for_each_core_metric(test__parsing_callback, &failures);
|
|
pmu_for_each_sys_metric(test__parsing_callback, &failures);
|
|
|
|
return failures == 0 ? TEST_OK : TEST_FAIL;
|
|
}
|
|
|
|
struct test_metric {
|
|
const char *str;
|
|
};
|
|
|
|
static struct test_metric metrics[] = {
|
|
{ "(unc_p_power_state_occupancy.cores_c0 / unc_p_clockticks) * 100." },
|
|
{ "imx8_ddr0@read\\-cycles@ * 4 * 4", },
|
|
{ "imx8_ddr0@axid\\-read\\,axi_mask\\=0xffff\\,axi_id\\=0x0000@ * 4", },
|
|
{ "(cstate_pkg@c2\\-residency@ / msr@tsc@) * 100", },
|
|
{ "(imx8_ddr0@read\\-cycles@ + imx8_ddr0@write\\-cycles@)", },
|
|
};
|
|
|
|
static int metric_parse_fake(const char *metric_name, const char *str)
|
|
{
|
|
struct expr_parse_ctx *ctx;
|
|
struct hashmap_entry *cur;
|
|
double result;
|
|
int ret = -1;
|
|
size_t bkt;
|
|
int i;
|
|
|
|
pr_debug("parsing '%s': '%s'\n", metric_name, str);
|
|
|
|
ctx = expr__ctx_new();
|
|
if (!ctx) {
|
|
pr_debug("expr__ctx_new failed");
|
|
return TEST_FAIL;
|
|
}
|
|
ctx->sctx.is_test = true;
|
|
if (expr__find_ids(str, NULL, ctx) < 0) {
|
|
pr_err("expr__find_ids failed\n");
|
|
return -1;
|
|
}
|
|
|
|
/*
|
|
* Add all ids with a made up value. The value may
|
|
* trigger divide by zero when subtracted and so try to
|
|
* make them unique.
|
|
*/
|
|
i = 1;
|
|
hashmap__for_each_entry(ctx->ids, cur, bkt)
|
|
expr__add_id_val(ctx, strdup(cur->pkey), i++);
|
|
|
|
hashmap__for_each_entry(ctx->ids, cur, bkt) {
|
|
if (check_parse_fake(cur->pkey)) {
|
|
pr_err("check_parse_fake failed\n");
|
|
goto out;
|
|
}
|
|
}
|
|
|
|
ret = 0;
|
|
if (expr__parse(&result, ctx, str)) {
|
|
/*
|
|
* Parsing failed, make numbers go from large to small which can
|
|
* resolve divide by zero issues.
|
|
*/
|
|
i = 1024;
|
|
hashmap__for_each_entry(ctx->ids, cur, bkt)
|
|
expr__add_id_val(ctx, strdup(cur->pkey), i--);
|
|
if (expr__parse(&result, ctx, str)) {
|
|
pr_err("expr__parse failed for %s\n", metric_name);
|
|
/* The following have hard to avoid divide by zero. */
|
|
if (!strcmp(metric_name, "tma_clears_resteers") ||
|
|
!strcmp(metric_name, "tma_mispredicts_resteers"))
|
|
ret = 0;
|
|
else
|
|
ret = -1;
|
|
}
|
|
}
|
|
|
|
out:
|
|
expr__ctx_free(ctx);
|
|
return ret;
|
|
}
|
|
|
|
static int test__parsing_fake_callback(const struct pmu_metric *pm,
|
|
const struct pmu_metrics_table *table __maybe_unused,
|
|
void *data __maybe_unused)
|
|
{
|
|
return metric_parse_fake(pm->metric_name, pm->metric_expr);
|
|
}
|
|
|
|
/*
|
|
* Parse all the metrics for current architecture,
|
|
* or all defined cpus via the 'fake_pmu'
|
|
* in parse_events.
|
|
*/
|
|
static int test__parsing_fake(struct test_suite *test __maybe_unused,
|
|
int subtest __maybe_unused)
|
|
{
|
|
int err = 0;
|
|
|
|
for (size_t i = 0; i < ARRAY_SIZE(metrics); i++) {
|
|
err = metric_parse_fake("", metrics[i].str);
|
|
if (err)
|
|
return err;
|
|
}
|
|
|
|
err = pmu_for_each_core_metric(test__parsing_fake_callback, NULL);
|
|
if (err)
|
|
return err;
|
|
|
|
return pmu_for_each_sys_metric(test__parsing_fake_callback, NULL);
|
|
}
|
|
|
|
static int test__parsing_threshold_callback(const struct pmu_metric *pm,
|
|
const struct pmu_metrics_table *table __maybe_unused,
|
|
void *data __maybe_unused)
|
|
{
|
|
if (!pm->metric_threshold)
|
|
return 0;
|
|
return metric_parse_fake(pm->metric_name, pm->metric_threshold);
|
|
}
|
|
|
|
static int test__parsing_threshold(struct test_suite *test __maybe_unused,
|
|
int subtest __maybe_unused)
|
|
{
|
|
int err = 0;
|
|
|
|
err = pmu_for_each_core_metric(test__parsing_threshold_callback, NULL);
|
|
if (err)
|
|
return err;
|
|
|
|
return pmu_for_each_sys_metric(test__parsing_threshold_callback, NULL);
|
|
}
|
|
|
|
static struct test_case pmu_events_tests[] = {
|
|
TEST_CASE("PMU event table sanity", pmu_event_table),
|
|
TEST_CASE("PMU event map aliases", aliases),
|
|
TEST_CASE_REASON("Parsing of PMU event table metrics", parsing,
|
|
"some metrics failed"),
|
|
TEST_CASE("Parsing of PMU event table metrics with fake PMUs", parsing_fake),
|
|
TEST_CASE("Parsing of metric thresholds with fake PMUs", parsing_threshold),
|
|
{ .name = NULL, }
|
|
};
|
|
|
|
struct test_suite suite__pmu_events = {
|
|
.desc = "PMU events",
|
|
.test_cases = pmu_events_tests,
|
|
};
|