perf/core improvements and fixes:
User visible: - The default for callchains is back to 'callee' when --children is not used, (Namhyung Kim) - Move the 'use_offset' option to the right place where the annotate code expects it to be to be able to properly handle it (Namhyung Kim) - Don't die when an unknown 'annotate' option is found in the perf config file (usually ~/.perfconfig), just warn the user (Arnaldo Carvalho de Melo) Infrastructure: - Support %ps/%pS in libtraceevent (Scott Wood) Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> -----BEGIN PGP SIGNATURE----- Version: GnuPG v1 iQIcBAABAgAGBQJWKVS9AAoJENZQFvNTUqpAUnIP/1vQdPG9mr3RsCsHysuBxITf VTqIVrnGEGLIhTH31eSrVEPcEprTWFrMoh8SRfmqD+BGrqMqt6IvngvFqCaRDQ/i uVzmViJiLQp0v9i9J9z4ByxaN3xyRSfoIoTxpxUTnk20SZ7JtlNy/1aUqJTYFhau bEZjrpB0vDcEcGANp4V76fvCZC9X5BuS+PI+95qgptJ22kIJEL+cnayiudTfhbhS HSpBKWpXLGkp1ohB/+fq+pt3AenXPvjO7M2M3lERb9PpWF4bS384JYDpcpitxPQJ PZWZiGhaGSJ7rDaODj11Zt9bRbK3QOCejwXTbDyq3teocmTV6FqnTXKe66tIQFjV oapu3tbUuaRVUt1uo8BkHK78nnI2vxvYW/qcFYQqmjotA0WBSff30RRTrhuo4vpZ xixBrsu22tNk9F7yyl5o69am1IDr3onduFEYr8Jcpt1BYOnoRJa2/FSveLBqK64Z 2kN2/Ws7i2J4ux5LwU+qEz/NFu/+2SgQz+GF0DBRm63bnePOs216mKM3cdYerbtO yiEdpmoanDRUpxfMcXtgxlrEfcnZCfUPyPlaBO446/kX/ghLx6gOQZqkFUc2C0Dw zIXDjL1iOmIEmTai+pwxAFvkHYBS5arBHC0T+lEupTrFEen97xIhZ6J1Af/8vV50 F+VEpKqlD4jgZQQOL10e =yDyE -----END PGP SIGNATURE----- Merge tag 'perf-core-for-mingo' of git://git.kernel.org/pub/scm/linux/kernel/git/acme/linux into perf/core Pull perf/core improvements and fixes from Arnaldo Carvalho de Melo: User visible changes: - The default for callchains is back to 'callee' when --children is not used. (Namhyung Kim) - Move the 'use_offset' option to the right place where the annotate code expects it to be to be able to properly handle it. (Namhyung Kim) - Don't die when an unknown 'annotate' option is found in the perf config file (usually ~/.perfconfig), just warn the user. (Arnaldo Carvalho de Melo) Infrastructure changes: - Support %ps/%pS in libtraceevent. (Scott Wood) Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> Signed-off-by: Ingo Molnar <mingo@kernel.org>
This commit is contained in:
commit
80fcd45ee0
@ -4905,8 +4905,8 @@ static void pretty_print(struct trace_seq *s, void *data, int size, struct event
|
||||
else
|
||||
ls = 2;
|
||||
|
||||
if (*(ptr+1) == 'F' ||
|
||||
*(ptr+1) == 'f') {
|
||||
if (*(ptr+1) == 'F' || *(ptr+1) == 'f' ||
|
||||
*(ptr+1) == 'S' || *(ptr+1) == 's') {
|
||||
ptr++;
|
||||
show_func = *ptr;
|
||||
} else if (*(ptr+1) == 'M' || *(ptr+1) == 'm') {
|
||||
|
@ -144,7 +144,7 @@ OPTIONS
|
||||
|
||||
--call-graph::
|
||||
Setup and enable call-graph (stack chain/backtrace) recording,
|
||||
implies -g.
|
||||
implies -g. Default is "fp".
|
||||
|
||||
Allows specifying "fp" (frame pointer) or "dwarf"
|
||||
(DWARF's CFI - Call Frame Information) or "lbr"
|
||||
@ -154,13 +154,18 @@ OPTIONS
|
||||
In some systems, where binaries are build with gcc
|
||||
--fomit-frame-pointer, using the "fp" method will produce bogus
|
||||
call graphs, using "dwarf", if available (perf tools linked to
|
||||
the libunwind library) should be used instead.
|
||||
the libunwind or libdw library) should be used instead.
|
||||
Using the "lbr" method doesn't require any compiler options. It
|
||||
will produce call graphs from the hardware LBR registers. The
|
||||
main limition is that it is only available on new Intel
|
||||
platforms, such as Haswell. It can only get user call chain. It
|
||||
doesn't work with branch stack sampling at the same time.
|
||||
|
||||
When "dwarf" recording is used, perf also records (user) stack dump
|
||||
when sampled. Default size of the stack dump is 8192 (bytes).
|
||||
User can change the size by passing the size after comma like
|
||||
"--call-graph dwarf,4096".
|
||||
|
||||
-q::
|
||||
--quiet::
|
||||
Don't print any message, useful for scripting.
|
||||
|
@ -169,30 +169,40 @@ OPTIONS
|
||||
--dump-raw-trace::
|
||||
Dump raw trace in ASCII.
|
||||
|
||||
-g [type,min[,limit],order[,key][,branch]]::
|
||||
--call-graph::
|
||||
Display call chains using type, min percent threshold, optional print
|
||||
limit and order.
|
||||
type can be either:
|
||||
-g::
|
||||
--call-graph=<print_type,threshold[,print_limit],order,sort_key,branch>::
|
||||
Display call chains using type, min percent threshold, print limit,
|
||||
call order, sort key and branch. Note that ordering of parameters is not
|
||||
fixed so any parement can be given in an arbitraty order. One exception
|
||||
is the print_limit which should be preceded by threshold.
|
||||
|
||||
print_type can be either:
|
||||
- flat: single column, linear exposure of call chains.
|
||||
- graph: use a graph tree, displaying absolute overhead rates.
|
||||
- graph: use a graph tree, displaying absolute overhead rates. (default)
|
||||
- fractal: like graph, but displays relative rates. Each branch of
|
||||
the tree is considered as a new profiled object. +
|
||||
the tree is considered as a new profiled object.
|
||||
- none: disable call chain display.
|
||||
|
||||
threshold is a percentage value which specifies a minimum percent to be
|
||||
included in the output call graph. Default is 0.5 (%).
|
||||
|
||||
print_limit is only applied when stdio interface is used. It's to limit
|
||||
number of call graph entries in a single hist entry. Note that it needs
|
||||
to be given after threshold (but not necessarily consecutive).
|
||||
Default is 0 (unlimited).
|
||||
|
||||
order can be either:
|
||||
- callee: callee based call graph.
|
||||
- caller: inverted caller based call graph.
|
||||
Default is 'caller' when --children is used, otherwise 'callee'.
|
||||
|
||||
key can be:
|
||||
- function: compare on functions
|
||||
sort_key can be:
|
||||
- function: compare on functions (default)
|
||||
- address: compare on individual code addresses
|
||||
|
||||
branch can be:
|
||||
- branch: include last branch information in callgraph
|
||||
when available. Usually more convenient to use --branch-history
|
||||
for this.
|
||||
|
||||
Default: graph,0.5,caller
|
||||
- branch: include last branch information in callgraph when available.
|
||||
Usually more convenient to use --branch-history for this.
|
||||
|
||||
--children::
|
||||
Accumulate callchain of children to parent entry so that then can
|
||||
|
@ -160,9 +160,10 @@ Default is to monitor all CPUS.
|
||||
-g::
|
||||
Enables call-graph (stack chain/backtrace) recording.
|
||||
|
||||
--call-graph::
|
||||
--call-graph [mode,type,min[,limit],order[,key][,branch]]::
|
||||
Setup and enable call-graph (stack chain/backtrace) recording,
|
||||
implies -g.
|
||||
implies -g. See `--call-graph` section in perf-record and
|
||||
perf-report man pages for details.
|
||||
|
||||
--children::
|
||||
Accumulate callchain of children to parent entry so that then can
|
||||
|
@ -1010,13 +1010,8 @@ static struct record record = {
|
||||
},
|
||||
};
|
||||
|
||||
#define CALLCHAIN_HELP "setup and enables call-graph (stack chain/backtrace) recording: "
|
||||
|
||||
#ifdef HAVE_DWARF_UNWIND_SUPPORT
|
||||
const char record_callchain_help[] = CALLCHAIN_HELP "fp dwarf lbr";
|
||||
#else
|
||||
const char record_callchain_help[] = CALLCHAIN_HELP "fp lbr";
|
||||
#endif
|
||||
const char record_callchain_help[] = CALLCHAIN_RECORD_HELP
|
||||
"\n\t\t\t\tDefault: fp";
|
||||
|
||||
/*
|
||||
* XXX Will stay a global variable till we fix builtin-script.c to stop messing
|
||||
@ -1064,7 +1059,7 @@ struct option __record_options[] = {
|
||||
NULL, "enables call-graph recording" ,
|
||||
&record_callchain_opt),
|
||||
OPT_CALLBACK(0, "call-graph", &record.opts,
|
||||
"mode[,dump_size]", record_callchain_help,
|
||||
"record_mode[,record_size]", record_callchain_help,
|
||||
&record_parse_callchain_opt),
|
||||
OPT_INCR('v', "verbose", &verbose,
|
||||
"be more verbose (show counter open errors, etc)"),
|
||||
|
@ -625,6 +625,12 @@ parse_percent_limit(const struct option *opt, const char *str,
|
||||
return 0;
|
||||
}
|
||||
|
||||
#define CALLCHAIN_DEFAULT_OPT "graph,0.5,caller,function"
|
||||
|
||||
const char report_callchain_help[] = "Display call graph (stack chain/backtrace):\n\n"
|
||||
CALLCHAIN_REPORT_HELP
|
||||
"\n\t\t\t\tDefault: " CALLCHAIN_DEFAULT_OPT;
|
||||
|
||||
int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
{
|
||||
struct perf_session *session;
|
||||
@ -633,7 +639,7 @@ int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
bool has_br_stack = false;
|
||||
int branch_mode = -1;
|
||||
bool branch_call_mode = false;
|
||||
char callchain_default_opt[] = "graph,0.5,caller";
|
||||
char callchain_default_opt[] = CALLCHAIN_DEFAULT_OPT;
|
||||
const char * const report_usage[] = {
|
||||
"perf report [<options>]",
|
||||
NULL
|
||||
@ -699,9 +705,10 @@ int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
"regex filter to identify parent, see: '--sort parent'"),
|
||||
OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other,
|
||||
"Only display entries with parent-match"),
|
||||
OPT_CALLBACK_DEFAULT('g', "call-graph", &report, "output_type,min_percent[,print_limit],call_order[,branch]",
|
||||
"Display callchains using output_type (graph, flat, fractal, or none) , min percent threshold, optional print limit, callchain order, key (function or address), add branches. "
|
||||
"Default: graph,0.5,caller", &report_parse_callchain_opt, callchain_default_opt),
|
||||
OPT_CALLBACK_DEFAULT('g', "call-graph", &report,
|
||||
"print_type,threshold[,print_limit],order,sort_key[,branch]",
|
||||
report_callchain_help, &report_parse_callchain_opt,
|
||||
callchain_default_opt),
|
||||
OPT_BOOLEAN(0, "children", &symbol_conf.cumulate_callchain,
|
||||
"Accumulate callchains of children and show total overhead as well"),
|
||||
OPT_INTEGER(0, "max-stack", &report.max_stack,
|
||||
@ -808,6 +815,8 @@ int cmd_report(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
|
||||
if (report.inverted_callchain)
|
||||
callchain_param.order = ORDER_CALLER;
|
||||
if (symbol_conf.cumulate_callchain && !callchain_param.order_set)
|
||||
callchain_param.order = ORDER_CALLER;
|
||||
|
||||
if (itrace_synth_opts.callchain &&
|
||||
(int)itrace_synth_opts.callchain_sz > report.max_stack)
|
||||
|
@ -1053,8 +1053,22 @@ callchain_opt(const struct option *opt, const char *arg, int unset)
|
||||
static int
|
||||
parse_callchain_opt(const struct option *opt, const char *arg, int unset)
|
||||
{
|
||||
symbol_conf.use_callchain = true;
|
||||
return record_parse_callchain_opt(opt, arg, unset);
|
||||
struct record_opts *record = (struct record_opts *)opt->value;
|
||||
|
||||
record->callgraph_set = true;
|
||||
callchain_param.enabled = !unset;
|
||||
callchain_param.record_mode = CALLCHAIN_FP;
|
||||
|
||||
/*
|
||||
* --no-call-graph
|
||||
*/
|
||||
if (unset) {
|
||||
symbol_conf.use_callchain = false;
|
||||
callchain_param.record_mode = CALLCHAIN_NONE;
|
||||
return 0;
|
||||
}
|
||||
|
||||
return parse_callchain_top_opt(arg);
|
||||
}
|
||||
|
||||
static int perf_top_config(const char *var, const char *value, void *cb)
|
||||
@ -1079,6 +1093,9 @@ parse_percent_limit(const struct option *opt, const char *arg,
|
||||
return 0;
|
||||
}
|
||||
|
||||
const char top_callchain_help[] = CALLCHAIN_RECORD_HELP CALLCHAIN_REPORT_HELP
|
||||
"\n\t\t\t\tDefault: fp,graph,0.5,caller,function";
|
||||
|
||||
int cmd_top(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
{
|
||||
char errbuf[BUFSIZ];
|
||||
@ -1154,11 +1171,11 @@ int cmd_top(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
OPT_BOOLEAN('n', "show-nr-samples", &symbol_conf.show_nr_samples,
|
||||
"Show a column with the number of samples"),
|
||||
OPT_CALLBACK_NOOPT('g', NULL, &top.record_opts,
|
||||
NULL, "enables call-graph recording",
|
||||
NULL, "enables call-graph recording and display",
|
||||
&callchain_opt),
|
||||
OPT_CALLBACK(0, "call-graph", &top.record_opts,
|
||||
"mode[,dump_size]", record_callchain_help,
|
||||
&parse_callchain_opt),
|
||||
"record_mode[,record_size],print_type,threshold[,print_limit],order,sort_key[,branch]",
|
||||
top_callchain_help, &parse_callchain_opt),
|
||||
OPT_BOOLEAN(0, "children", &symbol_conf.cumulate_callchain,
|
||||
"Accumulate callchains of children and show total overhead as well"),
|
||||
OPT_INTEGER(0, "max-stack", &top.max_stack,
|
||||
@ -1288,6 +1305,9 @@ int cmd_top(int argc, const char **argv, const char *prefix __maybe_unused)
|
||||
perf_hpp__cancel_cumulate();
|
||||
}
|
||||
|
||||
if (symbol_conf.cumulate_callchain && !callchain_param.order_set)
|
||||
callchain_param.order = ORDER_CALLER;
|
||||
|
||||
symbol_conf.priv_size = sizeof(struct annotation);
|
||||
|
||||
symbol_conf.try_vmlinux_path = (symbol_conf.vmlinux_name == NULL);
|
||||
|
@ -1125,8 +1125,8 @@ static struct annotate_config {
|
||||
ANNOTATE_CFG(jump_arrows),
|
||||
ANNOTATE_CFG(show_linenr),
|
||||
ANNOTATE_CFG(show_nr_jumps),
|
||||
ANNOTATE_CFG(use_offset),
|
||||
ANNOTATE_CFG(show_total_period),
|
||||
ANNOTATE_CFG(use_offset),
|
||||
};
|
||||
|
||||
#undef ANNOTATE_CFG
|
||||
@ -1152,9 +1152,9 @@ static int annotate__config(const char *var, const char *value,
|
||||
sizeof(struct annotate_config), annotate_config__cmp);
|
||||
|
||||
if (cfg == NULL)
|
||||
return -1;
|
||||
|
||||
*cfg->value = perf_config_bool(name, value);
|
||||
ui__warning("%s variable unknown, ignoring...", var);
|
||||
else
|
||||
*cfg->value = perf_config_bool(name, value);
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
@ -141,10 +141,6 @@ int ui__init(void)
|
||||
|
||||
SLkp_define_keysym((char *)"^(kB)", SL_KEY_UNTAB);
|
||||
|
||||
ui_helpline__init();
|
||||
ui_browser__init();
|
||||
tui_progress__init();
|
||||
|
||||
signal(SIGSEGV, ui__signal_backtrace);
|
||||
signal(SIGFPE, ui__signal_backtrace);
|
||||
signal(SIGINT, ui__signal);
|
||||
@ -153,6 +149,10 @@ int ui__init(void)
|
||||
|
||||
perf_error__register(&perf_tui_eops);
|
||||
|
||||
ui_helpline__init();
|
||||
ui_browser__init();
|
||||
tui_progress__init();
|
||||
|
||||
hist_browser__init_hpp();
|
||||
out:
|
||||
return err;
|
||||
|
@ -51,10 +51,12 @@ static int parse_callchain_order(const char *value)
|
||||
{
|
||||
if (!strncmp(value, "caller", strlen(value))) {
|
||||
callchain_param.order = ORDER_CALLER;
|
||||
callchain_param.order_set = true;
|
||||
return 0;
|
||||
}
|
||||
if (!strncmp(value, "callee", strlen(value))) {
|
||||
callchain_param.order = ORDER_CALLEE;
|
||||
callchain_param.order_set = true;
|
||||
return 0;
|
||||
}
|
||||
return -1;
|
||||
@ -77,12 +79,14 @@ static int parse_callchain_sort_key(const char *value)
|
||||
return -1;
|
||||
}
|
||||
|
||||
int
|
||||
parse_callchain_report_opt(const char *arg)
|
||||
static int
|
||||
__parse_callchain_report_opt(const char *arg, bool allow_record_opt)
|
||||
{
|
||||
char *tok;
|
||||
char *endptr;
|
||||
bool minpcnt_set = false;
|
||||
bool record_opt_set = false;
|
||||
bool try_stack_size = false;
|
||||
|
||||
symbol_conf.use_callchain = true;
|
||||
|
||||
@ -100,6 +104,28 @@ parse_callchain_report_opt(const char *arg)
|
||||
!parse_callchain_order(tok) ||
|
||||
!parse_callchain_sort_key(tok)) {
|
||||
/* parsing ok - move on to the next */
|
||||
try_stack_size = false;
|
||||
goto next;
|
||||
} else if (allow_record_opt && !record_opt_set) {
|
||||
if (parse_callchain_record(tok, &callchain_param))
|
||||
goto try_numbers;
|
||||
|
||||
/* assume that number followed by 'dwarf' is stack size */
|
||||
if (callchain_param.record_mode == CALLCHAIN_DWARF)
|
||||
try_stack_size = true;
|
||||
|
||||
record_opt_set = true;
|
||||
goto next;
|
||||
}
|
||||
|
||||
try_numbers:
|
||||
if (try_stack_size) {
|
||||
unsigned long size = 0;
|
||||
|
||||
if (get_stack_size(tok, &size) < 0)
|
||||
return -1;
|
||||
callchain_param.dump_size = size;
|
||||
try_stack_size = false;
|
||||
} else if (!minpcnt_set) {
|
||||
/* try to get the min percent */
|
||||
callchain_param.min_percent = strtod(tok, &endptr);
|
||||
@ -112,7 +138,7 @@ parse_callchain_report_opt(const char *arg)
|
||||
if (tok == endptr)
|
||||
return -1;
|
||||
}
|
||||
|
||||
next:
|
||||
arg = NULL;
|
||||
}
|
||||
|
||||
@ -123,6 +149,16 @@ parse_callchain_report_opt(const char *arg)
|
||||
return 0;
|
||||
}
|
||||
|
||||
int parse_callchain_report_opt(const char *arg)
|
||||
{
|
||||
return __parse_callchain_report_opt(arg, false);
|
||||
}
|
||||
|
||||
int parse_callchain_top_opt(const char *arg)
|
||||
{
|
||||
return __parse_callchain_report_opt(arg, true);
|
||||
}
|
||||
|
||||
int perf_callchain_config(const char *var, const char *value)
|
||||
{
|
||||
char *endptr;
|
||||
|
@ -7,6 +7,30 @@
|
||||
#include "event.h"
|
||||
#include "symbol.h"
|
||||
|
||||
#define HELP_PAD "\t\t\t\t"
|
||||
|
||||
#define CALLCHAIN_HELP "setup and enables call-graph (stack chain/backtrace):\n\n"
|
||||
|
||||
#ifdef HAVE_DWARF_UNWIND_SUPPORT
|
||||
# define RECORD_MODE_HELP HELP_PAD "record_mode:\tcall graph recording mode (fp|dwarf|lbr)\n"
|
||||
#else
|
||||
# define RECORD_MODE_HELP HELP_PAD "record_mode:\tcall graph recording mode (fp|lbr)\n"
|
||||
#endif
|
||||
|
||||
#define RECORD_SIZE_HELP \
|
||||
HELP_PAD "record_size:\tif record_mode is 'dwarf', max size of stack recording (<bytes>)\n" \
|
||||
HELP_PAD "\t\tdefault: 8192 (bytes)\n"
|
||||
|
||||
#define CALLCHAIN_RECORD_HELP CALLCHAIN_HELP RECORD_MODE_HELP RECORD_SIZE_HELP
|
||||
|
||||
#define CALLCHAIN_REPORT_HELP \
|
||||
HELP_PAD "print_type:\tcall graph printing style (graph|flat|fractal|none)\n" \
|
||||
HELP_PAD "threshold:\tminimum call graph inclusion threshold (<percent>)\n" \
|
||||
HELP_PAD "print_limit:\tmaximum number of call graph entry (<number>)\n" \
|
||||
HELP_PAD "order:\t\tcall graph order (caller|callee)\n" \
|
||||
HELP_PAD "sort_key:\tcall graph sort key (function|address)\n" \
|
||||
HELP_PAD "branch:\t\tinclude last branch info to call graph (branch)\n"
|
||||
|
||||
enum perf_call_graph_mode {
|
||||
CALLCHAIN_NONE,
|
||||
CALLCHAIN_FP,
|
||||
@ -63,6 +87,7 @@ struct callchain_param {
|
||||
double min_percent;
|
||||
sort_chain_func_t sort;
|
||||
enum chain_order order;
|
||||
bool order_set;
|
||||
enum chain_key key;
|
||||
bool branch_callstack;
|
||||
};
|
||||
@ -180,6 +205,7 @@ extern const char record_callchain_help[];
|
||||
extern int parse_callchain_record(const char *arg, struct callchain_param *param);
|
||||
int parse_callchain_record_opt(const char *arg, struct callchain_param *param);
|
||||
int parse_callchain_report_opt(const char *arg);
|
||||
int parse_callchain_top_opt(const char *arg);
|
||||
int perf_callchain_config(const char *var, const char *value);
|
||||
|
||||
static inline void callchain_cursor_snapshot(struct callchain_cursor *dest,
|
||||
|
@ -19,7 +19,7 @@
|
||||
struct callchain_param callchain_param = {
|
||||
.mode = CHAIN_GRAPH_ABS,
|
||||
.min_percent = 0.5,
|
||||
.order = ORDER_CALLER,
|
||||
.order = ORDER_CALLEE,
|
||||
.key = CCKEY_FUNCTION
|
||||
};
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user