mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
synced 2026-01-12 01:20:14 +00:00
Save samples with deferred callchains in a separate list and deliver
them after merging the user callchains. If users don't want to merge
they can set tool->merge_deferred_callchains to false to prevent the
behavior.
With previous result, now perf script will show the merged callchains.
$ perf script
...
pwd 2312 121.163435: 249113 cpu/cycles/P:
ffffffff845b78d8 __build_id_parse.isra.0+0x218 ([kernel.kallsyms])
ffffffff83bb5bf6 perf_event_mmap+0x2e6 ([kernel.kallsyms])
ffffffff83c31959 mprotect_fixup+0x1e9 ([kernel.kallsyms])
ffffffff83c31dc5 do_mprotect_pkey+0x2b5 ([kernel.kallsyms])
ffffffff83c3206f __x64_sys_mprotect+0x1f ([kernel.kallsyms])
ffffffff845e6692 do_syscall_64+0x62 ([kernel.kallsyms])
ffffffff8360012f entry_SYSCALL_64_after_hwframe+0x76 ([kernel.kallsyms])
7f18fe337fa7 mprotect+0x7 (/lib/x86_64-linux-gnu/ld-linux-x86-64.so.2)
7f18fe330e0f _dl_sysdep_start+0x7f (/lib/x86_64-linux-gnu/ld-linux-x86-64.so.2)
7f18fe331448 _dl_start_user+0x0 (/lib/x86_64-linux-gnu/ld-linux-x86-64.so.2)
...
The old output can be get using --no-merge-callchain option.
Also perf report can get the user callchain entry at the end.
$ perf report --no-children --stdio -q -S __build_id_parse.isra.0
# symbol: __build_id_parse.isra.0
8.40% pwd [kernel.kallsyms]
|
---__build_id_parse.isra.0
perf_event_mmap
mprotect_fixup
do_mprotect_pkey
__x64_sys_mprotect
do_syscall_64
entry_SYSCALL_64_after_hwframe
mprotect
_dl_sysdep_start
_dl_start_user
Reviewed-by: Ian Rogers <irogers@google.com>
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
117 lines
2.8 KiB
C
117 lines
2.8 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#ifndef __PERF_TOOL_H
|
|
#define __PERF_TOOL_H
|
|
|
|
#include <stdbool.h>
|
|
|
|
#include <linux/types.h>
|
|
|
|
struct perf_session;
|
|
union perf_event;
|
|
struct evlist;
|
|
struct evsel;
|
|
struct perf_sample;
|
|
struct perf_tool;
|
|
struct machine;
|
|
struct ordered_events;
|
|
|
|
typedef int (*event_sample)(const struct perf_tool *tool, union perf_event *event,
|
|
struct perf_sample *sample,
|
|
struct evsel *evsel, struct machine *machine);
|
|
|
|
typedef int (*event_op)(const struct perf_tool *tool, union perf_event *event,
|
|
struct perf_sample *sample, struct machine *machine);
|
|
|
|
typedef int (*event_attr_op)(const struct perf_tool *tool,
|
|
union perf_event *event,
|
|
struct evlist **pevlist);
|
|
|
|
typedef int (*event_op2)(const struct perf_tool *tool, struct perf_session *session,
|
|
union perf_event *event);
|
|
typedef s64 (*event_op3)(const struct perf_tool *tool, struct perf_session *session,
|
|
union perf_event *event);
|
|
typedef int (*event_op4)(const struct perf_tool *tool, struct perf_session *session,
|
|
union perf_event *event, u64 data, const char *str);
|
|
|
|
typedef int (*event_oe)(const struct perf_tool *tool, union perf_event *event,
|
|
struct ordered_events *oe);
|
|
|
|
enum show_feature_header {
|
|
SHOW_FEAT_NO_HEADER = 0,
|
|
SHOW_FEAT_HEADER,
|
|
SHOW_FEAT_HEADER_FULL_INFO,
|
|
};
|
|
|
|
struct perf_tool {
|
|
event_sample sample,
|
|
read,
|
|
callchain_deferred;
|
|
event_op mmap,
|
|
mmap2,
|
|
comm,
|
|
namespaces,
|
|
cgroup,
|
|
fork,
|
|
exit,
|
|
lost,
|
|
lost_samples,
|
|
aux,
|
|
itrace_start,
|
|
aux_output_hw_id,
|
|
context_switch,
|
|
throttle,
|
|
unthrottle,
|
|
ksymbol,
|
|
bpf,
|
|
text_poke;
|
|
|
|
event_attr_op attr;
|
|
event_attr_op event_update;
|
|
event_op2 tracing_data;
|
|
event_oe finished_round;
|
|
event_op2 build_id,
|
|
id_index,
|
|
auxtrace_info,
|
|
auxtrace_error,
|
|
time_conv,
|
|
thread_map,
|
|
cpu_map,
|
|
stat_config,
|
|
stat,
|
|
stat_round,
|
|
feature,
|
|
finished_init,
|
|
bpf_metadata;
|
|
event_op4 compressed;
|
|
event_op3 auxtrace;
|
|
bool ordered_events;
|
|
bool ordering_requires_timestamps;
|
|
bool namespace_events;
|
|
bool cgroup_events;
|
|
bool no_warn;
|
|
bool dont_split_sample_group;
|
|
bool merge_deferred_callchains;
|
|
enum show_feature_header show_feat_hdr;
|
|
};
|
|
|
|
void perf_tool__init(struct perf_tool *tool, bool ordered_events);
|
|
|
|
bool perf_tool__compressed_is_stub(const struct perf_tool *tool);
|
|
|
|
int process_event_sample_stub(const struct perf_tool *tool,
|
|
union perf_event *event,
|
|
struct perf_sample *sample,
|
|
struct evsel *evsel,
|
|
struct machine *machine);
|
|
|
|
struct delegate_tool {
|
|
/** @tool: The actual tool that calls the delegate. */
|
|
struct perf_tool tool;
|
|
/** @delegate: The tool that is delegated to. */
|
|
struct perf_tool *delegate;
|
|
};
|
|
|
|
void delegate_tool__init(struct delegate_tool *tool, struct perf_tool *delegate);
|
|
|
|
#endif /* __PERF_TOOL_H */
|