diff options
| author | Arnaldo Carvalho de Melo <acme@redhat.com> | 2016-05-12 12:06:21 -0400 |
|---|---|---|
| committer | Arnaldo Carvalho de Melo <acme@redhat.com> | 2016-05-16 22:11:53 -0400 |
| commit | c85b03349640b34f3545503c8429fc43005e9a92 (patch) | |
| tree | 4f226f1fa1c7b0399fba6986100418427e30870e /kernel | |
| parent | 3e4de4ec4cfea40994b47a79767610153edbf45b (diff) | |
perf core: Separate accounting of contexts and real addresses in a stack trace
The perf_sample->ip_callchain->nr value includes all the entries in the
ip_callchain->ip[] array, real addresses and PERF_CONTEXT_{KERNEL,USER,etc},
while what the user expects is that what is in the kernel.perf_event_max_stack
sysctl or in the upcoming per event perf_event_attr.sample_max_stack knob be
honoured in terms of IP addresses in the stack trace.
So allocate a bunch of extra entries for contexts, and do the accounting
via perf_callchain_entry_ctx struct members.
A new sysctl, kernel.perf_event_max_contexts_per_stack is also
introduced for investigating possible bugs in the callchain
implementation by some arch.
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Alexei Starovoitov <ast@kernel.org>
Cc: Brendan Gregg <brendan.d.gregg@gmail.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Frederic Weisbecker <fweisbec@gmail.com>
Cc: He Kuang <hekuang@huawei.com>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Masami Hiramatsu <mhiramat@kernel.org>
Cc: Milian Wolff <milian.wolff@kdab.com>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Stephane Eranian <eranian@google.com>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Vince Weaver <vincent.weaver@maine.edu>
Cc: Wang Nan <wangnan0@huawei.com>
Cc: Zefan Li <lizefan@huawei.com>
Link: http://lkml.kernel.org/n/tip-3b4wnqk340c4sg4gwkfdi9yk@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Diffstat (limited to 'kernel')
| -rw-r--r-- | kernel/events/callchain.c | 10 | ||||
| -rw-r--r-- | kernel/sysctl.c | 9 |
2 files changed, 18 insertions, 1 deletions
diff --git a/kernel/events/callchain.c b/kernel/events/callchain.c index ca645736a983..179ef4640964 100644 --- a/kernel/events/callchain.c +++ b/kernel/events/callchain.c | |||
| @@ -19,11 +19,13 @@ struct callchain_cpus_entries { | |||
| 19 | }; | 19 | }; |
| 20 | 20 | ||
| 21 | int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH; | 21 | int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH; |
| 22 | int sysctl_perf_event_max_contexts_per_stack __read_mostly = PERF_MAX_CONTEXTS_PER_STACK; | ||
| 22 | 23 | ||
| 23 | static inline size_t perf_callchain_entry__sizeof(void) | 24 | static inline size_t perf_callchain_entry__sizeof(void) |
| 24 | { | 25 | { |
| 25 | return (sizeof(struct perf_callchain_entry) + | 26 | return (sizeof(struct perf_callchain_entry) + |
| 26 | sizeof(__u64) * sysctl_perf_event_max_stack); | 27 | sizeof(__u64) * (sysctl_perf_event_max_stack + |
| 28 | sysctl_perf_event_max_contexts_per_stack)); | ||
| 27 | } | 29 | } |
| 28 | 30 | ||
| 29 | static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]); | 31 | static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]); |
| @@ -197,6 +199,8 @@ get_perf_callchain(struct pt_regs *regs, u32 init_nr, bool kernel, bool user, | |||
| 197 | ctx.entry = entry; | 199 | ctx.entry = entry; |
| 198 | ctx.max_stack = max_stack; | 200 | ctx.max_stack = max_stack; |
| 199 | ctx.nr = entry->nr = init_nr; | 201 | ctx.nr = entry->nr = init_nr; |
| 202 | ctx.contexts = 0; | ||
| 203 | ctx.contexts_maxed = false; | ||
| 200 | 204 | ||
| 201 | if (kernel && !user_mode(regs)) { | 205 | if (kernel && !user_mode(regs)) { |
| 202 | if (add_mark) | 206 | if (add_mark) |
| @@ -228,6 +232,10 @@ exit_put: | |||
| 228 | return entry; | 232 | return entry; |
| 229 | } | 233 | } |
| 230 | 234 | ||
| 235 | /* | ||
| 236 | * Used for sysctl_perf_event_max_stack and | ||
| 237 | * sysctl_perf_event_max_contexts_per_stack. | ||
| 238 | */ | ||
| 231 | int perf_event_max_stack_handler(struct ctl_table *table, int write, | 239 | int perf_event_max_stack_handler(struct ctl_table *table, int write, |
| 232 | void __user *buffer, size_t *lenp, loff_t *ppos) | 240 | void __user *buffer, size_t *lenp, loff_t *ppos) |
| 233 | { | 241 | { |
diff --git a/kernel/sysctl.c b/kernel/sysctl.c index 0ec6907a16b3..bec4c11c47d6 100644 --- a/kernel/sysctl.c +++ b/kernel/sysctl.c | |||
| @@ -1156,6 +1156,15 @@ static struct ctl_table kern_table[] = { | |||
| 1156 | .extra1 = &zero, | 1156 | .extra1 = &zero, |
| 1157 | .extra2 = &six_hundred_forty_kb, | 1157 | .extra2 = &six_hundred_forty_kb, |
| 1158 | }, | 1158 | }, |
| 1159 | { | ||
| 1160 | .procname = "perf_event_max_contexts_per_stack", | ||
| 1161 | .data = &sysctl_perf_event_max_contexts_per_stack, | ||
| 1162 | .maxlen = sizeof(sysctl_perf_event_max_contexts_per_stack), | ||
| 1163 | .mode = 0644, | ||
| 1164 | .proc_handler = perf_event_max_stack_handler, | ||
| 1165 | .extra1 = &zero, | ||
| 1166 | .extra2 = &one_thousand, | ||
| 1167 | }, | ||
| 1159 | #endif | 1168 | #endif |
| 1160 | #ifdef CONFIG_KMEMCHECK | 1169 | #ifdef CONFIG_KMEMCHECK |
| 1161 | { | 1170 | { |
