aboutsummaryrefslogtreecommitdiffstats
path: root/include
diff options
context:
space:
mode:
authorAdrian Hunter <adrian.hunter@intel.com>2014-05-28 04:45:04 -0400
committerIngo Molnar <mingo@kernel.org>2014-06-06 01:56:22 -0400
commit82b897782d10fcc4930c9d4a15b175348fdd2871 (patch)
tree82bc0bb22ef1379b901d4fce582584b6776a91ea /include
parentec00010972a0971b2c1da4fbe4e5c7d8ed1ecb05 (diff)
perf: Differentiate exec() and non-exec() comm events
perf tools like 'perf report' can aggregate samples by comm strings, which generally works. However, there are other potential use-cases. For example, to pair up 'calls' with 'returns' accurately (from branch events like Intel BTS) it is necessary to identify whether the process has exec'd. Although a comm event is generated when an 'exec' happens it is also generated whenever the comm string is changed on a whim (e.g. by prctl PR_SET_NAME). This patch adds a flag to the comm event to differentiate one case from the other. In order to determine whether the kernel supports the new flag, a selection bit named 'exec' is added to struct perf_event_attr. The bit does nothing but will cause perf_event_open() to fail if the bit is set on kernels that do not have it defined. Signed-off-by: Adrian Hunter <adrian.hunter@intel.com> Signed-off-by: Peter Zijlstra <peterz@infradead.org> Link: http://lkml.kernel.org/r/537D9EBE.7030806@intel.com Cc: Paul Mackerras <paulus@samba.org> Cc: Dave Jones <davej@redhat.com> Cc: Arnaldo Carvalho de Melo <acme@kernel.org> Cc: David Ahern <dsahern@gmail.com> Cc: Jiri Olsa <jolsa@redhat.com> Cc: Alexander Viro <viro@zeniv.linux.org.uk> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: linux-fsdevel@vger.kernel.org Cc: linux-kernel@vger.kernel.org Signed-off-by: Ingo Molnar <mingo@kernel.org>
Diffstat (limited to 'include')
-rw-r--r--include/linux/perf_event.h4
-rw-r--r--include/linux/sched.h6
-rw-r--r--include/uapi/linux/perf_event.h9
3 files changed, 14 insertions, 5 deletions
diff --git a/include/linux/perf_event.h b/include/linux/perf_event.h
index b4c1d4685bf0..707617a8c0f6 100644
--- a/include/linux/perf_event.h
+++ b/include/linux/perf_event.h
@@ -707,7 +707,7 @@ extern int perf_register_guest_info_callbacks(struct perf_guest_info_callbacks *
707extern int perf_unregister_guest_info_callbacks(struct perf_guest_info_callbacks *callbacks); 707extern int perf_unregister_guest_info_callbacks(struct perf_guest_info_callbacks *callbacks);
708 708
709extern void perf_event_exec(void); 709extern void perf_event_exec(void);
710extern void perf_event_comm(struct task_struct *tsk); 710extern void perf_event_comm(struct task_struct *tsk, bool exec);
711extern void perf_event_fork(struct task_struct *tsk); 711extern void perf_event_fork(struct task_struct *tsk);
712 712
713/* Callchains */ 713/* Callchains */
@@ -815,7 +815,7 @@ static inline int perf_unregister_guest_info_callbacks
815 815
816static inline void perf_event_mmap(struct vm_area_struct *vma) { } 816static inline void perf_event_mmap(struct vm_area_struct *vma) { }
817static inline void perf_event_exec(void) { } 817static inline void perf_event_exec(void) { }
818static inline void perf_event_comm(struct task_struct *tsk) { } 818static inline void perf_event_comm(struct task_struct *tsk, bool exec) { }
819static inline void perf_event_fork(struct task_struct *tsk) { } 819static inline void perf_event_fork(struct task_struct *tsk) { }
820static inline void perf_event_init(void) { } 820static inline void perf_event_init(void) { }
821static inline int perf_swevent_get_recursion_context(void) { return -1; } 821static inline int perf_swevent_get_recursion_context(void) { return -1; }
diff --git a/include/linux/sched.h b/include/linux/sched.h
index 221b2bde3723..ad86e1d7dbc2 100644
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -2379,7 +2379,11 @@ extern long do_fork(unsigned long, unsigned long, unsigned long, int __user *, i
2379struct task_struct *fork_idle(int); 2379struct task_struct *fork_idle(int);
2380extern pid_t kernel_thread(int (*fn)(void *), void *arg, unsigned long flags); 2380extern pid_t kernel_thread(int (*fn)(void *), void *arg, unsigned long flags);
2381 2381
2382extern void set_task_comm(struct task_struct *tsk, const char *from); 2382extern void __set_task_comm(struct task_struct *tsk, const char *from, bool exec);
2383static inline void set_task_comm(struct task_struct *tsk, const char *from)
2384{
2385 __set_task_comm(tsk, from, false);
2386}
2383extern char *get_task_comm(char *to, struct task_struct *tsk); 2387extern char *get_task_comm(char *to, struct task_struct *tsk);
2384 2388
2385#ifdef CONFIG_SMP 2389#ifdef CONFIG_SMP
diff --git a/include/uapi/linux/perf_event.h b/include/uapi/linux/perf_event.h
index d9cd853818ad..5312fae47218 100644
--- a/include/uapi/linux/perf_event.h
+++ b/include/uapi/linux/perf_event.h
@@ -302,8 +302,8 @@ struct perf_event_attr {
302 exclude_callchain_kernel : 1, /* exclude kernel callchains */ 302 exclude_callchain_kernel : 1, /* exclude kernel callchains */
303 exclude_callchain_user : 1, /* exclude user callchains */ 303 exclude_callchain_user : 1, /* exclude user callchains */
304 mmap2 : 1, /* include mmap with inode data */ 304 mmap2 : 1, /* include mmap with inode data */
305 305 comm_exec : 1, /* flag comm events that are due to an exec */
306 __reserved_1 : 40; 306 __reserved_1 : 39;
307 307
308 union { 308 union {
309 __u32 wakeup_events; /* wakeup every n events */ 309 __u32 wakeup_events; /* wakeup every n events */
@@ -502,7 +502,12 @@ struct perf_event_mmap_page {
502#define PERF_RECORD_MISC_GUEST_KERNEL (4 << 0) 502#define PERF_RECORD_MISC_GUEST_KERNEL (4 << 0)
503#define PERF_RECORD_MISC_GUEST_USER (5 << 0) 503#define PERF_RECORD_MISC_GUEST_USER (5 << 0)
504 504
505/*
506 * PERF_RECORD_MISC_MMAP_DATA and PERF_RECORD_MISC_COMM_EXEC are used on
507 * different events so can reuse the same bit position.
508 */
505#define PERF_RECORD_MISC_MMAP_DATA (1 << 13) 509#define PERF_RECORD_MISC_MMAP_DATA (1 << 13)
510#define PERF_RECORD_MISC_COMM_EXEC (1 << 13)
506/* 511/*
507 * Indicates that the content of PERF_SAMPLE_IP points to 512 * Indicates that the content of PERF_SAMPLE_IP points to
508 * the actual instruction that triggered the event. See also 513 * the actual instruction that triggered the event. See also