diff options
207 files changed, 14649 insertions, 8110 deletions
diff --git a/Documentation/kprobes.txt b/Documentation/kprobes.txt index 2f9115c0ae62..61c291cddf18 100644 --- a/Documentation/kprobes.txt +++ b/Documentation/kprobes.txt | |||
@@ -165,8 +165,8 @@ the user entry_handler invocation is also skipped. | |||
165 | 165 | ||
166 | 1.4 How Does Jump Optimization Work? | 166 | 1.4 How Does Jump Optimization Work? |
167 | 167 | ||
168 | If you configured your kernel with CONFIG_OPTPROBES=y (currently | 168 | If your kernel is built with CONFIG_OPTPROBES=y (currently this flag |
169 | this option is supported on x86/x86-64, non-preemptive kernel) and | 169 | is automatically set 'y' on x86/x86-64, non-preemptive kernel) and |
170 | the "debug.kprobes_optimization" kernel parameter is set to 1 (see | 170 | the "debug.kprobes_optimization" kernel parameter is set to 1 (see |
171 | sysctl(8)), Kprobes tries to reduce probe-hit overhead by using a jump | 171 | sysctl(8)), Kprobes tries to reduce probe-hit overhead by using a jump |
172 | instruction instead of a breakpoint instruction at each probepoint. | 172 | instruction instead of a breakpoint instruction at each probepoint. |
@@ -271,8 +271,6 @@ tweak the kernel's execution path, you need to suppress optimization, | |||
271 | using one of the following techniques: | 271 | using one of the following techniques: |
272 | - Specify an empty function for the kprobe's post_handler or break_handler. | 272 | - Specify an empty function for the kprobe's post_handler or break_handler. |
273 | or | 273 | or |
274 | - Config CONFIG_OPTPROBES=n. | ||
275 | or | ||
276 | - Execute 'sysctl -w debug.kprobes_optimization=n' | 274 | - Execute 'sysctl -w debug.kprobes_optimization=n' |
277 | 275 | ||
278 | 2. Architectures Supported | 276 | 2. Architectures Supported |
@@ -307,10 +305,6 @@ it useful to "Compile the kernel with debug info" (CONFIG_DEBUG_INFO), | |||
307 | so you can use "objdump -d -l vmlinux" to see the source-to-object | 305 | so you can use "objdump -d -l vmlinux" to see the source-to-object |
308 | code mapping. | 306 | code mapping. |
309 | 307 | ||
310 | If you want to reduce probing overhead, set "Kprobes jump optimization | ||
311 | support" (CONFIG_OPTPROBES) to "y". You can find this option under the | ||
312 | "Kprobes" line. | ||
313 | |||
314 | 4. API Reference | 308 | 4. API Reference |
315 | 309 | ||
316 | The Kprobes API includes a "register" function and an "unregister" | 310 | The Kprobes API includes a "register" function and an "unregister" |
diff --git a/Documentation/trace/kprobetrace.txt b/Documentation/trace/kprobetrace.txt index a9100b28eb84..ec94748ae65b 100644 --- a/Documentation/trace/kprobetrace.txt +++ b/Documentation/trace/kprobetrace.txt | |||
@@ -40,7 +40,9 @@ Synopsis of kprobe_events | |||
40 | $stack : Fetch stack address. | 40 | $stack : Fetch stack address. |
41 | $retval : Fetch return value.(*) | 41 | $retval : Fetch return value.(*) |
42 | +|-offs(FETCHARG) : Fetch memory at FETCHARG +|- offs address.(**) | 42 | +|-offs(FETCHARG) : Fetch memory at FETCHARG +|- offs address.(**) |
43 | NAME=FETCHARG: Set NAME as the argument name of FETCHARG. | 43 | NAME=FETCHARG : Set NAME as the argument name of FETCHARG. |
44 | FETCHARG:TYPE : Set TYPE as the type of FETCHARG. Currently, basic types | ||
45 | (u8/u16/u32/u64/s8/s16/s32/s64) are supported. | ||
44 | 46 | ||
45 | (*) only for return probe. | 47 | (*) only for return probe. |
46 | (**) this is useful for fetching a field of data structures. | 48 | (**) this is useful for fetching a field of data structures. |
diff --git a/MAINTAINERS b/MAINTAINERS index 033161805587..28332e1b0863 100644 --- a/MAINTAINERS +++ b/MAINTAINERS | |||
@@ -4354,13 +4354,13 @@ M: Paul Mackerras <paulus@samba.org> | |||
4354 | M: Ingo Molnar <mingo@elte.hu> | 4354 | M: Ingo Molnar <mingo@elte.hu> |
4355 | M: Arnaldo Carvalho de Melo <acme@redhat.com> | 4355 | M: Arnaldo Carvalho de Melo <acme@redhat.com> |
4356 | S: Supported | 4356 | S: Supported |
4357 | F: kernel/perf_event.c | 4357 | F: kernel/perf_event*.c |
4358 | F: include/linux/perf_event.h | 4358 | F: include/linux/perf_event.h |
4359 | F: arch/*/kernel/perf_event.c | 4359 | F: arch/*/kernel/perf_event*.c |
4360 | F: arch/*/kernel/*/perf_event.c | 4360 | F: arch/*/kernel/*/perf_event*.c |
4361 | F: arch/*/kernel/*/*/perf_event.c | 4361 | F: arch/*/kernel/*/*/perf_event*.c |
4362 | F: arch/*/include/asm/perf_event.h | 4362 | F: arch/*/include/asm/perf_event.h |
4363 | F: arch/*/lib/perf_event.c | 4363 | F: arch/*/lib/perf_event*.c |
4364 | F: arch/*/kernel/perf_callchain.c | 4364 | F: arch/*/kernel/perf_callchain.c |
4365 | F: tools/perf/ | 4365 | F: tools/perf/ |
4366 | 4366 | ||
diff --git a/arch/Kconfig b/arch/Kconfig index e5eb1337a537..acda512da2e2 100644 --- a/arch/Kconfig +++ b/arch/Kconfig | |||
@@ -42,15 +42,10 @@ config KPROBES | |||
42 | If in doubt, say "N". | 42 | If in doubt, say "N". |
43 | 43 | ||
44 | config OPTPROBES | 44 | config OPTPROBES |
45 | bool "Kprobes jump optimization support (EXPERIMENTAL)" | 45 | def_bool y |
46 | default y | 46 | depends on KPROBES && HAVE_OPTPROBES |
47 | depends on KPROBES | ||
48 | depends on !PREEMPT | 47 | depends on !PREEMPT |
49 | depends on HAVE_OPTPROBES | ||
50 | select KALLSYMS_ALL | 48 | select KALLSYMS_ALL |
51 | help | ||
52 | This option will allow kprobes to optimize breakpoint to | ||
53 | a jump for reducing its overhead. | ||
54 | 49 | ||
55 | config HAVE_EFFICIENT_UNALIGNED_ACCESS | 50 | config HAVE_EFFICIENT_UNALIGNED_ACCESS |
56 | bool | 51 | bool |
@@ -142,6 +137,17 @@ config HAVE_HW_BREAKPOINT | |||
142 | bool | 137 | bool |
143 | depends on PERF_EVENTS | 138 | depends on PERF_EVENTS |
144 | 139 | ||
140 | config HAVE_MIXED_BREAKPOINTS_REGS | ||
141 | bool | ||
142 | depends on HAVE_HW_BREAKPOINT | ||
143 | help | ||
144 | Depending on the arch implementation of hardware breakpoints, | ||
145 | some of them have separate registers for data and instruction | ||
146 | breakpoints addresses, others have mixed registers to store | ||
147 | them but define the access type in a control register. | ||
148 | Select this option if your arch implements breakpoints under the | ||
149 | latter fashion. | ||
150 | |||
145 | config HAVE_USER_RETURN_NOTIFIER | 151 | config HAVE_USER_RETURN_NOTIFIER |
146 | bool | 152 | bool |
147 | 153 | ||
diff --git a/arch/powerpc/kernel/perf_event.c b/arch/powerpc/kernel/perf_event.c index 08460a2e9f41..43b83c35cf54 100644 --- a/arch/powerpc/kernel/perf_event.c +++ b/arch/powerpc/kernel/perf_event.c | |||
@@ -35,6 +35,9 @@ struct cpu_hw_events { | |||
35 | u64 alternatives[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; | 35 | u64 alternatives[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; |
36 | unsigned long amasks[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; | 36 | unsigned long amasks[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; |
37 | unsigned long avalues[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; | 37 | unsigned long avalues[MAX_HWEVENTS][MAX_EVENT_ALTERNATIVES]; |
38 | |||
39 | unsigned int group_flag; | ||
40 | int n_txn_start; | ||
38 | }; | 41 | }; |
39 | DEFINE_PER_CPU(struct cpu_hw_events, cpu_hw_events); | 42 | DEFINE_PER_CPU(struct cpu_hw_events, cpu_hw_events); |
40 | 43 | ||
@@ -718,66 +721,6 @@ static int collect_events(struct perf_event *group, int max_count, | |||
718 | return n; | 721 | return n; |
719 | } | 722 | } |
720 | 723 | ||
721 | static void event_sched_in(struct perf_event *event) | ||
722 | { | ||
723 | event->state = PERF_EVENT_STATE_ACTIVE; | ||
724 | event->oncpu = smp_processor_id(); | ||
725 | event->tstamp_running += event->ctx->time - event->tstamp_stopped; | ||
726 | if (is_software_event(event)) | ||
727 | event->pmu->enable(event); | ||
728 | } | ||
729 | |||
730 | /* | ||
731 | * Called to enable a whole group of events. | ||
732 | * Returns 1 if the group was enabled, or -EAGAIN if it could not be. | ||
733 | * Assumes the caller has disabled interrupts and has | ||
734 | * frozen the PMU with hw_perf_save_disable. | ||
735 | */ | ||
736 | int hw_perf_group_sched_in(struct perf_event *group_leader, | ||
737 | struct perf_cpu_context *cpuctx, | ||
738 | struct perf_event_context *ctx) | ||
739 | { | ||
740 | struct cpu_hw_events *cpuhw; | ||
741 | long i, n, n0; | ||
742 | struct perf_event *sub; | ||
743 | |||
744 | if (!ppmu) | ||
745 | return 0; | ||
746 | cpuhw = &__get_cpu_var(cpu_hw_events); | ||
747 | n0 = cpuhw->n_events; | ||
748 | n = collect_events(group_leader, ppmu->n_counter - n0, | ||
749 | &cpuhw->event[n0], &cpuhw->events[n0], | ||
750 | &cpuhw->flags[n0]); | ||
751 | if (n < 0) | ||
752 | return -EAGAIN; | ||
753 | if (check_excludes(cpuhw->event, cpuhw->flags, n0, n)) | ||
754 | return -EAGAIN; | ||
755 | i = power_check_constraints(cpuhw, cpuhw->events, cpuhw->flags, n + n0); | ||
756 | if (i < 0) | ||
757 | return -EAGAIN; | ||
758 | cpuhw->n_events = n0 + n; | ||
759 | cpuhw->n_added += n; | ||
760 | |||
761 | /* | ||
762 | * OK, this group can go on; update event states etc., | ||
763 | * and enable any software events | ||
764 | */ | ||
765 | for (i = n0; i < n0 + n; ++i) | ||
766 | cpuhw->event[i]->hw.config = cpuhw->events[i]; | ||
767 | cpuctx->active_oncpu += n; | ||
768 | n = 1; | ||
769 | event_sched_in(group_leader); | ||
770 | list_for_each_entry(sub, &group_leader->sibling_list, group_entry) { | ||
771 | if (sub->state != PERF_EVENT_STATE_OFF) { | ||
772 | event_sched_in(sub); | ||
773 | ++n; | ||
774 | } | ||
775 | } | ||
776 | ctx->nr_active += n; | ||
777 | |||
778 | return 1; | ||
779 | } | ||
780 | |||
781 | /* | 724 | /* |
782 | * Add a event to the PMU. | 725 | * Add a event to the PMU. |
783 | * If all events are not already frozen, then we disable and | 726 | * If all events are not already frozen, then we disable and |
@@ -805,12 +748,22 @@ static int power_pmu_enable(struct perf_event *event) | |||
805 | cpuhw->event[n0] = event; | 748 | cpuhw->event[n0] = event; |
806 | cpuhw->events[n0] = event->hw.config; | 749 | cpuhw->events[n0] = event->hw.config; |
807 | cpuhw->flags[n0] = event->hw.event_base; | 750 | cpuhw->flags[n0] = event->hw.event_base; |
751 | |||
752 | /* | ||
753 | * If group events scheduling transaction was started, | ||
754 | * skip the schedulability test here, it will be peformed | ||
755 | * at commit time(->commit_txn) as a whole | ||
756 | */ | ||
757 | if (cpuhw->group_flag & PERF_EVENT_TXN_STARTED) | ||
758 | goto nocheck; | ||
759 | |||
808 | if (check_excludes(cpuhw->event, cpuhw->flags, n0, 1)) | 760 | if (check_excludes(cpuhw->event, cpuhw->flags, n0, 1)) |
809 | goto out; | 761 | goto out; |
810 | if (power_check_constraints(cpuhw, cpuhw->events, cpuhw->flags, n0 + 1)) | 762 | if (power_check_constraints(cpuhw, cpuhw->events, cpuhw->flags, n0 + 1)) |
811 | goto out; | 763 | goto out; |
812 | |||
813 | event->hw.config = cpuhw->events[n0]; | 764 | event->hw.config = cpuhw->events[n0]; |
765 | |||
766 | nocheck: | ||
814 | ++cpuhw->n_events; | 767 | ++cpuhw->n_events; |
815 | ++cpuhw->n_added; | 768 | ++cpuhw->n_added; |
816 | 769 | ||
@@ -896,11 +849,65 @@ static void power_pmu_unthrottle(struct perf_event *event) | |||
896 | local_irq_restore(flags); | 849 | local_irq_restore(flags); |
897 | } | 850 | } |
898 | 851 | ||
852 | /* | ||
853 | * Start group events scheduling transaction | ||
854 | * Set the flag to make pmu::enable() not perform the | ||
855 | * schedulability test, it will be performed at commit time | ||
856 | */ | ||
857 | void power_pmu_start_txn(const struct pmu *pmu) | ||
858 | { | ||
859 | struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events); | ||
860 | |||
861 | cpuhw->group_flag |= PERF_EVENT_TXN_STARTED; | ||
862 | cpuhw->n_txn_start = cpuhw->n_events; | ||
863 | } | ||
864 | |||
865 | /* | ||
866 | * Stop group events scheduling transaction | ||
867 | * Clear the flag and pmu::enable() will perform the | ||
868 | * schedulability test. | ||
869 | */ | ||
870 | void power_pmu_cancel_txn(const struct pmu *pmu) | ||
871 | { | ||
872 | struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events); | ||
873 | |||
874 | cpuhw->group_flag &= ~PERF_EVENT_TXN_STARTED; | ||
875 | } | ||
876 | |||
877 | /* | ||
878 | * Commit group events scheduling transaction | ||
879 | * Perform the group schedulability test as a whole | ||
880 | * Return 0 if success | ||
881 | */ | ||
882 | int power_pmu_commit_txn(const struct pmu *pmu) | ||
883 | { | ||
884 | struct cpu_hw_events *cpuhw; | ||
885 | long i, n; | ||
886 | |||
887 | if (!ppmu) | ||
888 | return -EAGAIN; | ||
889 | cpuhw = &__get_cpu_var(cpu_hw_events); | ||
890 | n = cpuhw->n_events; | ||
891 | if (check_excludes(cpuhw->event, cpuhw->flags, 0, n)) | ||
892 | return -EAGAIN; | ||
893 | i = power_check_constraints(cpuhw, cpuhw->events, cpuhw->flags, n); | ||
894 | if (i < 0) | ||
895 | return -EAGAIN; | ||
896 | |||
897 | for (i = cpuhw->n_txn_start; i < n; ++i) | ||
898 | cpuhw->event[i]->hw.config = cpuhw->events[i]; | ||
899 | |||
900 | return 0; | ||
901 | } | ||
902 | |||
899 | struct pmu power_pmu = { | 903 | struct pmu power_pmu = { |
900 | .enable = power_pmu_enable, | 904 | .enable = power_pmu_enable, |
901 | .disable = power_pmu_disable, | 905 | .disable = power_pmu_disable, |
902 | .read = power_pmu_read, | 906 | .read = power_pmu_read, |
903 | .unthrottle = power_pmu_unthrottle, | 907 | .unthrottle = power_pmu_unthrottle, |
908 | .start_txn = power_pmu_start_txn, | ||
909 | .cancel_txn = power_pmu_cancel_txn, | ||
910 | .commit_txn = power_pmu_commit_txn, | ||
904 | }; | 911 | }; |
905 | 912 | ||
906 | /* | 913 | /* |
diff --git a/arch/sh/Kconfig b/arch/sh/Kconfig index 8d90564c2bcf..e6d8ab5cfa9d 100644 --- a/arch/sh/Kconfig +++ b/arch/sh/Kconfig | |||
@@ -44,6 +44,7 @@ config SUPERH32 | |||
44 | select HAVE_FUNCTION_GRAPH_TRACER | 44 | select HAVE_FUNCTION_GRAPH_TRACER |
45 | select HAVE_ARCH_KGDB | 45 | select HAVE_ARCH_KGDB |
46 | select HAVE_HW_BREAKPOINT | 46 | select HAVE_HW_BREAKPOINT |
47 | select HAVE_MIXED_BREAKPOINTS_REGS | ||
47 | select PERF_EVENTS if HAVE_HW_BREAKPOINT | 48 | select PERF_EVENTS if HAVE_HW_BREAKPOINT |
48 | select ARCH_HIBERNATION_POSSIBLE if MMU | 49 | select ARCH_HIBERNATION_POSSIBLE if MMU |
49 | 50 | ||
diff --git a/arch/sh/include/asm/hw_breakpoint.h b/arch/sh/include/asm/hw_breakpoint.h index 965dd780d51b..e14cad96798f 100644 --- a/arch/sh/include/asm/hw_breakpoint.h +++ b/arch/sh/include/asm/hw_breakpoint.h | |||
@@ -46,10 +46,14 @@ struct pmu; | |||
46 | /* Maximum number of UBC channels */ | 46 | /* Maximum number of UBC channels */ |
47 | #define HBP_NUM 2 | 47 | #define HBP_NUM 2 |
48 | 48 | ||
49 | static inline int hw_breakpoint_slots(int type) | ||
50 | { | ||
51 | return HBP_NUM; | ||
52 | } | ||
53 | |||
49 | /* arch/sh/kernel/hw_breakpoint.c */ | 54 | /* arch/sh/kernel/hw_breakpoint.c */ |
50 | extern int arch_check_va_in_userspace(unsigned long va, u16 hbp_len); | 55 | extern int arch_check_bp_in_kernelspace(struct perf_event *bp); |
51 | extern int arch_validate_hwbkpt_settings(struct perf_event *bp, | 56 | extern int arch_validate_hwbkpt_settings(struct perf_event *bp); |
52 | struct task_struct *tsk); | ||
53 | extern int hw_breakpoint_exceptions_notify(struct notifier_block *unused, | 57 | extern int hw_breakpoint_exceptions_notify(struct notifier_block *unused, |
54 | unsigned long val, void *data); | 58 | unsigned long val, void *data); |
55 | 59 | ||
diff --git a/arch/sh/kernel/hw_breakpoint.c b/arch/sh/kernel/hw_breakpoint.c index 675eea7785d9..1f2cf6229862 100644 --- a/arch/sh/kernel/hw_breakpoint.c +++ b/arch/sh/kernel/hw_breakpoint.c | |||
@@ -120,25 +120,16 @@ static int get_hbp_len(u16 hbp_len) | |||
120 | } | 120 | } |
121 | 121 | ||
122 | /* | 122 | /* |
123 | * Check for virtual address in user space. | ||
124 | */ | ||
125 | int arch_check_va_in_userspace(unsigned long va, u16 hbp_len) | ||
126 | { | ||
127 | unsigned int len; | ||
128 | |||
129 | len = get_hbp_len(hbp_len); | ||
130 | |||
131 | return (va <= TASK_SIZE - len); | ||
132 | } | ||
133 | |||
134 | /* | ||
135 | * Check for virtual address in kernel space. | 123 | * Check for virtual address in kernel space. |
136 | */ | 124 | */ |
137 | static int arch_check_va_in_kernelspace(unsigned long va, u8 hbp_len) | 125 | int arch_check_bp_in_kernelspace(struct perf_event *bp) |
138 | { | 126 | { |
139 | unsigned int len; | 127 | unsigned int len; |
128 | unsigned long va; | ||
129 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); | ||
140 | 130 | ||
141 | len = get_hbp_len(hbp_len); | 131 | va = info->address; |
132 | len = get_hbp_len(info->len); | ||
142 | 133 | ||
143 | return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE); | 134 | return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE); |
144 | } | 135 | } |
@@ -226,8 +217,7 @@ static int arch_build_bp_info(struct perf_event *bp) | |||
226 | /* | 217 | /* |
227 | * Validate the arch-specific HW Breakpoint register settings | 218 | * Validate the arch-specific HW Breakpoint register settings |
228 | */ | 219 | */ |
229 | int arch_validate_hwbkpt_settings(struct perf_event *bp, | 220 | int arch_validate_hwbkpt_settings(struct perf_event *bp) |
230 | struct task_struct *tsk) | ||
231 | { | 221 | { |
232 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); | 222 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); |
233 | unsigned int align; | 223 | unsigned int align; |
@@ -270,15 +260,6 @@ int arch_validate_hwbkpt_settings(struct perf_event *bp, | |||
270 | if (info->address & align) | 260 | if (info->address & align) |
271 | return -EINVAL; | 261 | return -EINVAL; |
272 | 262 | ||
273 | /* Check that the virtual address is in the proper range */ | ||
274 | if (tsk) { | ||
275 | if (!arch_check_va_in_userspace(info->address, info->len)) | ||
276 | return -EFAULT; | ||
277 | } else { | ||
278 | if (!arch_check_va_in_kernelspace(info->address, info->len)) | ||
279 | return -EFAULT; | ||
280 | } | ||
281 | |||
282 | return 0; | 263 | return 0; |
283 | } | 264 | } |
284 | 265 | ||
@@ -363,8 +344,7 @@ static int __kprobes hw_breakpoint_handler(struct die_args *args) | |||
363 | perf_bp_event(bp, args->regs); | 344 | perf_bp_event(bp, args->regs); |
364 | 345 | ||
365 | /* Deliver the signal to userspace */ | 346 | /* Deliver the signal to userspace */ |
366 | if (arch_check_va_in_userspace(bp->attr.bp_addr, | 347 | if (!arch_check_bp_in_kernelspace(bp)) { |
367 | bp->attr.bp_len)) { | ||
368 | siginfo_t info; | 348 | siginfo_t info; |
369 | 349 | ||
370 | info.si_signo = args->signr; | 350 | info.si_signo = args->signr; |
diff --git a/arch/sh/kernel/ptrace_32.c b/arch/sh/kernel/ptrace_32.c index 7759a9a93211..d4104ce9fe53 100644 --- a/arch/sh/kernel/ptrace_32.c +++ b/arch/sh/kernel/ptrace_32.c | |||
@@ -85,7 +85,7 @@ static int set_single_step(struct task_struct *tsk, unsigned long addr) | |||
85 | 85 | ||
86 | bp = thread->ptrace_bps[0]; | 86 | bp = thread->ptrace_bps[0]; |
87 | if (!bp) { | 87 | if (!bp) { |
88 | hw_breakpoint_init(&attr); | 88 | ptrace_breakpoint_init(&attr); |
89 | 89 | ||
90 | attr.bp_addr = addr; | 90 | attr.bp_addr = addr; |
91 | attr.bp_len = HW_BREAKPOINT_LEN_2; | 91 | attr.bp_len = HW_BREAKPOINT_LEN_2; |
diff --git a/arch/x86/Kconfig b/arch/x86/Kconfig index 9458685902bd..01177dcbe261 100644 --- a/arch/x86/Kconfig +++ b/arch/x86/Kconfig | |||
@@ -53,11 +53,15 @@ config X86 | |||
53 | select HAVE_KERNEL_LZMA | 53 | select HAVE_KERNEL_LZMA |
54 | select HAVE_KERNEL_LZO | 54 | select HAVE_KERNEL_LZO |
55 | select HAVE_HW_BREAKPOINT | 55 | select HAVE_HW_BREAKPOINT |
56 | select HAVE_MIXED_BREAKPOINTS_REGS | ||
56 | select PERF_EVENTS | 57 | select PERF_EVENTS |
57 | select ANON_INODES | 58 | select ANON_INODES |
58 | select HAVE_ARCH_KMEMCHECK | 59 | select HAVE_ARCH_KMEMCHECK |
59 | select HAVE_USER_RETURN_NOTIFIER | 60 | select HAVE_USER_RETURN_NOTIFIER |
60 | 61 | ||
62 | config INSTRUCTION_DECODER | ||
63 | def_bool (KPROBES || PERF_EVENTS) | ||
64 | |||
61 | config OUTPUT_FORMAT | 65 | config OUTPUT_FORMAT |
62 | string | 66 | string |
63 | default "elf32-i386" if X86_32 | 67 | default "elf32-i386" if X86_32 |
diff --git a/arch/x86/Kconfig.cpu b/arch/x86/Kconfig.cpu index a19829374e6a..918fbb1855cc 100644 --- a/arch/x86/Kconfig.cpu +++ b/arch/x86/Kconfig.cpu | |||
@@ -502,23 +502,3 @@ config CPU_SUP_UMC_32 | |||
502 | CPU might render the kernel unbootable. | 502 | CPU might render the kernel unbootable. |
503 | 503 | ||
504 | If unsure, say N. | 504 | If unsure, say N. |
505 | |||
506 | config X86_DS | ||
507 | def_bool X86_PTRACE_BTS | ||
508 | depends on X86_DEBUGCTLMSR | ||
509 | select HAVE_HW_BRANCH_TRACER | ||
510 | |||
511 | config X86_PTRACE_BTS | ||
512 | bool "Branch Trace Store" | ||
513 | default y | ||
514 | depends on X86_DEBUGCTLMSR | ||
515 | depends on BROKEN | ||
516 | ---help--- | ||
517 | This adds a ptrace interface to the hardware's branch trace store. | ||
518 | |||
519 | Debuggers may use it to collect an execution trace of the debugged | ||
520 | application in order to answer the question 'how did I get here?'. | ||
521 | Debuggers may trace user mode as well as kernel mode. | ||
522 | |||
523 | Say Y unless there is no application development on this machine | ||
524 | and you want to save a small amount of code size. | ||
diff --git a/arch/x86/Kconfig.debug b/arch/x86/Kconfig.debug index bc01e3ebfeb2..bd58c8abbfbd 100644 --- a/arch/x86/Kconfig.debug +++ b/arch/x86/Kconfig.debug | |||
@@ -174,15 +174,6 @@ config IOMMU_LEAK | |||
174 | Add a simple leak tracer to the IOMMU code. This is useful when you | 174 | Add a simple leak tracer to the IOMMU code. This is useful when you |
175 | are debugging a buggy device driver that leaks IOMMU mappings. | 175 | are debugging a buggy device driver that leaks IOMMU mappings. |
176 | 176 | ||
177 | config X86_DS_SELFTEST | ||
178 | bool "DS selftest" | ||
179 | default y | ||
180 | depends on DEBUG_KERNEL | ||
181 | depends on X86_DS | ||
182 | ---help--- | ||
183 | Perform Debug Store selftests at boot time. | ||
184 | If in doubt, say "N". | ||
185 | |||
186 | config HAVE_MMIOTRACE_SUPPORT | 177 | config HAVE_MMIOTRACE_SUPPORT |
187 | def_bool y | 178 | def_bool y |
188 | 179 | ||
diff --git a/arch/x86/include/asm/apic.h b/arch/x86/include/asm/apic.h index b4ac2cdcb64f..1fa03e04ae44 100644 --- a/arch/x86/include/asm/apic.h +++ b/arch/x86/include/asm/apic.h | |||
@@ -373,6 +373,7 @@ extern atomic_t init_deasserted; | |||
373 | extern int wakeup_secondary_cpu_via_nmi(int apicid, unsigned long start_eip); | 373 | extern int wakeup_secondary_cpu_via_nmi(int apicid, unsigned long start_eip); |
374 | #endif | 374 | #endif |
375 | 375 | ||
376 | #ifdef CONFIG_X86_LOCAL_APIC | ||
376 | static inline u32 apic_read(u32 reg) | 377 | static inline u32 apic_read(u32 reg) |
377 | { | 378 | { |
378 | return apic->read(reg); | 379 | return apic->read(reg); |
@@ -403,10 +404,19 @@ static inline u32 safe_apic_wait_icr_idle(void) | |||
403 | return apic->safe_wait_icr_idle(); | 404 | return apic->safe_wait_icr_idle(); |
404 | } | 405 | } |
405 | 406 | ||
407 | #else /* CONFIG_X86_LOCAL_APIC */ | ||
408 | |||
409 | static inline u32 apic_read(u32 reg) { return 0; } | ||
410 | static inline void apic_write(u32 reg, u32 val) { } | ||
411 | static inline u64 apic_icr_read(void) { return 0; } | ||
412 | static inline void apic_icr_write(u32 low, u32 high) { } | ||
413 | static inline void apic_wait_icr_idle(void) { } | ||
414 | static inline u32 safe_apic_wait_icr_idle(void) { return 0; } | ||
415 | |||
416 | #endif /* CONFIG_X86_LOCAL_APIC */ | ||
406 | 417 | ||
407 | static inline void ack_APIC_irq(void) | 418 | static inline void ack_APIC_irq(void) |
408 | { | 419 | { |
409 | #ifdef CONFIG_X86_LOCAL_APIC | ||
410 | /* | 420 | /* |
411 | * ack_APIC_irq() actually gets compiled as a single instruction | 421 | * ack_APIC_irq() actually gets compiled as a single instruction |
412 | * ... yummie. | 422 | * ... yummie. |
@@ -414,7 +424,6 @@ static inline void ack_APIC_irq(void) | |||
414 | 424 | ||
415 | /* Docs say use 0 for future compatibility */ | 425 | /* Docs say use 0 for future compatibility */ |
416 | apic_write(APIC_EOI, 0); | 426 | apic_write(APIC_EOI, 0); |
417 | #endif | ||
418 | } | 427 | } |
419 | 428 | ||
420 | static inline unsigned default_get_apic_id(unsigned long x) | 429 | static inline unsigned default_get_apic_id(unsigned long x) |
diff --git a/arch/x86/include/asm/ds.h b/arch/x86/include/asm/ds.h deleted file mode 100644 index 70dac199b093..000000000000 --- a/arch/x86/include/asm/ds.h +++ /dev/null | |||
@@ -1,302 +0,0 @@ | |||
1 | /* | ||
2 | * Debug Store (DS) support | ||
3 | * | ||
4 | * This provides a low-level interface to the hardware's Debug Store | ||
5 | * feature that is used for branch trace store (BTS) and | ||
6 | * precise-event based sampling (PEBS). | ||
7 | * | ||
8 | * It manages: | ||
9 | * - DS and BTS hardware configuration | ||
10 | * - buffer overflow handling (to be done) | ||
11 | * - buffer access | ||
12 | * | ||
13 | * It does not do: | ||
14 | * - security checking (is the caller allowed to trace the task) | ||
15 | * - buffer allocation (memory accounting) | ||
16 | * | ||
17 | * | ||
18 | * Copyright (C) 2007-2009 Intel Corporation. | ||
19 | * Markus Metzger <markus.t.metzger@intel.com>, 2007-2009 | ||
20 | */ | ||
21 | |||
22 | #ifndef _ASM_X86_DS_H | ||
23 | #define _ASM_X86_DS_H | ||
24 | |||
25 | |||
26 | #include <linux/types.h> | ||
27 | #include <linux/init.h> | ||
28 | #include <linux/err.h> | ||
29 | |||
30 | |||
31 | #ifdef CONFIG_X86_DS | ||
32 | |||
33 | struct task_struct; | ||
34 | struct ds_context; | ||
35 | struct ds_tracer; | ||
36 | struct bts_tracer; | ||
37 | struct pebs_tracer; | ||
38 | |||
39 | typedef void (*bts_ovfl_callback_t)(struct bts_tracer *); | ||
40 | typedef void (*pebs_ovfl_callback_t)(struct pebs_tracer *); | ||
41 | |||
42 | |||
43 | /* | ||
44 | * A list of features plus corresponding macros to talk about them in | ||
45 | * the ds_request function's flags parameter. | ||
46 | * | ||
47 | * We use the enum to index an array of corresponding control bits; | ||
48 | * we use the macro to index a flags bit-vector. | ||
49 | */ | ||
50 | enum ds_feature { | ||
51 | dsf_bts = 0, | ||
52 | dsf_bts_kernel, | ||
53 | #define BTS_KERNEL (1 << dsf_bts_kernel) | ||
54 | /* trace kernel-mode branches */ | ||
55 | |||
56 | dsf_bts_user, | ||
57 | #define BTS_USER (1 << dsf_bts_user) | ||
58 | /* trace user-mode branches */ | ||
59 | |||
60 | dsf_bts_overflow, | ||
61 | dsf_bts_max, | ||
62 | dsf_pebs = dsf_bts_max, | ||
63 | |||
64 | dsf_pebs_max, | ||
65 | dsf_ctl_max = dsf_pebs_max, | ||
66 | dsf_bts_timestamps = dsf_ctl_max, | ||
67 | #define BTS_TIMESTAMPS (1 << dsf_bts_timestamps) | ||
68 | /* add timestamps into BTS trace */ | ||
69 | |||
70 | #define BTS_USER_FLAGS (BTS_KERNEL | BTS_USER | BTS_TIMESTAMPS) | ||
71 | }; | ||
72 | |||
73 | |||
74 | /* | ||
75 | * Request BTS or PEBS | ||
76 | * | ||
77 | * Due to alignement constraints, the actual buffer may be slightly | ||
78 | * smaller than the requested or provided buffer. | ||
79 | * | ||
80 | * Returns a pointer to a tracer structure on success, or | ||
81 | * ERR_PTR(errcode) on failure. | ||
82 | * | ||
83 | * The interrupt threshold is independent from the overflow callback | ||
84 | * to allow users to use their own overflow interrupt handling mechanism. | ||
85 | * | ||
86 | * The function might sleep. | ||
87 | * | ||
88 | * task: the task to request recording for | ||
89 | * cpu: the cpu to request recording for | ||
90 | * base: the base pointer for the (non-pageable) buffer; | ||
91 | * size: the size of the provided buffer in bytes | ||
92 | * ovfl: pointer to a function to be called on buffer overflow; | ||
93 | * NULL if cyclic buffer requested | ||
94 | * th: the interrupt threshold in records from the end of the buffer; | ||
95 | * -1 if no interrupt threshold is requested. | ||
96 | * flags: a bit-mask of the above flags | ||
97 | */ | ||
98 | extern struct bts_tracer *ds_request_bts_task(struct task_struct *task, | ||
99 | void *base, size_t size, | ||
100 | bts_ovfl_callback_t ovfl, | ||
101 | size_t th, unsigned int flags); | ||
102 | extern struct bts_tracer *ds_request_bts_cpu(int cpu, void *base, size_t size, | ||
103 | bts_ovfl_callback_t ovfl, | ||
104 | size_t th, unsigned int flags); | ||
105 | extern struct pebs_tracer *ds_request_pebs_task(struct task_struct *task, | ||
106 | void *base, size_t size, | ||
107 | pebs_ovfl_callback_t ovfl, | ||
108 | size_t th, unsigned int flags); | ||
109 | extern struct pebs_tracer *ds_request_pebs_cpu(int cpu, | ||
110 | void *base, size_t size, | ||
111 | pebs_ovfl_callback_t ovfl, | ||
112 | size_t th, unsigned int flags); | ||
113 | |||
114 | /* | ||
115 | * Release BTS or PEBS resources | ||
116 | * Suspend and resume BTS or PEBS tracing | ||
117 | * | ||
118 | * Must be called with irq's enabled. | ||
119 | * | ||
120 | * tracer: the tracer handle returned from ds_request_~() | ||
121 | */ | ||
122 | extern void ds_release_bts(struct bts_tracer *tracer); | ||
123 | extern void ds_suspend_bts(struct bts_tracer *tracer); | ||
124 | extern void ds_resume_bts(struct bts_tracer *tracer); | ||
125 | extern void ds_release_pebs(struct pebs_tracer *tracer); | ||
126 | extern void ds_suspend_pebs(struct pebs_tracer *tracer); | ||
127 | extern void ds_resume_pebs(struct pebs_tracer *tracer); | ||
128 | |||
129 | /* | ||
130 | * Release BTS or PEBS resources | ||
131 | * Suspend and resume BTS or PEBS tracing | ||
132 | * | ||
133 | * Cpu tracers must call this on the traced cpu. | ||
134 | * Task tracers must call ds_release_~_noirq() for themselves. | ||
135 | * | ||
136 | * May be called with irq's disabled. | ||
137 | * | ||
138 | * Returns 0 if successful; | ||
139 | * -EPERM if the cpu tracer does not trace the current cpu. | ||
140 | * -EPERM if the task tracer does not trace itself. | ||
141 | * | ||
142 | * tracer: the tracer handle returned from ds_request_~() | ||
143 | */ | ||
144 | extern int ds_release_bts_noirq(struct bts_tracer *tracer); | ||
145 | extern int ds_suspend_bts_noirq(struct bts_tracer *tracer); | ||
146 | extern int ds_resume_bts_noirq(struct bts_tracer *tracer); | ||
147 | extern int ds_release_pebs_noirq(struct pebs_tracer *tracer); | ||
148 | extern int ds_suspend_pebs_noirq(struct pebs_tracer *tracer); | ||
149 | extern int ds_resume_pebs_noirq(struct pebs_tracer *tracer); | ||
150 | |||
151 | |||
152 | /* | ||
153 | * The raw DS buffer state as it is used for BTS and PEBS recording. | ||
154 | * | ||
155 | * This is the low-level, arch-dependent interface for working | ||
156 | * directly on the raw trace data. | ||
157 | */ | ||
158 | struct ds_trace { | ||
159 | /* the number of bts/pebs records */ | ||
160 | size_t n; | ||
161 | /* the size of a bts/pebs record in bytes */ | ||
162 | size_t size; | ||
163 | /* pointers into the raw buffer: | ||
164 | - to the first entry */ | ||
165 | void *begin; | ||
166 | /* - one beyond the last entry */ | ||
167 | void *end; | ||
168 | /* - one beyond the newest entry */ | ||
169 | void *top; | ||
170 | /* - the interrupt threshold */ | ||
171 | void *ith; | ||
172 | /* flags given on ds_request() */ | ||
173 | unsigned int flags; | ||
174 | }; | ||
175 | |||
176 | /* | ||
177 | * An arch-independent view on branch trace data. | ||
178 | */ | ||
179 | enum bts_qualifier { | ||
180 | bts_invalid, | ||
181 | #define BTS_INVALID bts_invalid | ||
182 | |||
183 | bts_branch, | ||
184 | #define BTS_BRANCH bts_branch | ||
185 | |||
186 | bts_task_arrives, | ||
187 | #define BTS_TASK_ARRIVES bts_task_arrives | ||
188 | |||
189 | bts_task_departs, | ||
190 | #define BTS_TASK_DEPARTS bts_task_departs | ||
191 | |||
192 | bts_qual_bit_size = 4, | ||
193 | bts_qual_max = (1 << bts_qual_bit_size), | ||
194 | }; | ||
195 | |||
196 | struct bts_struct { | ||
197 | __u64 qualifier; | ||
198 | union { | ||
199 | /* BTS_BRANCH */ | ||
200 | struct { | ||
201 | __u64 from; | ||
202 | __u64 to; | ||
203 | } lbr; | ||
204 | /* BTS_TASK_ARRIVES or BTS_TASK_DEPARTS */ | ||
205 | struct { | ||
206 | __u64 clock; | ||
207 | pid_t pid; | ||
208 | } event; | ||
209 | } variant; | ||
210 | }; | ||
211 | |||
212 | |||
213 | /* | ||
214 | * The BTS state. | ||
215 | * | ||
216 | * This gives access to the raw DS state and adds functions to provide | ||
217 | * an arch-independent view of the BTS data. | ||
218 | */ | ||
219 | struct bts_trace { | ||
220 | struct ds_trace ds; | ||
221 | |||
222 | int (*read)(struct bts_tracer *tracer, const void *at, | ||
223 | struct bts_struct *out); | ||
224 | int (*write)(struct bts_tracer *tracer, const struct bts_struct *in); | ||
225 | }; | ||
226 | |||
227 | |||
228 | /* | ||
229 | * The PEBS state. | ||
230 | * | ||
231 | * This gives access to the raw DS state and the PEBS-specific counter | ||
232 | * reset value. | ||
233 | */ | ||
234 | struct pebs_trace { | ||
235 | struct ds_trace ds; | ||
236 | |||
237 | /* the number of valid counters in the below array */ | ||
238 | unsigned int counters; | ||
239 | |||
240 | #define MAX_PEBS_COUNTERS 4 | ||
241 | /* the counter reset value */ | ||
242 | unsigned long long counter_reset[MAX_PEBS_COUNTERS]; | ||
243 | }; | ||
244 | |||
245 | |||
246 | /* | ||
247 | * Read the BTS or PEBS trace. | ||
248 | * | ||
249 | * Returns a view on the trace collected for the parameter tracer. | ||
250 | * | ||
251 | * The view remains valid as long as the traced task is not running or | ||
252 | * the tracer is suspended. | ||
253 | * Writes into the trace buffer are not reflected. | ||
254 | * | ||
255 | * tracer: the tracer handle returned from ds_request_~() | ||
256 | */ | ||
257 | extern const struct bts_trace *ds_read_bts(struct bts_tracer *tracer); | ||
258 | extern const struct pebs_trace *ds_read_pebs(struct pebs_tracer *tracer); | ||
259 | |||
260 | |||
261 | /* | ||
262 | * Reset the write pointer of the BTS/PEBS buffer. | ||
263 | * | ||
264 | * Returns 0 on success; -Eerrno on error | ||
265 | * | ||
266 | * tracer: the tracer handle returned from ds_request_~() | ||
267 | */ | ||
268 | extern int ds_reset_bts(struct bts_tracer *tracer); | ||
269 | extern int ds_reset_pebs(struct pebs_tracer *tracer); | ||
270 | |||
271 | /* | ||
272 | * Set the PEBS counter reset value. | ||
273 | * | ||
274 | * Returns 0 on success; -Eerrno on error | ||
275 | * | ||
276 | * tracer: the tracer handle returned from ds_request_pebs() | ||
277 | * counter: the index of the counter | ||
278 | * value: the new counter reset value | ||
279 | */ | ||
280 | extern int ds_set_pebs_reset(struct pebs_tracer *tracer, | ||
281 | unsigned int counter, u64 value); | ||
282 | |||
283 | /* | ||
284 | * Initialization | ||
285 | */ | ||
286 | struct cpuinfo_x86; | ||
287 | extern void __cpuinit ds_init_intel(struct cpuinfo_x86 *); | ||
288 | |||
289 | /* | ||
290 | * Context switch work | ||
291 | */ | ||
292 | extern void ds_switch_to(struct task_struct *prev, struct task_struct *next); | ||
293 | |||
294 | #else /* CONFIG_X86_DS */ | ||
295 | |||
296 | struct cpuinfo_x86; | ||
297 | static inline void __cpuinit ds_init_intel(struct cpuinfo_x86 *ignored) {} | ||
298 | static inline void ds_switch_to(struct task_struct *prev, | ||
299 | struct task_struct *next) {} | ||
300 | |||
301 | #endif /* CONFIG_X86_DS */ | ||
302 | #endif /* _ASM_X86_DS_H */ | ||
diff --git a/arch/x86/include/asm/hw_breakpoint.h b/arch/x86/include/asm/hw_breakpoint.h index 2a1bd8f4f23a..942255310e6a 100644 --- a/arch/x86/include/asm/hw_breakpoint.h +++ b/arch/x86/include/asm/hw_breakpoint.h | |||
@@ -41,12 +41,16 @@ struct arch_hw_breakpoint { | |||
41 | /* Total number of available HW breakpoint registers */ | 41 | /* Total number of available HW breakpoint registers */ |
42 | #define HBP_NUM 4 | 42 | #define HBP_NUM 4 |
43 | 43 | ||
44 | static inline int hw_breakpoint_slots(int type) | ||
45 | { | ||
46 | return HBP_NUM; | ||
47 | } | ||
48 | |||
44 | struct perf_event; | 49 | struct perf_event; |
45 | struct pmu; | 50 | struct pmu; |
46 | 51 | ||
47 | extern int arch_check_va_in_userspace(unsigned long va, u8 hbp_len); | 52 | extern int arch_check_bp_in_kernelspace(struct perf_event *bp); |
48 | extern int arch_validate_hwbkpt_settings(struct perf_event *bp, | 53 | extern int arch_validate_hwbkpt_settings(struct perf_event *bp); |
49 | struct task_struct *tsk); | ||
50 | extern int hw_breakpoint_exceptions_notify(struct notifier_block *unused, | 54 | extern int hw_breakpoint_exceptions_notify(struct notifier_block *unused, |
51 | unsigned long val, void *data); | 55 | unsigned long val, void *data); |
52 | 56 | ||
diff --git a/arch/x86/include/asm/insn.h b/arch/x86/include/asm/insn.h index 96c2e0ad04ca..88c765e16410 100644 --- a/arch/x86/include/asm/insn.h +++ b/arch/x86/include/asm/insn.h | |||
@@ -68,6 +68,8 @@ struct insn { | |||
68 | const insn_byte_t *next_byte; | 68 | const insn_byte_t *next_byte; |
69 | }; | 69 | }; |
70 | 70 | ||
71 | #define MAX_INSN_SIZE 16 | ||
72 | |||
71 | #define X86_MODRM_MOD(modrm) (((modrm) & 0xc0) >> 6) | 73 | #define X86_MODRM_MOD(modrm) (((modrm) & 0xc0) >> 6) |
72 | #define X86_MODRM_REG(modrm) (((modrm) & 0x38) >> 3) | 74 | #define X86_MODRM_REG(modrm) (((modrm) & 0x38) >> 3) |
73 | #define X86_MODRM_RM(modrm) ((modrm) & 0x07) | 75 | #define X86_MODRM_RM(modrm) ((modrm) & 0x07) |
diff --git a/arch/x86/include/asm/kprobes.h b/arch/x86/include/asm/kprobes.h index 4ffa345a8ccb..547882539157 100644 --- a/arch/x86/include/asm/kprobes.h +++ b/arch/x86/include/asm/kprobes.h | |||
@@ -24,6 +24,7 @@ | |||
24 | #include <linux/types.h> | 24 | #include <linux/types.h> |
25 | #include <linux/ptrace.h> | 25 | #include <linux/ptrace.h> |
26 | #include <linux/percpu.h> | 26 | #include <linux/percpu.h> |
27 | #include <asm/insn.h> | ||
27 | 28 | ||
28 | #define __ARCH_WANT_KPROBES_INSN_SLOT | 29 | #define __ARCH_WANT_KPROBES_INSN_SLOT |
29 | 30 | ||
@@ -36,7 +37,6 @@ typedef u8 kprobe_opcode_t; | |||
36 | #define RELATIVEJUMP_SIZE 5 | 37 | #define RELATIVEJUMP_SIZE 5 |
37 | #define RELATIVECALL_OPCODE 0xe8 | 38 | #define RELATIVECALL_OPCODE 0xe8 |
38 | #define RELATIVE_ADDR_SIZE 4 | 39 | #define RELATIVE_ADDR_SIZE 4 |
39 | #define MAX_INSN_SIZE 16 | ||
40 | #define MAX_STACK_SIZE 64 | 40 | #define MAX_STACK_SIZE 64 |
41 | #define MIN_STACK_SIZE(ADDR) \ | 41 | #define MIN_STACK_SIZE(ADDR) \ |
42 | (((MAX_STACK_SIZE) < (((unsigned long)current_thread_info()) + \ | 42 | (((MAX_STACK_SIZE) < (((unsigned long)current_thread_info()) + \ |
diff --git a/arch/x86/include/asm/msr-index.h b/arch/x86/include/asm/msr-index.h index 4604e6a54d36..bc473acfa7f9 100644 --- a/arch/x86/include/asm/msr-index.h +++ b/arch/x86/include/asm/msr-index.h | |||
@@ -71,11 +71,14 @@ | |||
71 | #define MSR_IA32_LASTINTTOIP 0x000001de | 71 | #define MSR_IA32_LASTINTTOIP 0x000001de |
72 | 72 | ||
73 | /* DEBUGCTLMSR bits (others vary by model): */ | 73 | /* DEBUGCTLMSR bits (others vary by model): */ |
74 | #define _DEBUGCTLMSR_LBR 0 /* last branch recording */ | 74 | #define DEBUGCTLMSR_LBR (1UL << 0) /* last branch recording */ |
75 | #define _DEBUGCTLMSR_BTF 1 /* single-step on branches */ | 75 | #define DEBUGCTLMSR_BTF (1UL << 1) /* single-step on branches */ |
76 | 76 | #define DEBUGCTLMSR_TR (1UL << 6) | |
77 | #define DEBUGCTLMSR_LBR (1UL << _DEBUGCTLMSR_LBR) | 77 | #define DEBUGCTLMSR_BTS (1UL << 7) |
78 | #define DEBUGCTLMSR_BTF (1UL << _DEBUGCTLMSR_BTF) | 78 | #define DEBUGCTLMSR_BTINT (1UL << 8) |
79 | #define DEBUGCTLMSR_BTS_OFF_OS (1UL << 9) | ||
80 | #define DEBUGCTLMSR_BTS_OFF_USR (1UL << 10) | ||
81 | #define DEBUGCTLMSR_FREEZE_LBRS_ON_PMI (1UL << 11) | ||
79 | 82 | ||
80 | #define MSR_IA32_MC0_CTL 0x00000400 | 83 | #define MSR_IA32_MC0_CTL 0x00000400 |
81 | #define MSR_IA32_MC0_STATUS 0x00000401 | 84 | #define MSR_IA32_MC0_STATUS 0x00000401 |
@@ -359,6 +362,8 @@ | |||
359 | #define MSR_P4_U2L_ESCR0 0x000003b0 | 362 | #define MSR_P4_U2L_ESCR0 0x000003b0 |
360 | #define MSR_P4_U2L_ESCR1 0x000003b1 | 363 | #define MSR_P4_U2L_ESCR1 0x000003b1 |
361 | 364 | ||
365 | #define MSR_P4_PEBS_MATRIX_VERT 0x000003f2 | ||
366 | |||
362 | /* Intel Core-based CPU performance counters */ | 367 | /* Intel Core-based CPU performance counters */ |
363 | #define MSR_CORE_PERF_FIXED_CTR0 0x00000309 | 368 | #define MSR_CORE_PERF_FIXED_CTR0 0x00000309 |
364 | #define MSR_CORE_PERF_FIXED_CTR1 0x0000030a | 369 | #define MSR_CORE_PERF_FIXED_CTR1 0x0000030a |
diff --git a/arch/x86/include/asm/perf_event.h b/arch/x86/include/asm/perf_event.h index db6109a885a7..254883d0c7e0 100644 --- a/arch/x86/include/asm/perf_event.h +++ b/arch/x86/include/asm/perf_event.h | |||
@@ -5,7 +5,7 @@ | |||
5 | * Performance event hw details: | 5 | * Performance event hw details: |
6 | */ | 6 | */ |
7 | 7 | ||
8 | #define X86_PMC_MAX_GENERIC 8 | 8 | #define X86_PMC_MAX_GENERIC 32 |
9 | #define X86_PMC_MAX_FIXED 3 | 9 | #define X86_PMC_MAX_FIXED 3 |
10 | 10 | ||
11 | #define X86_PMC_IDX_GENERIC 0 | 11 | #define X86_PMC_IDX_GENERIC 0 |
@@ -18,39 +18,31 @@ | |||
18 | #define MSR_ARCH_PERFMON_EVENTSEL0 0x186 | 18 | #define MSR_ARCH_PERFMON_EVENTSEL0 0x186 |
19 | #define MSR_ARCH_PERFMON_EVENTSEL1 0x187 | 19 | #define MSR_ARCH_PERFMON_EVENTSEL1 0x187 |
20 | 20 | ||
21 | #define ARCH_PERFMON_EVENTSEL_ENABLE (1 << 22) | 21 | #define ARCH_PERFMON_EVENTSEL_EVENT 0x000000FFULL |
22 | #define ARCH_PERFMON_EVENTSEL_ANY (1 << 21) | 22 | #define ARCH_PERFMON_EVENTSEL_UMASK 0x0000FF00ULL |
23 | #define ARCH_PERFMON_EVENTSEL_INT (1 << 20) | 23 | #define ARCH_PERFMON_EVENTSEL_USR (1ULL << 16) |
24 | #define ARCH_PERFMON_EVENTSEL_OS (1 << 17) | 24 | #define ARCH_PERFMON_EVENTSEL_OS (1ULL << 17) |
25 | #define ARCH_PERFMON_EVENTSEL_USR (1 << 16) | 25 | #define ARCH_PERFMON_EVENTSEL_EDGE (1ULL << 18) |
26 | 26 | #define ARCH_PERFMON_EVENTSEL_INT (1ULL << 20) | |
27 | /* | 27 | #define ARCH_PERFMON_EVENTSEL_ANY (1ULL << 21) |
28 | * Includes eventsel and unit mask as well: | 28 | #define ARCH_PERFMON_EVENTSEL_ENABLE (1ULL << 22) |
29 | */ | 29 | #define ARCH_PERFMON_EVENTSEL_INV (1ULL << 23) |
30 | 30 | #define ARCH_PERFMON_EVENTSEL_CMASK 0xFF000000ULL | |
31 | 31 | ||
32 | #define INTEL_ARCH_EVTSEL_MASK 0x000000FFULL | 32 | #define AMD64_EVENTSEL_EVENT \ |
33 | #define INTEL_ARCH_UNIT_MASK 0x0000FF00ULL | 33 | (ARCH_PERFMON_EVENTSEL_EVENT | (0x0FULL << 32)) |
34 | #define INTEL_ARCH_EDGE_MASK 0x00040000ULL | 34 | #define INTEL_ARCH_EVENT_MASK \ |
35 | #define INTEL_ARCH_INV_MASK 0x00800000ULL | 35 | (ARCH_PERFMON_EVENTSEL_UMASK | ARCH_PERFMON_EVENTSEL_EVENT) |
36 | #define INTEL_ARCH_CNT_MASK 0xFF000000ULL | 36 | |
37 | #define INTEL_ARCH_EVENT_MASK (INTEL_ARCH_UNIT_MASK|INTEL_ARCH_EVTSEL_MASK) | 37 | #define X86_RAW_EVENT_MASK \ |
38 | 38 | (ARCH_PERFMON_EVENTSEL_EVENT | \ | |
39 | /* | 39 | ARCH_PERFMON_EVENTSEL_UMASK | \ |
40 | * filter mask to validate fixed counter events. | 40 | ARCH_PERFMON_EVENTSEL_EDGE | \ |
41 | * the following filters disqualify for fixed counters: | 41 | ARCH_PERFMON_EVENTSEL_INV | \ |
42 | * - inv | 42 | ARCH_PERFMON_EVENTSEL_CMASK) |
43 | * - edge | 43 | #define AMD64_RAW_EVENT_MASK \ |
44 | * - cnt-mask | 44 | (X86_RAW_EVENT_MASK | \ |
45 | * The other filters are supported by fixed counters. | 45 | AMD64_EVENTSEL_EVENT) |
46 | * The any-thread option is supported starting with v3. | ||
47 | */ | ||
48 | #define INTEL_ARCH_FIXED_MASK \ | ||
49 | (INTEL_ARCH_CNT_MASK| \ | ||
50 | INTEL_ARCH_INV_MASK| \ | ||
51 | INTEL_ARCH_EDGE_MASK|\ | ||
52 | INTEL_ARCH_UNIT_MASK|\ | ||
53 | INTEL_ARCH_EVENT_MASK) | ||
54 | 46 | ||
55 | #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_SEL 0x3c | 47 | #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_SEL 0x3c |
56 | #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_UMASK (0x00 << 8) | 48 | #define ARCH_PERFMON_UNHALTED_CORE_CYCLES_UMASK (0x00 << 8) |
@@ -67,7 +59,7 @@ | |||
67 | union cpuid10_eax { | 59 | union cpuid10_eax { |
68 | struct { | 60 | struct { |
69 | unsigned int version_id:8; | 61 | unsigned int version_id:8; |
70 | unsigned int num_events:8; | 62 | unsigned int num_counters:8; |
71 | unsigned int bit_width:8; | 63 | unsigned int bit_width:8; |
72 | unsigned int mask_length:8; | 64 | unsigned int mask_length:8; |
73 | } split; | 65 | } split; |
@@ -76,7 +68,7 @@ union cpuid10_eax { | |||
76 | 68 | ||
77 | union cpuid10_edx { | 69 | union cpuid10_edx { |
78 | struct { | 70 | struct { |
79 | unsigned int num_events_fixed:4; | 71 | unsigned int num_counters_fixed:4; |
80 | unsigned int reserved:28; | 72 | unsigned int reserved:28; |
81 | } split; | 73 | } split; |
82 | unsigned int full; | 74 | unsigned int full; |
@@ -136,6 +128,18 @@ extern void perf_events_lapic_init(void); | |||
136 | 128 | ||
137 | #define PERF_EVENT_INDEX_OFFSET 0 | 129 | #define PERF_EVENT_INDEX_OFFSET 0 |
138 | 130 | ||
131 | /* | ||
132 | * Abuse bit 3 of the cpu eflags register to indicate proper PEBS IP fixups. | ||
133 | * This flag is otherwise unused and ABI specified to be 0, so nobody should | ||
134 | * care what we do with it. | ||
135 | */ | ||
136 | #define PERF_EFLAGS_EXACT (1UL << 3) | ||
137 | |||
138 | struct pt_regs; | ||
139 | extern unsigned long perf_instruction_pointer(struct pt_regs *regs); | ||
140 | extern unsigned long perf_misc_flags(struct pt_regs *regs); | ||
141 | #define perf_misc_flags(regs) perf_misc_flags(regs) | ||
142 | |||
139 | #else | 143 | #else |
140 | static inline void init_hw_perf_events(void) { } | 144 | static inline void init_hw_perf_events(void) { } |
141 | static inline void perf_events_lapic_init(void) { } | 145 | static inline void perf_events_lapic_init(void) { } |
diff --git a/arch/x86/include/asm/perf_event_p4.h b/arch/x86/include/asm/perf_event_p4.h new file mode 100644 index 000000000000..b05400a542ff --- /dev/null +++ b/arch/x86/include/asm/perf_event_p4.h | |||
@@ -0,0 +1,794 @@ | |||
1 | /* | ||
2 | * Netburst Perfomance Events (P4, old Xeon) | ||
3 | */ | ||
4 | |||
5 | #ifndef PERF_EVENT_P4_H | ||
6 | #define PERF_EVENT_P4_H | ||
7 | |||
8 | #include <linux/cpu.h> | ||
9 | #include <linux/bitops.h> | ||
10 | |||
11 | /* | ||
12 | * NetBurst has perfomance MSRs shared between | ||
13 | * threads if HT is turned on, ie for both logical | ||
14 | * processors (mem: in turn in Atom with HT support | ||
15 | * perf-MSRs are not shared and every thread has its | ||
16 | * own perf-MSRs set) | ||
17 | */ | ||
18 | #define ARCH_P4_TOTAL_ESCR (46) | ||
19 | #define ARCH_P4_RESERVED_ESCR (2) /* IQ_ESCR(0,1) not always present */ | ||
20 | #define ARCH_P4_MAX_ESCR (ARCH_P4_TOTAL_ESCR - ARCH_P4_RESERVED_ESCR) | ||
21 | #define ARCH_P4_MAX_CCCR (18) | ||
22 | #define ARCH_P4_MAX_COUNTER (ARCH_P4_MAX_CCCR / 2) | ||
23 | |||
24 | #define P4_ESCR_EVENT_MASK 0x7e000000U | ||
25 | #define P4_ESCR_EVENT_SHIFT 25 | ||
26 | #define P4_ESCR_EVENTMASK_MASK 0x01fffe00U | ||
27 | #define P4_ESCR_EVENTMASK_SHIFT 9 | ||
28 | #define P4_ESCR_TAG_MASK 0x000001e0U | ||
29 | #define P4_ESCR_TAG_SHIFT 5 | ||
30 | #define P4_ESCR_TAG_ENABLE 0x00000010U | ||
31 | #define P4_ESCR_T0_OS 0x00000008U | ||
32 | #define P4_ESCR_T0_USR 0x00000004U | ||
33 | #define P4_ESCR_T1_OS 0x00000002U | ||
34 | #define P4_ESCR_T1_USR 0x00000001U | ||
35 | |||
36 | #define P4_ESCR_EVENT(v) ((v) << P4_ESCR_EVENT_SHIFT) | ||
37 | #define P4_ESCR_EMASK(v) ((v) << P4_ESCR_EVENTMASK_SHIFT) | ||
38 | #define P4_ESCR_TAG(v) ((v) << P4_ESCR_TAG_SHIFT) | ||
39 | |||
40 | /* Non HT mask */ | ||
41 | #define P4_ESCR_MASK \ | ||
42 | (P4_ESCR_EVENT_MASK | \ | ||
43 | P4_ESCR_EVENTMASK_MASK | \ | ||
44 | P4_ESCR_TAG_MASK | \ | ||
45 | P4_ESCR_TAG_ENABLE | \ | ||
46 | P4_ESCR_T0_OS | \ | ||
47 | P4_ESCR_T0_USR) | ||
48 | |||
49 | /* HT mask */ | ||
50 | #define P4_ESCR_MASK_HT \ | ||
51 | (P4_ESCR_MASK | P4_ESCR_T1_OS | P4_ESCR_T1_USR) | ||
52 | |||
53 | #define P4_CCCR_OVF 0x80000000U | ||
54 | #define P4_CCCR_CASCADE 0x40000000U | ||
55 | #define P4_CCCR_OVF_PMI_T0 0x04000000U | ||
56 | #define P4_CCCR_OVF_PMI_T1 0x08000000U | ||
57 | #define P4_CCCR_FORCE_OVF 0x02000000U | ||
58 | #define P4_CCCR_EDGE 0x01000000U | ||
59 | #define P4_CCCR_THRESHOLD_MASK 0x00f00000U | ||
60 | #define P4_CCCR_THRESHOLD_SHIFT 20 | ||
61 | #define P4_CCCR_COMPLEMENT 0x00080000U | ||
62 | #define P4_CCCR_COMPARE 0x00040000U | ||
63 | #define P4_CCCR_ESCR_SELECT_MASK 0x0000e000U | ||
64 | #define P4_CCCR_ESCR_SELECT_SHIFT 13 | ||
65 | #define P4_CCCR_ENABLE 0x00001000U | ||
66 | #define P4_CCCR_THREAD_SINGLE 0x00010000U | ||
67 | #define P4_CCCR_THREAD_BOTH 0x00020000U | ||
68 | #define P4_CCCR_THREAD_ANY 0x00030000U | ||
69 | #define P4_CCCR_RESERVED 0x00000fffU | ||
70 | |||
71 | #define P4_CCCR_THRESHOLD(v) ((v) << P4_CCCR_THRESHOLD_SHIFT) | ||
72 | #define P4_CCCR_ESEL(v) ((v) << P4_CCCR_ESCR_SELECT_SHIFT) | ||
73 | |||
74 | /* Custom bits in reerved CCCR area */ | ||
75 | #define P4_CCCR_CACHE_OPS_MASK 0x0000003fU | ||
76 | |||
77 | |||
78 | /* Non HT mask */ | ||
79 | #define P4_CCCR_MASK \ | ||
80 | (P4_CCCR_OVF | \ | ||
81 | P4_CCCR_CASCADE | \ | ||
82 | P4_CCCR_OVF_PMI_T0 | \ | ||
83 | P4_CCCR_FORCE_OVF | \ | ||
84 | P4_CCCR_EDGE | \ | ||
85 | P4_CCCR_THRESHOLD_MASK | \ | ||
86 | P4_CCCR_COMPLEMENT | \ | ||
87 | P4_CCCR_COMPARE | \ | ||
88 | P4_CCCR_ESCR_SELECT_MASK | \ | ||
89 | P4_CCCR_ENABLE) | ||
90 | |||
91 | /* HT mask */ | ||
92 | #define P4_CCCR_MASK_HT (P4_CCCR_MASK | P4_CCCR_THREAD_ANY) | ||
93 | |||
94 | #define P4_GEN_ESCR_EMASK(class, name, bit) \ | ||
95 | class##__##name = ((1 << bit) << P4_ESCR_EVENTMASK_SHIFT) | ||
96 | #define P4_ESCR_EMASK_BIT(class, name) class##__##name | ||
97 | |||
98 | /* | ||
99 | * config field is 64bit width and consists of | ||
100 | * HT << 63 | ESCR << 32 | CCCR | ||
101 | * where HT is HyperThreading bit (since ESCR | ||
102 | * has it reserved we may use it for own purpose) | ||
103 | * | ||
104 | * note that this is NOT the addresses of respective | ||
105 | * ESCR and CCCR but rather an only packed value should | ||
106 | * be unpacked and written to a proper addresses | ||
107 | * | ||
108 | * the base idea is to pack as much info as | ||
109 | * possible | ||
110 | */ | ||
111 | #define p4_config_pack_escr(v) (((u64)(v)) << 32) | ||
112 | #define p4_config_pack_cccr(v) (((u64)(v)) & 0xffffffffULL) | ||
113 | #define p4_config_unpack_escr(v) (((u64)(v)) >> 32) | ||
114 | #define p4_config_unpack_cccr(v) (((u64)(v)) & 0xffffffffULL) | ||
115 | |||
116 | #define p4_config_unpack_emask(v) \ | ||
117 | ({ \ | ||
118 | u32 t = p4_config_unpack_escr((v)); \ | ||
119 | t = t & P4_ESCR_EVENTMASK_MASK; \ | ||
120 | t = t >> P4_ESCR_EVENTMASK_SHIFT; \ | ||
121 | t; \ | ||
122 | }) | ||
123 | |||
124 | #define p4_config_unpack_event(v) \ | ||
125 | ({ \ | ||
126 | u32 t = p4_config_unpack_escr((v)); \ | ||
127 | t = t & P4_ESCR_EVENT_MASK; \ | ||
128 | t = t >> P4_ESCR_EVENT_SHIFT; \ | ||
129 | t; \ | ||
130 | }) | ||
131 | |||
132 | #define p4_config_unpack_cache_event(v) (((u64)(v)) & P4_CCCR_CACHE_OPS_MASK) | ||
133 | |||
134 | #define P4_CONFIG_HT_SHIFT 63 | ||
135 | #define P4_CONFIG_HT (1ULL << P4_CONFIG_HT_SHIFT) | ||
136 | |||
137 | static inline bool p4_is_event_cascaded(u64 config) | ||
138 | { | ||
139 | u32 cccr = p4_config_unpack_cccr(config); | ||
140 | return !!(cccr & P4_CCCR_CASCADE); | ||
141 | } | ||
142 | |||
143 | static inline int p4_ht_config_thread(u64 config) | ||
144 | { | ||
145 | return !!(config & P4_CONFIG_HT); | ||
146 | } | ||
147 | |||
148 | static inline u64 p4_set_ht_bit(u64 config) | ||
149 | { | ||
150 | return config | P4_CONFIG_HT; | ||
151 | } | ||
152 | |||
153 | static inline u64 p4_clear_ht_bit(u64 config) | ||
154 | { | ||
155 | return config & ~P4_CONFIG_HT; | ||
156 | } | ||
157 | |||
158 | static inline int p4_ht_active(void) | ||
159 | { | ||
160 | #ifdef CONFIG_SMP | ||
161 | return smp_num_siblings > 1; | ||
162 | #endif | ||
163 | return 0; | ||
164 | } | ||
165 | |||
166 | static inline int p4_ht_thread(int cpu) | ||
167 | { | ||
168 | #ifdef CONFIG_SMP | ||
169 | if (smp_num_siblings == 2) | ||
170 | return cpu != cpumask_first(__get_cpu_var(cpu_sibling_map)); | ||
171 | #endif | ||
172 | return 0; | ||
173 | } | ||
174 | |||
175 | static inline int p4_should_swap_ts(u64 config, int cpu) | ||
176 | { | ||
177 | return p4_ht_config_thread(config) ^ p4_ht_thread(cpu); | ||
178 | } | ||
179 | |||
180 | static inline u32 p4_default_cccr_conf(int cpu) | ||
181 | { | ||
182 | /* | ||
183 | * Note that P4_CCCR_THREAD_ANY is "required" on | ||
184 | * non-HT machines (on HT machines we count TS events | ||
185 | * regardless the state of second logical processor | ||
186 | */ | ||
187 | u32 cccr = P4_CCCR_THREAD_ANY; | ||
188 | |||
189 | if (!p4_ht_thread(cpu)) | ||
190 | cccr |= P4_CCCR_OVF_PMI_T0; | ||
191 | else | ||
192 | cccr |= P4_CCCR_OVF_PMI_T1; | ||
193 | |||
194 | return cccr; | ||
195 | } | ||
196 | |||
197 | static inline u32 p4_default_escr_conf(int cpu, int exclude_os, int exclude_usr) | ||
198 | { | ||
199 | u32 escr = 0; | ||
200 | |||
201 | if (!p4_ht_thread(cpu)) { | ||
202 | if (!exclude_os) | ||
203 | escr |= P4_ESCR_T0_OS; | ||
204 | if (!exclude_usr) | ||
205 | escr |= P4_ESCR_T0_USR; | ||
206 | } else { | ||
207 | if (!exclude_os) | ||
208 | escr |= P4_ESCR_T1_OS; | ||
209 | if (!exclude_usr) | ||
210 | escr |= P4_ESCR_T1_USR; | ||
211 | } | ||
212 | |||
213 | return escr; | ||
214 | } | ||
215 | |||
216 | enum P4_EVENTS { | ||
217 | P4_EVENT_TC_DELIVER_MODE, | ||
218 | P4_EVENT_BPU_FETCH_REQUEST, | ||
219 | P4_EVENT_ITLB_REFERENCE, | ||
220 | P4_EVENT_MEMORY_CANCEL, | ||
221 | P4_EVENT_MEMORY_COMPLETE, | ||
222 | P4_EVENT_LOAD_PORT_REPLAY, | ||
223 | P4_EVENT_STORE_PORT_REPLAY, | ||
224 | P4_EVENT_MOB_LOAD_REPLAY, | ||
225 | P4_EVENT_PAGE_WALK_TYPE, | ||
226 | P4_EVENT_BSQ_CACHE_REFERENCE, | ||
227 | P4_EVENT_IOQ_ALLOCATION, | ||
228 | P4_EVENT_IOQ_ACTIVE_ENTRIES, | ||
229 | P4_EVENT_FSB_DATA_ACTIVITY, | ||
230 | P4_EVENT_BSQ_ALLOCATION, | ||
231 | P4_EVENT_BSQ_ACTIVE_ENTRIES, | ||
232 | P4_EVENT_SSE_INPUT_ASSIST, | ||
233 | P4_EVENT_PACKED_SP_UOP, | ||
234 | P4_EVENT_PACKED_DP_UOP, | ||
235 | P4_EVENT_SCALAR_SP_UOP, | ||
236 | P4_EVENT_SCALAR_DP_UOP, | ||
237 | P4_EVENT_64BIT_MMX_UOP, | ||
238 | P4_EVENT_128BIT_MMX_UOP, | ||
239 | P4_EVENT_X87_FP_UOP, | ||
240 | P4_EVENT_TC_MISC, | ||
241 | P4_EVENT_GLOBAL_POWER_EVENTS, | ||
242 | P4_EVENT_TC_MS_XFER, | ||
243 | P4_EVENT_UOP_QUEUE_WRITES, | ||
244 | P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, | ||
245 | P4_EVENT_RETIRED_BRANCH_TYPE, | ||
246 | P4_EVENT_RESOURCE_STALL, | ||
247 | P4_EVENT_WC_BUFFER, | ||
248 | P4_EVENT_B2B_CYCLES, | ||
249 | P4_EVENT_BNR, | ||
250 | P4_EVENT_SNOOP, | ||
251 | P4_EVENT_RESPONSE, | ||
252 | P4_EVENT_FRONT_END_EVENT, | ||
253 | P4_EVENT_EXECUTION_EVENT, | ||
254 | P4_EVENT_REPLAY_EVENT, | ||
255 | P4_EVENT_INSTR_RETIRED, | ||
256 | P4_EVENT_UOPS_RETIRED, | ||
257 | P4_EVENT_UOP_TYPE, | ||
258 | P4_EVENT_BRANCH_RETIRED, | ||
259 | P4_EVENT_MISPRED_BRANCH_RETIRED, | ||
260 | P4_EVENT_X87_ASSIST, | ||
261 | P4_EVENT_MACHINE_CLEAR, | ||
262 | P4_EVENT_INSTR_COMPLETED, | ||
263 | }; | ||
264 | |||
265 | #define P4_OPCODE(event) event##_OPCODE | ||
266 | #define P4_OPCODE_ESEL(opcode) ((opcode & 0x00ff) >> 0) | ||
267 | #define P4_OPCODE_EVNT(opcode) ((opcode & 0xff00) >> 8) | ||
268 | #define P4_OPCODE_PACK(event, sel) (((event) << 8) | sel) | ||
269 | |||
270 | /* | ||
271 | * Comments below the event represent ESCR restriction | ||
272 | * for this event and counter index per ESCR | ||
273 | * | ||
274 | * MSR_P4_IQ_ESCR0 and MSR_P4_IQ_ESCR1 are available only on early | ||
275 | * processor builds (family 0FH, models 01H-02H). These MSRs | ||
276 | * are not available on later versions, so that we don't use | ||
277 | * them completely | ||
278 | * | ||
279 | * Also note that CCCR1 do not have P4_CCCR_ENABLE bit properly | ||
280 | * working so that we should not use this CCCR and respective | ||
281 | * counter as result | ||
282 | */ | ||
283 | enum P4_EVENT_OPCODES { | ||
284 | P4_OPCODE(P4_EVENT_TC_DELIVER_MODE) = P4_OPCODE_PACK(0x01, 0x01), | ||
285 | /* | ||
286 | * MSR_P4_TC_ESCR0: 4, 5 | ||
287 | * MSR_P4_TC_ESCR1: 6, 7 | ||
288 | */ | ||
289 | |||
290 | P4_OPCODE(P4_EVENT_BPU_FETCH_REQUEST) = P4_OPCODE_PACK(0x03, 0x00), | ||
291 | /* | ||
292 | * MSR_P4_BPU_ESCR0: 0, 1 | ||
293 | * MSR_P4_BPU_ESCR1: 2, 3 | ||
294 | */ | ||
295 | |||
296 | P4_OPCODE(P4_EVENT_ITLB_REFERENCE) = P4_OPCODE_PACK(0x18, 0x03), | ||
297 | /* | ||
298 | * MSR_P4_ITLB_ESCR0: 0, 1 | ||
299 | * MSR_P4_ITLB_ESCR1: 2, 3 | ||
300 | */ | ||
301 | |||
302 | P4_OPCODE(P4_EVENT_MEMORY_CANCEL) = P4_OPCODE_PACK(0x02, 0x05), | ||
303 | /* | ||
304 | * MSR_P4_DAC_ESCR0: 8, 9 | ||
305 | * MSR_P4_DAC_ESCR1: 10, 11 | ||
306 | */ | ||
307 | |||
308 | P4_OPCODE(P4_EVENT_MEMORY_COMPLETE) = P4_OPCODE_PACK(0x08, 0x02), | ||
309 | /* | ||
310 | * MSR_P4_SAAT_ESCR0: 8, 9 | ||
311 | * MSR_P4_SAAT_ESCR1: 10, 11 | ||
312 | */ | ||
313 | |||
314 | P4_OPCODE(P4_EVENT_LOAD_PORT_REPLAY) = P4_OPCODE_PACK(0x04, 0x02), | ||
315 | /* | ||
316 | * MSR_P4_SAAT_ESCR0: 8, 9 | ||
317 | * MSR_P4_SAAT_ESCR1: 10, 11 | ||
318 | */ | ||
319 | |||
320 | P4_OPCODE(P4_EVENT_STORE_PORT_REPLAY) = P4_OPCODE_PACK(0x05, 0x02), | ||
321 | /* | ||
322 | * MSR_P4_SAAT_ESCR0: 8, 9 | ||
323 | * MSR_P4_SAAT_ESCR1: 10, 11 | ||
324 | */ | ||
325 | |||
326 | P4_OPCODE(P4_EVENT_MOB_LOAD_REPLAY) = P4_OPCODE_PACK(0x03, 0x02), | ||
327 | /* | ||
328 | * MSR_P4_MOB_ESCR0: 0, 1 | ||
329 | * MSR_P4_MOB_ESCR1: 2, 3 | ||
330 | */ | ||
331 | |||
332 | P4_OPCODE(P4_EVENT_PAGE_WALK_TYPE) = P4_OPCODE_PACK(0x01, 0x04), | ||
333 | /* | ||
334 | * MSR_P4_PMH_ESCR0: 0, 1 | ||
335 | * MSR_P4_PMH_ESCR1: 2, 3 | ||
336 | */ | ||
337 | |||
338 | P4_OPCODE(P4_EVENT_BSQ_CACHE_REFERENCE) = P4_OPCODE_PACK(0x0c, 0x07), | ||
339 | /* | ||
340 | * MSR_P4_BSU_ESCR0: 0, 1 | ||
341 | * MSR_P4_BSU_ESCR1: 2, 3 | ||
342 | */ | ||
343 | |||
344 | P4_OPCODE(P4_EVENT_IOQ_ALLOCATION) = P4_OPCODE_PACK(0x03, 0x06), | ||
345 | /* | ||
346 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
347 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
348 | */ | ||
349 | |||
350 | P4_OPCODE(P4_EVENT_IOQ_ACTIVE_ENTRIES) = P4_OPCODE_PACK(0x1a, 0x06), | ||
351 | /* | ||
352 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
353 | */ | ||
354 | |||
355 | P4_OPCODE(P4_EVENT_FSB_DATA_ACTIVITY) = P4_OPCODE_PACK(0x17, 0x06), | ||
356 | /* | ||
357 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
358 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
359 | */ | ||
360 | |||
361 | P4_OPCODE(P4_EVENT_BSQ_ALLOCATION) = P4_OPCODE_PACK(0x05, 0x07), | ||
362 | /* | ||
363 | * MSR_P4_BSU_ESCR0: 0, 1 | ||
364 | */ | ||
365 | |||
366 | P4_OPCODE(P4_EVENT_BSQ_ACTIVE_ENTRIES) = P4_OPCODE_PACK(0x06, 0x07), | ||
367 | /* | ||
368 | * NOTE: no ESCR name in docs, it's guessed | ||
369 | * MSR_P4_BSU_ESCR1: 2, 3 | ||
370 | */ | ||
371 | |||
372 | P4_OPCODE(P4_EVENT_SSE_INPUT_ASSIST) = P4_OPCODE_PACK(0x34, 0x01), | ||
373 | /* | ||
374 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
375 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
376 | */ | ||
377 | |||
378 | P4_OPCODE(P4_EVENT_PACKED_SP_UOP) = P4_OPCODE_PACK(0x08, 0x01), | ||
379 | /* | ||
380 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
381 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
382 | */ | ||
383 | |||
384 | P4_OPCODE(P4_EVENT_PACKED_DP_UOP) = P4_OPCODE_PACK(0x0c, 0x01), | ||
385 | /* | ||
386 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
387 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
388 | */ | ||
389 | |||
390 | P4_OPCODE(P4_EVENT_SCALAR_SP_UOP) = P4_OPCODE_PACK(0x0a, 0x01), | ||
391 | /* | ||
392 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
393 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
394 | */ | ||
395 | |||
396 | P4_OPCODE(P4_EVENT_SCALAR_DP_UOP) = P4_OPCODE_PACK(0x0e, 0x01), | ||
397 | /* | ||
398 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
399 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
400 | */ | ||
401 | |||
402 | P4_OPCODE(P4_EVENT_64BIT_MMX_UOP) = P4_OPCODE_PACK(0x02, 0x01), | ||
403 | /* | ||
404 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
405 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
406 | */ | ||
407 | |||
408 | P4_OPCODE(P4_EVENT_128BIT_MMX_UOP) = P4_OPCODE_PACK(0x1a, 0x01), | ||
409 | /* | ||
410 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
411 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
412 | */ | ||
413 | |||
414 | P4_OPCODE(P4_EVENT_X87_FP_UOP) = P4_OPCODE_PACK(0x04, 0x01), | ||
415 | /* | ||
416 | * MSR_P4_FIRM_ESCR0: 8, 9 | ||
417 | * MSR_P4_FIRM_ESCR1: 10, 11 | ||
418 | */ | ||
419 | |||
420 | P4_OPCODE(P4_EVENT_TC_MISC) = P4_OPCODE_PACK(0x06, 0x01), | ||
421 | /* | ||
422 | * MSR_P4_TC_ESCR0: 4, 5 | ||
423 | * MSR_P4_TC_ESCR1: 6, 7 | ||
424 | */ | ||
425 | |||
426 | P4_OPCODE(P4_EVENT_GLOBAL_POWER_EVENTS) = P4_OPCODE_PACK(0x13, 0x06), | ||
427 | /* | ||
428 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
429 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
430 | */ | ||
431 | |||
432 | P4_OPCODE(P4_EVENT_TC_MS_XFER) = P4_OPCODE_PACK(0x05, 0x00), | ||
433 | /* | ||
434 | * MSR_P4_MS_ESCR0: 4, 5 | ||
435 | * MSR_P4_MS_ESCR1: 6, 7 | ||
436 | */ | ||
437 | |||
438 | P4_OPCODE(P4_EVENT_UOP_QUEUE_WRITES) = P4_OPCODE_PACK(0x09, 0x00), | ||
439 | /* | ||
440 | * MSR_P4_MS_ESCR0: 4, 5 | ||
441 | * MSR_P4_MS_ESCR1: 6, 7 | ||
442 | */ | ||
443 | |||
444 | P4_OPCODE(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE) = P4_OPCODE_PACK(0x05, 0x02), | ||
445 | /* | ||
446 | * MSR_P4_TBPU_ESCR0: 4, 5 | ||
447 | * MSR_P4_TBPU_ESCR1: 6, 7 | ||
448 | */ | ||
449 | |||
450 | P4_OPCODE(P4_EVENT_RETIRED_BRANCH_TYPE) = P4_OPCODE_PACK(0x04, 0x02), | ||
451 | /* | ||
452 | * MSR_P4_TBPU_ESCR0: 4, 5 | ||
453 | * MSR_P4_TBPU_ESCR1: 6, 7 | ||
454 | */ | ||
455 | |||
456 | P4_OPCODE(P4_EVENT_RESOURCE_STALL) = P4_OPCODE_PACK(0x01, 0x01), | ||
457 | /* | ||
458 | * MSR_P4_ALF_ESCR0: 12, 13, 16 | ||
459 | * MSR_P4_ALF_ESCR1: 14, 15, 17 | ||
460 | */ | ||
461 | |||
462 | P4_OPCODE(P4_EVENT_WC_BUFFER) = P4_OPCODE_PACK(0x05, 0x05), | ||
463 | /* | ||
464 | * MSR_P4_DAC_ESCR0: 8, 9 | ||
465 | * MSR_P4_DAC_ESCR1: 10, 11 | ||
466 | */ | ||
467 | |||
468 | P4_OPCODE(P4_EVENT_B2B_CYCLES) = P4_OPCODE_PACK(0x16, 0x03), | ||
469 | /* | ||
470 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
471 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
472 | */ | ||
473 | |||
474 | P4_OPCODE(P4_EVENT_BNR) = P4_OPCODE_PACK(0x08, 0x03), | ||
475 | /* | ||
476 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
477 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
478 | */ | ||
479 | |||
480 | P4_OPCODE(P4_EVENT_SNOOP) = P4_OPCODE_PACK(0x06, 0x03), | ||
481 | /* | ||
482 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
483 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
484 | */ | ||
485 | |||
486 | P4_OPCODE(P4_EVENT_RESPONSE) = P4_OPCODE_PACK(0x04, 0x03), | ||
487 | /* | ||
488 | * MSR_P4_FSB_ESCR0: 0, 1 | ||
489 | * MSR_P4_FSB_ESCR1: 2, 3 | ||
490 | */ | ||
491 | |||
492 | P4_OPCODE(P4_EVENT_FRONT_END_EVENT) = P4_OPCODE_PACK(0x08, 0x05), | ||
493 | /* | ||
494 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
495 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
496 | */ | ||
497 | |||
498 | P4_OPCODE(P4_EVENT_EXECUTION_EVENT) = P4_OPCODE_PACK(0x0c, 0x05), | ||
499 | /* | ||
500 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
501 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
502 | */ | ||
503 | |||
504 | P4_OPCODE(P4_EVENT_REPLAY_EVENT) = P4_OPCODE_PACK(0x09, 0x05), | ||
505 | /* | ||
506 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
507 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
508 | */ | ||
509 | |||
510 | P4_OPCODE(P4_EVENT_INSTR_RETIRED) = P4_OPCODE_PACK(0x02, 0x04), | ||
511 | /* | ||
512 | * MSR_P4_CRU_ESCR0: 12, 13, 16 | ||
513 | * MSR_P4_CRU_ESCR1: 14, 15, 17 | ||
514 | */ | ||
515 | |||
516 | P4_OPCODE(P4_EVENT_UOPS_RETIRED) = P4_OPCODE_PACK(0x01, 0x04), | ||
517 | /* | ||
518 | * MSR_P4_CRU_ESCR0: 12, 13, 16 | ||
519 | * MSR_P4_CRU_ESCR1: 14, 15, 17 | ||
520 | */ | ||
521 | |||
522 | P4_OPCODE(P4_EVENT_UOP_TYPE) = P4_OPCODE_PACK(0x02, 0x02), | ||
523 | /* | ||
524 | * MSR_P4_RAT_ESCR0: 12, 13, 16 | ||
525 | * MSR_P4_RAT_ESCR1: 14, 15, 17 | ||
526 | */ | ||
527 | |||
528 | P4_OPCODE(P4_EVENT_BRANCH_RETIRED) = P4_OPCODE_PACK(0x06, 0x05), | ||
529 | /* | ||
530 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
531 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
532 | */ | ||
533 | |||
534 | P4_OPCODE(P4_EVENT_MISPRED_BRANCH_RETIRED) = P4_OPCODE_PACK(0x03, 0x04), | ||
535 | /* | ||
536 | * MSR_P4_CRU_ESCR0: 12, 13, 16 | ||
537 | * MSR_P4_CRU_ESCR1: 14, 15, 17 | ||
538 | */ | ||
539 | |||
540 | P4_OPCODE(P4_EVENT_X87_ASSIST) = P4_OPCODE_PACK(0x03, 0x05), | ||
541 | /* | ||
542 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
543 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
544 | */ | ||
545 | |||
546 | P4_OPCODE(P4_EVENT_MACHINE_CLEAR) = P4_OPCODE_PACK(0x02, 0x05), | ||
547 | /* | ||
548 | * MSR_P4_CRU_ESCR2: 12, 13, 16 | ||
549 | * MSR_P4_CRU_ESCR3: 14, 15, 17 | ||
550 | */ | ||
551 | |||
552 | P4_OPCODE(P4_EVENT_INSTR_COMPLETED) = P4_OPCODE_PACK(0x07, 0x04), | ||
553 | /* | ||
554 | * MSR_P4_CRU_ESCR0: 12, 13, 16 | ||
555 | * MSR_P4_CRU_ESCR1: 14, 15, 17 | ||
556 | */ | ||
557 | }; | ||
558 | |||
559 | /* | ||
560 | * a caller should use P4_ESCR_EMASK_NAME helper to | ||
561 | * pick the EventMask needed, for example | ||
562 | * | ||
563 | * P4_ESCR_EMASK_NAME(P4_EVENT_TC_DELIVER_MODE, DD) | ||
564 | */ | ||
565 | enum P4_ESCR_EMASKS { | ||
566 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, DD, 0), | ||
567 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, DB, 1), | ||
568 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, DI, 2), | ||
569 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, BD, 3), | ||
570 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, BB, 4), | ||
571 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, BI, 5), | ||
572 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_DELIVER_MODE, ID, 6), | ||
573 | |||
574 | P4_GEN_ESCR_EMASK(P4_EVENT_BPU_FETCH_REQUEST, TCMISS, 0), | ||
575 | |||
576 | P4_GEN_ESCR_EMASK(P4_EVENT_ITLB_REFERENCE, HIT, 0), | ||
577 | P4_GEN_ESCR_EMASK(P4_EVENT_ITLB_REFERENCE, MISS, 1), | ||
578 | P4_GEN_ESCR_EMASK(P4_EVENT_ITLB_REFERENCE, HIT_UK, 2), | ||
579 | |||
580 | P4_GEN_ESCR_EMASK(P4_EVENT_MEMORY_CANCEL, ST_RB_FULL, 2), | ||
581 | P4_GEN_ESCR_EMASK(P4_EVENT_MEMORY_CANCEL, 64K_CONF, 3), | ||
582 | |||
583 | P4_GEN_ESCR_EMASK(P4_EVENT_MEMORY_COMPLETE, LSC, 0), | ||
584 | P4_GEN_ESCR_EMASK(P4_EVENT_MEMORY_COMPLETE, SSC, 1), | ||
585 | |||
586 | P4_GEN_ESCR_EMASK(P4_EVENT_LOAD_PORT_REPLAY, SPLIT_LD, 1), | ||
587 | |||
588 | P4_GEN_ESCR_EMASK(P4_EVENT_STORE_PORT_REPLAY, SPLIT_ST, 1), | ||
589 | |||
590 | P4_GEN_ESCR_EMASK(P4_EVENT_MOB_LOAD_REPLAY, NO_STA, 1), | ||
591 | P4_GEN_ESCR_EMASK(P4_EVENT_MOB_LOAD_REPLAY, NO_STD, 3), | ||
592 | P4_GEN_ESCR_EMASK(P4_EVENT_MOB_LOAD_REPLAY, PARTIAL_DATA, 4), | ||
593 | P4_GEN_ESCR_EMASK(P4_EVENT_MOB_LOAD_REPLAY, UNALGN_ADDR, 5), | ||
594 | |||
595 | P4_GEN_ESCR_EMASK(P4_EVENT_PAGE_WALK_TYPE, DTMISS, 0), | ||
596 | P4_GEN_ESCR_EMASK(P4_EVENT_PAGE_WALK_TYPE, ITMISS, 1), | ||
597 | |||
598 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITS, 0), | ||
599 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITE, 1), | ||
600 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITM, 2), | ||
601 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITS, 3), | ||
602 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITE, 4), | ||
603 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITM, 5), | ||
604 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_MISS, 8), | ||
605 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_MISS, 9), | ||
606 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_CACHE_REFERENCE, WR_2ndL_MISS, 10), | ||
607 | |||
608 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, DEFAULT, 0), | ||
609 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, ALL_READ, 5), | ||
610 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, ALL_WRITE, 6), | ||
611 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, MEM_UC, 7), | ||
612 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, MEM_WC, 8), | ||
613 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, MEM_WT, 9), | ||
614 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, MEM_WP, 10), | ||
615 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, MEM_WB, 11), | ||
616 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, OWN, 13), | ||
617 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, OTHER, 14), | ||
618 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ALLOCATION, PREFETCH, 15), | ||
619 | |||
620 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, DEFAULT, 0), | ||
621 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_READ, 5), | ||
622 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, ALL_WRITE, 6), | ||
623 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_UC, 7), | ||
624 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WC, 8), | ||
625 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WT, 9), | ||
626 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WP, 10), | ||
627 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, MEM_WB, 11), | ||
628 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, OWN, 13), | ||
629 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, OTHER, 14), | ||
630 | P4_GEN_ESCR_EMASK(P4_EVENT_IOQ_ACTIVE_ENTRIES, PREFETCH, 15), | ||
631 | |||
632 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_DRV, 0), | ||
633 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OWN, 1), | ||
634 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OTHER, 2), | ||
635 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_DRV, 3), | ||
636 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OWN, 4), | ||
637 | P4_GEN_ESCR_EMASK(P4_EVENT_FSB_DATA_ACTIVITY, DBSY_OTHER, 5), | ||
638 | |||
639 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE0, 0), | ||
640 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_TYPE1, 1), | ||
641 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_LEN0, 2), | ||
642 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_LEN1, 3), | ||
643 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_IO_TYPE, 5), | ||
644 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_LOCK_TYPE, 6), | ||
645 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_CACHE_TYPE, 7), | ||
646 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_SPLIT_TYPE, 8), | ||
647 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_DEM_TYPE, 9), | ||
648 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, REQ_ORD_TYPE, 10), | ||
649 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE0, 11), | ||
650 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE1, 12), | ||
651 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ALLOCATION, MEM_TYPE2, 13), | ||
652 | |||
653 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE0, 0), | ||
654 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_TYPE1, 1), | ||
655 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN0, 2), | ||
656 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LEN1, 3), | ||
657 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_IO_TYPE, 5), | ||
658 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_LOCK_TYPE, 6), | ||
659 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_CACHE_TYPE, 7), | ||
660 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_SPLIT_TYPE, 8), | ||
661 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_DEM_TYPE, 9), | ||
662 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, REQ_ORD_TYPE, 10), | ||
663 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE0, 11), | ||
664 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE1, 12), | ||
665 | P4_GEN_ESCR_EMASK(P4_EVENT_BSQ_ACTIVE_ENTRIES, MEM_TYPE2, 13), | ||
666 | |||
667 | P4_GEN_ESCR_EMASK(P4_EVENT_SSE_INPUT_ASSIST, ALL, 15), | ||
668 | |||
669 | P4_GEN_ESCR_EMASK(P4_EVENT_PACKED_SP_UOP, ALL, 15), | ||
670 | |||
671 | P4_GEN_ESCR_EMASK(P4_EVENT_PACKED_DP_UOP, ALL, 15), | ||
672 | |||
673 | P4_GEN_ESCR_EMASK(P4_EVENT_SCALAR_SP_UOP, ALL, 15), | ||
674 | |||
675 | P4_GEN_ESCR_EMASK(P4_EVENT_SCALAR_DP_UOP, ALL, 15), | ||
676 | |||
677 | P4_GEN_ESCR_EMASK(P4_EVENT_64BIT_MMX_UOP, ALL, 15), | ||
678 | |||
679 | P4_GEN_ESCR_EMASK(P4_EVENT_128BIT_MMX_UOP, ALL, 15), | ||
680 | |||
681 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_FP_UOP, ALL, 15), | ||
682 | |||
683 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_MISC, FLUSH, 4), | ||
684 | |||
685 | P4_GEN_ESCR_EMASK(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING, 0), | ||
686 | |||
687 | P4_GEN_ESCR_EMASK(P4_EVENT_TC_MS_XFER, CISC, 0), | ||
688 | |||
689 | P4_GEN_ESCR_EMASK(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_BUILD, 0), | ||
690 | P4_GEN_ESCR_EMASK(P4_EVENT_UOP_QUEUE_WRITES, FROM_TC_DELIVER, 1), | ||
691 | P4_GEN_ESCR_EMASK(P4_EVENT_UOP_QUEUE_WRITES, FROM_ROM, 2), | ||
692 | |||
693 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CONDITIONAL, 1), | ||
694 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, CALL, 2), | ||
695 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, RETURN, 3), | ||
696 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE, INDIRECT, 4), | ||
697 | |||
698 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_BRANCH_TYPE, CONDITIONAL, 1), | ||
699 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_BRANCH_TYPE, CALL, 2), | ||
700 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_BRANCH_TYPE, RETURN, 3), | ||
701 | P4_GEN_ESCR_EMASK(P4_EVENT_RETIRED_BRANCH_TYPE, INDIRECT, 4), | ||
702 | |||
703 | P4_GEN_ESCR_EMASK(P4_EVENT_RESOURCE_STALL, SBFULL, 5), | ||
704 | |||
705 | P4_GEN_ESCR_EMASK(P4_EVENT_WC_BUFFER, WCB_EVICTS, 0), | ||
706 | P4_GEN_ESCR_EMASK(P4_EVENT_WC_BUFFER, WCB_FULL_EVICTS, 1), | ||
707 | |||
708 | P4_GEN_ESCR_EMASK(P4_EVENT_FRONT_END_EVENT, NBOGUS, 0), | ||
709 | P4_GEN_ESCR_EMASK(P4_EVENT_FRONT_END_EVENT, BOGUS, 1), | ||
710 | |||
711 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, NBOGUS0, 0), | ||
712 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, NBOGUS1, 1), | ||
713 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, NBOGUS2, 2), | ||
714 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, NBOGUS3, 3), | ||
715 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, BOGUS0, 4), | ||
716 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, BOGUS1, 5), | ||
717 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, BOGUS2, 6), | ||
718 | P4_GEN_ESCR_EMASK(P4_EVENT_EXECUTION_EVENT, BOGUS3, 7), | ||
719 | |||
720 | P4_GEN_ESCR_EMASK(P4_EVENT_REPLAY_EVENT, NBOGUS, 0), | ||
721 | P4_GEN_ESCR_EMASK(P4_EVENT_REPLAY_EVENT, BOGUS, 1), | ||
722 | |||
723 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_RETIRED, NBOGUSNTAG, 0), | ||
724 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_RETIRED, NBOGUSTAG, 1), | ||
725 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_RETIRED, BOGUSNTAG, 2), | ||
726 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_RETIRED, BOGUSTAG, 3), | ||
727 | |||
728 | P4_GEN_ESCR_EMASK(P4_EVENT_UOPS_RETIRED, NBOGUS, 0), | ||
729 | P4_GEN_ESCR_EMASK(P4_EVENT_UOPS_RETIRED, BOGUS, 1), | ||
730 | |||
731 | P4_GEN_ESCR_EMASK(P4_EVENT_UOP_TYPE, TAGLOADS, 1), | ||
732 | P4_GEN_ESCR_EMASK(P4_EVENT_UOP_TYPE, TAGSTORES, 2), | ||
733 | |||
734 | P4_GEN_ESCR_EMASK(P4_EVENT_BRANCH_RETIRED, MMNP, 0), | ||
735 | P4_GEN_ESCR_EMASK(P4_EVENT_BRANCH_RETIRED, MMNM, 1), | ||
736 | P4_GEN_ESCR_EMASK(P4_EVENT_BRANCH_RETIRED, MMTP, 2), | ||
737 | P4_GEN_ESCR_EMASK(P4_EVENT_BRANCH_RETIRED, MMTM, 3), | ||
738 | |||
739 | P4_GEN_ESCR_EMASK(P4_EVENT_MISPRED_BRANCH_RETIRED, NBOGUS, 0), | ||
740 | |||
741 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_ASSIST, FPSU, 0), | ||
742 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_ASSIST, FPSO, 1), | ||
743 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_ASSIST, POAO, 2), | ||
744 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_ASSIST, POAU, 3), | ||
745 | P4_GEN_ESCR_EMASK(P4_EVENT_X87_ASSIST, PREA, 4), | ||
746 | |||
747 | P4_GEN_ESCR_EMASK(P4_EVENT_MACHINE_CLEAR, CLEAR, 0), | ||
748 | P4_GEN_ESCR_EMASK(P4_EVENT_MACHINE_CLEAR, MOCLEAR, 1), | ||
749 | P4_GEN_ESCR_EMASK(P4_EVENT_MACHINE_CLEAR, SMCLEAR, 2), | ||
750 | |||
751 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_COMPLETED, NBOGUS, 0), | ||
752 | P4_GEN_ESCR_EMASK(P4_EVENT_INSTR_COMPLETED, BOGUS, 1), | ||
753 | }; | ||
754 | |||
755 | /* P4 PEBS: stale for a while */ | ||
756 | #define P4_PEBS_METRIC_MASK 0x00001fffU | ||
757 | #define P4_PEBS_UOB_TAG 0x01000000U | ||
758 | #define P4_PEBS_ENABLE 0x02000000U | ||
759 | |||
760 | /* Replay metrics for MSR_IA32_PEBS_ENABLE and MSR_P4_PEBS_MATRIX_VERT */ | ||
761 | #define P4_PEBS__1stl_cache_load_miss_retired 0x3000001 | ||
762 | #define P4_PEBS__2ndl_cache_load_miss_retired 0x3000002 | ||
763 | #define P4_PEBS__dtlb_load_miss_retired 0x3000004 | ||
764 | #define P4_PEBS__dtlb_store_miss_retired 0x3000004 | ||
765 | #define P4_PEBS__dtlb_all_miss_retired 0x3000004 | ||
766 | #define P4_PEBS__tagged_mispred_branch 0x3018000 | ||
767 | #define P4_PEBS__mob_load_replay_retired 0x3000200 | ||
768 | #define P4_PEBS__split_load_retired 0x3000400 | ||
769 | #define P4_PEBS__split_store_retired 0x3000400 | ||
770 | |||
771 | #define P4_VERT__1stl_cache_load_miss_retired 0x0000001 | ||
772 | #define P4_VERT__2ndl_cache_load_miss_retired 0x0000001 | ||
773 | #define P4_VERT__dtlb_load_miss_retired 0x0000001 | ||
774 | #define P4_VERT__dtlb_store_miss_retired 0x0000002 | ||
775 | #define P4_VERT__dtlb_all_miss_retired 0x0000003 | ||
776 | #define P4_VERT__tagged_mispred_branch 0x0000010 | ||
777 | #define P4_VERT__mob_load_replay_retired 0x0000001 | ||
778 | #define P4_VERT__split_load_retired 0x0000001 | ||
779 | #define P4_VERT__split_store_retired 0x0000002 | ||
780 | |||
781 | enum P4_CACHE_EVENTS { | ||
782 | P4_CACHE__NONE, | ||
783 | |||
784 | P4_CACHE__1stl_cache_load_miss_retired, | ||
785 | P4_CACHE__2ndl_cache_load_miss_retired, | ||
786 | P4_CACHE__dtlb_load_miss_retired, | ||
787 | P4_CACHE__dtlb_store_miss_retired, | ||
788 | P4_CACHE__itlb_reference_hit, | ||
789 | P4_CACHE__itlb_reference_miss, | ||
790 | |||
791 | P4_CACHE__MAX | ||
792 | }; | ||
793 | |||
794 | #endif /* PERF_EVENT_P4_H */ | ||
diff --git a/arch/x86/include/asm/processor.h b/arch/x86/include/asm/processor.h index b753ea59703a..32428b410b55 100644 --- a/arch/x86/include/asm/processor.h +++ b/arch/x86/include/asm/processor.h | |||
@@ -21,7 +21,6 @@ struct mm_struct; | |||
21 | #include <asm/msr.h> | 21 | #include <asm/msr.h> |
22 | #include <asm/desc_defs.h> | 22 | #include <asm/desc_defs.h> |
23 | #include <asm/nops.h> | 23 | #include <asm/nops.h> |
24 | #include <asm/ds.h> | ||
25 | 24 | ||
26 | #include <linux/personality.h> | 25 | #include <linux/personality.h> |
27 | #include <linux/cpumask.h> | 26 | #include <linux/cpumask.h> |
@@ -29,6 +28,7 @@ struct mm_struct; | |||
29 | #include <linux/threads.h> | 28 | #include <linux/threads.h> |
30 | #include <linux/math64.h> | 29 | #include <linux/math64.h> |
31 | #include <linux/init.h> | 30 | #include <linux/init.h> |
31 | #include <linux/err.h> | ||
32 | 32 | ||
33 | #define HBP_NUM 4 | 33 | #define HBP_NUM 4 |
34 | /* | 34 | /* |
@@ -473,10 +473,6 @@ struct thread_struct { | |||
473 | unsigned long iopl; | 473 | unsigned long iopl; |
474 | /* Max allowed port in the bitmap, in bytes: */ | 474 | /* Max allowed port in the bitmap, in bytes: */ |
475 | unsigned io_bitmap_max; | 475 | unsigned io_bitmap_max; |
476 | /* MSR_IA32_DEBUGCTLMSR value to switch in if TIF_DEBUGCTLMSR is set. */ | ||
477 | unsigned long debugctlmsr; | ||
478 | /* Debug Store context; see asm/ds.h */ | ||
479 | struct ds_context *ds_ctx; | ||
480 | }; | 476 | }; |
481 | 477 | ||
482 | static inline unsigned long native_get_debugreg(int regno) | 478 | static inline unsigned long native_get_debugreg(int regno) |
@@ -803,7 +799,7 @@ extern void cpu_init(void); | |||
803 | 799 | ||
804 | static inline unsigned long get_debugctlmsr(void) | 800 | static inline unsigned long get_debugctlmsr(void) |
805 | { | 801 | { |
806 | unsigned long debugctlmsr = 0; | 802 | unsigned long debugctlmsr = 0; |
807 | 803 | ||
808 | #ifndef CONFIG_X86_DEBUGCTLMSR | 804 | #ifndef CONFIG_X86_DEBUGCTLMSR |
809 | if (boot_cpu_data.x86 < 6) | 805 | if (boot_cpu_data.x86 < 6) |
@@ -811,21 +807,6 @@ static inline unsigned long get_debugctlmsr(void) | |||
811 | #endif | 807 | #endif |
812 | rdmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); | 808 | rdmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); |
813 | 809 | ||
814 | return debugctlmsr; | ||
815 | } | ||
816 | |||
817 | static inline unsigned long get_debugctlmsr_on_cpu(int cpu) | ||
818 | { | ||
819 | u64 debugctlmsr = 0; | ||
820 | u32 val1, val2; | ||
821 | |||
822 | #ifndef CONFIG_X86_DEBUGCTLMSR | ||
823 | if (boot_cpu_data.x86 < 6) | ||
824 | return 0; | ||
825 | #endif | ||
826 | rdmsr_on_cpu(cpu, MSR_IA32_DEBUGCTLMSR, &val1, &val2); | ||
827 | debugctlmsr = val1 | ((u64)val2 << 32); | ||
828 | |||
829 | return debugctlmsr; | 810 | return debugctlmsr; |
830 | } | 811 | } |
831 | 812 | ||
@@ -838,18 +819,6 @@ static inline void update_debugctlmsr(unsigned long debugctlmsr) | |||
838 | wrmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); | 819 | wrmsrl(MSR_IA32_DEBUGCTLMSR, debugctlmsr); |
839 | } | 820 | } |
840 | 821 | ||
841 | static inline void update_debugctlmsr_on_cpu(int cpu, | ||
842 | unsigned long debugctlmsr) | ||
843 | { | ||
844 | #ifndef CONFIG_X86_DEBUGCTLMSR | ||
845 | if (boot_cpu_data.x86 < 6) | ||
846 | return; | ||
847 | #endif | ||
848 | wrmsr_on_cpu(cpu, MSR_IA32_DEBUGCTLMSR, | ||
849 | (u32)((u64)debugctlmsr), | ||
850 | (u32)((u64)debugctlmsr >> 32)); | ||
851 | } | ||
852 | |||
853 | /* | 822 | /* |
854 | * from system description table in BIOS. Mostly for MCA use, but | 823 | * from system description table in BIOS. Mostly for MCA use, but |
855 | * others may find it useful: | 824 | * others may find it useful: |
diff --git a/arch/x86/include/asm/ptrace-abi.h b/arch/x86/include/asm/ptrace-abi.h index 86723035a515..52b098a6eebb 100644 --- a/arch/x86/include/asm/ptrace-abi.h +++ b/arch/x86/include/asm/ptrace-abi.h | |||
@@ -82,61 +82,6 @@ | |||
82 | 82 | ||
83 | #ifndef __ASSEMBLY__ | 83 | #ifndef __ASSEMBLY__ |
84 | #include <linux/types.h> | 84 | #include <linux/types.h> |
85 | 85 | #endif | |
86 | /* configuration/status structure used in PTRACE_BTS_CONFIG and | ||
87 | PTRACE_BTS_STATUS commands. | ||
88 | */ | ||
89 | struct ptrace_bts_config { | ||
90 | /* requested or actual size of BTS buffer in bytes */ | ||
91 | __u32 size; | ||
92 | /* bitmask of below flags */ | ||
93 | __u32 flags; | ||
94 | /* buffer overflow signal */ | ||
95 | __u32 signal; | ||
96 | /* actual size of bts_struct in bytes */ | ||
97 | __u32 bts_size; | ||
98 | }; | ||
99 | #endif /* __ASSEMBLY__ */ | ||
100 | |||
101 | #define PTRACE_BTS_O_TRACE 0x1 /* branch trace */ | ||
102 | #define PTRACE_BTS_O_SCHED 0x2 /* scheduling events w/ jiffies */ | ||
103 | #define PTRACE_BTS_O_SIGNAL 0x4 /* send SIG<signal> on buffer overflow | ||
104 | instead of wrapping around */ | ||
105 | #define PTRACE_BTS_O_ALLOC 0x8 /* (re)allocate buffer */ | ||
106 | |||
107 | #define PTRACE_BTS_CONFIG 40 | ||
108 | /* Configure branch trace recording. | ||
109 | ADDR points to a struct ptrace_bts_config. | ||
110 | DATA gives the size of that buffer. | ||
111 | A new buffer is allocated, if requested in the flags. | ||
112 | An overflow signal may only be requested for new buffers. | ||
113 | Returns the number of bytes read. | ||
114 | */ | ||
115 | #define PTRACE_BTS_STATUS 41 | ||
116 | /* Return the current configuration in a struct ptrace_bts_config | ||
117 | pointed to by ADDR; DATA gives the size of that buffer. | ||
118 | Returns the number of bytes written. | ||
119 | */ | ||
120 | #define PTRACE_BTS_SIZE 42 | ||
121 | /* Return the number of available BTS records for draining. | ||
122 | DATA and ADDR are ignored. | ||
123 | */ | ||
124 | #define PTRACE_BTS_GET 43 | ||
125 | /* Get a single BTS record. | ||
126 | DATA defines the index into the BTS array, where 0 is the newest | ||
127 | entry, and higher indices refer to older entries. | ||
128 | ADDR is pointing to struct bts_struct (see asm/ds.h). | ||
129 | */ | ||
130 | #define PTRACE_BTS_CLEAR 44 | ||
131 | /* Clear the BTS buffer. | ||
132 | DATA and ADDR are ignored. | ||
133 | */ | ||
134 | #define PTRACE_BTS_DRAIN 45 | ||
135 | /* Read all available BTS records and clear the buffer. | ||
136 | ADDR points to an array of struct bts_struct. | ||
137 | DATA gives the size of that buffer. | ||
138 | BTS records are read from oldest to newest. | ||
139 | Returns number of BTS records drained. | ||
140 | */ | ||
141 | 86 | ||
142 | #endif /* _ASM_X86_PTRACE_ABI_H */ | 87 | #endif /* _ASM_X86_PTRACE_ABI_H */ |
diff --git a/arch/x86/include/asm/ptrace.h b/arch/x86/include/asm/ptrace.h index 69a686a7dff0..78cd1ea94500 100644 --- a/arch/x86/include/asm/ptrace.h +++ b/arch/x86/include/asm/ptrace.h | |||
@@ -289,12 +289,6 @@ extern int do_get_thread_area(struct task_struct *p, int idx, | |||
289 | extern int do_set_thread_area(struct task_struct *p, int idx, | 289 | extern int do_set_thread_area(struct task_struct *p, int idx, |
290 | struct user_desc __user *info, int can_allocate); | 290 | struct user_desc __user *info, int can_allocate); |
291 | 291 | ||
292 | #ifdef CONFIG_X86_PTRACE_BTS | ||
293 | extern void ptrace_bts_untrace(struct task_struct *tsk); | ||
294 | |||
295 | #define arch_ptrace_untrace(tsk) ptrace_bts_untrace(tsk) | ||
296 | #endif /* CONFIG_X86_PTRACE_BTS */ | ||
297 | |||
298 | #endif /* __KERNEL__ */ | 292 | #endif /* __KERNEL__ */ |
299 | 293 | ||
300 | #endif /* !__ASSEMBLY__ */ | 294 | #endif /* !__ASSEMBLY__ */ |
diff --git a/arch/x86/include/asm/thread_info.h b/arch/x86/include/asm/thread_info.h index e0d28901e969..d017ed5502e2 100644 --- a/arch/x86/include/asm/thread_info.h +++ b/arch/x86/include/asm/thread_info.h | |||
@@ -92,8 +92,7 @@ struct thread_info { | |||
92 | #define TIF_IO_BITMAP 22 /* uses I/O bitmap */ | 92 | #define TIF_IO_BITMAP 22 /* uses I/O bitmap */ |
93 | #define TIF_FREEZE 23 /* is freezing for suspend */ | 93 | #define TIF_FREEZE 23 /* is freezing for suspend */ |
94 | #define TIF_FORCED_TF 24 /* true if TF in eflags artificially */ | 94 | #define TIF_FORCED_TF 24 /* true if TF in eflags artificially */ |
95 | #define TIF_DEBUGCTLMSR 25 /* uses thread_struct.debugctlmsr */ | 95 | #define TIF_BLOCKSTEP 25 /* set when we want DEBUGCTLMSR_BTF */ |
96 | #define TIF_DS_AREA_MSR 26 /* uses thread_struct.ds_area_msr */ | ||
97 | #define TIF_LAZY_MMU_UPDATES 27 /* task is updating the mmu lazily */ | 96 | #define TIF_LAZY_MMU_UPDATES 27 /* task is updating the mmu lazily */ |
98 | #define TIF_SYSCALL_TRACEPOINT 28 /* syscall tracepoint instrumentation */ | 97 | #define TIF_SYSCALL_TRACEPOINT 28 /* syscall tracepoint instrumentation */ |
99 | 98 | ||
@@ -115,8 +114,7 @@ struct thread_info { | |||
115 | #define _TIF_IO_BITMAP (1 << TIF_IO_BITMAP) | 114 | #define _TIF_IO_BITMAP (1 << TIF_IO_BITMAP) |
116 | #define _TIF_FREEZE (1 << TIF_FREEZE) | 115 | #define _TIF_FREEZE (1 << TIF_FREEZE) |
117 | #define _TIF_FORCED_TF (1 << TIF_FORCED_TF) | 116 | #define _TIF_FORCED_TF (1 << TIF_FORCED_TF) |
118 | #define _TIF_DEBUGCTLMSR (1 << TIF_DEBUGCTLMSR) | 117 | #define _TIF_BLOCKSTEP (1 << TIF_BLOCKSTEP) |
119 | #define _TIF_DS_AREA_MSR (1 << TIF_DS_AREA_MSR) | ||
120 | #define _TIF_LAZY_MMU_UPDATES (1 << TIF_LAZY_MMU_UPDATES) | 118 | #define _TIF_LAZY_MMU_UPDATES (1 << TIF_LAZY_MMU_UPDATES) |
121 | #define _TIF_SYSCALL_TRACEPOINT (1 << TIF_SYSCALL_TRACEPOINT) | 119 | #define _TIF_SYSCALL_TRACEPOINT (1 << TIF_SYSCALL_TRACEPOINT) |
122 | 120 | ||
@@ -147,7 +145,7 @@ struct thread_info { | |||
147 | 145 | ||
148 | /* flags to check in __switch_to() */ | 146 | /* flags to check in __switch_to() */ |
149 | #define _TIF_WORK_CTXSW \ | 147 | #define _TIF_WORK_CTXSW \ |
150 | (_TIF_IO_BITMAP|_TIF_DEBUGCTLMSR|_TIF_DS_AREA_MSR|_TIF_NOTSC) | 148 | (_TIF_IO_BITMAP|_TIF_NOTSC|_TIF_BLOCKSTEP) |
151 | 149 | ||
152 | #define _TIF_WORK_CTXSW_PREV (_TIF_WORK_CTXSW|_TIF_USER_RETURN_NOTIFY) | 150 | #define _TIF_WORK_CTXSW_PREV (_TIF_WORK_CTXSW|_TIF_USER_RETURN_NOTIFY) |
153 | #define _TIF_WORK_CTXSW_NEXT (_TIF_WORK_CTXSW|_TIF_DEBUG) | 151 | #define _TIF_WORK_CTXSW_NEXT (_TIF_WORK_CTXSW|_TIF_DEBUG) |
diff --git a/arch/x86/kernel/Makefile b/arch/x86/kernel/Makefile index 4c58352209e0..e77b22083721 100644 --- a/arch/x86/kernel/Makefile +++ b/arch/x86/kernel/Makefile | |||
@@ -47,8 +47,6 @@ obj-$(CONFIG_X86_TRAMPOLINE) += trampoline.o | |||
47 | obj-y += process.o | 47 | obj-y += process.o |
48 | obj-y += i387.o xsave.o | 48 | obj-y += i387.o xsave.o |
49 | obj-y += ptrace.o | 49 | obj-y += ptrace.o |
50 | obj-$(CONFIG_X86_DS) += ds.o | ||
51 | obj-$(CONFIG_X86_DS_SELFTEST) += ds_selftest.o | ||
52 | obj-$(CONFIG_X86_32) += tls.o | 50 | obj-$(CONFIG_X86_32) += tls.o |
53 | obj-$(CONFIG_IA32_EMULATION) += tls.o | 51 | obj-$(CONFIG_IA32_EMULATION) += tls.o |
54 | obj-y += step.o | 52 | obj-y += step.o |
diff --git a/arch/x86/kernel/cpu/intel.c b/arch/x86/kernel/cpu/intel.c index 1366c7cfd483..f5e5390d3459 100644 --- a/arch/x86/kernel/cpu/intel.c +++ b/arch/x86/kernel/cpu/intel.c | |||
@@ -12,7 +12,6 @@ | |||
12 | #include <asm/processor.h> | 12 | #include <asm/processor.h> |
13 | #include <asm/pgtable.h> | 13 | #include <asm/pgtable.h> |
14 | #include <asm/msr.h> | 14 | #include <asm/msr.h> |
15 | #include <asm/ds.h> | ||
16 | #include <asm/bugs.h> | 15 | #include <asm/bugs.h> |
17 | #include <asm/cpu.h> | 16 | #include <asm/cpu.h> |
18 | 17 | ||
@@ -388,7 +387,6 @@ static void __cpuinit init_intel(struct cpuinfo_x86 *c) | |||
388 | set_cpu_cap(c, X86_FEATURE_BTS); | 387 | set_cpu_cap(c, X86_FEATURE_BTS); |
389 | if (!(l1 & (1<<12))) | 388 | if (!(l1 & (1<<12))) |
390 | set_cpu_cap(c, X86_FEATURE_PEBS); | 389 | set_cpu_cap(c, X86_FEATURE_PEBS); |
391 | ds_init_intel(c); | ||
392 | } | 390 | } |
393 | 391 | ||
394 | if (c->x86 == 6 && c->x86_model == 29 && cpu_has_clflush) | 392 | if (c->x86 == 6 && c->x86_model == 29 && cpu_has_clflush) |
diff --git a/arch/x86/kernel/cpu/perf_event.c b/arch/x86/kernel/cpu/perf_event.c index db5bdc8addf8..fd4db0db3708 100644 --- a/arch/x86/kernel/cpu/perf_event.c +++ b/arch/x86/kernel/cpu/perf_event.c | |||
@@ -31,46 +31,51 @@ | |||
31 | #include <asm/nmi.h> | 31 | #include <asm/nmi.h> |
32 | #include <asm/compat.h> | 32 | #include <asm/compat.h> |
33 | 33 | ||
34 | static u64 perf_event_mask __read_mostly; | 34 | #if 0 |
35 | #undef wrmsrl | ||
36 | #define wrmsrl(msr, val) \ | ||
37 | do { \ | ||
38 | trace_printk("wrmsrl(%lx, %lx)\n", (unsigned long)(msr),\ | ||
39 | (unsigned long)(val)); \ | ||
40 | native_write_msr((msr), (u32)((u64)(val)), \ | ||
41 | (u32)((u64)(val) >> 32)); \ | ||
42 | } while (0) | ||
43 | #endif | ||
35 | 44 | ||
36 | /* The maximal number of PEBS events: */ | 45 | /* |
37 | #define MAX_PEBS_EVENTS 4 | 46 | * best effort, GUP based copy_from_user() that assumes IRQ or NMI context |
47 | */ | ||
48 | static unsigned long | ||
49 | copy_from_user_nmi(void *to, const void __user *from, unsigned long n) | ||
50 | { | ||
51 | unsigned long offset, addr = (unsigned long)from; | ||
52 | int type = in_nmi() ? KM_NMI : KM_IRQ0; | ||
53 | unsigned long size, len = 0; | ||
54 | struct page *page; | ||
55 | void *map; | ||
56 | int ret; | ||
38 | 57 | ||
39 | /* The size of a BTS record in bytes: */ | 58 | do { |
40 | #define BTS_RECORD_SIZE 24 | 59 | ret = __get_user_pages_fast(addr, 1, 0, &page); |
60 | if (!ret) | ||
61 | break; | ||
41 | 62 | ||
42 | /* The size of a per-cpu BTS buffer in bytes: */ | 63 | offset = addr & (PAGE_SIZE - 1); |
43 | #define BTS_BUFFER_SIZE (BTS_RECORD_SIZE * 2048) | 64 | size = min(PAGE_SIZE - offset, n - len); |
44 | 65 | ||
45 | /* The BTS overflow threshold in bytes from the end of the buffer: */ | 66 | map = kmap_atomic(page, type); |
46 | #define BTS_OVFL_TH (BTS_RECORD_SIZE * 128) | 67 | memcpy(to, map+offset, size); |
68 | kunmap_atomic(map, type); | ||
69 | put_page(page); | ||
47 | 70 | ||
71 | len += size; | ||
72 | to += size; | ||
73 | addr += size; | ||
48 | 74 | ||
49 | /* | 75 | } while (len < n); |
50 | * Bits in the debugctlmsr controlling branch tracing. | ||
51 | */ | ||
52 | #define X86_DEBUGCTL_TR (1 << 6) | ||
53 | #define X86_DEBUGCTL_BTS (1 << 7) | ||
54 | #define X86_DEBUGCTL_BTINT (1 << 8) | ||
55 | #define X86_DEBUGCTL_BTS_OFF_OS (1 << 9) | ||
56 | #define X86_DEBUGCTL_BTS_OFF_USR (1 << 10) | ||
57 | 76 | ||
58 | /* | 77 | return len; |
59 | * A debug store configuration. | 78 | } |
60 | * | ||
61 | * We only support architectures that use 64bit fields. | ||
62 | */ | ||
63 | struct debug_store { | ||
64 | u64 bts_buffer_base; | ||
65 | u64 bts_index; | ||
66 | u64 bts_absolute_maximum; | ||
67 | u64 bts_interrupt_threshold; | ||
68 | u64 pebs_buffer_base; | ||
69 | u64 pebs_index; | ||
70 | u64 pebs_absolute_maximum; | ||
71 | u64 pebs_interrupt_threshold; | ||
72 | u64 pebs_event_reset[MAX_PEBS_EVENTS]; | ||
73 | }; | ||
74 | 79 | ||
75 | struct event_constraint { | 80 | struct event_constraint { |
76 | union { | 81 | union { |
@@ -89,18 +94,41 @@ struct amd_nb { | |||
89 | struct event_constraint event_constraints[X86_PMC_IDX_MAX]; | 94 | struct event_constraint event_constraints[X86_PMC_IDX_MAX]; |
90 | }; | 95 | }; |
91 | 96 | ||
97 | #define MAX_LBR_ENTRIES 16 | ||
98 | |||
92 | struct cpu_hw_events { | 99 | struct cpu_hw_events { |
100 | /* | ||
101 | * Generic x86 PMC bits | ||
102 | */ | ||
93 | struct perf_event *events[X86_PMC_IDX_MAX]; /* in counter order */ | 103 | struct perf_event *events[X86_PMC_IDX_MAX]; /* in counter order */ |
94 | unsigned long active_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)]; | 104 | unsigned long active_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)]; |
95 | unsigned long interrupts; | ||
96 | int enabled; | 105 | int enabled; |
97 | struct debug_store *ds; | ||
98 | 106 | ||
99 | int n_events; | 107 | int n_events; |
100 | int n_added; | 108 | int n_added; |
101 | int assign[X86_PMC_IDX_MAX]; /* event to counter assignment */ | 109 | int assign[X86_PMC_IDX_MAX]; /* event to counter assignment */ |
102 | u64 tags[X86_PMC_IDX_MAX]; | 110 | u64 tags[X86_PMC_IDX_MAX]; |
103 | struct perf_event *event_list[X86_PMC_IDX_MAX]; /* in enabled order */ | 111 | struct perf_event *event_list[X86_PMC_IDX_MAX]; /* in enabled order */ |
112 | |||
113 | unsigned int group_flag; | ||
114 | |||
115 | /* | ||
116 | * Intel DebugStore bits | ||
117 | */ | ||
118 | struct debug_store *ds; | ||
119 | u64 pebs_enabled; | ||
120 | |||
121 | /* | ||
122 | * Intel LBR bits | ||
123 | */ | ||
124 | int lbr_users; | ||
125 | void *lbr_context; | ||
126 | struct perf_branch_stack lbr_stack; | ||
127 | struct perf_branch_entry lbr_entries[MAX_LBR_ENTRIES]; | ||
128 | |||
129 | /* | ||
130 | * AMD specific bits | ||
131 | */ | ||
104 | struct amd_nb *amd_nb; | 132 | struct amd_nb *amd_nb; |
105 | }; | 133 | }; |
106 | 134 | ||
@@ -114,44 +142,75 @@ struct cpu_hw_events { | |||
114 | #define EVENT_CONSTRAINT(c, n, m) \ | 142 | #define EVENT_CONSTRAINT(c, n, m) \ |
115 | __EVENT_CONSTRAINT(c, n, m, HWEIGHT(n)) | 143 | __EVENT_CONSTRAINT(c, n, m, HWEIGHT(n)) |
116 | 144 | ||
145 | /* | ||
146 | * Constraint on the Event code. | ||
147 | */ | ||
117 | #define INTEL_EVENT_CONSTRAINT(c, n) \ | 148 | #define INTEL_EVENT_CONSTRAINT(c, n) \ |
118 | EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVTSEL_MASK) | 149 | EVENT_CONSTRAINT(c, n, ARCH_PERFMON_EVENTSEL_EVENT) |
119 | 150 | ||
151 | /* | ||
152 | * Constraint on the Event code + UMask + fixed-mask | ||
153 | * | ||
154 | * filter mask to validate fixed counter events. | ||
155 | * the following filters disqualify for fixed counters: | ||
156 | * - inv | ||
157 | * - edge | ||
158 | * - cnt-mask | ||
159 | * The other filters are supported by fixed counters. | ||
160 | * The any-thread option is supported starting with v3. | ||
161 | */ | ||
120 | #define FIXED_EVENT_CONSTRAINT(c, n) \ | 162 | #define FIXED_EVENT_CONSTRAINT(c, n) \ |
121 | EVENT_CONSTRAINT(c, (1ULL << (32+n)), INTEL_ARCH_FIXED_MASK) | 163 | EVENT_CONSTRAINT(c, (1ULL << (32+n)), X86_RAW_EVENT_MASK) |
164 | |||
165 | /* | ||
166 | * Constraint on the Event code + UMask | ||
167 | */ | ||
168 | #define PEBS_EVENT_CONSTRAINT(c, n) \ | ||
169 | EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK) | ||
122 | 170 | ||
123 | #define EVENT_CONSTRAINT_END \ | 171 | #define EVENT_CONSTRAINT_END \ |
124 | EVENT_CONSTRAINT(0, 0, 0) | 172 | EVENT_CONSTRAINT(0, 0, 0) |
125 | 173 | ||
126 | #define for_each_event_constraint(e, c) \ | 174 | #define for_each_event_constraint(e, c) \ |
127 | for ((e) = (c); (e)->cmask; (e)++) | 175 | for ((e) = (c); (e)->weight; (e)++) |
176 | |||
177 | union perf_capabilities { | ||
178 | struct { | ||
179 | u64 lbr_format : 6; | ||
180 | u64 pebs_trap : 1; | ||
181 | u64 pebs_arch_reg : 1; | ||
182 | u64 pebs_format : 4; | ||
183 | u64 smm_freeze : 1; | ||
184 | }; | ||
185 | u64 capabilities; | ||
186 | }; | ||
128 | 187 | ||
129 | /* | 188 | /* |
130 | * struct x86_pmu - generic x86 pmu | 189 | * struct x86_pmu - generic x86 pmu |
131 | */ | 190 | */ |
132 | struct x86_pmu { | 191 | struct x86_pmu { |
192 | /* | ||
193 | * Generic x86 PMC bits | ||
194 | */ | ||
133 | const char *name; | 195 | const char *name; |
134 | int version; | 196 | int version; |
135 | int (*handle_irq)(struct pt_regs *); | 197 | int (*handle_irq)(struct pt_regs *); |
136 | void (*disable_all)(void); | 198 | void (*disable_all)(void); |
137 | void (*enable_all)(void); | 199 | void (*enable_all)(int added); |
138 | void (*enable)(struct perf_event *); | 200 | void (*enable)(struct perf_event *); |
139 | void (*disable)(struct perf_event *); | 201 | void (*disable)(struct perf_event *); |
202 | int (*hw_config)(struct perf_event *event); | ||
203 | int (*schedule_events)(struct cpu_hw_events *cpuc, int n, int *assign); | ||
140 | unsigned eventsel; | 204 | unsigned eventsel; |
141 | unsigned perfctr; | 205 | unsigned perfctr; |
142 | u64 (*event_map)(int); | 206 | u64 (*event_map)(int); |
143 | u64 (*raw_event)(u64); | ||
144 | int max_events; | 207 | int max_events; |
145 | int num_events; | 208 | int num_counters; |
146 | int num_events_fixed; | 209 | int num_counters_fixed; |
147 | int event_bits; | 210 | int cntval_bits; |
148 | u64 event_mask; | 211 | u64 cntval_mask; |
149 | int apic; | 212 | int apic; |
150 | u64 max_period; | 213 | u64 max_period; |
151 | u64 intel_ctrl; | ||
152 | void (*enable_bts)(u64 config); | ||
153 | void (*disable_bts)(void); | ||
154 | |||
155 | struct event_constraint * | 214 | struct event_constraint * |
156 | (*get_event_constraints)(struct cpu_hw_events *cpuc, | 215 | (*get_event_constraints)(struct cpu_hw_events *cpuc, |
157 | struct perf_event *event); | 216 | struct perf_event *event); |
@@ -159,11 +218,32 @@ struct x86_pmu { | |||
159 | void (*put_event_constraints)(struct cpu_hw_events *cpuc, | 218 | void (*put_event_constraints)(struct cpu_hw_events *cpuc, |
160 | struct perf_event *event); | 219 | struct perf_event *event); |
161 | struct event_constraint *event_constraints; | 220 | struct event_constraint *event_constraints; |
221 | void (*quirks)(void); | ||
162 | 222 | ||
163 | int (*cpu_prepare)(int cpu); | 223 | int (*cpu_prepare)(int cpu); |
164 | void (*cpu_starting)(int cpu); | 224 | void (*cpu_starting)(int cpu); |
165 | void (*cpu_dying)(int cpu); | 225 | void (*cpu_dying)(int cpu); |
166 | void (*cpu_dead)(int cpu); | 226 | void (*cpu_dead)(int cpu); |
227 | |||
228 | /* | ||
229 | * Intel Arch Perfmon v2+ | ||
230 | */ | ||
231 | u64 intel_ctrl; | ||
232 | union perf_capabilities intel_cap; | ||
233 | |||
234 | /* | ||
235 | * Intel DebugStore bits | ||
236 | */ | ||
237 | int bts, pebs; | ||
238 | int pebs_record_size; | ||
239 | void (*drain_pebs)(struct pt_regs *regs); | ||
240 | struct event_constraint *pebs_constraints; | ||
241 | |||
242 | /* | ||
243 | * Intel LBR | ||
244 | */ | ||
245 | unsigned long lbr_tos, lbr_from, lbr_to; /* MSR base regs */ | ||
246 | int lbr_nr; /* hardware stack size */ | ||
167 | }; | 247 | }; |
168 | 248 | ||
169 | static struct x86_pmu x86_pmu __read_mostly; | 249 | static struct x86_pmu x86_pmu __read_mostly; |
@@ -198,7 +278,7 @@ static u64 | |||
198 | x86_perf_event_update(struct perf_event *event) | 278 | x86_perf_event_update(struct perf_event *event) |
199 | { | 279 | { |
200 | struct hw_perf_event *hwc = &event->hw; | 280 | struct hw_perf_event *hwc = &event->hw; |
201 | int shift = 64 - x86_pmu.event_bits; | 281 | int shift = 64 - x86_pmu.cntval_bits; |
202 | u64 prev_raw_count, new_raw_count; | 282 | u64 prev_raw_count, new_raw_count; |
203 | int idx = hwc->idx; | 283 | int idx = hwc->idx; |
204 | s64 delta; | 284 | s64 delta; |
@@ -241,33 +321,32 @@ again: | |||
241 | static atomic_t active_events; | 321 | static atomic_t active_events; |
242 | static DEFINE_MUTEX(pmc_reserve_mutex); | 322 | static DEFINE_MUTEX(pmc_reserve_mutex); |
243 | 323 | ||
324 | #ifdef CONFIG_X86_LOCAL_APIC | ||
325 | |||
244 | static bool reserve_pmc_hardware(void) | 326 | static bool reserve_pmc_hardware(void) |
245 | { | 327 | { |
246 | #ifdef CONFIG_X86_LOCAL_APIC | ||
247 | int i; | 328 | int i; |
248 | 329 | ||
249 | if (nmi_watchdog == NMI_LOCAL_APIC) | 330 | if (nmi_watchdog == NMI_LOCAL_APIC) |
250 | disable_lapic_nmi_watchdog(); | 331 | disable_lapic_nmi_watchdog(); |
251 | 332 | ||
252 | for (i = 0; i < x86_pmu.num_events; i++) { | 333 | for (i = 0; i < x86_pmu.num_counters; i++) { |
253 | if (!reserve_perfctr_nmi(x86_pmu.perfctr + i)) | 334 | if (!reserve_perfctr_nmi(x86_pmu.perfctr + i)) |
254 | goto perfctr_fail; | 335 | goto perfctr_fail; |
255 | } | 336 | } |
256 | 337 | ||
257 | for (i = 0; i < x86_pmu.num_events; i++) { | 338 | for (i = 0; i < x86_pmu.num_counters; i++) { |
258 | if (!reserve_evntsel_nmi(x86_pmu.eventsel + i)) | 339 | if (!reserve_evntsel_nmi(x86_pmu.eventsel + i)) |
259 | goto eventsel_fail; | 340 | goto eventsel_fail; |
260 | } | 341 | } |
261 | #endif | ||
262 | 342 | ||
263 | return true; | 343 | return true; |
264 | 344 | ||
265 | #ifdef CONFIG_X86_LOCAL_APIC | ||
266 | eventsel_fail: | 345 | eventsel_fail: |
267 | for (i--; i >= 0; i--) | 346 | for (i--; i >= 0; i--) |
268 | release_evntsel_nmi(x86_pmu.eventsel + i); | 347 | release_evntsel_nmi(x86_pmu.eventsel + i); |
269 | 348 | ||
270 | i = x86_pmu.num_events; | 349 | i = x86_pmu.num_counters; |
271 | 350 | ||
272 | perfctr_fail: | 351 | perfctr_fail: |
273 | for (i--; i >= 0; i--) | 352 | for (i--; i >= 0; i--) |
@@ -277,128 +356,36 @@ perfctr_fail: | |||
277 | enable_lapic_nmi_watchdog(); | 356 | enable_lapic_nmi_watchdog(); |
278 | 357 | ||
279 | return false; | 358 | return false; |
280 | #endif | ||
281 | } | 359 | } |
282 | 360 | ||
283 | static void release_pmc_hardware(void) | 361 | static void release_pmc_hardware(void) |
284 | { | 362 | { |
285 | #ifdef CONFIG_X86_LOCAL_APIC | ||
286 | int i; | 363 | int i; |
287 | 364 | ||
288 | for (i = 0; i < x86_pmu.num_events; i++) { | 365 | for (i = 0; i < x86_pmu.num_counters; i++) { |
289 | release_perfctr_nmi(x86_pmu.perfctr + i); | 366 | release_perfctr_nmi(x86_pmu.perfctr + i); |
290 | release_evntsel_nmi(x86_pmu.eventsel + i); | 367 | release_evntsel_nmi(x86_pmu.eventsel + i); |
291 | } | 368 | } |
292 | 369 | ||
293 | if (nmi_watchdog == NMI_LOCAL_APIC) | 370 | if (nmi_watchdog == NMI_LOCAL_APIC) |
294 | enable_lapic_nmi_watchdog(); | 371 | enable_lapic_nmi_watchdog(); |
295 | #endif | ||
296 | } | ||
297 | |||
298 | static inline bool bts_available(void) | ||
299 | { | ||
300 | return x86_pmu.enable_bts != NULL; | ||
301 | } | 372 | } |
302 | 373 | ||
303 | static void init_debug_store_on_cpu(int cpu) | 374 | #else |
304 | { | ||
305 | struct debug_store *ds = per_cpu(cpu_hw_events, cpu).ds; | ||
306 | |||
307 | if (!ds) | ||
308 | return; | ||
309 | |||
310 | wrmsr_on_cpu(cpu, MSR_IA32_DS_AREA, | ||
311 | (u32)((u64)(unsigned long)ds), | ||
312 | (u32)((u64)(unsigned long)ds >> 32)); | ||
313 | } | ||
314 | |||
315 | static void fini_debug_store_on_cpu(int cpu) | ||
316 | { | ||
317 | if (!per_cpu(cpu_hw_events, cpu).ds) | ||
318 | return; | ||
319 | |||
320 | wrmsr_on_cpu(cpu, MSR_IA32_DS_AREA, 0, 0); | ||
321 | } | ||
322 | |||
323 | static void release_bts_hardware(void) | ||
324 | { | ||
325 | int cpu; | ||
326 | |||
327 | if (!bts_available()) | ||
328 | return; | ||
329 | |||
330 | get_online_cpus(); | ||
331 | |||
332 | for_each_online_cpu(cpu) | ||
333 | fini_debug_store_on_cpu(cpu); | ||
334 | |||
335 | for_each_possible_cpu(cpu) { | ||
336 | struct debug_store *ds = per_cpu(cpu_hw_events, cpu).ds; | ||
337 | |||
338 | if (!ds) | ||
339 | continue; | ||
340 | |||
341 | per_cpu(cpu_hw_events, cpu).ds = NULL; | ||
342 | |||
343 | kfree((void *)(unsigned long)ds->bts_buffer_base); | ||
344 | kfree(ds); | ||
345 | } | ||
346 | |||
347 | put_online_cpus(); | ||
348 | } | ||
349 | |||
350 | static int reserve_bts_hardware(void) | ||
351 | { | ||
352 | int cpu, err = 0; | ||
353 | |||
354 | if (!bts_available()) | ||
355 | return 0; | ||
356 | |||
357 | get_online_cpus(); | ||
358 | |||
359 | for_each_possible_cpu(cpu) { | ||
360 | struct debug_store *ds; | ||
361 | void *buffer; | ||
362 | |||
363 | err = -ENOMEM; | ||
364 | buffer = kzalloc(BTS_BUFFER_SIZE, GFP_KERNEL); | ||
365 | if (unlikely(!buffer)) | ||
366 | break; | ||
367 | |||
368 | ds = kzalloc(sizeof(*ds), GFP_KERNEL); | ||
369 | if (unlikely(!ds)) { | ||
370 | kfree(buffer); | ||
371 | break; | ||
372 | } | ||
373 | |||
374 | ds->bts_buffer_base = (u64)(unsigned long)buffer; | ||
375 | ds->bts_index = ds->bts_buffer_base; | ||
376 | ds->bts_absolute_maximum = | ||
377 | ds->bts_buffer_base + BTS_BUFFER_SIZE; | ||
378 | ds->bts_interrupt_threshold = | ||
379 | ds->bts_absolute_maximum - BTS_OVFL_TH; | ||
380 | |||
381 | per_cpu(cpu_hw_events, cpu).ds = ds; | ||
382 | err = 0; | ||
383 | } | ||
384 | 375 | ||
385 | if (err) | 376 | static bool reserve_pmc_hardware(void) { return true; } |
386 | release_bts_hardware(); | 377 | static void release_pmc_hardware(void) {} |
387 | else { | ||
388 | for_each_online_cpu(cpu) | ||
389 | init_debug_store_on_cpu(cpu); | ||
390 | } | ||
391 | 378 | ||
392 | put_online_cpus(); | 379 | #endif |
393 | 380 | ||
394 | return err; | 381 | static int reserve_ds_buffers(void); |
395 | } | 382 | static void release_ds_buffers(void); |
396 | 383 | ||
397 | static void hw_perf_event_destroy(struct perf_event *event) | 384 | static void hw_perf_event_destroy(struct perf_event *event) |
398 | { | 385 | { |
399 | if (atomic_dec_and_mutex_lock(&active_events, &pmc_reserve_mutex)) { | 386 | if (atomic_dec_and_mutex_lock(&active_events, &pmc_reserve_mutex)) { |
400 | release_pmc_hardware(); | 387 | release_pmc_hardware(); |
401 | release_bts_hardware(); | 388 | release_ds_buffers(); |
402 | mutex_unlock(&pmc_reserve_mutex); | 389 | mutex_unlock(&pmc_reserve_mutex); |
403 | } | 390 | } |
404 | } | 391 | } |
@@ -441,54 +428,11 @@ set_ext_hw_attr(struct hw_perf_event *hwc, struct perf_event_attr *attr) | |||
441 | return 0; | 428 | return 0; |
442 | } | 429 | } |
443 | 430 | ||
444 | /* | 431 | static int x86_setup_perfctr(struct perf_event *event) |
445 | * Setup the hardware configuration for a given attr_type | ||
446 | */ | ||
447 | static int __hw_perf_event_init(struct perf_event *event) | ||
448 | { | 432 | { |
449 | struct perf_event_attr *attr = &event->attr; | 433 | struct perf_event_attr *attr = &event->attr; |
450 | struct hw_perf_event *hwc = &event->hw; | 434 | struct hw_perf_event *hwc = &event->hw; |
451 | u64 config; | 435 | u64 config; |
452 | int err; | ||
453 | |||
454 | if (!x86_pmu_initialized()) | ||
455 | return -ENODEV; | ||
456 | |||
457 | err = 0; | ||
458 | if (!atomic_inc_not_zero(&active_events)) { | ||
459 | mutex_lock(&pmc_reserve_mutex); | ||
460 | if (atomic_read(&active_events) == 0) { | ||
461 | if (!reserve_pmc_hardware()) | ||
462 | err = -EBUSY; | ||
463 | else | ||
464 | err = reserve_bts_hardware(); | ||
465 | } | ||
466 | if (!err) | ||
467 | atomic_inc(&active_events); | ||
468 | mutex_unlock(&pmc_reserve_mutex); | ||
469 | } | ||
470 | if (err) | ||
471 | return err; | ||
472 | |||
473 | event->destroy = hw_perf_event_destroy; | ||
474 | |||
475 | /* | ||
476 | * Generate PMC IRQs: | ||
477 | * (keep 'enabled' bit clear for now) | ||
478 | */ | ||
479 | hwc->config = ARCH_PERFMON_EVENTSEL_INT; | ||
480 | |||
481 | hwc->idx = -1; | ||
482 | hwc->last_cpu = -1; | ||
483 | hwc->last_tag = ~0ULL; | ||
484 | |||
485 | /* | ||
486 | * Count user and OS events unless requested not to. | ||
487 | */ | ||
488 | if (!attr->exclude_user) | ||
489 | hwc->config |= ARCH_PERFMON_EVENTSEL_USR; | ||
490 | if (!attr->exclude_kernel) | ||
491 | hwc->config |= ARCH_PERFMON_EVENTSEL_OS; | ||
492 | 436 | ||
493 | if (!hwc->sample_period) { | 437 | if (!hwc->sample_period) { |
494 | hwc->sample_period = x86_pmu.max_period; | 438 | hwc->sample_period = x86_pmu.max_period; |
@@ -505,16 +449,8 @@ static int __hw_perf_event_init(struct perf_event *event) | |||
505 | return -EOPNOTSUPP; | 449 | return -EOPNOTSUPP; |
506 | } | 450 | } |
507 | 451 | ||
508 | /* | 452 | if (attr->type == PERF_TYPE_RAW) |
509 | * Raw hw_event type provide the config in the hw_event structure | ||
510 | */ | ||
511 | if (attr->type == PERF_TYPE_RAW) { | ||
512 | hwc->config |= x86_pmu.raw_event(attr->config); | ||
513 | if ((hwc->config & ARCH_PERFMON_EVENTSEL_ANY) && | ||
514 | perf_paranoid_cpu() && !capable(CAP_SYS_ADMIN)) | ||
515 | return -EACCES; | ||
516 | return 0; | 453 | return 0; |
517 | } | ||
518 | 454 | ||
519 | if (attr->type == PERF_TYPE_HW_CACHE) | 455 | if (attr->type == PERF_TYPE_HW_CACHE) |
520 | return set_ext_hw_attr(hwc, attr); | 456 | return set_ext_hw_attr(hwc, attr); |
@@ -539,11 +475,11 @@ static int __hw_perf_event_init(struct perf_event *event) | |||
539 | if ((attr->config == PERF_COUNT_HW_BRANCH_INSTRUCTIONS) && | 475 | if ((attr->config == PERF_COUNT_HW_BRANCH_INSTRUCTIONS) && |
540 | (hwc->sample_period == 1)) { | 476 | (hwc->sample_period == 1)) { |
541 | /* BTS is not supported by this architecture. */ | 477 | /* BTS is not supported by this architecture. */ |
542 | if (!bts_available()) | 478 | if (!x86_pmu.bts) |
543 | return -EOPNOTSUPP; | 479 | return -EOPNOTSUPP; |
544 | 480 | ||
545 | /* BTS is currently only allowed for user-mode. */ | 481 | /* BTS is currently only allowed for user-mode. */ |
546 | if (hwc->config & ARCH_PERFMON_EVENTSEL_OS) | 482 | if (!attr->exclude_kernel) |
547 | return -EOPNOTSUPP; | 483 | return -EOPNOTSUPP; |
548 | } | 484 | } |
549 | 485 | ||
@@ -552,12 +488,87 @@ static int __hw_perf_event_init(struct perf_event *event) | |||
552 | return 0; | 488 | return 0; |
553 | } | 489 | } |
554 | 490 | ||
491 | static int x86_pmu_hw_config(struct perf_event *event) | ||
492 | { | ||
493 | if (event->attr.precise_ip) { | ||
494 | int precise = 0; | ||
495 | |||
496 | /* Support for constant skid */ | ||
497 | if (x86_pmu.pebs) | ||
498 | precise++; | ||
499 | |||
500 | /* Support for IP fixup */ | ||
501 | if (x86_pmu.lbr_nr) | ||
502 | precise++; | ||
503 | |||
504 | if (event->attr.precise_ip > precise) | ||
505 | return -EOPNOTSUPP; | ||
506 | } | ||
507 | |||
508 | /* | ||
509 | * Generate PMC IRQs: | ||
510 | * (keep 'enabled' bit clear for now) | ||
511 | */ | ||
512 | event->hw.config = ARCH_PERFMON_EVENTSEL_INT; | ||
513 | |||
514 | /* | ||
515 | * Count user and OS events unless requested not to | ||
516 | */ | ||
517 | if (!event->attr.exclude_user) | ||
518 | event->hw.config |= ARCH_PERFMON_EVENTSEL_USR; | ||
519 | if (!event->attr.exclude_kernel) | ||
520 | event->hw.config |= ARCH_PERFMON_EVENTSEL_OS; | ||
521 | |||
522 | if (event->attr.type == PERF_TYPE_RAW) | ||
523 | event->hw.config |= event->attr.config & X86_RAW_EVENT_MASK; | ||
524 | |||
525 | return x86_setup_perfctr(event); | ||
526 | } | ||
527 | |||
528 | /* | ||
529 | * Setup the hardware configuration for a given attr_type | ||
530 | */ | ||
531 | static int __hw_perf_event_init(struct perf_event *event) | ||
532 | { | ||
533 | int err; | ||
534 | |||
535 | if (!x86_pmu_initialized()) | ||
536 | return -ENODEV; | ||
537 | |||
538 | err = 0; | ||
539 | if (!atomic_inc_not_zero(&active_events)) { | ||
540 | mutex_lock(&pmc_reserve_mutex); | ||
541 | if (atomic_read(&active_events) == 0) { | ||
542 | if (!reserve_pmc_hardware()) | ||
543 | err = -EBUSY; | ||
544 | else { | ||
545 | err = reserve_ds_buffers(); | ||
546 | if (err) | ||
547 | release_pmc_hardware(); | ||
548 | } | ||
549 | } | ||
550 | if (!err) | ||
551 | atomic_inc(&active_events); | ||
552 | mutex_unlock(&pmc_reserve_mutex); | ||
553 | } | ||
554 | if (err) | ||
555 | return err; | ||
556 | |||
557 | event->destroy = hw_perf_event_destroy; | ||
558 | |||
559 | event->hw.idx = -1; | ||
560 | event->hw.last_cpu = -1; | ||
561 | event->hw.last_tag = ~0ULL; | ||
562 | |||
563 | return x86_pmu.hw_config(event); | ||
564 | } | ||
565 | |||
555 | static void x86_pmu_disable_all(void) | 566 | static void x86_pmu_disable_all(void) |
556 | { | 567 | { |
557 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 568 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
558 | int idx; | 569 | int idx; |
559 | 570 | ||
560 | for (idx = 0; idx < x86_pmu.num_events; idx++) { | 571 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { |
561 | u64 val; | 572 | u64 val; |
562 | 573 | ||
563 | if (!test_bit(idx, cpuc->active_mask)) | 574 | if (!test_bit(idx, cpuc->active_mask)) |
@@ -587,12 +598,12 @@ void hw_perf_disable(void) | |||
587 | x86_pmu.disable_all(); | 598 | x86_pmu.disable_all(); |
588 | } | 599 | } |
589 | 600 | ||
590 | static void x86_pmu_enable_all(void) | 601 | static void x86_pmu_enable_all(int added) |
591 | { | 602 | { |
592 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 603 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
593 | int idx; | 604 | int idx; |
594 | 605 | ||
595 | for (idx = 0; idx < x86_pmu.num_events; idx++) { | 606 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { |
596 | struct perf_event *event = cpuc->events[idx]; | 607 | struct perf_event *event = cpuc->events[idx]; |
597 | u64 val; | 608 | u64 val; |
598 | 609 | ||
@@ -667,14 +678,14 @@ static int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign) | |||
667 | * assign events to counters starting with most | 678 | * assign events to counters starting with most |
668 | * constrained events. | 679 | * constrained events. |
669 | */ | 680 | */ |
670 | wmax = x86_pmu.num_events; | 681 | wmax = x86_pmu.num_counters; |
671 | 682 | ||
672 | /* | 683 | /* |
673 | * when fixed event counters are present, | 684 | * when fixed event counters are present, |
674 | * wmax is incremented by 1 to account | 685 | * wmax is incremented by 1 to account |
675 | * for one more choice | 686 | * for one more choice |
676 | */ | 687 | */ |
677 | if (x86_pmu.num_events_fixed) | 688 | if (x86_pmu.num_counters_fixed) |
678 | wmax++; | 689 | wmax++; |
679 | 690 | ||
680 | for (w = 1, num = n; num && w <= wmax; w++) { | 691 | for (w = 1, num = n; num && w <= wmax; w++) { |
@@ -724,7 +735,7 @@ static int collect_events(struct cpu_hw_events *cpuc, struct perf_event *leader, | |||
724 | struct perf_event *event; | 735 | struct perf_event *event; |
725 | int n, max_count; | 736 | int n, max_count; |
726 | 737 | ||
727 | max_count = x86_pmu.num_events + x86_pmu.num_events_fixed; | 738 | max_count = x86_pmu.num_counters + x86_pmu.num_counters_fixed; |
728 | 739 | ||
729 | /* current number of events already accepted */ | 740 | /* current number of events already accepted */ |
730 | n = cpuc->n_events; | 741 | n = cpuc->n_events; |
@@ -795,7 +806,7 @@ void hw_perf_enable(void) | |||
795 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 806 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
796 | struct perf_event *event; | 807 | struct perf_event *event; |
797 | struct hw_perf_event *hwc; | 808 | struct hw_perf_event *hwc; |
798 | int i; | 809 | int i, added = cpuc->n_added; |
799 | 810 | ||
800 | if (!x86_pmu_initialized()) | 811 | if (!x86_pmu_initialized()) |
801 | return; | 812 | return; |
@@ -847,19 +858,20 @@ void hw_perf_enable(void) | |||
847 | cpuc->enabled = 1; | 858 | cpuc->enabled = 1; |
848 | barrier(); | 859 | barrier(); |
849 | 860 | ||
850 | x86_pmu.enable_all(); | 861 | x86_pmu.enable_all(added); |
851 | } | 862 | } |
852 | 863 | ||
853 | static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc) | 864 | static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc, |
865 | u64 enable_mask) | ||
854 | { | 866 | { |
855 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, | 867 | wrmsrl(hwc->config_base + hwc->idx, hwc->config | enable_mask); |
856 | hwc->config | ARCH_PERFMON_EVENTSEL_ENABLE); | ||
857 | } | 868 | } |
858 | 869 | ||
859 | static inline void x86_pmu_disable_event(struct perf_event *event) | 870 | static inline void x86_pmu_disable_event(struct perf_event *event) |
860 | { | 871 | { |
861 | struct hw_perf_event *hwc = &event->hw; | 872 | struct hw_perf_event *hwc = &event->hw; |
862 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, hwc->config); | 873 | |
874 | wrmsrl(hwc->config_base + hwc->idx, hwc->config); | ||
863 | } | 875 | } |
864 | 876 | ||
865 | static DEFINE_PER_CPU(u64 [X86_PMC_IDX_MAX], pmc_prev_left); | 877 | static DEFINE_PER_CPU(u64 [X86_PMC_IDX_MAX], pmc_prev_left); |
@@ -874,7 +886,7 @@ x86_perf_event_set_period(struct perf_event *event) | |||
874 | struct hw_perf_event *hwc = &event->hw; | 886 | struct hw_perf_event *hwc = &event->hw; |
875 | s64 left = atomic64_read(&hwc->period_left); | 887 | s64 left = atomic64_read(&hwc->period_left); |
876 | s64 period = hwc->sample_period; | 888 | s64 period = hwc->sample_period; |
877 | int err, ret = 0, idx = hwc->idx; | 889 | int ret = 0, idx = hwc->idx; |
878 | 890 | ||
879 | if (idx == X86_PMC_IDX_FIXED_BTS) | 891 | if (idx == X86_PMC_IDX_FIXED_BTS) |
880 | return 0; | 892 | return 0; |
@@ -912,8 +924,8 @@ x86_perf_event_set_period(struct perf_event *event) | |||
912 | */ | 924 | */ |
913 | atomic64_set(&hwc->prev_count, (u64)-left); | 925 | atomic64_set(&hwc->prev_count, (u64)-left); |
914 | 926 | ||
915 | err = checking_wrmsrl(hwc->event_base + idx, | 927 | wrmsrl(hwc->event_base + idx, |
916 | (u64)(-left) & x86_pmu.event_mask); | 928 | (u64)(-left) & x86_pmu.cntval_mask); |
917 | 929 | ||
918 | perf_event_update_userpage(event); | 930 | perf_event_update_userpage(event); |
919 | 931 | ||
@@ -924,7 +936,8 @@ static void x86_pmu_enable_event(struct perf_event *event) | |||
924 | { | 936 | { |
925 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 937 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
926 | if (cpuc->enabled) | 938 | if (cpuc->enabled) |
927 | __x86_pmu_enable_event(&event->hw); | 939 | __x86_pmu_enable_event(&event->hw, |
940 | ARCH_PERFMON_EVENTSEL_ENABLE); | ||
928 | } | 941 | } |
929 | 942 | ||
930 | /* | 943 | /* |
@@ -950,7 +963,15 @@ static int x86_pmu_enable(struct perf_event *event) | |||
950 | if (n < 0) | 963 | if (n < 0) |
951 | return n; | 964 | return n; |
952 | 965 | ||
953 | ret = x86_schedule_events(cpuc, n, assign); | 966 | /* |
967 | * If group events scheduling transaction was started, | ||
968 | * skip the schedulability test here, it will be peformed | ||
969 | * at commit time(->commit_txn) as a whole | ||
970 | */ | ||
971 | if (cpuc->group_flag & PERF_EVENT_TXN_STARTED) | ||
972 | goto out; | ||
973 | |||
974 | ret = x86_pmu.schedule_events(cpuc, n, assign); | ||
954 | if (ret) | 975 | if (ret) |
955 | return ret; | 976 | return ret; |
956 | /* | 977 | /* |
@@ -959,6 +980,7 @@ static int x86_pmu_enable(struct perf_event *event) | |||
959 | */ | 980 | */ |
960 | memcpy(cpuc->assign, assign, n*sizeof(int)); | 981 | memcpy(cpuc->assign, assign, n*sizeof(int)); |
961 | 982 | ||
983 | out: | ||
962 | cpuc->n_events = n; | 984 | cpuc->n_events = n; |
963 | cpuc->n_added += n - n0; | 985 | cpuc->n_added += n - n0; |
964 | 986 | ||
@@ -991,11 +1013,12 @@ static void x86_pmu_unthrottle(struct perf_event *event) | |||
991 | void perf_event_print_debug(void) | 1013 | void perf_event_print_debug(void) |
992 | { | 1014 | { |
993 | u64 ctrl, status, overflow, pmc_ctrl, pmc_count, prev_left, fixed; | 1015 | u64 ctrl, status, overflow, pmc_ctrl, pmc_count, prev_left, fixed; |
1016 | u64 pebs; | ||
994 | struct cpu_hw_events *cpuc; | 1017 | struct cpu_hw_events *cpuc; |
995 | unsigned long flags; | 1018 | unsigned long flags; |
996 | int cpu, idx; | 1019 | int cpu, idx; |
997 | 1020 | ||
998 | if (!x86_pmu.num_events) | 1021 | if (!x86_pmu.num_counters) |
999 | return; | 1022 | return; |
1000 | 1023 | ||
1001 | local_irq_save(flags); | 1024 | local_irq_save(flags); |
@@ -1008,16 +1031,18 @@ void perf_event_print_debug(void) | |||
1008 | rdmsrl(MSR_CORE_PERF_GLOBAL_STATUS, status); | 1031 | rdmsrl(MSR_CORE_PERF_GLOBAL_STATUS, status); |
1009 | rdmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, overflow); | 1032 | rdmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, overflow); |
1010 | rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR_CTRL, fixed); | 1033 | rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR_CTRL, fixed); |
1034 | rdmsrl(MSR_IA32_PEBS_ENABLE, pebs); | ||
1011 | 1035 | ||
1012 | pr_info("\n"); | 1036 | pr_info("\n"); |
1013 | pr_info("CPU#%d: ctrl: %016llx\n", cpu, ctrl); | 1037 | pr_info("CPU#%d: ctrl: %016llx\n", cpu, ctrl); |
1014 | pr_info("CPU#%d: status: %016llx\n", cpu, status); | 1038 | pr_info("CPU#%d: status: %016llx\n", cpu, status); |
1015 | pr_info("CPU#%d: overflow: %016llx\n", cpu, overflow); | 1039 | pr_info("CPU#%d: overflow: %016llx\n", cpu, overflow); |
1016 | pr_info("CPU#%d: fixed: %016llx\n", cpu, fixed); | 1040 | pr_info("CPU#%d: fixed: %016llx\n", cpu, fixed); |
1041 | pr_info("CPU#%d: pebs: %016llx\n", cpu, pebs); | ||
1017 | } | 1042 | } |
1018 | pr_info("CPU#%d: active: %016llx\n", cpu, *(u64 *)cpuc->active_mask); | 1043 | pr_info("CPU#%d: active: %016llx\n", cpu, *(u64 *)cpuc->active_mask); |
1019 | 1044 | ||
1020 | for (idx = 0; idx < x86_pmu.num_events; idx++) { | 1045 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { |
1021 | rdmsrl(x86_pmu.eventsel + idx, pmc_ctrl); | 1046 | rdmsrl(x86_pmu.eventsel + idx, pmc_ctrl); |
1022 | rdmsrl(x86_pmu.perfctr + idx, pmc_count); | 1047 | rdmsrl(x86_pmu.perfctr + idx, pmc_count); |
1023 | 1048 | ||
@@ -1030,7 +1055,7 @@ void perf_event_print_debug(void) | |||
1030 | pr_info("CPU#%d: gen-PMC%d left: %016llx\n", | 1055 | pr_info("CPU#%d: gen-PMC%d left: %016llx\n", |
1031 | cpu, idx, prev_left); | 1056 | cpu, idx, prev_left); |
1032 | } | 1057 | } |
1033 | for (idx = 0; idx < x86_pmu.num_events_fixed; idx++) { | 1058 | for (idx = 0; idx < x86_pmu.num_counters_fixed; idx++) { |
1034 | rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, pmc_count); | 1059 | rdmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, pmc_count); |
1035 | 1060 | ||
1036 | pr_info("CPU#%d: fixed-PMC%d count: %016llx\n", | 1061 | pr_info("CPU#%d: fixed-PMC%d count: %016llx\n", |
@@ -1095,7 +1120,7 @@ static int x86_pmu_handle_irq(struct pt_regs *regs) | |||
1095 | 1120 | ||
1096 | cpuc = &__get_cpu_var(cpu_hw_events); | 1121 | cpuc = &__get_cpu_var(cpu_hw_events); |
1097 | 1122 | ||
1098 | for (idx = 0; idx < x86_pmu.num_events; idx++) { | 1123 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { |
1099 | if (!test_bit(idx, cpuc->active_mask)) | 1124 | if (!test_bit(idx, cpuc->active_mask)) |
1100 | continue; | 1125 | continue; |
1101 | 1126 | ||
@@ -1103,7 +1128,7 @@ static int x86_pmu_handle_irq(struct pt_regs *regs) | |||
1103 | hwc = &event->hw; | 1128 | hwc = &event->hw; |
1104 | 1129 | ||
1105 | val = x86_perf_event_update(event); | 1130 | val = x86_perf_event_update(event); |
1106 | if (val & (1ULL << (x86_pmu.event_bits - 1))) | 1131 | if (val & (1ULL << (x86_pmu.cntval_bits - 1))) |
1107 | continue; | 1132 | continue; |
1108 | 1133 | ||
1109 | /* | 1134 | /* |
@@ -1146,7 +1171,6 @@ void set_perf_event_pending(void) | |||
1146 | 1171 | ||
1147 | void perf_events_lapic_init(void) | 1172 | void perf_events_lapic_init(void) |
1148 | { | 1173 | { |
1149 | #ifdef CONFIG_X86_LOCAL_APIC | ||
1150 | if (!x86_pmu.apic || !x86_pmu_initialized()) | 1174 | if (!x86_pmu.apic || !x86_pmu_initialized()) |
1151 | return; | 1175 | return; |
1152 | 1176 | ||
@@ -1154,7 +1178,6 @@ void perf_events_lapic_init(void) | |||
1154 | * Always use NMI for PMU | 1178 | * Always use NMI for PMU |
1155 | */ | 1179 | */ |
1156 | apic_write(APIC_LVTPC, APIC_DM_NMI); | 1180 | apic_write(APIC_LVTPC, APIC_DM_NMI); |
1157 | #endif | ||
1158 | } | 1181 | } |
1159 | 1182 | ||
1160 | static int __kprobes | 1183 | static int __kprobes |
@@ -1178,9 +1201,7 @@ perf_event_nmi_handler(struct notifier_block *self, | |||
1178 | 1201 | ||
1179 | regs = args->regs; | 1202 | regs = args->regs; |
1180 | 1203 | ||
1181 | #ifdef CONFIG_X86_LOCAL_APIC | ||
1182 | apic_write(APIC_LVTPC, APIC_DM_NMI); | 1204 | apic_write(APIC_LVTPC, APIC_DM_NMI); |
1183 | #endif | ||
1184 | /* | 1205 | /* |
1185 | * Can't rely on the handled return value to say it was our NMI, two | 1206 | * Can't rely on the handled return value to say it was our NMI, two |
1186 | * events could trigger 'simultaneously' raising two back-to-back NMIs. | 1207 | * events could trigger 'simultaneously' raising two back-to-back NMIs. |
@@ -1217,118 +1238,11 @@ x86_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event) | |||
1217 | return &unconstrained; | 1238 | return &unconstrained; |
1218 | } | 1239 | } |
1219 | 1240 | ||
1220 | static int x86_event_sched_in(struct perf_event *event, | ||
1221 | struct perf_cpu_context *cpuctx) | ||
1222 | { | ||
1223 | int ret = 0; | ||
1224 | |||
1225 | event->state = PERF_EVENT_STATE_ACTIVE; | ||
1226 | event->oncpu = smp_processor_id(); | ||
1227 | event->tstamp_running += event->ctx->time - event->tstamp_stopped; | ||
1228 | |||
1229 | if (!is_x86_event(event)) | ||
1230 | ret = event->pmu->enable(event); | ||
1231 | |||
1232 | if (!ret && !is_software_event(event)) | ||
1233 | cpuctx->active_oncpu++; | ||
1234 | |||
1235 | if (!ret && event->attr.exclusive) | ||
1236 | cpuctx->exclusive = 1; | ||
1237 | |||
1238 | return ret; | ||
1239 | } | ||
1240 | |||
1241 | static void x86_event_sched_out(struct perf_event *event, | ||
1242 | struct perf_cpu_context *cpuctx) | ||
1243 | { | ||
1244 | event->state = PERF_EVENT_STATE_INACTIVE; | ||
1245 | event->oncpu = -1; | ||
1246 | |||
1247 | if (!is_x86_event(event)) | ||
1248 | event->pmu->disable(event); | ||
1249 | |||
1250 | event->tstamp_running -= event->ctx->time - event->tstamp_stopped; | ||
1251 | |||
1252 | if (!is_software_event(event)) | ||
1253 | cpuctx->active_oncpu--; | ||
1254 | |||
1255 | if (event->attr.exclusive || !cpuctx->active_oncpu) | ||
1256 | cpuctx->exclusive = 0; | ||
1257 | } | ||
1258 | |||
1259 | /* | ||
1260 | * Called to enable a whole group of events. | ||
1261 | * Returns 1 if the group was enabled, or -EAGAIN if it could not be. | ||
1262 | * Assumes the caller has disabled interrupts and has | ||
1263 | * frozen the PMU with hw_perf_save_disable. | ||
1264 | * | ||
1265 | * called with PMU disabled. If successful and return value 1, | ||
1266 | * then guaranteed to call perf_enable() and hw_perf_enable() | ||
1267 | */ | ||
1268 | int hw_perf_group_sched_in(struct perf_event *leader, | ||
1269 | struct perf_cpu_context *cpuctx, | ||
1270 | struct perf_event_context *ctx) | ||
1271 | { | ||
1272 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
1273 | struct perf_event *sub; | ||
1274 | int assign[X86_PMC_IDX_MAX]; | ||
1275 | int n0, n1, ret; | ||
1276 | |||
1277 | /* n0 = total number of events */ | ||
1278 | n0 = collect_events(cpuc, leader, true); | ||
1279 | if (n0 < 0) | ||
1280 | return n0; | ||
1281 | |||
1282 | ret = x86_schedule_events(cpuc, n0, assign); | ||
1283 | if (ret) | ||
1284 | return ret; | ||
1285 | |||
1286 | ret = x86_event_sched_in(leader, cpuctx); | ||
1287 | if (ret) | ||
1288 | return ret; | ||
1289 | |||
1290 | n1 = 1; | ||
1291 | list_for_each_entry(sub, &leader->sibling_list, group_entry) { | ||
1292 | if (sub->state > PERF_EVENT_STATE_OFF) { | ||
1293 | ret = x86_event_sched_in(sub, cpuctx); | ||
1294 | if (ret) | ||
1295 | goto undo; | ||
1296 | ++n1; | ||
1297 | } | ||
1298 | } | ||
1299 | /* | ||
1300 | * copy new assignment, now we know it is possible | ||
1301 | * will be used by hw_perf_enable() | ||
1302 | */ | ||
1303 | memcpy(cpuc->assign, assign, n0*sizeof(int)); | ||
1304 | |||
1305 | cpuc->n_events = n0; | ||
1306 | cpuc->n_added += n1; | ||
1307 | ctx->nr_active += n1; | ||
1308 | |||
1309 | /* | ||
1310 | * 1 means successful and events are active | ||
1311 | * This is not quite true because we defer | ||
1312 | * actual activation until hw_perf_enable() but | ||
1313 | * this way we* ensure caller won't try to enable | ||
1314 | * individual events | ||
1315 | */ | ||
1316 | return 1; | ||
1317 | undo: | ||
1318 | x86_event_sched_out(leader, cpuctx); | ||
1319 | n0 = 1; | ||
1320 | list_for_each_entry(sub, &leader->sibling_list, group_entry) { | ||
1321 | if (sub->state == PERF_EVENT_STATE_ACTIVE) { | ||
1322 | x86_event_sched_out(sub, cpuctx); | ||
1323 | if (++n0 == n1) | ||
1324 | break; | ||
1325 | } | ||
1326 | } | ||
1327 | return ret; | ||
1328 | } | ||
1329 | |||
1330 | #include "perf_event_amd.c" | 1241 | #include "perf_event_amd.c" |
1331 | #include "perf_event_p6.c" | 1242 | #include "perf_event_p6.c" |
1243 | #include "perf_event_p4.c" | ||
1244 | #include "perf_event_intel_lbr.c" | ||
1245 | #include "perf_event_intel_ds.c" | ||
1332 | #include "perf_event_intel.c" | 1246 | #include "perf_event_intel.c" |
1333 | 1247 | ||
1334 | static int __cpuinit | 1248 | static int __cpuinit |
@@ -1402,48 +1316,50 @@ void __init init_hw_perf_events(void) | |||
1402 | 1316 | ||
1403 | pr_cont("%s PMU driver.\n", x86_pmu.name); | 1317 | pr_cont("%s PMU driver.\n", x86_pmu.name); |
1404 | 1318 | ||
1405 | if (x86_pmu.num_events > X86_PMC_MAX_GENERIC) { | 1319 | if (x86_pmu.quirks) |
1320 | x86_pmu.quirks(); | ||
1321 | |||
1322 | if (x86_pmu.num_counters > X86_PMC_MAX_GENERIC) { | ||
1406 | WARN(1, KERN_ERR "hw perf events %d > max(%d), clipping!", | 1323 | WARN(1, KERN_ERR "hw perf events %d > max(%d), clipping!", |
1407 | x86_pmu.num_events, X86_PMC_MAX_GENERIC); | 1324 | x86_pmu.num_counters, X86_PMC_MAX_GENERIC); |
1408 | x86_pmu.num_events = X86_PMC_MAX_GENERIC; | 1325 | x86_pmu.num_counters = X86_PMC_MAX_GENERIC; |
1409 | } | 1326 | } |
1410 | perf_event_mask = (1 << x86_pmu.num_events) - 1; | 1327 | x86_pmu.intel_ctrl = (1 << x86_pmu.num_counters) - 1; |
1411 | perf_max_events = x86_pmu.num_events; | 1328 | perf_max_events = x86_pmu.num_counters; |
1412 | 1329 | ||
1413 | if (x86_pmu.num_events_fixed > X86_PMC_MAX_FIXED) { | 1330 | if (x86_pmu.num_counters_fixed > X86_PMC_MAX_FIXED) { |
1414 | WARN(1, KERN_ERR "hw perf events fixed %d > max(%d), clipping!", | 1331 | WARN(1, KERN_ERR "hw perf events fixed %d > max(%d), clipping!", |
1415 | x86_pmu.num_events_fixed, X86_PMC_MAX_FIXED); | 1332 | x86_pmu.num_counters_fixed, X86_PMC_MAX_FIXED); |
1416 | x86_pmu.num_events_fixed = X86_PMC_MAX_FIXED; | 1333 | x86_pmu.num_counters_fixed = X86_PMC_MAX_FIXED; |
1417 | } | 1334 | } |
1418 | 1335 | ||
1419 | perf_event_mask |= | 1336 | x86_pmu.intel_ctrl |= |
1420 | ((1LL << x86_pmu.num_events_fixed)-1) << X86_PMC_IDX_FIXED; | 1337 | ((1LL << x86_pmu.num_counters_fixed)-1) << X86_PMC_IDX_FIXED; |
1421 | x86_pmu.intel_ctrl = perf_event_mask; | ||
1422 | 1338 | ||
1423 | perf_events_lapic_init(); | 1339 | perf_events_lapic_init(); |
1424 | register_die_notifier(&perf_event_nmi_notifier); | 1340 | register_die_notifier(&perf_event_nmi_notifier); |
1425 | 1341 | ||
1426 | unconstrained = (struct event_constraint) | 1342 | unconstrained = (struct event_constraint) |
1427 | __EVENT_CONSTRAINT(0, (1ULL << x86_pmu.num_events) - 1, | 1343 | __EVENT_CONSTRAINT(0, (1ULL << x86_pmu.num_counters) - 1, |
1428 | 0, x86_pmu.num_events); | 1344 | 0, x86_pmu.num_counters); |
1429 | 1345 | ||
1430 | if (x86_pmu.event_constraints) { | 1346 | if (x86_pmu.event_constraints) { |
1431 | for_each_event_constraint(c, x86_pmu.event_constraints) { | 1347 | for_each_event_constraint(c, x86_pmu.event_constraints) { |
1432 | if (c->cmask != INTEL_ARCH_FIXED_MASK) | 1348 | if (c->cmask != X86_RAW_EVENT_MASK) |
1433 | continue; | 1349 | continue; |
1434 | 1350 | ||
1435 | c->idxmsk64 |= (1ULL << x86_pmu.num_events) - 1; | 1351 | c->idxmsk64 |= (1ULL << x86_pmu.num_counters) - 1; |
1436 | c->weight += x86_pmu.num_events; | 1352 | c->weight += x86_pmu.num_counters; |
1437 | } | 1353 | } |
1438 | } | 1354 | } |
1439 | 1355 | ||
1440 | pr_info("... version: %d\n", x86_pmu.version); | 1356 | pr_info("... version: %d\n", x86_pmu.version); |
1441 | pr_info("... bit width: %d\n", x86_pmu.event_bits); | 1357 | pr_info("... bit width: %d\n", x86_pmu.cntval_bits); |
1442 | pr_info("... generic registers: %d\n", x86_pmu.num_events); | 1358 | pr_info("... generic registers: %d\n", x86_pmu.num_counters); |
1443 | pr_info("... value mask: %016Lx\n", x86_pmu.event_mask); | 1359 | pr_info("... value mask: %016Lx\n", x86_pmu.cntval_mask); |
1444 | pr_info("... max period: %016Lx\n", x86_pmu.max_period); | 1360 | pr_info("... max period: %016Lx\n", x86_pmu.max_period); |
1445 | pr_info("... fixed-purpose events: %d\n", x86_pmu.num_events_fixed); | 1361 | pr_info("... fixed-purpose events: %d\n", x86_pmu.num_counters_fixed); |
1446 | pr_info("... event mask: %016Lx\n", perf_event_mask); | 1362 | pr_info("... event mask: %016Lx\n", x86_pmu.intel_ctrl); |
1447 | 1363 | ||
1448 | perf_cpu_notifier(x86_pmu_notifier); | 1364 | perf_cpu_notifier(x86_pmu_notifier); |
1449 | } | 1365 | } |
@@ -1453,6 +1369,59 @@ static inline void x86_pmu_read(struct perf_event *event) | |||
1453 | x86_perf_event_update(event); | 1369 | x86_perf_event_update(event); |
1454 | } | 1370 | } |
1455 | 1371 | ||
1372 | /* | ||
1373 | * Start group events scheduling transaction | ||
1374 | * Set the flag to make pmu::enable() not perform the | ||
1375 | * schedulability test, it will be performed at commit time | ||
1376 | */ | ||
1377 | static void x86_pmu_start_txn(const struct pmu *pmu) | ||
1378 | { | ||
1379 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
1380 | |||
1381 | cpuc->group_flag |= PERF_EVENT_TXN_STARTED; | ||
1382 | } | ||
1383 | |||
1384 | /* | ||
1385 | * Stop group events scheduling transaction | ||
1386 | * Clear the flag and pmu::enable() will perform the | ||
1387 | * schedulability test. | ||
1388 | */ | ||
1389 | static void x86_pmu_cancel_txn(const struct pmu *pmu) | ||
1390 | { | ||
1391 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
1392 | |||
1393 | cpuc->group_flag &= ~PERF_EVENT_TXN_STARTED; | ||
1394 | } | ||
1395 | |||
1396 | /* | ||
1397 | * Commit group events scheduling transaction | ||
1398 | * Perform the group schedulability test as a whole | ||
1399 | * Return 0 if success | ||
1400 | */ | ||
1401 | static int x86_pmu_commit_txn(const struct pmu *pmu) | ||
1402 | { | ||
1403 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
1404 | int assign[X86_PMC_IDX_MAX]; | ||
1405 | int n, ret; | ||
1406 | |||
1407 | n = cpuc->n_events; | ||
1408 | |||
1409 | if (!x86_pmu_initialized()) | ||
1410 | return -EAGAIN; | ||
1411 | |||
1412 | ret = x86_pmu.schedule_events(cpuc, n, assign); | ||
1413 | if (ret) | ||
1414 | return ret; | ||
1415 | |||
1416 | /* | ||
1417 | * copy new assignment, now we know it is possible | ||
1418 | * will be used by hw_perf_enable() | ||
1419 | */ | ||
1420 | memcpy(cpuc->assign, assign, n*sizeof(int)); | ||
1421 | |||
1422 | return 0; | ||
1423 | } | ||
1424 | |||
1456 | static const struct pmu pmu = { | 1425 | static const struct pmu pmu = { |
1457 | .enable = x86_pmu_enable, | 1426 | .enable = x86_pmu_enable, |
1458 | .disable = x86_pmu_disable, | 1427 | .disable = x86_pmu_disable, |
@@ -1460,9 +1429,38 @@ static const struct pmu pmu = { | |||
1460 | .stop = x86_pmu_stop, | 1429 | .stop = x86_pmu_stop, |
1461 | .read = x86_pmu_read, | 1430 | .read = x86_pmu_read, |
1462 | .unthrottle = x86_pmu_unthrottle, | 1431 | .unthrottle = x86_pmu_unthrottle, |
1432 | .start_txn = x86_pmu_start_txn, | ||
1433 | .cancel_txn = x86_pmu_cancel_txn, | ||
1434 | .commit_txn = x86_pmu_commit_txn, | ||
1463 | }; | 1435 | }; |
1464 | 1436 | ||
1465 | /* | 1437 | /* |
1438 | * validate that we can schedule this event | ||
1439 | */ | ||
1440 | static int validate_event(struct perf_event *event) | ||
1441 | { | ||
1442 | struct cpu_hw_events *fake_cpuc; | ||
1443 | struct event_constraint *c; | ||
1444 | int ret = 0; | ||
1445 | |||
1446 | fake_cpuc = kmalloc(sizeof(*fake_cpuc), GFP_KERNEL | __GFP_ZERO); | ||
1447 | if (!fake_cpuc) | ||
1448 | return -ENOMEM; | ||
1449 | |||
1450 | c = x86_pmu.get_event_constraints(fake_cpuc, event); | ||
1451 | |||
1452 | if (!c || !c->weight) | ||
1453 | ret = -ENOSPC; | ||
1454 | |||
1455 | if (x86_pmu.put_event_constraints) | ||
1456 | x86_pmu.put_event_constraints(fake_cpuc, event); | ||
1457 | |||
1458 | kfree(fake_cpuc); | ||
1459 | |||
1460 | return ret; | ||
1461 | } | ||
1462 | |||
1463 | /* | ||
1466 | * validate a single event group | 1464 | * validate a single event group |
1467 | * | 1465 | * |
1468 | * validation include: | 1466 | * validation include: |
@@ -1502,7 +1500,7 @@ static int validate_group(struct perf_event *event) | |||
1502 | 1500 | ||
1503 | fake_cpuc->n_events = n; | 1501 | fake_cpuc->n_events = n; |
1504 | 1502 | ||
1505 | ret = x86_schedule_events(fake_cpuc, n, NULL); | 1503 | ret = x86_pmu.schedule_events(fake_cpuc, n, NULL); |
1506 | 1504 | ||
1507 | out_free: | 1505 | out_free: |
1508 | kfree(fake_cpuc); | 1506 | kfree(fake_cpuc); |
@@ -1527,6 +1525,8 @@ const struct pmu *hw_perf_event_init(struct perf_event *event) | |||
1527 | 1525 | ||
1528 | if (event->group_leader != event) | 1526 | if (event->group_leader != event) |
1529 | err = validate_group(event); | 1527 | err = validate_group(event); |
1528 | else | ||
1529 | err = validate_event(event); | ||
1530 | 1530 | ||
1531 | event->pmu = tmp; | 1531 | event->pmu = tmp; |
1532 | } | 1532 | } |
@@ -1574,8 +1574,7 @@ static void backtrace_address(void *data, unsigned long addr, int reliable) | |||
1574 | { | 1574 | { |
1575 | struct perf_callchain_entry *entry = data; | 1575 | struct perf_callchain_entry *entry = data; |
1576 | 1576 | ||
1577 | if (reliable) | 1577 | callchain_store(entry, addr); |
1578 | callchain_store(entry, addr); | ||
1579 | } | 1578 | } |
1580 | 1579 | ||
1581 | static const struct stacktrace_ops backtrace_ops = { | 1580 | static const struct stacktrace_ops backtrace_ops = { |
@@ -1597,41 +1596,6 @@ perf_callchain_kernel(struct pt_regs *regs, struct perf_callchain_entry *entry) | |||
1597 | dump_trace(NULL, regs, NULL, regs->bp, &backtrace_ops, entry); | 1596 | dump_trace(NULL, regs, NULL, regs->bp, &backtrace_ops, entry); |
1598 | } | 1597 | } |
1599 | 1598 | ||
1600 | /* | ||
1601 | * best effort, GUP based copy_from_user() that assumes IRQ or NMI context | ||
1602 | */ | ||
1603 | static unsigned long | ||
1604 | copy_from_user_nmi(void *to, const void __user *from, unsigned long n) | ||
1605 | { | ||
1606 | unsigned long offset, addr = (unsigned long)from; | ||
1607 | int type = in_nmi() ? KM_NMI : KM_IRQ0; | ||
1608 | unsigned long size, len = 0; | ||
1609 | struct page *page; | ||
1610 | void *map; | ||
1611 | int ret; | ||
1612 | |||
1613 | do { | ||
1614 | ret = __get_user_pages_fast(addr, 1, 0, &page); | ||
1615 | if (!ret) | ||
1616 | break; | ||
1617 | |||
1618 | offset = addr & (PAGE_SIZE - 1); | ||
1619 | size = min(PAGE_SIZE - offset, n - len); | ||
1620 | |||
1621 | map = kmap_atomic(page, type); | ||
1622 | memcpy(to, map+offset, size); | ||
1623 | kunmap_atomic(map, type); | ||
1624 | put_page(page); | ||
1625 | |||
1626 | len += size; | ||
1627 | to += size; | ||
1628 | addr += size; | ||
1629 | |||
1630 | } while (len < n); | ||
1631 | |||
1632 | return len; | ||
1633 | } | ||
1634 | |||
1635 | #ifdef CONFIG_COMPAT | 1599 | #ifdef CONFIG_COMPAT |
1636 | static inline int | 1600 | static inline int |
1637 | perf_callchain_user32(struct pt_regs *regs, struct perf_callchain_entry *entry) | 1601 | perf_callchain_user32(struct pt_regs *regs, struct perf_callchain_entry *entry) |
@@ -1727,6 +1691,11 @@ struct perf_callchain_entry *perf_callchain(struct pt_regs *regs) | |||
1727 | { | 1691 | { |
1728 | struct perf_callchain_entry *entry; | 1692 | struct perf_callchain_entry *entry; |
1729 | 1693 | ||
1694 | if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) { | ||
1695 | /* TODO: We don't support guest os callchain now */ | ||
1696 | return NULL; | ||
1697 | } | ||
1698 | |||
1730 | if (in_nmi()) | 1699 | if (in_nmi()) |
1731 | entry = &__get_cpu_var(pmc_nmi_entry); | 1700 | entry = &__get_cpu_var(pmc_nmi_entry); |
1732 | else | 1701 | else |
@@ -1750,3 +1719,37 @@ void perf_arch_fetch_caller_regs(struct pt_regs *regs, unsigned long ip, int ski | |||
1750 | regs->cs = __KERNEL_CS; | 1719 | regs->cs = __KERNEL_CS; |
1751 | local_save_flags(regs->flags); | 1720 | local_save_flags(regs->flags); |
1752 | } | 1721 | } |
1722 | |||
1723 | unsigned long perf_instruction_pointer(struct pt_regs *regs) | ||
1724 | { | ||
1725 | unsigned long ip; | ||
1726 | |||
1727 | if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) | ||
1728 | ip = perf_guest_cbs->get_guest_ip(); | ||
1729 | else | ||
1730 | ip = instruction_pointer(regs); | ||
1731 | |||
1732 | return ip; | ||
1733 | } | ||
1734 | |||
1735 | unsigned long perf_misc_flags(struct pt_regs *regs) | ||
1736 | { | ||
1737 | int misc = 0; | ||
1738 | |||
1739 | if (perf_guest_cbs && perf_guest_cbs->is_in_guest()) { | ||
1740 | if (perf_guest_cbs->is_user_mode()) | ||
1741 | misc |= PERF_RECORD_MISC_GUEST_USER; | ||
1742 | else | ||
1743 | misc |= PERF_RECORD_MISC_GUEST_KERNEL; | ||
1744 | } else { | ||
1745 | if (user_mode(regs)) | ||
1746 | misc |= PERF_RECORD_MISC_USER; | ||
1747 | else | ||
1748 | misc |= PERF_RECORD_MISC_KERNEL; | ||
1749 | } | ||
1750 | |||
1751 | if (regs->flags & PERF_EFLAGS_EXACT) | ||
1752 | misc |= PERF_RECORD_MISC_EXACT_IP; | ||
1753 | |||
1754 | return misc; | ||
1755 | } | ||
diff --git a/arch/x86/kernel/cpu/perf_event_amd.c b/arch/x86/kernel/cpu/perf_event_amd.c index db6f7d4056e1..611df11ba15e 100644 --- a/arch/x86/kernel/cpu/perf_event_amd.c +++ b/arch/x86/kernel/cpu/perf_event_amd.c | |||
@@ -2,7 +2,7 @@ | |||
2 | 2 | ||
3 | static DEFINE_RAW_SPINLOCK(amd_nb_lock); | 3 | static DEFINE_RAW_SPINLOCK(amd_nb_lock); |
4 | 4 | ||
5 | static __initconst u64 amd_hw_cache_event_ids | 5 | static __initconst const u64 amd_hw_cache_event_ids |
6 | [PERF_COUNT_HW_CACHE_MAX] | 6 | [PERF_COUNT_HW_CACHE_MAX] |
7 | [PERF_COUNT_HW_CACHE_OP_MAX] | 7 | [PERF_COUNT_HW_CACHE_OP_MAX] |
8 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | 8 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = |
@@ -111,22 +111,19 @@ static u64 amd_pmu_event_map(int hw_event) | |||
111 | return amd_perfmon_event_map[hw_event]; | 111 | return amd_perfmon_event_map[hw_event]; |
112 | } | 112 | } |
113 | 113 | ||
114 | static u64 amd_pmu_raw_event(u64 hw_event) | 114 | static int amd_pmu_hw_config(struct perf_event *event) |
115 | { | 115 | { |
116 | #define K7_EVNTSEL_EVENT_MASK 0xF000000FFULL | 116 | int ret = x86_pmu_hw_config(event); |
117 | #define K7_EVNTSEL_UNIT_MASK 0x00000FF00ULL | 117 | |
118 | #define K7_EVNTSEL_EDGE_MASK 0x000040000ULL | 118 | if (ret) |
119 | #define K7_EVNTSEL_INV_MASK 0x000800000ULL | 119 | return ret; |
120 | #define K7_EVNTSEL_REG_MASK 0x0FF000000ULL | 120 | |
121 | 121 | if (event->attr.type != PERF_TYPE_RAW) | |
122 | #define K7_EVNTSEL_MASK \ | 122 | return 0; |
123 | (K7_EVNTSEL_EVENT_MASK | \ | 123 | |
124 | K7_EVNTSEL_UNIT_MASK | \ | 124 | event->hw.config |= event->attr.config & AMD64_RAW_EVENT_MASK; |
125 | K7_EVNTSEL_EDGE_MASK | \ | 125 | |
126 | K7_EVNTSEL_INV_MASK | \ | 126 | return 0; |
127 | K7_EVNTSEL_REG_MASK) | ||
128 | |||
129 | return hw_event & K7_EVNTSEL_MASK; | ||
130 | } | 127 | } |
131 | 128 | ||
132 | /* | 129 | /* |
@@ -165,7 +162,7 @@ static void amd_put_event_constraints(struct cpu_hw_events *cpuc, | |||
165 | * be removed on one CPU at a time AND PMU is disabled | 162 | * be removed on one CPU at a time AND PMU is disabled |
166 | * when we come here | 163 | * when we come here |
167 | */ | 164 | */ |
168 | for (i = 0; i < x86_pmu.num_events; i++) { | 165 | for (i = 0; i < x86_pmu.num_counters; i++) { |
169 | if (nb->owners[i] == event) { | 166 | if (nb->owners[i] == event) { |
170 | cmpxchg(nb->owners+i, event, NULL); | 167 | cmpxchg(nb->owners+i, event, NULL); |
171 | break; | 168 | break; |
@@ -215,7 +212,7 @@ amd_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event) | |||
215 | struct hw_perf_event *hwc = &event->hw; | 212 | struct hw_perf_event *hwc = &event->hw; |
216 | struct amd_nb *nb = cpuc->amd_nb; | 213 | struct amd_nb *nb = cpuc->amd_nb; |
217 | struct perf_event *old = NULL; | 214 | struct perf_event *old = NULL; |
218 | int max = x86_pmu.num_events; | 215 | int max = x86_pmu.num_counters; |
219 | int i, j, k = -1; | 216 | int i, j, k = -1; |
220 | 217 | ||
221 | /* | 218 | /* |
@@ -293,7 +290,7 @@ static struct amd_nb *amd_alloc_nb(int cpu, int nb_id) | |||
293 | /* | 290 | /* |
294 | * initialize all possible NB constraints | 291 | * initialize all possible NB constraints |
295 | */ | 292 | */ |
296 | for (i = 0; i < x86_pmu.num_events; i++) { | 293 | for (i = 0; i < x86_pmu.num_counters; i++) { |
297 | __set_bit(i, nb->event_constraints[i].idxmsk); | 294 | __set_bit(i, nb->event_constraints[i].idxmsk); |
298 | nb->event_constraints[i].weight = 1; | 295 | nb->event_constraints[i].weight = 1; |
299 | } | 296 | } |
@@ -371,21 +368,22 @@ static void amd_pmu_cpu_dead(int cpu) | |||
371 | raw_spin_unlock(&amd_nb_lock); | 368 | raw_spin_unlock(&amd_nb_lock); |
372 | } | 369 | } |
373 | 370 | ||
374 | static __initconst struct x86_pmu amd_pmu = { | 371 | static __initconst const struct x86_pmu amd_pmu = { |
375 | .name = "AMD", | 372 | .name = "AMD", |
376 | .handle_irq = x86_pmu_handle_irq, | 373 | .handle_irq = x86_pmu_handle_irq, |
377 | .disable_all = x86_pmu_disable_all, | 374 | .disable_all = x86_pmu_disable_all, |
378 | .enable_all = x86_pmu_enable_all, | 375 | .enable_all = x86_pmu_enable_all, |
379 | .enable = x86_pmu_enable_event, | 376 | .enable = x86_pmu_enable_event, |
380 | .disable = x86_pmu_disable_event, | 377 | .disable = x86_pmu_disable_event, |
378 | .hw_config = amd_pmu_hw_config, | ||
379 | .schedule_events = x86_schedule_events, | ||
381 | .eventsel = MSR_K7_EVNTSEL0, | 380 | .eventsel = MSR_K7_EVNTSEL0, |
382 | .perfctr = MSR_K7_PERFCTR0, | 381 | .perfctr = MSR_K7_PERFCTR0, |
383 | .event_map = amd_pmu_event_map, | 382 | .event_map = amd_pmu_event_map, |
384 | .raw_event = amd_pmu_raw_event, | ||
385 | .max_events = ARRAY_SIZE(amd_perfmon_event_map), | 383 | .max_events = ARRAY_SIZE(amd_perfmon_event_map), |
386 | .num_events = 4, | 384 | .num_counters = 4, |
387 | .event_bits = 48, | 385 | .cntval_bits = 48, |
388 | .event_mask = (1ULL << 48) - 1, | 386 | .cntval_mask = (1ULL << 48) - 1, |
389 | .apic = 1, | 387 | .apic = 1, |
390 | /* use highest bit to detect overflow */ | 388 | /* use highest bit to detect overflow */ |
391 | .max_period = (1ULL << 47) - 1, | 389 | .max_period = (1ULL << 47) - 1, |
diff --git a/arch/x86/kernel/cpu/perf_event_intel.c b/arch/x86/kernel/cpu/perf_event_intel.c index 9c794ac87837..fdbc652d3feb 100644 --- a/arch/x86/kernel/cpu/perf_event_intel.c +++ b/arch/x86/kernel/cpu/perf_event_intel.c | |||
@@ -88,7 +88,7 @@ static u64 intel_pmu_event_map(int hw_event) | |||
88 | return intel_perfmon_event_map[hw_event]; | 88 | return intel_perfmon_event_map[hw_event]; |
89 | } | 89 | } |
90 | 90 | ||
91 | static __initconst u64 westmere_hw_cache_event_ids | 91 | static __initconst const u64 westmere_hw_cache_event_ids |
92 | [PERF_COUNT_HW_CACHE_MAX] | 92 | [PERF_COUNT_HW_CACHE_MAX] |
93 | [PERF_COUNT_HW_CACHE_OP_MAX] | 93 | [PERF_COUNT_HW_CACHE_OP_MAX] |
94 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | 94 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = |
@@ -179,7 +179,7 @@ static __initconst u64 westmere_hw_cache_event_ids | |||
179 | }, | 179 | }, |
180 | }; | 180 | }; |
181 | 181 | ||
182 | static __initconst u64 nehalem_hw_cache_event_ids | 182 | static __initconst const u64 nehalem_hw_cache_event_ids |
183 | [PERF_COUNT_HW_CACHE_MAX] | 183 | [PERF_COUNT_HW_CACHE_MAX] |
184 | [PERF_COUNT_HW_CACHE_OP_MAX] | 184 | [PERF_COUNT_HW_CACHE_OP_MAX] |
185 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | 185 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = |
@@ -270,7 +270,7 @@ static __initconst u64 nehalem_hw_cache_event_ids | |||
270 | }, | 270 | }, |
271 | }; | 271 | }; |
272 | 272 | ||
273 | static __initconst u64 core2_hw_cache_event_ids | 273 | static __initconst const u64 core2_hw_cache_event_ids |
274 | [PERF_COUNT_HW_CACHE_MAX] | 274 | [PERF_COUNT_HW_CACHE_MAX] |
275 | [PERF_COUNT_HW_CACHE_OP_MAX] | 275 | [PERF_COUNT_HW_CACHE_OP_MAX] |
276 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | 276 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = |
@@ -361,7 +361,7 @@ static __initconst u64 core2_hw_cache_event_ids | |||
361 | }, | 361 | }, |
362 | }; | 362 | }; |
363 | 363 | ||
364 | static __initconst u64 atom_hw_cache_event_ids | 364 | static __initconst const u64 atom_hw_cache_event_ids |
365 | [PERF_COUNT_HW_CACHE_MAX] | 365 | [PERF_COUNT_HW_CACHE_MAX] |
366 | [PERF_COUNT_HW_CACHE_OP_MAX] | 366 | [PERF_COUNT_HW_CACHE_OP_MAX] |
367 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | 367 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = |
@@ -452,60 +452,6 @@ static __initconst u64 atom_hw_cache_event_ids | |||
452 | }, | 452 | }, |
453 | }; | 453 | }; |
454 | 454 | ||
455 | static u64 intel_pmu_raw_event(u64 hw_event) | ||
456 | { | ||
457 | #define CORE_EVNTSEL_EVENT_MASK 0x000000FFULL | ||
458 | #define CORE_EVNTSEL_UNIT_MASK 0x0000FF00ULL | ||
459 | #define CORE_EVNTSEL_EDGE_MASK 0x00040000ULL | ||
460 | #define CORE_EVNTSEL_INV_MASK 0x00800000ULL | ||
461 | #define CORE_EVNTSEL_REG_MASK 0xFF000000ULL | ||
462 | |||
463 | #define CORE_EVNTSEL_MASK \ | ||
464 | (INTEL_ARCH_EVTSEL_MASK | \ | ||
465 | INTEL_ARCH_UNIT_MASK | \ | ||
466 | INTEL_ARCH_EDGE_MASK | \ | ||
467 | INTEL_ARCH_INV_MASK | \ | ||
468 | INTEL_ARCH_CNT_MASK) | ||
469 | |||
470 | return hw_event & CORE_EVNTSEL_MASK; | ||
471 | } | ||
472 | |||
473 | static void intel_pmu_enable_bts(u64 config) | ||
474 | { | ||
475 | unsigned long debugctlmsr; | ||
476 | |||
477 | debugctlmsr = get_debugctlmsr(); | ||
478 | |||
479 | debugctlmsr |= X86_DEBUGCTL_TR; | ||
480 | debugctlmsr |= X86_DEBUGCTL_BTS; | ||
481 | debugctlmsr |= X86_DEBUGCTL_BTINT; | ||
482 | |||
483 | if (!(config & ARCH_PERFMON_EVENTSEL_OS)) | ||
484 | debugctlmsr |= X86_DEBUGCTL_BTS_OFF_OS; | ||
485 | |||
486 | if (!(config & ARCH_PERFMON_EVENTSEL_USR)) | ||
487 | debugctlmsr |= X86_DEBUGCTL_BTS_OFF_USR; | ||
488 | |||
489 | update_debugctlmsr(debugctlmsr); | ||
490 | } | ||
491 | |||
492 | static void intel_pmu_disable_bts(void) | ||
493 | { | ||
494 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
495 | unsigned long debugctlmsr; | ||
496 | |||
497 | if (!cpuc->ds) | ||
498 | return; | ||
499 | |||
500 | debugctlmsr = get_debugctlmsr(); | ||
501 | |||
502 | debugctlmsr &= | ||
503 | ~(X86_DEBUGCTL_TR | X86_DEBUGCTL_BTS | X86_DEBUGCTL_BTINT | | ||
504 | X86_DEBUGCTL_BTS_OFF_OS | X86_DEBUGCTL_BTS_OFF_USR); | ||
505 | |||
506 | update_debugctlmsr(debugctlmsr); | ||
507 | } | ||
508 | |||
509 | static void intel_pmu_disable_all(void) | 455 | static void intel_pmu_disable_all(void) |
510 | { | 456 | { |
511 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 457 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
@@ -514,12 +460,17 @@ static void intel_pmu_disable_all(void) | |||
514 | 460 | ||
515 | if (test_bit(X86_PMC_IDX_FIXED_BTS, cpuc->active_mask)) | 461 | if (test_bit(X86_PMC_IDX_FIXED_BTS, cpuc->active_mask)) |
516 | intel_pmu_disable_bts(); | 462 | intel_pmu_disable_bts(); |
463 | |||
464 | intel_pmu_pebs_disable_all(); | ||
465 | intel_pmu_lbr_disable_all(); | ||
517 | } | 466 | } |
518 | 467 | ||
519 | static void intel_pmu_enable_all(void) | 468 | static void intel_pmu_enable_all(int added) |
520 | { | 469 | { |
521 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | 470 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); |
522 | 471 | ||
472 | intel_pmu_pebs_enable_all(); | ||
473 | intel_pmu_lbr_enable_all(); | ||
523 | wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, x86_pmu.intel_ctrl); | 474 | wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, x86_pmu.intel_ctrl); |
524 | 475 | ||
525 | if (test_bit(X86_PMC_IDX_FIXED_BTS, cpuc->active_mask)) { | 476 | if (test_bit(X86_PMC_IDX_FIXED_BTS, cpuc->active_mask)) { |
@@ -533,6 +484,42 @@ static void intel_pmu_enable_all(void) | |||
533 | } | 484 | } |
534 | } | 485 | } |
535 | 486 | ||
487 | /* | ||
488 | * Workaround for: | ||
489 | * Intel Errata AAK100 (model 26) | ||
490 | * Intel Errata AAP53 (model 30) | ||
491 | * Intel Errata BD53 (model 44) | ||
492 | * | ||
493 | * These chips need to be 'reset' when adding counters by programming | ||
494 | * the magic three (non counting) events 0x4300D2, 0x4300B1 and 0x4300B5 | ||
495 | * either in sequence on the same PMC or on different PMCs. | ||
496 | */ | ||
497 | static void intel_pmu_nhm_enable_all(int added) | ||
498 | { | ||
499 | if (added) { | ||
500 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
501 | int i; | ||
502 | |||
503 | wrmsrl(MSR_ARCH_PERFMON_EVENTSEL0 + 0, 0x4300D2); | ||
504 | wrmsrl(MSR_ARCH_PERFMON_EVENTSEL0 + 1, 0x4300B1); | ||
505 | wrmsrl(MSR_ARCH_PERFMON_EVENTSEL0 + 2, 0x4300B5); | ||
506 | |||
507 | wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, 0x3); | ||
508 | wrmsrl(MSR_CORE_PERF_GLOBAL_CTRL, 0x0); | ||
509 | |||
510 | for (i = 0; i < 3; i++) { | ||
511 | struct perf_event *event = cpuc->events[i]; | ||
512 | |||
513 | if (!event) | ||
514 | continue; | ||
515 | |||
516 | __x86_pmu_enable_event(&event->hw, | ||
517 | ARCH_PERFMON_EVENTSEL_ENABLE); | ||
518 | } | ||
519 | } | ||
520 | intel_pmu_enable_all(added); | ||
521 | } | ||
522 | |||
536 | static inline u64 intel_pmu_get_status(void) | 523 | static inline u64 intel_pmu_get_status(void) |
537 | { | 524 | { |
538 | u64 status; | 525 | u64 status; |
@@ -547,8 +534,7 @@ static inline void intel_pmu_ack_status(u64 ack) | |||
547 | wrmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, ack); | 534 | wrmsrl(MSR_CORE_PERF_GLOBAL_OVF_CTRL, ack); |
548 | } | 535 | } |
549 | 536 | ||
550 | static inline void | 537 | static void intel_pmu_disable_fixed(struct hw_perf_event *hwc) |
551 | intel_pmu_disable_fixed(struct hw_perf_event *hwc) | ||
552 | { | 538 | { |
553 | int idx = hwc->idx - X86_PMC_IDX_FIXED; | 539 | int idx = hwc->idx - X86_PMC_IDX_FIXED; |
554 | u64 ctrl_val, mask; | 540 | u64 ctrl_val, mask; |
@@ -557,71 +543,10 @@ intel_pmu_disable_fixed(struct hw_perf_event *hwc) | |||
557 | 543 | ||
558 | rdmsrl(hwc->config_base, ctrl_val); | 544 | rdmsrl(hwc->config_base, ctrl_val); |
559 | ctrl_val &= ~mask; | 545 | ctrl_val &= ~mask; |
560 | (void)checking_wrmsrl(hwc->config_base, ctrl_val); | 546 | wrmsrl(hwc->config_base, ctrl_val); |
561 | } | ||
562 | |||
563 | static void intel_pmu_drain_bts_buffer(void) | ||
564 | { | ||
565 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
566 | struct debug_store *ds = cpuc->ds; | ||
567 | struct bts_record { | ||
568 | u64 from; | ||
569 | u64 to; | ||
570 | u64 flags; | ||
571 | }; | ||
572 | struct perf_event *event = cpuc->events[X86_PMC_IDX_FIXED_BTS]; | ||
573 | struct bts_record *at, *top; | ||
574 | struct perf_output_handle handle; | ||
575 | struct perf_event_header header; | ||
576 | struct perf_sample_data data; | ||
577 | struct pt_regs regs; | ||
578 | |||
579 | if (!event) | ||
580 | return; | ||
581 | |||
582 | if (!ds) | ||
583 | return; | ||
584 | |||
585 | at = (struct bts_record *)(unsigned long)ds->bts_buffer_base; | ||
586 | top = (struct bts_record *)(unsigned long)ds->bts_index; | ||
587 | |||
588 | if (top <= at) | ||
589 | return; | ||
590 | |||
591 | ds->bts_index = ds->bts_buffer_base; | ||
592 | |||
593 | perf_sample_data_init(&data, 0); | ||
594 | |||
595 | data.period = event->hw.last_period; | ||
596 | regs.ip = 0; | ||
597 | |||
598 | /* | ||
599 | * Prepare a generic sample, i.e. fill in the invariant fields. | ||
600 | * We will overwrite the from and to address before we output | ||
601 | * the sample. | ||
602 | */ | ||
603 | perf_prepare_sample(&header, &data, event, ®s); | ||
604 | |||
605 | if (perf_output_begin(&handle, event, | ||
606 | header.size * (top - at), 1, 1)) | ||
607 | return; | ||
608 | |||
609 | for (; at < top; at++) { | ||
610 | data.ip = at->from; | ||
611 | data.addr = at->to; | ||
612 | |||
613 | perf_output_sample(&handle, &header, &data, event); | ||
614 | } | ||
615 | |||
616 | perf_output_end(&handle); | ||
617 | |||
618 | /* There's new data available. */ | ||
619 | event->hw.interrupts++; | ||
620 | event->pending_kill = POLL_IN; | ||
621 | } | 547 | } |
622 | 548 | ||
623 | static inline void | 549 | static void intel_pmu_disable_event(struct perf_event *event) |
624 | intel_pmu_disable_event(struct perf_event *event) | ||
625 | { | 550 | { |
626 | struct hw_perf_event *hwc = &event->hw; | 551 | struct hw_perf_event *hwc = &event->hw; |
627 | 552 | ||
@@ -637,14 +562,15 @@ intel_pmu_disable_event(struct perf_event *event) | |||
637 | } | 562 | } |
638 | 563 | ||
639 | x86_pmu_disable_event(event); | 564 | x86_pmu_disable_event(event); |
565 | |||
566 | if (unlikely(event->attr.precise_ip)) | ||
567 | intel_pmu_pebs_disable(event); | ||
640 | } | 568 | } |
641 | 569 | ||
642 | static inline void | 570 | static void intel_pmu_enable_fixed(struct hw_perf_event *hwc) |
643 | intel_pmu_enable_fixed(struct hw_perf_event *hwc) | ||
644 | { | 571 | { |
645 | int idx = hwc->idx - X86_PMC_IDX_FIXED; | 572 | int idx = hwc->idx - X86_PMC_IDX_FIXED; |
646 | u64 ctrl_val, bits, mask; | 573 | u64 ctrl_val, bits, mask; |
647 | int err; | ||
648 | 574 | ||
649 | /* | 575 | /* |
650 | * Enable IRQ generation (0x8), | 576 | * Enable IRQ generation (0x8), |
@@ -669,7 +595,7 @@ intel_pmu_enable_fixed(struct hw_perf_event *hwc) | |||
669 | rdmsrl(hwc->config_base, ctrl_val); | 595 | rdmsrl(hwc->config_base, ctrl_val); |
670 | ctrl_val &= ~mask; | 596 | ctrl_val &= ~mask; |
671 | ctrl_val |= bits; | 597 | ctrl_val |= bits; |
672 | err = checking_wrmsrl(hwc->config_base, ctrl_val); | 598 | wrmsrl(hwc->config_base, ctrl_val); |
673 | } | 599 | } |
674 | 600 | ||
675 | static void intel_pmu_enable_event(struct perf_event *event) | 601 | static void intel_pmu_enable_event(struct perf_event *event) |
@@ -689,7 +615,10 @@ static void intel_pmu_enable_event(struct perf_event *event) | |||
689 | return; | 615 | return; |
690 | } | 616 | } |
691 | 617 | ||
692 | __x86_pmu_enable_event(hwc); | 618 | if (unlikely(event->attr.precise_ip)) |
619 | intel_pmu_pebs_enable(event); | ||
620 | |||
621 | __x86_pmu_enable_event(hwc, ARCH_PERFMON_EVENTSEL_ENABLE); | ||
693 | } | 622 | } |
694 | 623 | ||
695 | /* | 624 | /* |
@@ -708,20 +637,20 @@ static void intel_pmu_reset(void) | |||
708 | unsigned long flags; | 637 | unsigned long flags; |
709 | int idx; | 638 | int idx; |
710 | 639 | ||
711 | if (!x86_pmu.num_events) | 640 | if (!x86_pmu.num_counters) |
712 | return; | 641 | return; |
713 | 642 | ||
714 | local_irq_save(flags); | 643 | local_irq_save(flags); |
715 | 644 | ||
716 | printk("clearing PMU state on CPU#%d\n", smp_processor_id()); | 645 | printk("clearing PMU state on CPU#%d\n", smp_processor_id()); |
717 | 646 | ||
718 | for (idx = 0; idx < x86_pmu.num_events; idx++) { | 647 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { |
719 | checking_wrmsrl(x86_pmu.eventsel + idx, 0ull); | 648 | checking_wrmsrl(x86_pmu.eventsel + idx, 0ull); |
720 | checking_wrmsrl(x86_pmu.perfctr + idx, 0ull); | 649 | checking_wrmsrl(x86_pmu.perfctr + idx, 0ull); |
721 | } | 650 | } |
722 | for (idx = 0; idx < x86_pmu.num_events_fixed; idx++) { | 651 | for (idx = 0; idx < x86_pmu.num_counters_fixed; idx++) |
723 | checking_wrmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, 0ull); | 652 | checking_wrmsrl(MSR_ARCH_PERFMON_FIXED_CTR0 + idx, 0ull); |
724 | } | 653 | |
725 | if (ds) | 654 | if (ds) |
726 | ds->bts_index = ds->bts_buffer_base; | 655 | ds->bts_index = ds->bts_buffer_base; |
727 | 656 | ||
@@ -747,7 +676,7 @@ static int intel_pmu_handle_irq(struct pt_regs *regs) | |||
747 | intel_pmu_drain_bts_buffer(); | 676 | intel_pmu_drain_bts_buffer(); |
748 | status = intel_pmu_get_status(); | 677 | status = intel_pmu_get_status(); |
749 | if (!status) { | 678 | if (!status) { |
750 | intel_pmu_enable_all(); | 679 | intel_pmu_enable_all(0); |
751 | return 0; | 680 | return 0; |
752 | } | 681 | } |
753 | 682 | ||
@@ -762,6 +691,15 @@ again: | |||
762 | 691 | ||
763 | inc_irq_stat(apic_perf_irqs); | 692 | inc_irq_stat(apic_perf_irqs); |
764 | ack = status; | 693 | ack = status; |
694 | |||
695 | intel_pmu_lbr_read(); | ||
696 | |||
697 | /* | ||
698 | * PEBS overflow sets bit 62 in the global status register | ||
699 | */ | ||
700 | if (__test_and_clear_bit(62, (unsigned long *)&status)) | ||
701 | x86_pmu.drain_pebs(regs); | ||
702 | |||
765 | for_each_set_bit(bit, (unsigned long *)&status, X86_PMC_IDX_MAX) { | 703 | for_each_set_bit(bit, (unsigned long *)&status, X86_PMC_IDX_MAX) { |
766 | struct perf_event *event = cpuc->events[bit]; | 704 | struct perf_event *event = cpuc->events[bit]; |
767 | 705 | ||
@@ -787,26 +725,22 @@ again: | |||
787 | goto again; | 725 | goto again; |
788 | 726 | ||
789 | done: | 727 | done: |
790 | intel_pmu_enable_all(); | 728 | intel_pmu_enable_all(0); |
791 | return 1; | 729 | return 1; |
792 | } | 730 | } |
793 | 731 | ||
794 | static struct event_constraint bts_constraint = | ||
795 | EVENT_CONSTRAINT(0, 1ULL << X86_PMC_IDX_FIXED_BTS, 0); | ||
796 | |||
797 | static struct event_constraint * | 732 | static struct event_constraint * |
798 | intel_special_constraints(struct perf_event *event) | 733 | intel_bts_constraints(struct perf_event *event) |
799 | { | 734 | { |
800 | unsigned int hw_event; | 735 | struct hw_perf_event *hwc = &event->hw; |
801 | 736 | unsigned int hw_event, bts_event; | |
802 | hw_event = event->hw.config & INTEL_ARCH_EVENT_MASK; | ||
803 | 737 | ||
804 | if (unlikely((hw_event == | 738 | hw_event = hwc->config & INTEL_ARCH_EVENT_MASK; |
805 | x86_pmu.event_map(PERF_COUNT_HW_BRANCH_INSTRUCTIONS)) && | 739 | bts_event = x86_pmu.event_map(PERF_COUNT_HW_BRANCH_INSTRUCTIONS); |
806 | (event->hw.sample_period == 1))) { | ||
807 | 740 | ||
741 | if (unlikely(hw_event == bts_event && hwc->sample_period == 1)) | ||
808 | return &bts_constraint; | 742 | return &bts_constraint; |
809 | } | 743 | |
810 | return NULL; | 744 | return NULL; |
811 | } | 745 | } |
812 | 746 | ||
@@ -815,24 +749,53 @@ intel_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event | |||
815 | { | 749 | { |
816 | struct event_constraint *c; | 750 | struct event_constraint *c; |
817 | 751 | ||
818 | c = intel_special_constraints(event); | 752 | c = intel_bts_constraints(event); |
753 | if (c) | ||
754 | return c; | ||
755 | |||
756 | c = intel_pebs_constraints(event); | ||
819 | if (c) | 757 | if (c) |
820 | return c; | 758 | return c; |
821 | 759 | ||
822 | return x86_get_event_constraints(cpuc, event); | 760 | return x86_get_event_constraints(cpuc, event); |
823 | } | 761 | } |
824 | 762 | ||
825 | static __initconst struct x86_pmu core_pmu = { | 763 | static int intel_pmu_hw_config(struct perf_event *event) |
764 | { | ||
765 | int ret = x86_pmu_hw_config(event); | ||
766 | |||
767 | if (ret) | ||
768 | return ret; | ||
769 | |||
770 | if (event->attr.type != PERF_TYPE_RAW) | ||
771 | return 0; | ||
772 | |||
773 | if (!(event->attr.config & ARCH_PERFMON_EVENTSEL_ANY)) | ||
774 | return 0; | ||
775 | |||
776 | if (x86_pmu.version < 3) | ||
777 | return -EINVAL; | ||
778 | |||
779 | if (perf_paranoid_cpu() && !capable(CAP_SYS_ADMIN)) | ||
780 | return -EACCES; | ||
781 | |||
782 | event->hw.config |= ARCH_PERFMON_EVENTSEL_ANY; | ||
783 | |||
784 | return 0; | ||
785 | } | ||
786 | |||
787 | static __initconst const struct x86_pmu core_pmu = { | ||
826 | .name = "core", | 788 | .name = "core", |
827 | .handle_irq = x86_pmu_handle_irq, | 789 | .handle_irq = x86_pmu_handle_irq, |
828 | .disable_all = x86_pmu_disable_all, | 790 | .disable_all = x86_pmu_disable_all, |
829 | .enable_all = x86_pmu_enable_all, | 791 | .enable_all = x86_pmu_enable_all, |
830 | .enable = x86_pmu_enable_event, | 792 | .enable = x86_pmu_enable_event, |
831 | .disable = x86_pmu_disable_event, | 793 | .disable = x86_pmu_disable_event, |
794 | .hw_config = x86_pmu_hw_config, | ||
795 | .schedule_events = x86_schedule_events, | ||
832 | .eventsel = MSR_ARCH_PERFMON_EVENTSEL0, | 796 | .eventsel = MSR_ARCH_PERFMON_EVENTSEL0, |
833 | .perfctr = MSR_ARCH_PERFMON_PERFCTR0, | 797 | .perfctr = MSR_ARCH_PERFMON_PERFCTR0, |
834 | .event_map = intel_pmu_event_map, | 798 | .event_map = intel_pmu_event_map, |
835 | .raw_event = intel_pmu_raw_event, | ||
836 | .max_events = ARRAY_SIZE(intel_perfmon_event_map), | 799 | .max_events = ARRAY_SIZE(intel_perfmon_event_map), |
837 | .apic = 1, | 800 | .apic = 1, |
838 | /* | 801 | /* |
@@ -845,17 +808,32 @@ static __initconst struct x86_pmu core_pmu = { | |||
845 | .event_constraints = intel_core_event_constraints, | 808 | .event_constraints = intel_core_event_constraints, |
846 | }; | 809 | }; |
847 | 810 | ||
848 | static __initconst struct x86_pmu intel_pmu = { | 811 | static void intel_pmu_cpu_starting(int cpu) |
812 | { | ||
813 | init_debug_store_on_cpu(cpu); | ||
814 | /* | ||
815 | * Deal with CPUs that don't clear their LBRs on power-up. | ||
816 | */ | ||
817 | intel_pmu_lbr_reset(); | ||
818 | } | ||
819 | |||
820 | static void intel_pmu_cpu_dying(int cpu) | ||
821 | { | ||
822 | fini_debug_store_on_cpu(cpu); | ||
823 | } | ||
824 | |||
825 | static __initconst const struct x86_pmu intel_pmu = { | ||
849 | .name = "Intel", | 826 | .name = "Intel", |
850 | .handle_irq = intel_pmu_handle_irq, | 827 | .handle_irq = intel_pmu_handle_irq, |
851 | .disable_all = intel_pmu_disable_all, | 828 | .disable_all = intel_pmu_disable_all, |
852 | .enable_all = intel_pmu_enable_all, | 829 | .enable_all = intel_pmu_enable_all, |
853 | .enable = intel_pmu_enable_event, | 830 | .enable = intel_pmu_enable_event, |
854 | .disable = intel_pmu_disable_event, | 831 | .disable = intel_pmu_disable_event, |
832 | .hw_config = intel_pmu_hw_config, | ||
833 | .schedule_events = x86_schedule_events, | ||
855 | .eventsel = MSR_ARCH_PERFMON_EVENTSEL0, | 834 | .eventsel = MSR_ARCH_PERFMON_EVENTSEL0, |
856 | .perfctr = MSR_ARCH_PERFMON_PERFCTR0, | 835 | .perfctr = MSR_ARCH_PERFMON_PERFCTR0, |
857 | .event_map = intel_pmu_event_map, | 836 | .event_map = intel_pmu_event_map, |
858 | .raw_event = intel_pmu_raw_event, | ||
859 | .max_events = ARRAY_SIZE(intel_perfmon_event_map), | 837 | .max_events = ARRAY_SIZE(intel_perfmon_event_map), |
860 | .apic = 1, | 838 | .apic = 1, |
861 | /* | 839 | /* |
@@ -864,14 +842,38 @@ static __initconst struct x86_pmu intel_pmu = { | |||
864 | * the generic event period: | 842 | * the generic event period: |
865 | */ | 843 | */ |
866 | .max_period = (1ULL << 31) - 1, | 844 | .max_period = (1ULL << 31) - 1, |
867 | .enable_bts = intel_pmu_enable_bts, | ||
868 | .disable_bts = intel_pmu_disable_bts, | ||
869 | .get_event_constraints = intel_get_event_constraints, | 845 | .get_event_constraints = intel_get_event_constraints, |
870 | 846 | ||
871 | .cpu_starting = init_debug_store_on_cpu, | 847 | .cpu_starting = intel_pmu_cpu_starting, |
872 | .cpu_dying = fini_debug_store_on_cpu, | 848 | .cpu_dying = intel_pmu_cpu_dying, |
873 | }; | 849 | }; |
874 | 850 | ||
851 | static void intel_clovertown_quirks(void) | ||
852 | { | ||
853 | /* | ||
854 | * PEBS is unreliable due to: | ||
855 | * | ||
856 | * AJ67 - PEBS may experience CPL leaks | ||
857 | * AJ68 - PEBS PMI may be delayed by one event | ||
858 | * AJ69 - GLOBAL_STATUS[62] will only be set when DEBUGCTL[12] | ||
859 | * AJ106 - FREEZE_LBRS_ON_PMI doesn't work in combination with PEBS | ||
860 | * | ||
861 | * AJ67 could be worked around by restricting the OS/USR flags. | ||
862 | * AJ69 could be worked around by setting PMU_FREEZE_ON_PMI. | ||
863 | * | ||
864 | * AJ106 could possibly be worked around by not allowing LBR | ||
865 | * usage from PEBS, including the fixup. | ||
866 | * AJ68 could possibly be worked around by always programming | ||
867 | * a pebs_event_reset[0] value and coping with the lost events. | ||
868 | * | ||
869 | * But taken together it might just make sense to not enable PEBS on | ||
870 | * these chips. | ||
871 | */ | ||
872 | printk(KERN_WARNING "PEBS disabled due to CPU errata.\n"); | ||
873 | x86_pmu.pebs = 0; | ||
874 | x86_pmu.pebs_constraints = NULL; | ||
875 | } | ||
876 | |||
875 | static __init int intel_pmu_init(void) | 877 | static __init int intel_pmu_init(void) |
876 | { | 878 | { |
877 | union cpuid10_edx edx; | 879 | union cpuid10_edx edx; |
@@ -881,12 +883,13 @@ static __init int intel_pmu_init(void) | |||
881 | int version; | 883 | int version; |
882 | 884 | ||
883 | if (!cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON)) { | 885 | if (!cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON)) { |
884 | /* check for P6 processor family */ | 886 | switch (boot_cpu_data.x86) { |
885 | if (boot_cpu_data.x86 == 6) { | 887 | case 0x6: |
886 | return p6_pmu_init(); | 888 | return p6_pmu_init(); |
887 | } else { | 889 | case 0xf: |
890 | return p4_pmu_init(); | ||
891 | } | ||
888 | return -ENODEV; | 892 | return -ENODEV; |
889 | } | ||
890 | } | 893 | } |
891 | 894 | ||
892 | /* | 895 | /* |
@@ -904,16 +907,28 @@ static __init int intel_pmu_init(void) | |||
904 | x86_pmu = intel_pmu; | 907 | x86_pmu = intel_pmu; |
905 | 908 | ||
906 | x86_pmu.version = version; | 909 | x86_pmu.version = version; |
907 | x86_pmu.num_events = eax.split.num_events; | 910 | x86_pmu.num_counters = eax.split.num_counters; |
908 | x86_pmu.event_bits = eax.split.bit_width; | 911 | x86_pmu.cntval_bits = eax.split.bit_width; |
909 | x86_pmu.event_mask = (1ULL << eax.split.bit_width) - 1; | 912 | x86_pmu.cntval_mask = (1ULL << eax.split.bit_width) - 1; |
910 | 913 | ||
911 | /* | 914 | /* |
912 | * Quirk: v2 perfmon does not report fixed-purpose events, so | 915 | * Quirk: v2 perfmon does not report fixed-purpose events, so |
913 | * assume at least 3 events: | 916 | * assume at least 3 events: |
914 | */ | 917 | */ |
915 | if (version > 1) | 918 | if (version > 1) |
916 | x86_pmu.num_events_fixed = max((int)edx.split.num_events_fixed, 3); | 919 | x86_pmu.num_counters_fixed = max((int)edx.split.num_counters_fixed, 3); |
920 | |||
921 | /* | ||
922 | * v2 and above have a perf capabilities MSR | ||
923 | */ | ||
924 | if (version > 1) { | ||
925 | u64 capabilities; | ||
926 | |||
927 | rdmsrl(MSR_IA32_PERF_CAPABILITIES, capabilities); | ||
928 | x86_pmu.intel_cap.capabilities = capabilities; | ||
929 | } | ||
930 | |||
931 | intel_ds_init(); | ||
917 | 932 | ||
918 | /* | 933 | /* |
919 | * Install the hw-cache-events table: | 934 | * Install the hw-cache-events table: |
@@ -924,12 +939,15 @@ static __init int intel_pmu_init(void) | |||
924 | break; | 939 | break; |
925 | 940 | ||
926 | case 15: /* original 65 nm celeron/pentium/core2/xeon, "Merom"/"Conroe" */ | 941 | case 15: /* original 65 nm celeron/pentium/core2/xeon, "Merom"/"Conroe" */ |
942 | x86_pmu.quirks = intel_clovertown_quirks; | ||
927 | case 22: /* single-core 65 nm celeron/core2solo "Merom-L"/"Conroe-L" */ | 943 | case 22: /* single-core 65 nm celeron/core2solo "Merom-L"/"Conroe-L" */ |
928 | case 23: /* current 45 nm celeron/core2/xeon "Penryn"/"Wolfdale" */ | 944 | case 23: /* current 45 nm celeron/core2/xeon "Penryn"/"Wolfdale" */ |
929 | case 29: /* six-core 45 nm xeon "Dunnington" */ | 945 | case 29: /* six-core 45 nm xeon "Dunnington" */ |
930 | memcpy(hw_cache_event_ids, core2_hw_cache_event_ids, | 946 | memcpy(hw_cache_event_ids, core2_hw_cache_event_ids, |
931 | sizeof(hw_cache_event_ids)); | 947 | sizeof(hw_cache_event_ids)); |
932 | 948 | ||
949 | intel_pmu_lbr_init_core(); | ||
950 | |||
933 | x86_pmu.event_constraints = intel_core2_event_constraints; | 951 | x86_pmu.event_constraints = intel_core2_event_constraints; |
934 | pr_cont("Core2 events, "); | 952 | pr_cont("Core2 events, "); |
935 | break; | 953 | break; |
@@ -940,13 +958,19 @@ static __init int intel_pmu_init(void) | |||
940 | memcpy(hw_cache_event_ids, nehalem_hw_cache_event_ids, | 958 | memcpy(hw_cache_event_ids, nehalem_hw_cache_event_ids, |
941 | sizeof(hw_cache_event_ids)); | 959 | sizeof(hw_cache_event_ids)); |
942 | 960 | ||
961 | intel_pmu_lbr_init_nhm(); | ||
962 | |||
943 | x86_pmu.event_constraints = intel_nehalem_event_constraints; | 963 | x86_pmu.event_constraints = intel_nehalem_event_constraints; |
944 | pr_cont("Nehalem/Corei7 events, "); | 964 | x86_pmu.enable_all = intel_pmu_nhm_enable_all; |
965 | pr_cont("Nehalem events, "); | ||
945 | break; | 966 | break; |
967 | |||
946 | case 28: /* Atom */ | 968 | case 28: /* Atom */ |
947 | memcpy(hw_cache_event_ids, atom_hw_cache_event_ids, | 969 | memcpy(hw_cache_event_ids, atom_hw_cache_event_ids, |
948 | sizeof(hw_cache_event_ids)); | 970 | sizeof(hw_cache_event_ids)); |
949 | 971 | ||
972 | intel_pmu_lbr_init_atom(); | ||
973 | |||
950 | x86_pmu.event_constraints = intel_gen_event_constraints; | 974 | x86_pmu.event_constraints = intel_gen_event_constraints; |
951 | pr_cont("Atom events, "); | 975 | pr_cont("Atom events, "); |
952 | break; | 976 | break; |
@@ -956,7 +980,10 @@ static __init int intel_pmu_init(void) | |||
956 | memcpy(hw_cache_event_ids, westmere_hw_cache_event_ids, | 980 | memcpy(hw_cache_event_ids, westmere_hw_cache_event_ids, |
957 | sizeof(hw_cache_event_ids)); | 981 | sizeof(hw_cache_event_ids)); |
958 | 982 | ||
983 | intel_pmu_lbr_init_nhm(); | ||
984 | |||
959 | x86_pmu.event_constraints = intel_westmere_event_constraints; | 985 | x86_pmu.event_constraints = intel_westmere_event_constraints; |
986 | x86_pmu.enable_all = intel_pmu_nhm_enable_all; | ||
960 | pr_cont("Westmere events, "); | 987 | pr_cont("Westmere events, "); |
961 | break; | 988 | break; |
962 | 989 | ||
diff --git a/arch/x86/kernel/cpu/perf_event_intel_ds.c b/arch/x86/kernel/cpu/perf_event_intel_ds.c new file mode 100644 index 000000000000..18018d1311cd --- /dev/null +++ b/arch/x86/kernel/cpu/perf_event_intel_ds.c | |||
@@ -0,0 +1,641 @@ | |||
1 | #ifdef CONFIG_CPU_SUP_INTEL | ||
2 | |||
3 | /* The maximal number of PEBS events: */ | ||
4 | #define MAX_PEBS_EVENTS 4 | ||
5 | |||
6 | /* The size of a BTS record in bytes: */ | ||
7 | #define BTS_RECORD_SIZE 24 | ||
8 | |||
9 | #define BTS_BUFFER_SIZE (PAGE_SIZE << 4) | ||
10 | #define PEBS_BUFFER_SIZE PAGE_SIZE | ||
11 | |||
12 | /* | ||
13 | * pebs_record_32 for p4 and core not supported | ||
14 | |||
15 | struct pebs_record_32 { | ||
16 | u32 flags, ip; | ||
17 | u32 ax, bc, cx, dx; | ||
18 | u32 si, di, bp, sp; | ||
19 | }; | ||
20 | |||
21 | */ | ||
22 | |||
23 | struct pebs_record_core { | ||
24 | u64 flags, ip; | ||
25 | u64 ax, bx, cx, dx; | ||
26 | u64 si, di, bp, sp; | ||
27 | u64 r8, r9, r10, r11; | ||
28 | u64 r12, r13, r14, r15; | ||
29 | }; | ||
30 | |||
31 | struct pebs_record_nhm { | ||
32 | u64 flags, ip; | ||
33 | u64 ax, bx, cx, dx; | ||
34 | u64 si, di, bp, sp; | ||
35 | u64 r8, r9, r10, r11; | ||
36 | u64 r12, r13, r14, r15; | ||
37 | u64 status, dla, dse, lat; | ||
38 | }; | ||
39 | |||
40 | /* | ||
41 | * A debug store configuration. | ||
42 | * | ||
43 | * We only support architectures that use 64bit fields. | ||
44 | */ | ||
45 | struct debug_store { | ||
46 | u64 bts_buffer_base; | ||
47 | u64 bts_index; | ||
48 | u64 bts_absolute_maximum; | ||
49 | u64 bts_interrupt_threshold; | ||
50 | u64 pebs_buffer_base; | ||
51 | u64 pebs_index; | ||
52 | u64 pebs_absolute_maximum; | ||
53 | u64 pebs_interrupt_threshold; | ||
54 | u64 pebs_event_reset[MAX_PEBS_EVENTS]; | ||
55 | }; | ||
56 | |||
57 | static void init_debug_store_on_cpu(int cpu) | ||
58 | { | ||
59 | struct debug_store *ds = per_cpu(cpu_hw_events, cpu).ds; | ||
60 | |||
61 | if (!ds) | ||
62 | return; | ||
63 | |||
64 | wrmsr_on_cpu(cpu, MSR_IA32_DS_AREA, | ||
65 | (u32)((u64)(unsigned long)ds), | ||
66 | (u32)((u64)(unsigned long)ds >> 32)); | ||
67 | } | ||
68 | |||
69 | static void fini_debug_store_on_cpu(int cpu) | ||
70 | { | ||
71 | if (!per_cpu(cpu_hw_events, cpu).ds) | ||
72 | return; | ||
73 | |||
74 | wrmsr_on_cpu(cpu, MSR_IA32_DS_AREA, 0, 0); | ||
75 | } | ||
76 | |||
77 | static void release_ds_buffers(void) | ||
78 | { | ||
79 | int cpu; | ||
80 | |||
81 | if (!x86_pmu.bts && !x86_pmu.pebs) | ||
82 | return; | ||
83 | |||
84 | get_online_cpus(); | ||
85 | |||
86 | for_each_online_cpu(cpu) | ||
87 | fini_debug_store_on_cpu(cpu); | ||
88 | |||
89 | for_each_possible_cpu(cpu) { | ||
90 | struct debug_store *ds = per_cpu(cpu_hw_events, cpu).ds; | ||
91 | |||
92 | if (!ds) | ||
93 | continue; | ||
94 | |||
95 | per_cpu(cpu_hw_events, cpu).ds = NULL; | ||
96 | |||
97 | kfree((void *)(unsigned long)ds->pebs_buffer_base); | ||
98 | kfree((void *)(unsigned long)ds->bts_buffer_base); | ||
99 | kfree(ds); | ||
100 | } | ||
101 | |||
102 | put_online_cpus(); | ||
103 | } | ||
104 | |||
105 | static int reserve_ds_buffers(void) | ||
106 | { | ||
107 | int cpu, err = 0; | ||
108 | |||
109 | if (!x86_pmu.bts && !x86_pmu.pebs) | ||
110 | return 0; | ||
111 | |||
112 | get_online_cpus(); | ||
113 | |||
114 | for_each_possible_cpu(cpu) { | ||
115 | struct debug_store *ds; | ||
116 | void *buffer; | ||
117 | int max, thresh; | ||
118 | |||
119 | err = -ENOMEM; | ||
120 | ds = kzalloc(sizeof(*ds), GFP_KERNEL); | ||
121 | if (unlikely(!ds)) | ||
122 | break; | ||
123 | per_cpu(cpu_hw_events, cpu).ds = ds; | ||
124 | |||
125 | if (x86_pmu.bts) { | ||
126 | buffer = kzalloc(BTS_BUFFER_SIZE, GFP_KERNEL); | ||
127 | if (unlikely(!buffer)) | ||
128 | break; | ||
129 | |||
130 | max = BTS_BUFFER_SIZE / BTS_RECORD_SIZE; | ||
131 | thresh = max / 16; | ||
132 | |||
133 | ds->bts_buffer_base = (u64)(unsigned long)buffer; | ||
134 | ds->bts_index = ds->bts_buffer_base; | ||
135 | ds->bts_absolute_maximum = ds->bts_buffer_base + | ||
136 | max * BTS_RECORD_SIZE; | ||
137 | ds->bts_interrupt_threshold = ds->bts_absolute_maximum - | ||
138 | thresh * BTS_RECORD_SIZE; | ||
139 | } | ||
140 | |||
141 | if (x86_pmu.pebs) { | ||
142 | buffer = kzalloc(PEBS_BUFFER_SIZE, GFP_KERNEL); | ||
143 | if (unlikely(!buffer)) | ||
144 | break; | ||
145 | |||
146 | max = PEBS_BUFFER_SIZE / x86_pmu.pebs_record_size; | ||
147 | |||
148 | ds->pebs_buffer_base = (u64)(unsigned long)buffer; | ||
149 | ds->pebs_index = ds->pebs_buffer_base; | ||
150 | ds->pebs_absolute_maximum = ds->pebs_buffer_base + | ||
151 | max * x86_pmu.pebs_record_size; | ||
152 | /* | ||
153 | * Always use single record PEBS | ||
154 | */ | ||
155 | ds->pebs_interrupt_threshold = ds->pebs_buffer_base + | ||
156 | x86_pmu.pebs_record_size; | ||
157 | } | ||
158 | |||
159 | err = 0; | ||
160 | } | ||
161 | |||
162 | if (err) | ||
163 | release_ds_buffers(); | ||
164 | else { | ||
165 | for_each_online_cpu(cpu) | ||
166 | init_debug_store_on_cpu(cpu); | ||
167 | } | ||
168 | |||
169 | put_online_cpus(); | ||
170 | |||
171 | return err; | ||
172 | } | ||
173 | |||
174 | /* | ||
175 | * BTS | ||
176 | */ | ||
177 | |||
178 | static struct event_constraint bts_constraint = | ||
179 | EVENT_CONSTRAINT(0, 1ULL << X86_PMC_IDX_FIXED_BTS, 0); | ||
180 | |||
181 | static void intel_pmu_enable_bts(u64 config) | ||
182 | { | ||
183 | unsigned long debugctlmsr; | ||
184 | |||
185 | debugctlmsr = get_debugctlmsr(); | ||
186 | |||
187 | debugctlmsr |= DEBUGCTLMSR_TR; | ||
188 | debugctlmsr |= DEBUGCTLMSR_BTS; | ||
189 | debugctlmsr |= DEBUGCTLMSR_BTINT; | ||
190 | |||
191 | if (!(config & ARCH_PERFMON_EVENTSEL_OS)) | ||
192 | debugctlmsr |= DEBUGCTLMSR_BTS_OFF_OS; | ||
193 | |||
194 | if (!(config & ARCH_PERFMON_EVENTSEL_USR)) | ||
195 | debugctlmsr |= DEBUGCTLMSR_BTS_OFF_USR; | ||
196 | |||
197 | update_debugctlmsr(debugctlmsr); | ||
198 | } | ||
199 | |||
200 | static void intel_pmu_disable_bts(void) | ||
201 | { | ||
202 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
203 | unsigned long debugctlmsr; | ||
204 | |||
205 | if (!cpuc->ds) | ||
206 | return; | ||
207 | |||
208 | debugctlmsr = get_debugctlmsr(); | ||
209 | |||
210 | debugctlmsr &= | ||
211 | ~(DEBUGCTLMSR_TR | DEBUGCTLMSR_BTS | DEBUGCTLMSR_BTINT | | ||
212 | DEBUGCTLMSR_BTS_OFF_OS | DEBUGCTLMSR_BTS_OFF_USR); | ||
213 | |||
214 | update_debugctlmsr(debugctlmsr); | ||
215 | } | ||
216 | |||
217 | static void intel_pmu_drain_bts_buffer(void) | ||
218 | { | ||
219 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
220 | struct debug_store *ds = cpuc->ds; | ||
221 | struct bts_record { | ||
222 | u64 from; | ||
223 | u64 to; | ||
224 | u64 flags; | ||
225 | }; | ||
226 | struct perf_event *event = cpuc->events[X86_PMC_IDX_FIXED_BTS]; | ||
227 | struct bts_record *at, *top; | ||
228 | struct perf_output_handle handle; | ||
229 | struct perf_event_header header; | ||
230 | struct perf_sample_data data; | ||
231 | struct pt_regs regs; | ||
232 | |||
233 | if (!event) | ||
234 | return; | ||
235 | |||
236 | if (!ds) | ||
237 | return; | ||
238 | |||
239 | at = (struct bts_record *)(unsigned long)ds->bts_buffer_base; | ||
240 | top = (struct bts_record *)(unsigned long)ds->bts_index; | ||
241 | |||
242 | if (top <= at) | ||
243 | return; | ||
244 | |||
245 | ds->bts_index = ds->bts_buffer_base; | ||
246 | |||
247 | perf_sample_data_init(&data, 0); | ||
248 | data.period = event->hw.last_period; | ||
249 | regs.ip = 0; | ||
250 | |||
251 | /* | ||
252 | * Prepare a generic sample, i.e. fill in the invariant fields. | ||
253 | * We will overwrite the from and to address before we output | ||
254 | * the sample. | ||
255 | */ | ||
256 | perf_prepare_sample(&header, &data, event, ®s); | ||
257 | |||
258 | if (perf_output_begin(&handle, event, header.size * (top - at), 1, 1)) | ||
259 | return; | ||
260 | |||
261 | for (; at < top; at++) { | ||
262 | data.ip = at->from; | ||
263 | data.addr = at->to; | ||
264 | |||
265 | perf_output_sample(&handle, &header, &data, event); | ||
266 | } | ||
267 | |||
268 | perf_output_end(&handle); | ||
269 | |||
270 | /* There's new data available. */ | ||
271 | event->hw.interrupts++; | ||
272 | event->pending_kill = POLL_IN; | ||
273 | } | ||
274 | |||
275 | /* | ||
276 | * PEBS | ||
277 | */ | ||
278 | |||
279 | static struct event_constraint intel_core_pebs_events[] = { | ||
280 | PEBS_EVENT_CONSTRAINT(0x00c0, 0x1), /* INSTR_RETIRED.ANY */ | ||
281 | PEBS_EVENT_CONSTRAINT(0xfec1, 0x1), /* X87_OPS_RETIRED.ANY */ | ||
282 | PEBS_EVENT_CONSTRAINT(0x00c5, 0x1), /* BR_INST_RETIRED.MISPRED */ | ||
283 | PEBS_EVENT_CONSTRAINT(0x1fc7, 0x1), /* SIMD_INST_RETURED.ANY */ | ||
284 | PEBS_EVENT_CONSTRAINT(0x01cb, 0x1), /* MEM_LOAD_RETIRED.L1D_MISS */ | ||
285 | PEBS_EVENT_CONSTRAINT(0x02cb, 0x1), /* MEM_LOAD_RETIRED.L1D_LINE_MISS */ | ||
286 | PEBS_EVENT_CONSTRAINT(0x04cb, 0x1), /* MEM_LOAD_RETIRED.L2_MISS */ | ||
287 | PEBS_EVENT_CONSTRAINT(0x08cb, 0x1), /* MEM_LOAD_RETIRED.L2_LINE_MISS */ | ||
288 | PEBS_EVENT_CONSTRAINT(0x10cb, 0x1), /* MEM_LOAD_RETIRED.DTLB_MISS */ | ||
289 | EVENT_CONSTRAINT_END | ||
290 | }; | ||
291 | |||
292 | static struct event_constraint intel_nehalem_pebs_events[] = { | ||
293 | PEBS_EVENT_CONSTRAINT(0x00c0, 0xf), /* INSTR_RETIRED.ANY */ | ||
294 | PEBS_EVENT_CONSTRAINT(0xfec1, 0xf), /* X87_OPS_RETIRED.ANY */ | ||
295 | PEBS_EVENT_CONSTRAINT(0x00c5, 0xf), /* BR_INST_RETIRED.MISPRED */ | ||
296 | PEBS_EVENT_CONSTRAINT(0x1fc7, 0xf), /* SIMD_INST_RETURED.ANY */ | ||
297 | PEBS_EVENT_CONSTRAINT(0x01cb, 0xf), /* MEM_LOAD_RETIRED.L1D_MISS */ | ||
298 | PEBS_EVENT_CONSTRAINT(0x02cb, 0xf), /* MEM_LOAD_RETIRED.L1D_LINE_MISS */ | ||
299 | PEBS_EVENT_CONSTRAINT(0x04cb, 0xf), /* MEM_LOAD_RETIRED.L2_MISS */ | ||
300 | PEBS_EVENT_CONSTRAINT(0x08cb, 0xf), /* MEM_LOAD_RETIRED.L2_LINE_MISS */ | ||
301 | PEBS_EVENT_CONSTRAINT(0x10cb, 0xf), /* MEM_LOAD_RETIRED.DTLB_MISS */ | ||
302 | EVENT_CONSTRAINT_END | ||
303 | }; | ||
304 | |||
305 | static struct event_constraint * | ||
306 | intel_pebs_constraints(struct perf_event *event) | ||
307 | { | ||
308 | struct event_constraint *c; | ||
309 | |||
310 | if (!event->attr.precise_ip) | ||
311 | return NULL; | ||
312 | |||
313 | if (x86_pmu.pebs_constraints) { | ||
314 | for_each_event_constraint(c, x86_pmu.pebs_constraints) { | ||
315 | if ((event->hw.config & c->cmask) == c->code) | ||
316 | return c; | ||
317 | } | ||
318 | } | ||
319 | |||
320 | return &emptyconstraint; | ||
321 | } | ||
322 | |||
323 | static void intel_pmu_pebs_enable(struct perf_event *event) | ||
324 | { | ||
325 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
326 | struct hw_perf_event *hwc = &event->hw; | ||
327 | |||
328 | hwc->config &= ~ARCH_PERFMON_EVENTSEL_INT; | ||
329 | |||
330 | cpuc->pebs_enabled |= 1ULL << hwc->idx; | ||
331 | WARN_ON_ONCE(cpuc->enabled); | ||
332 | |||
333 | if (x86_pmu.intel_cap.pebs_trap && event->attr.precise_ip > 1) | ||
334 | intel_pmu_lbr_enable(event); | ||
335 | } | ||
336 | |||
337 | static void intel_pmu_pebs_disable(struct perf_event *event) | ||
338 | { | ||
339 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
340 | struct hw_perf_event *hwc = &event->hw; | ||
341 | |||
342 | cpuc->pebs_enabled &= ~(1ULL << hwc->idx); | ||
343 | if (cpuc->enabled) | ||
344 | wrmsrl(MSR_IA32_PEBS_ENABLE, cpuc->pebs_enabled); | ||
345 | |||
346 | hwc->config |= ARCH_PERFMON_EVENTSEL_INT; | ||
347 | |||
348 | if (x86_pmu.intel_cap.pebs_trap && event->attr.precise_ip > 1) | ||
349 | intel_pmu_lbr_disable(event); | ||
350 | } | ||
351 | |||
352 | static void intel_pmu_pebs_enable_all(void) | ||
353 | { | ||
354 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
355 | |||
356 | if (cpuc->pebs_enabled) | ||
357 | wrmsrl(MSR_IA32_PEBS_ENABLE, cpuc->pebs_enabled); | ||
358 | } | ||
359 | |||
360 | static void intel_pmu_pebs_disable_all(void) | ||
361 | { | ||
362 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
363 | |||
364 | if (cpuc->pebs_enabled) | ||
365 | wrmsrl(MSR_IA32_PEBS_ENABLE, 0); | ||
366 | } | ||
367 | |||
368 | #include <asm/insn.h> | ||
369 | |||
370 | static inline bool kernel_ip(unsigned long ip) | ||
371 | { | ||
372 | #ifdef CONFIG_X86_32 | ||
373 | return ip > PAGE_OFFSET; | ||
374 | #else | ||
375 | return (long)ip < 0; | ||
376 | #endif | ||
377 | } | ||
378 | |||
379 | static int intel_pmu_pebs_fixup_ip(struct pt_regs *regs) | ||
380 | { | ||
381 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
382 | unsigned long from = cpuc->lbr_entries[0].from; | ||
383 | unsigned long old_to, to = cpuc->lbr_entries[0].to; | ||
384 | unsigned long ip = regs->ip; | ||
385 | |||
386 | /* | ||
387 | * We don't need to fixup if the PEBS assist is fault like | ||
388 | */ | ||
389 | if (!x86_pmu.intel_cap.pebs_trap) | ||
390 | return 1; | ||
391 | |||
392 | /* | ||
393 | * No LBR entry, no basic block, no rewinding | ||
394 | */ | ||
395 | if (!cpuc->lbr_stack.nr || !from || !to) | ||
396 | return 0; | ||
397 | |||
398 | /* | ||
399 | * Basic blocks should never cross user/kernel boundaries | ||
400 | */ | ||
401 | if (kernel_ip(ip) != kernel_ip(to)) | ||
402 | return 0; | ||
403 | |||
404 | /* | ||
405 | * unsigned math, either ip is before the start (impossible) or | ||
406 | * the basic block is larger than 1 page (sanity) | ||
407 | */ | ||
408 | if ((ip - to) > PAGE_SIZE) | ||
409 | return 0; | ||
410 | |||
411 | /* | ||
412 | * We sampled a branch insn, rewind using the LBR stack | ||
413 | */ | ||
414 | if (ip == to) { | ||
415 | regs->ip = from; | ||
416 | return 1; | ||
417 | } | ||
418 | |||
419 | do { | ||
420 | struct insn insn; | ||
421 | u8 buf[MAX_INSN_SIZE]; | ||
422 | void *kaddr; | ||
423 | |||
424 | old_to = to; | ||
425 | if (!kernel_ip(ip)) { | ||
426 | int bytes, size = MAX_INSN_SIZE; | ||
427 | |||
428 | bytes = copy_from_user_nmi(buf, (void __user *)to, size); | ||
429 | if (bytes != size) | ||
430 | return 0; | ||
431 | |||
432 | kaddr = buf; | ||
433 | } else | ||
434 | kaddr = (void *)to; | ||
435 | |||
436 | kernel_insn_init(&insn, kaddr); | ||
437 | insn_get_length(&insn); | ||
438 | to += insn.length; | ||
439 | } while (to < ip); | ||
440 | |||
441 | if (to == ip) { | ||
442 | regs->ip = old_to; | ||
443 | return 1; | ||
444 | } | ||
445 | |||
446 | /* | ||
447 | * Even though we decoded the basic block, the instruction stream | ||
448 | * never matched the given IP, either the TO or the IP got corrupted. | ||
449 | */ | ||
450 | return 0; | ||
451 | } | ||
452 | |||
453 | static int intel_pmu_save_and_restart(struct perf_event *event); | ||
454 | |||
455 | static void __intel_pmu_pebs_event(struct perf_event *event, | ||
456 | struct pt_regs *iregs, void *__pebs) | ||
457 | { | ||
458 | /* | ||
459 | * We cast to pebs_record_core since that is a subset of | ||
460 | * both formats and we don't use the other fields in this | ||
461 | * routine. | ||
462 | */ | ||
463 | struct pebs_record_core *pebs = __pebs; | ||
464 | struct perf_sample_data data; | ||
465 | struct pt_regs regs; | ||
466 | |||
467 | if (!intel_pmu_save_and_restart(event)) | ||
468 | return; | ||
469 | |||
470 | perf_sample_data_init(&data, 0); | ||
471 | data.period = event->hw.last_period; | ||
472 | |||
473 | /* | ||
474 | * We use the interrupt regs as a base because the PEBS record | ||
475 | * does not contain a full regs set, specifically it seems to | ||
476 | * lack segment descriptors, which get used by things like | ||
477 | * user_mode(). | ||
478 | * | ||
479 | * In the simple case fix up only the IP and BP,SP regs, for | ||
480 | * PERF_SAMPLE_IP and PERF_SAMPLE_CALLCHAIN to function properly. | ||
481 | * A possible PERF_SAMPLE_REGS will have to transfer all regs. | ||
482 | */ | ||
483 | regs = *iregs; | ||
484 | regs.ip = pebs->ip; | ||
485 | regs.bp = pebs->bp; | ||
486 | regs.sp = pebs->sp; | ||
487 | |||
488 | if (event->attr.precise_ip > 1 && intel_pmu_pebs_fixup_ip(®s)) | ||
489 | regs.flags |= PERF_EFLAGS_EXACT; | ||
490 | else | ||
491 | regs.flags &= ~PERF_EFLAGS_EXACT; | ||
492 | |||
493 | if (perf_event_overflow(event, 1, &data, ®s)) | ||
494 | x86_pmu_stop(event); | ||
495 | } | ||
496 | |||
497 | static void intel_pmu_drain_pebs_core(struct pt_regs *iregs) | ||
498 | { | ||
499 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
500 | struct debug_store *ds = cpuc->ds; | ||
501 | struct perf_event *event = cpuc->events[0]; /* PMC0 only */ | ||
502 | struct pebs_record_core *at, *top; | ||
503 | int n; | ||
504 | |||
505 | if (!ds || !x86_pmu.pebs) | ||
506 | return; | ||
507 | |||
508 | at = (struct pebs_record_core *)(unsigned long)ds->pebs_buffer_base; | ||
509 | top = (struct pebs_record_core *)(unsigned long)ds->pebs_index; | ||
510 | |||
511 | /* | ||
512 | * Whatever else happens, drain the thing | ||
513 | */ | ||
514 | ds->pebs_index = ds->pebs_buffer_base; | ||
515 | |||
516 | if (!test_bit(0, cpuc->active_mask)) | ||
517 | return; | ||
518 | |||
519 | WARN_ON_ONCE(!event); | ||
520 | |||
521 | if (!event->attr.precise_ip) | ||
522 | return; | ||
523 | |||
524 | n = top - at; | ||
525 | if (n <= 0) | ||
526 | return; | ||
527 | |||
528 | /* | ||
529 | * Should not happen, we program the threshold at 1 and do not | ||
530 | * set a reset value. | ||
531 | */ | ||
532 | WARN_ON_ONCE(n > 1); | ||
533 | at += n - 1; | ||
534 | |||
535 | __intel_pmu_pebs_event(event, iregs, at); | ||
536 | } | ||
537 | |||
538 | static void intel_pmu_drain_pebs_nhm(struct pt_regs *iregs) | ||
539 | { | ||
540 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
541 | struct debug_store *ds = cpuc->ds; | ||
542 | struct pebs_record_nhm *at, *top; | ||
543 | struct perf_event *event = NULL; | ||
544 | u64 status = 0; | ||
545 | int bit, n; | ||
546 | |||
547 | if (!ds || !x86_pmu.pebs) | ||
548 | return; | ||
549 | |||
550 | at = (struct pebs_record_nhm *)(unsigned long)ds->pebs_buffer_base; | ||
551 | top = (struct pebs_record_nhm *)(unsigned long)ds->pebs_index; | ||
552 | |||
553 | ds->pebs_index = ds->pebs_buffer_base; | ||
554 | |||
555 | n = top - at; | ||
556 | if (n <= 0) | ||
557 | return; | ||
558 | |||
559 | /* | ||
560 | * Should not happen, we program the threshold at 1 and do not | ||
561 | * set a reset value. | ||
562 | */ | ||
563 | WARN_ON_ONCE(n > MAX_PEBS_EVENTS); | ||
564 | |||
565 | for ( ; at < top; at++) { | ||
566 | for_each_set_bit(bit, (unsigned long *)&at->status, MAX_PEBS_EVENTS) { | ||
567 | event = cpuc->events[bit]; | ||
568 | if (!test_bit(bit, cpuc->active_mask)) | ||
569 | continue; | ||
570 | |||
571 | WARN_ON_ONCE(!event); | ||
572 | |||
573 | if (!event->attr.precise_ip) | ||
574 | continue; | ||
575 | |||
576 | if (__test_and_set_bit(bit, (unsigned long *)&status)) | ||
577 | continue; | ||
578 | |||
579 | break; | ||
580 | } | ||
581 | |||
582 | if (!event || bit >= MAX_PEBS_EVENTS) | ||
583 | continue; | ||
584 | |||
585 | __intel_pmu_pebs_event(event, iregs, at); | ||
586 | } | ||
587 | } | ||
588 | |||
589 | /* | ||
590 | * BTS, PEBS probe and setup | ||
591 | */ | ||
592 | |||
593 | static void intel_ds_init(void) | ||
594 | { | ||
595 | /* | ||
596 | * No support for 32bit formats | ||
597 | */ | ||
598 | if (!boot_cpu_has(X86_FEATURE_DTES64)) | ||
599 | return; | ||
600 | |||
601 | x86_pmu.bts = boot_cpu_has(X86_FEATURE_BTS); | ||
602 | x86_pmu.pebs = boot_cpu_has(X86_FEATURE_PEBS); | ||
603 | if (x86_pmu.pebs) { | ||
604 | char pebs_type = x86_pmu.intel_cap.pebs_trap ? '+' : '-'; | ||
605 | int format = x86_pmu.intel_cap.pebs_format; | ||
606 | |||
607 | switch (format) { | ||
608 | case 0: | ||
609 | printk(KERN_CONT "PEBS fmt0%c, ", pebs_type); | ||
610 | x86_pmu.pebs_record_size = sizeof(struct pebs_record_core); | ||
611 | x86_pmu.drain_pebs = intel_pmu_drain_pebs_core; | ||
612 | x86_pmu.pebs_constraints = intel_core_pebs_events; | ||
613 | break; | ||
614 | |||
615 | case 1: | ||
616 | printk(KERN_CONT "PEBS fmt1%c, ", pebs_type); | ||
617 | x86_pmu.pebs_record_size = sizeof(struct pebs_record_nhm); | ||
618 | x86_pmu.drain_pebs = intel_pmu_drain_pebs_nhm; | ||
619 | x86_pmu.pebs_constraints = intel_nehalem_pebs_events; | ||
620 | break; | ||
621 | |||
622 | default: | ||
623 | printk(KERN_CONT "no PEBS fmt%d%c, ", format, pebs_type); | ||
624 | x86_pmu.pebs = 0; | ||
625 | break; | ||
626 | } | ||
627 | } | ||
628 | } | ||
629 | |||
630 | #else /* CONFIG_CPU_SUP_INTEL */ | ||
631 | |||
632 | static int reserve_ds_buffers(void) | ||
633 | { | ||
634 | return 0; | ||
635 | } | ||
636 | |||
637 | static void release_ds_buffers(void) | ||
638 | { | ||
639 | } | ||
640 | |||
641 | #endif /* CONFIG_CPU_SUP_INTEL */ | ||
diff --git a/arch/x86/kernel/cpu/perf_event_intel_lbr.c b/arch/x86/kernel/cpu/perf_event_intel_lbr.c new file mode 100644 index 000000000000..d202c1bece1a --- /dev/null +++ b/arch/x86/kernel/cpu/perf_event_intel_lbr.c | |||
@@ -0,0 +1,218 @@ | |||
1 | #ifdef CONFIG_CPU_SUP_INTEL | ||
2 | |||
3 | enum { | ||
4 | LBR_FORMAT_32 = 0x00, | ||
5 | LBR_FORMAT_LIP = 0x01, | ||
6 | LBR_FORMAT_EIP = 0x02, | ||
7 | LBR_FORMAT_EIP_FLAGS = 0x03, | ||
8 | }; | ||
9 | |||
10 | /* | ||
11 | * We only support LBR implementations that have FREEZE_LBRS_ON_PMI | ||
12 | * otherwise it becomes near impossible to get a reliable stack. | ||
13 | */ | ||
14 | |||
15 | static void __intel_pmu_lbr_enable(void) | ||
16 | { | ||
17 | u64 debugctl; | ||
18 | |||
19 | rdmsrl(MSR_IA32_DEBUGCTLMSR, debugctl); | ||
20 | debugctl |= (DEBUGCTLMSR_LBR | DEBUGCTLMSR_FREEZE_LBRS_ON_PMI); | ||
21 | wrmsrl(MSR_IA32_DEBUGCTLMSR, debugctl); | ||
22 | } | ||
23 | |||
24 | static void __intel_pmu_lbr_disable(void) | ||
25 | { | ||
26 | u64 debugctl; | ||
27 | |||
28 | rdmsrl(MSR_IA32_DEBUGCTLMSR, debugctl); | ||
29 | debugctl &= ~(DEBUGCTLMSR_LBR | DEBUGCTLMSR_FREEZE_LBRS_ON_PMI); | ||
30 | wrmsrl(MSR_IA32_DEBUGCTLMSR, debugctl); | ||
31 | } | ||
32 | |||
33 | static void intel_pmu_lbr_reset_32(void) | ||
34 | { | ||
35 | int i; | ||
36 | |||
37 | for (i = 0; i < x86_pmu.lbr_nr; i++) | ||
38 | wrmsrl(x86_pmu.lbr_from + i, 0); | ||
39 | } | ||
40 | |||
41 | static void intel_pmu_lbr_reset_64(void) | ||
42 | { | ||
43 | int i; | ||
44 | |||
45 | for (i = 0; i < x86_pmu.lbr_nr; i++) { | ||
46 | wrmsrl(x86_pmu.lbr_from + i, 0); | ||
47 | wrmsrl(x86_pmu.lbr_to + i, 0); | ||
48 | } | ||
49 | } | ||
50 | |||
51 | static void intel_pmu_lbr_reset(void) | ||
52 | { | ||
53 | if (!x86_pmu.lbr_nr) | ||
54 | return; | ||
55 | |||
56 | if (x86_pmu.intel_cap.lbr_format == LBR_FORMAT_32) | ||
57 | intel_pmu_lbr_reset_32(); | ||
58 | else | ||
59 | intel_pmu_lbr_reset_64(); | ||
60 | } | ||
61 | |||
62 | static void intel_pmu_lbr_enable(struct perf_event *event) | ||
63 | { | ||
64 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
65 | |||
66 | if (!x86_pmu.lbr_nr) | ||
67 | return; | ||
68 | |||
69 | WARN_ON_ONCE(cpuc->enabled); | ||
70 | |||
71 | /* | ||
72 | * Reset the LBR stack if we changed task context to | ||
73 | * avoid data leaks. | ||
74 | */ | ||
75 | |||
76 | if (event->ctx->task && cpuc->lbr_context != event->ctx) { | ||
77 | intel_pmu_lbr_reset(); | ||
78 | cpuc->lbr_context = event->ctx; | ||
79 | } | ||
80 | |||
81 | cpuc->lbr_users++; | ||
82 | } | ||
83 | |||
84 | static void intel_pmu_lbr_disable(struct perf_event *event) | ||
85 | { | ||
86 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
87 | |||
88 | if (!x86_pmu.lbr_nr) | ||
89 | return; | ||
90 | |||
91 | cpuc->lbr_users--; | ||
92 | WARN_ON_ONCE(cpuc->lbr_users < 0); | ||
93 | |||
94 | if (cpuc->enabled && !cpuc->lbr_users) | ||
95 | __intel_pmu_lbr_disable(); | ||
96 | } | ||
97 | |||
98 | static void intel_pmu_lbr_enable_all(void) | ||
99 | { | ||
100 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
101 | |||
102 | if (cpuc->lbr_users) | ||
103 | __intel_pmu_lbr_enable(); | ||
104 | } | ||
105 | |||
106 | static void intel_pmu_lbr_disable_all(void) | ||
107 | { | ||
108 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
109 | |||
110 | if (cpuc->lbr_users) | ||
111 | __intel_pmu_lbr_disable(); | ||
112 | } | ||
113 | |||
114 | static inline u64 intel_pmu_lbr_tos(void) | ||
115 | { | ||
116 | u64 tos; | ||
117 | |||
118 | rdmsrl(x86_pmu.lbr_tos, tos); | ||
119 | |||
120 | return tos; | ||
121 | } | ||
122 | |||
123 | static void intel_pmu_lbr_read_32(struct cpu_hw_events *cpuc) | ||
124 | { | ||
125 | unsigned long mask = x86_pmu.lbr_nr - 1; | ||
126 | u64 tos = intel_pmu_lbr_tos(); | ||
127 | int i; | ||
128 | |||
129 | for (i = 0; i < x86_pmu.lbr_nr; i++) { | ||
130 | unsigned long lbr_idx = (tos - i) & mask; | ||
131 | union { | ||
132 | struct { | ||
133 | u32 from; | ||
134 | u32 to; | ||
135 | }; | ||
136 | u64 lbr; | ||
137 | } msr_lastbranch; | ||
138 | |||
139 | rdmsrl(x86_pmu.lbr_from + lbr_idx, msr_lastbranch.lbr); | ||
140 | |||
141 | cpuc->lbr_entries[i].from = msr_lastbranch.from; | ||
142 | cpuc->lbr_entries[i].to = msr_lastbranch.to; | ||
143 | cpuc->lbr_entries[i].flags = 0; | ||
144 | } | ||
145 | cpuc->lbr_stack.nr = i; | ||
146 | } | ||
147 | |||
148 | #define LBR_FROM_FLAG_MISPRED (1ULL << 63) | ||
149 | |||
150 | /* | ||
151 | * Due to lack of segmentation in Linux the effective address (offset) | ||
152 | * is the same as the linear address, allowing us to merge the LIP and EIP | ||
153 | * LBR formats. | ||
154 | */ | ||
155 | static void intel_pmu_lbr_read_64(struct cpu_hw_events *cpuc) | ||
156 | { | ||
157 | unsigned long mask = x86_pmu.lbr_nr - 1; | ||
158 | int lbr_format = x86_pmu.intel_cap.lbr_format; | ||
159 | u64 tos = intel_pmu_lbr_tos(); | ||
160 | int i; | ||
161 | |||
162 | for (i = 0; i < x86_pmu.lbr_nr; i++) { | ||
163 | unsigned long lbr_idx = (tos - i) & mask; | ||
164 | u64 from, to, flags = 0; | ||
165 | |||
166 | rdmsrl(x86_pmu.lbr_from + lbr_idx, from); | ||
167 | rdmsrl(x86_pmu.lbr_to + lbr_idx, to); | ||
168 | |||
169 | if (lbr_format == LBR_FORMAT_EIP_FLAGS) { | ||
170 | flags = !!(from & LBR_FROM_FLAG_MISPRED); | ||
171 | from = (u64)((((s64)from) << 1) >> 1); | ||
172 | } | ||
173 | |||
174 | cpuc->lbr_entries[i].from = from; | ||
175 | cpuc->lbr_entries[i].to = to; | ||
176 | cpuc->lbr_entries[i].flags = flags; | ||
177 | } | ||
178 | cpuc->lbr_stack.nr = i; | ||
179 | } | ||
180 | |||
181 | static void intel_pmu_lbr_read(void) | ||
182 | { | ||
183 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
184 | |||
185 | if (!cpuc->lbr_users) | ||
186 | return; | ||
187 | |||
188 | if (x86_pmu.intel_cap.lbr_format == LBR_FORMAT_32) | ||
189 | intel_pmu_lbr_read_32(cpuc); | ||
190 | else | ||
191 | intel_pmu_lbr_read_64(cpuc); | ||
192 | } | ||
193 | |||
194 | static void intel_pmu_lbr_init_core(void) | ||
195 | { | ||
196 | x86_pmu.lbr_nr = 4; | ||
197 | x86_pmu.lbr_tos = 0x01c9; | ||
198 | x86_pmu.lbr_from = 0x40; | ||
199 | x86_pmu.lbr_to = 0x60; | ||
200 | } | ||
201 | |||
202 | static void intel_pmu_lbr_init_nhm(void) | ||
203 | { | ||
204 | x86_pmu.lbr_nr = 16; | ||
205 | x86_pmu.lbr_tos = 0x01c9; | ||
206 | x86_pmu.lbr_from = 0x680; | ||
207 | x86_pmu.lbr_to = 0x6c0; | ||
208 | } | ||
209 | |||
210 | static void intel_pmu_lbr_init_atom(void) | ||
211 | { | ||
212 | x86_pmu.lbr_nr = 8; | ||
213 | x86_pmu.lbr_tos = 0x01c9; | ||
214 | x86_pmu.lbr_from = 0x40; | ||
215 | x86_pmu.lbr_to = 0x60; | ||
216 | } | ||
217 | |||
218 | #endif /* CONFIG_CPU_SUP_INTEL */ | ||
diff --git a/arch/x86/kernel/cpu/perf_event_p4.c b/arch/x86/kernel/cpu/perf_event_p4.c new file mode 100644 index 000000000000..424fc8de68e4 --- /dev/null +++ b/arch/x86/kernel/cpu/perf_event_p4.c | |||
@@ -0,0 +1,857 @@ | |||
1 | /* | ||
2 | * Netburst Perfomance Events (P4, old Xeon) | ||
3 | * | ||
4 | * Copyright (C) 2010 Parallels, Inc., Cyrill Gorcunov <gorcunov@openvz.org> | ||
5 | * Copyright (C) 2010 Intel Corporation, Lin Ming <ming.m.lin@intel.com> | ||
6 | * | ||
7 | * For licencing details see kernel-base/COPYING | ||
8 | */ | ||
9 | |||
10 | #ifdef CONFIG_CPU_SUP_INTEL | ||
11 | |||
12 | #include <asm/perf_event_p4.h> | ||
13 | |||
14 | #define P4_CNTR_LIMIT 3 | ||
15 | /* | ||
16 | * array indices: 0,1 - HT threads, used with HT enabled cpu | ||
17 | */ | ||
18 | struct p4_event_bind { | ||
19 | unsigned int opcode; /* Event code and ESCR selector */ | ||
20 | unsigned int escr_msr[2]; /* ESCR MSR for this event */ | ||
21 | char cntr[2][P4_CNTR_LIMIT]; /* counter index (offset), -1 on abscence */ | ||
22 | }; | ||
23 | |||
24 | struct p4_cache_event_bind { | ||
25 | unsigned int metric_pebs; | ||
26 | unsigned int metric_vert; | ||
27 | }; | ||
28 | |||
29 | #define P4_GEN_CACHE_EVENT_BIND(name) \ | ||
30 | [P4_CACHE__##name] = { \ | ||
31 | .metric_pebs = P4_PEBS__##name, \ | ||
32 | .metric_vert = P4_VERT__##name, \ | ||
33 | } | ||
34 | |||
35 | static struct p4_cache_event_bind p4_cache_event_bind_map[] = { | ||
36 | P4_GEN_CACHE_EVENT_BIND(1stl_cache_load_miss_retired), | ||
37 | P4_GEN_CACHE_EVENT_BIND(2ndl_cache_load_miss_retired), | ||
38 | P4_GEN_CACHE_EVENT_BIND(dtlb_load_miss_retired), | ||
39 | P4_GEN_CACHE_EVENT_BIND(dtlb_store_miss_retired), | ||
40 | }; | ||
41 | |||
42 | /* | ||
43 | * Note that we don't use CCCR1 here, there is an | ||
44 | * exception for P4_BSQ_ALLOCATION but we just have | ||
45 | * no workaround | ||
46 | * | ||
47 | * consider this binding as resources which particular | ||
48 | * event may borrow, it doesn't contain EventMask, | ||
49 | * Tags and friends -- they are left to a caller | ||
50 | */ | ||
51 | static struct p4_event_bind p4_event_bind_map[] = { | ||
52 | [P4_EVENT_TC_DELIVER_MODE] = { | ||
53 | .opcode = P4_OPCODE(P4_EVENT_TC_DELIVER_MODE), | ||
54 | .escr_msr = { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 }, | ||
55 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
56 | }, | ||
57 | [P4_EVENT_BPU_FETCH_REQUEST] = { | ||
58 | .opcode = P4_OPCODE(P4_EVENT_BPU_FETCH_REQUEST), | ||
59 | .escr_msr = { MSR_P4_BPU_ESCR0, MSR_P4_BPU_ESCR1 }, | ||
60 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
61 | }, | ||
62 | [P4_EVENT_ITLB_REFERENCE] = { | ||
63 | .opcode = P4_OPCODE(P4_EVENT_ITLB_REFERENCE), | ||
64 | .escr_msr = { MSR_P4_ITLB_ESCR0, MSR_P4_ITLB_ESCR1 }, | ||
65 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
66 | }, | ||
67 | [P4_EVENT_MEMORY_CANCEL] = { | ||
68 | .opcode = P4_OPCODE(P4_EVENT_MEMORY_CANCEL), | ||
69 | .escr_msr = { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 }, | ||
70 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
71 | }, | ||
72 | [P4_EVENT_MEMORY_COMPLETE] = { | ||
73 | .opcode = P4_OPCODE(P4_EVENT_MEMORY_COMPLETE), | ||
74 | .escr_msr = { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 }, | ||
75 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
76 | }, | ||
77 | [P4_EVENT_LOAD_PORT_REPLAY] = { | ||
78 | .opcode = P4_OPCODE(P4_EVENT_LOAD_PORT_REPLAY), | ||
79 | .escr_msr = { MSR_P4_SAAT_ESCR0, MSR_P4_SAAT_ESCR1 }, | ||
80 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
81 | }, | ||
82 | [P4_EVENT_STORE_PORT_REPLAY] = { | ||
83 | .opcode = P4_OPCODE(P4_EVENT_STORE_PORT_REPLAY), | ||
84 | .escr_msr = { MSR_P4_SAAT_ESCR0 , MSR_P4_SAAT_ESCR1 }, | ||
85 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
86 | }, | ||
87 | [P4_EVENT_MOB_LOAD_REPLAY] = { | ||
88 | .opcode = P4_OPCODE(P4_EVENT_MOB_LOAD_REPLAY), | ||
89 | .escr_msr = { MSR_P4_MOB_ESCR0, MSR_P4_MOB_ESCR1 }, | ||
90 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
91 | }, | ||
92 | [P4_EVENT_PAGE_WALK_TYPE] = { | ||
93 | .opcode = P4_OPCODE(P4_EVENT_PAGE_WALK_TYPE), | ||
94 | .escr_msr = { MSR_P4_PMH_ESCR0, MSR_P4_PMH_ESCR1 }, | ||
95 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
96 | }, | ||
97 | [P4_EVENT_BSQ_CACHE_REFERENCE] = { | ||
98 | .opcode = P4_OPCODE(P4_EVENT_BSQ_CACHE_REFERENCE), | ||
99 | .escr_msr = { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR1 }, | ||
100 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
101 | }, | ||
102 | [P4_EVENT_IOQ_ALLOCATION] = { | ||
103 | .opcode = P4_OPCODE(P4_EVENT_IOQ_ALLOCATION), | ||
104 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
105 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
106 | }, | ||
107 | [P4_EVENT_IOQ_ACTIVE_ENTRIES] = { /* shared ESCR */ | ||
108 | .opcode = P4_OPCODE(P4_EVENT_IOQ_ACTIVE_ENTRIES), | ||
109 | .escr_msr = { MSR_P4_FSB_ESCR1, MSR_P4_FSB_ESCR1 }, | ||
110 | .cntr = { {2, -1, -1}, {3, -1, -1} }, | ||
111 | }, | ||
112 | [P4_EVENT_FSB_DATA_ACTIVITY] = { | ||
113 | .opcode = P4_OPCODE(P4_EVENT_FSB_DATA_ACTIVITY), | ||
114 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
115 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
116 | }, | ||
117 | [P4_EVENT_BSQ_ALLOCATION] = { /* shared ESCR, broken CCCR1 */ | ||
118 | .opcode = P4_OPCODE(P4_EVENT_BSQ_ALLOCATION), | ||
119 | .escr_msr = { MSR_P4_BSU_ESCR0, MSR_P4_BSU_ESCR0 }, | ||
120 | .cntr = { {0, -1, -1}, {1, -1, -1} }, | ||
121 | }, | ||
122 | [P4_EVENT_BSQ_ACTIVE_ENTRIES] = { /* shared ESCR */ | ||
123 | .opcode = P4_OPCODE(P4_EVENT_BSQ_ACTIVE_ENTRIES), | ||
124 | .escr_msr = { MSR_P4_BSU_ESCR1 , MSR_P4_BSU_ESCR1 }, | ||
125 | .cntr = { {2, -1, -1}, {3, -1, -1} }, | ||
126 | }, | ||
127 | [P4_EVENT_SSE_INPUT_ASSIST] = { | ||
128 | .opcode = P4_OPCODE(P4_EVENT_SSE_INPUT_ASSIST), | ||
129 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
130 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
131 | }, | ||
132 | [P4_EVENT_PACKED_SP_UOP] = { | ||
133 | .opcode = P4_OPCODE(P4_EVENT_PACKED_SP_UOP), | ||
134 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
135 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
136 | }, | ||
137 | [P4_EVENT_PACKED_DP_UOP] = { | ||
138 | .opcode = P4_OPCODE(P4_EVENT_PACKED_DP_UOP), | ||
139 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
140 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
141 | }, | ||
142 | [P4_EVENT_SCALAR_SP_UOP] = { | ||
143 | .opcode = P4_OPCODE(P4_EVENT_SCALAR_SP_UOP), | ||
144 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
145 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
146 | }, | ||
147 | [P4_EVENT_SCALAR_DP_UOP] = { | ||
148 | .opcode = P4_OPCODE(P4_EVENT_SCALAR_DP_UOP), | ||
149 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
150 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
151 | }, | ||
152 | [P4_EVENT_64BIT_MMX_UOP] = { | ||
153 | .opcode = P4_OPCODE(P4_EVENT_64BIT_MMX_UOP), | ||
154 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
155 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
156 | }, | ||
157 | [P4_EVENT_128BIT_MMX_UOP] = { | ||
158 | .opcode = P4_OPCODE(P4_EVENT_128BIT_MMX_UOP), | ||
159 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
160 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
161 | }, | ||
162 | [P4_EVENT_X87_FP_UOP] = { | ||
163 | .opcode = P4_OPCODE(P4_EVENT_X87_FP_UOP), | ||
164 | .escr_msr = { MSR_P4_FIRM_ESCR0, MSR_P4_FIRM_ESCR1 }, | ||
165 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
166 | }, | ||
167 | [P4_EVENT_TC_MISC] = { | ||
168 | .opcode = P4_OPCODE(P4_EVENT_TC_MISC), | ||
169 | .escr_msr = { MSR_P4_TC_ESCR0, MSR_P4_TC_ESCR1 }, | ||
170 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
171 | }, | ||
172 | [P4_EVENT_GLOBAL_POWER_EVENTS] = { | ||
173 | .opcode = P4_OPCODE(P4_EVENT_GLOBAL_POWER_EVENTS), | ||
174 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
175 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
176 | }, | ||
177 | [P4_EVENT_TC_MS_XFER] = { | ||
178 | .opcode = P4_OPCODE(P4_EVENT_TC_MS_XFER), | ||
179 | .escr_msr = { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 }, | ||
180 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
181 | }, | ||
182 | [P4_EVENT_UOP_QUEUE_WRITES] = { | ||
183 | .opcode = P4_OPCODE(P4_EVENT_UOP_QUEUE_WRITES), | ||
184 | .escr_msr = { MSR_P4_MS_ESCR0, MSR_P4_MS_ESCR1 }, | ||
185 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
186 | }, | ||
187 | [P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE] = { | ||
188 | .opcode = P4_OPCODE(P4_EVENT_RETIRED_MISPRED_BRANCH_TYPE), | ||
189 | .escr_msr = { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR0 }, | ||
190 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
191 | }, | ||
192 | [P4_EVENT_RETIRED_BRANCH_TYPE] = { | ||
193 | .opcode = P4_OPCODE(P4_EVENT_RETIRED_BRANCH_TYPE), | ||
194 | .escr_msr = { MSR_P4_TBPU_ESCR0 , MSR_P4_TBPU_ESCR1 }, | ||
195 | .cntr = { {4, 5, -1}, {6, 7, -1} }, | ||
196 | }, | ||
197 | [P4_EVENT_RESOURCE_STALL] = { | ||
198 | .opcode = P4_OPCODE(P4_EVENT_RESOURCE_STALL), | ||
199 | .escr_msr = { MSR_P4_ALF_ESCR0, MSR_P4_ALF_ESCR1 }, | ||
200 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
201 | }, | ||
202 | [P4_EVENT_WC_BUFFER] = { | ||
203 | .opcode = P4_OPCODE(P4_EVENT_WC_BUFFER), | ||
204 | .escr_msr = { MSR_P4_DAC_ESCR0, MSR_P4_DAC_ESCR1 }, | ||
205 | .cntr = { {8, 9, -1}, {10, 11, -1} }, | ||
206 | }, | ||
207 | [P4_EVENT_B2B_CYCLES] = { | ||
208 | .opcode = P4_OPCODE(P4_EVENT_B2B_CYCLES), | ||
209 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
210 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
211 | }, | ||
212 | [P4_EVENT_BNR] = { | ||
213 | .opcode = P4_OPCODE(P4_EVENT_BNR), | ||
214 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
215 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
216 | }, | ||
217 | [P4_EVENT_SNOOP] = { | ||
218 | .opcode = P4_OPCODE(P4_EVENT_SNOOP), | ||
219 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
220 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
221 | }, | ||
222 | [P4_EVENT_RESPONSE] = { | ||
223 | .opcode = P4_OPCODE(P4_EVENT_RESPONSE), | ||
224 | .escr_msr = { MSR_P4_FSB_ESCR0, MSR_P4_FSB_ESCR1 }, | ||
225 | .cntr = { {0, -1, -1}, {2, -1, -1} }, | ||
226 | }, | ||
227 | [P4_EVENT_FRONT_END_EVENT] = { | ||
228 | .opcode = P4_OPCODE(P4_EVENT_FRONT_END_EVENT), | ||
229 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
230 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
231 | }, | ||
232 | [P4_EVENT_EXECUTION_EVENT] = { | ||
233 | .opcode = P4_OPCODE(P4_EVENT_EXECUTION_EVENT), | ||
234 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
235 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
236 | }, | ||
237 | [P4_EVENT_REPLAY_EVENT] = { | ||
238 | .opcode = P4_OPCODE(P4_EVENT_REPLAY_EVENT), | ||
239 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
240 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
241 | }, | ||
242 | [P4_EVENT_INSTR_RETIRED] = { | ||
243 | .opcode = P4_OPCODE(P4_EVENT_INSTR_RETIRED), | ||
244 | .escr_msr = { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 }, | ||
245 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
246 | }, | ||
247 | [P4_EVENT_UOPS_RETIRED] = { | ||
248 | .opcode = P4_OPCODE(P4_EVENT_UOPS_RETIRED), | ||
249 | .escr_msr = { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 }, | ||
250 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
251 | }, | ||
252 | [P4_EVENT_UOP_TYPE] = { | ||
253 | .opcode = P4_OPCODE(P4_EVENT_UOP_TYPE), | ||
254 | .escr_msr = { MSR_P4_RAT_ESCR0, MSR_P4_RAT_ESCR1 }, | ||
255 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
256 | }, | ||
257 | [P4_EVENT_BRANCH_RETIRED] = { | ||
258 | .opcode = P4_OPCODE(P4_EVENT_BRANCH_RETIRED), | ||
259 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
260 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
261 | }, | ||
262 | [P4_EVENT_MISPRED_BRANCH_RETIRED] = { | ||
263 | .opcode = P4_OPCODE(P4_EVENT_MISPRED_BRANCH_RETIRED), | ||
264 | .escr_msr = { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 }, | ||
265 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
266 | }, | ||
267 | [P4_EVENT_X87_ASSIST] = { | ||
268 | .opcode = P4_OPCODE(P4_EVENT_X87_ASSIST), | ||
269 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
270 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
271 | }, | ||
272 | [P4_EVENT_MACHINE_CLEAR] = { | ||
273 | .opcode = P4_OPCODE(P4_EVENT_MACHINE_CLEAR), | ||
274 | .escr_msr = { MSR_P4_CRU_ESCR2, MSR_P4_CRU_ESCR3 }, | ||
275 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
276 | }, | ||
277 | [P4_EVENT_INSTR_COMPLETED] = { | ||
278 | .opcode = P4_OPCODE(P4_EVENT_INSTR_COMPLETED), | ||
279 | .escr_msr = { MSR_P4_CRU_ESCR0, MSR_P4_CRU_ESCR1 }, | ||
280 | .cntr = { {12, 13, 16}, {14, 15, 17} }, | ||
281 | }, | ||
282 | }; | ||
283 | |||
284 | #define P4_GEN_CACHE_EVENT(event, bit, cache_event) \ | ||
285 | p4_config_pack_escr(P4_ESCR_EVENT(event) | \ | ||
286 | P4_ESCR_EMASK_BIT(event, bit)) | \ | ||
287 | p4_config_pack_cccr(cache_event | \ | ||
288 | P4_CCCR_ESEL(P4_OPCODE_ESEL(P4_OPCODE(event)))) | ||
289 | |||
290 | static __initconst const u64 p4_hw_cache_event_ids | ||
291 | [PERF_COUNT_HW_CACHE_MAX] | ||
292 | [PERF_COUNT_HW_CACHE_OP_MAX] | ||
293 | [PERF_COUNT_HW_CACHE_RESULT_MAX] = | ||
294 | { | ||
295 | [ C(L1D ) ] = { | ||
296 | [ C(OP_READ) ] = { | ||
297 | [ C(RESULT_ACCESS) ] = 0x0, | ||
298 | [ C(RESULT_MISS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS, | ||
299 | P4_CACHE__1stl_cache_load_miss_retired), | ||
300 | }, | ||
301 | }, | ||
302 | [ C(LL ) ] = { | ||
303 | [ C(OP_READ) ] = { | ||
304 | [ C(RESULT_ACCESS) ] = 0x0, | ||
305 | [ C(RESULT_MISS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS, | ||
306 | P4_CACHE__2ndl_cache_load_miss_retired), | ||
307 | }, | ||
308 | }, | ||
309 | [ C(DTLB) ] = { | ||
310 | [ C(OP_READ) ] = { | ||
311 | [ C(RESULT_ACCESS) ] = 0x0, | ||
312 | [ C(RESULT_MISS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS, | ||
313 | P4_CACHE__dtlb_load_miss_retired), | ||
314 | }, | ||
315 | [ C(OP_WRITE) ] = { | ||
316 | [ C(RESULT_ACCESS) ] = 0x0, | ||
317 | [ C(RESULT_MISS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_REPLAY_EVENT, NBOGUS, | ||
318 | P4_CACHE__dtlb_store_miss_retired), | ||
319 | }, | ||
320 | }, | ||
321 | [ C(ITLB) ] = { | ||
322 | [ C(OP_READ) ] = { | ||
323 | [ C(RESULT_ACCESS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_ITLB_REFERENCE, HIT, | ||
324 | P4_CACHE__itlb_reference_hit), | ||
325 | [ C(RESULT_MISS) ] = P4_GEN_CACHE_EVENT(P4_EVENT_ITLB_REFERENCE, MISS, | ||
326 | P4_CACHE__itlb_reference_miss), | ||
327 | }, | ||
328 | [ C(OP_WRITE) ] = { | ||
329 | [ C(RESULT_ACCESS) ] = -1, | ||
330 | [ C(RESULT_MISS) ] = -1, | ||
331 | }, | ||
332 | [ C(OP_PREFETCH) ] = { | ||
333 | [ C(RESULT_ACCESS) ] = -1, | ||
334 | [ C(RESULT_MISS) ] = -1, | ||
335 | }, | ||
336 | }, | ||
337 | }; | ||
338 | |||
339 | static u64 p4_general_events[PERF_COUNT_HW_MAX] = { | ||
340 | /* non-halted CPU clocks */ | ||
341 | [PERF_COUNT_HW_CPU_CYCLES] = | ||
342 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_GLOBAL_POWER_EVENTS) | | ||
343 | P4_ESCR_EMASK_BIT(P4_EVENT_GLOBAL_POWER_EVENTS, RUNNING)), | ||
344 | |||
345 | /* | ||
346 | * retired instructions | ||
347 | * in a sake of simplicity we don't use the FSB tagging | ||
348 | */ | ||
349 | [PERF_COUNT_HW_INSTRUCTIONS] = | ||
350 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_INSTR_RETIRED) | | ||
351 | P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, NBOGUSNTAG) | | ||
352 | P4_ESCR_EMASK_BIT(P4_EVENT_INSTR_RETIRED, BOGUSNTAG)), | ||
353 | |||
354 | /* cache hits */ | ||
355 | [PERF_COUNT_HW_CACHE_REFERENCES] = | ||
356 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_BSQ_CACHE_REFERENCE) | | ||
357 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITS) | | ||
358 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITE) | | ||
359 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_HITM) | | ||
360 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITS) | | ||
361 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITE) | | ||
362 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_HITM)), | ||
363 | |||
364 | /* cache misses */ | ||
365 | [PERF_COUNT_HW_CACHE_MISSES] = | ||
366 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_BSQ_CACHE_REFERENCE) | | ||
367 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_2ndL_MISS) | | ||
368 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, RD_3rdL_MISS) | | ||
369 | P4_ESCR_EMASK_BIT(P4_EVENT_BSQ_CACHE_REFERENCE, WR_2ndL_MISS)), | ||
370 | |||
371 | /* branch instructions retired */ | ||
372 | [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = | ||
373 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_RETIRED_BRANCH_TYPE) | | ||
374 | P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CONDITIONAL) | | ||
375 | P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, CALL) | | ||
376 | P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, RETURN) | | ||
377 | P4_ESCR_EMASK_BIT(P4_EVENT_RETIRED_BRANCH_TYPE, INDIRECT)), | ||
378 | |||
379 | /* mispredicted branches retired */ | ||
380 | [PERF_COUNT_HW_BRANCH_MISSES] = | ||
381 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_MISPRED_BRANCH_RETIRED) | | ||
382 | P4_ESCR_EMASK_BIT(P4_EVENT_MISPRED_BRANCH_RETIRED, NBOGUS)), | ||
383 | |||
384 | /* bus ready clocks (cpu is driving #DRDY_DRV\#DRDY_OWN): */ | ||
385 | [PERF_COUNT_HW_BUS_CYCLES] = | ||
386 | p4_config_pack_escr(P4_ESCR_EVENT(P4_EVENT_FSB_DATA_ACTIVITY) | | ||
387 | P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_DRV) | | ||
388 | P4_ESCR_EMASK_BIT(P4_EVENT_FSB_DATA_ACTIVITY, DRDY_OWN)) | | ||
389 | p4_config_pack_cccr(P4_CCCR_EDGE | P4_CCCR_COMPARE), | ||
390 | }; | ||
391 | |||
392 | static struct p4_event_bind *p4_config_get_bind(u64 config) | ||
393 | { | ||
394 | unsigned int evnt = p4_config_unpack_event(config); | ||
395 | struct p4_event_bind *bind = NULL; | ||
396 | |||
397 | if (evnt < ARRAY_SIZE(p4_event_bind_map)) | ||
398 | bind = &p4_event_bind_map[evnt]; | ||
399 | |||
400 | return bind; | ||
401 | } | ||
402 | |||
403 | static u64 p4_pmu_event_map(int hw_event) | ||
404 | { | ||
405 | struct p4_event_bind *bind; | ||
406 | unsigned int esel; | ||
407 | u64 config; | ||
408 | |||
409 | config = p4_general_events[hw_event]; | ||
410 | bind = p4_config_get_bind(config); | ||
411 | esel = P4_OPCODE_ESEL(bind->opcode); | ||
412 | config |= p4_config_pack_cccr(P4_CCCR_ESEL(esel)); | ||
413 | |||
414 | return config; | ||
415 | } | ||
416 | |||
417 | static int p4_hw_config(struct perf_event *event) | ||
418 | { | ||
419 | int cpu = get_cpu(); | ||
420 | int rc = 0; | ||
421 | unsigned int evnt; | ||
422 | u32 escr, cccr; | ||
423 | |||
424 | /* | ||
425 | * the reason we use cpu that early is that: if we get scheduled | ||
426 | * first time on the same cpu -- we will not need swap thread | ||
427 | * specific flags in config (and will save some cpu cycles) | ||
428 | */ | ||
429 | |||
430 | cccr = p4_default_cccr_conf(cpu); | ||
431 | escr = p4_default_escr_conf(cpu, event->attr.exclude_kernel, | ||
432 | event->attr.exclude_user); | ||
433 | event->hw.config = p4_config_pack_escr(escr) | | ||
434 | p4_config_pack_cccr(cccr); | ||
435 | |||
436 | if (p4_ht_active() && p4_ht_thread(cpu)) | ||
437 | event->hw.config = p4_set_ht_bit(event->hw.config); | ||
438 | |||
439 | if (event->attr.type == PERF_TYPE_RAW) { | ||
440 | |||
441 | /* user data may have out-of-bound event index */ | ||
442 | evnt = p4_config_unpack_event(event->attr.config); | ||
443 | if (evnt >= ARRAY_SIZE(p4_event_bind_map)) { | ||
444 | rc = -EINVAL; | ||
445 | goto out; | ||
446 | } | ||
447 | |||
448 | /* | ||
449 | * We don't control raw events so it's up to the caller | ||
450 | * to pass sane values (and we don't count the thread number | ||
451 | * on HT machine but allow HT-compatible specifics to be | ||
452 | * passed on) | ||
453 | * | ||
454 | * XXX: HT wide things should check perf_paranoid_cpu() && | ||
455 | * CAP_SYS_ADMIN | ||
456 | */ | ||
457 | event->hw.config |= event->attr.config & | ||
458 | (p4_config_pack_escr(P4_ESCR_MASK_HT) | | ||
459 | p4_config_pack_cccr(P4_CCCR_MASK_HT)); | ||
460 | } | ||
461 | |||
462 | rc = x86_setup_perfctr(event); | ||
463 | out: | ||
464 | put_cpu(); | ||
465 | return rc; | ||
466 | } | ||
467 | |||
468 | static inline void p4_pmu_clear_cccr_ovf(struct hw_perf_event *hwc) | ||
469 | { | ||
470 | unsigned long dummy; | ||
471 | |||
472 | rdmsrl(hwc->config_base + hwc->idx, dummy); | ||
473 | if (dummy & P4_CCCR_OVF) { | ||
474 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, | ||
475 | ((u64)dummy) & ~P4_CCCR_OVF); | ||
476 | } | ||
477 | } | ||
478 | |||
479 | static inline void p4_pmu_disable_event(struct perf_event *event) | ||
480 | { | ||
481 | struct hw_perf_event *hwc = &event->hw; | ||
482 | |||
483 | /* | ||
484 | * If event gets disabled while counter is in overflowed | ||
485 | * state we need to clear P4_CCCR_OVF, otherwise interrupt get | ||
486 | * asserted again and again | ||
487 | */ | ||
488 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, | ||
489 | (u64)(p4_config_unpack_cccr(hwc->config)) & | ||
490 | ~P4_CCCR_ENABLE & ~P4_CCCR_OVF & ~P4_CCCR_RESERVED); | ||
491 | } | ||
492 | |||
493 | static void p4_pmu_disable_all(void) | ||
494 | { | ||
495 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
496 | int idx; | ||
497 | |||
498 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { | ||
499 | struct perf_event *event = cpuc->events[idx]; | ||
500 | if (!test_bit(idx, cpuc->active_mask)) | ||
501 | continue; | ||
502 | p4_pmu_disable_event(event); | ||
503 | } | ||
504 | } | ||
505 | |||
506 | static void p4_pmu_enable_event(struct perf_event *event) | ||
507 | { | ||
508 | struct hw_perf_event *hwc = &event->hw; | ||
509 | int thread = p4_ht_config_thread(hwc->config); | ||
510 | u64 escr_conf = p4_config_unpack_escr(p4_clear_ht_bit(hwc->config)); | ||
511 | unsigned int idx = p4_config_unpack_event(hwc->config); | ||
512 | unsigned int idx_cache = p4_config_unpack_cache_event(hwc->config); | ||
513 | struct p4_event_bind *bind; | ||
514 | struct p4_cache_event_bind *bind_cache; | ||
515 | u64 escr_addr, cccr; | ||
516 | |||
517 | bind = &p4_event_bind_map[idx]; | ||
518 | escr_addr = (u64)bind->escr_msr[thread]; | ||
519 | |||
520 | /* | ||
521 | * - we dont support cascaded counters yet | ||
522 | * - and counter 1 is broken (erratum) | ||
523 | */ | ||
524 | WARN_ON_ONCE(p4_is_event_cascaded(hwc->config)); | ||
525 | WARN_ON_ONCE(hwc->idx == 1); | ||
526 | |||
527 | /* we need a real Event value */ | ||
528 | escr_conf &= ~P4_ESCR_EVENT_MASK; | ||
529 | escr_conf |= P4_ESCR_EVENT(P4_OPCODE_EVNT(bind->opcode)); | ||
530 | |||
531 | cccr = p4_config_unpack_cccr(hwc->config); | ||
532 | |||
533 | /* | ||
534 | * it could be Cache event so that we need to | ||
535 | * set metrics into additional MSRs | ||
536 | */ | ||
537 | BUILD_BUG_ON(P4_CACHE__MAX > P4_CCCR_CACHE_OPS_MASK); | ||
538 | if (idx_cache > P4_CACHE__NONE && | ||
539 | idx_cache < ARRAY_SIZE(p4_cache_event_bind_map)) { | ||
540 | bind_cache = &p4_cache_event_bind_map[idx_cache]; | ||
541 | (void)checking_wrmsrl(MSR_IA32_PEBS_ENABLE, (u64)bind_cache->metric_pebs); | ||
542 | (void)checking_wrmsrl(MSR_P4_PEBS_MATRIX_VERT, (u64)bind_cache->metric_vert); | ||
543 | } | ||
544 | |||
545 | (void)checking_wrmsrl(escr_addr, escr_conf); | ||
546 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, | ||
547 | (cccr & ~P4_CCCR_RESERVED) | P4_CCCR_ENABLE); | ||
548 | } | ||
549 | |||
550 | static void p4_pmu_enable_all(int added) | ||
551 | { | ||
552 | struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); | ||
553 | int idx; | ||
554 | |||
555 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { | ||
556 | struct perf_event *event = cpuc->events[idx]; | ||
557 | if (!test_bit(idx, cpuc->active_mask)) | ||
558 | continue; | ||
559 | p4_pmu_enable_event(event); | ||
560 | } | ||
561 | } | ||
562 | |||
563 | static int p4_pmu_handle_irq(struct pt_regs *regs) | ||
564 | { | ||
565 | struct perf_sample_data data; | ||
566 | struct cpu_hw_events *cpuc; | ||
567 | struct perf_event *event; | ||
568 | struct hw_perf_event *hwc; | ||
569 | int idx, handled = 0; | ||
570 | u64 val; | ||
571 | |||
572 | data.addr = 0; | ||
573 | data.raw = NULL; | ||
574 | |||
575 | cpuc = &__get_cpu_var(cpu_hw_events); | ||
576 | |||
577 | for (idx = 0; idx < x86_pmu.num_counters; idx++) { | ||
578 | |||
579 | if (!test_bit(idx, cpuc->active_mask)) | ||
580 | continue; | ||
581 | |||
582 | event = cpuc->events[idx]; | ||
583 | hwc = &event->hw; | ||
584 | |||
585 | WARN_ON_ONCE(hwc->idx != idx); | ||
586 | |||
587 | /* | ||
588 | * FIXME: Redundant call, actually not needed | ||
589 | * but just to check if we're screwed | ||
590 | */ | ||
591 | p4_pmu_clear_cccr_ovf(hwc); | ||
592 | |||
593 | val = x86_perf_event_update(event); | ||
594 | if (val & (1ULL << (x86_pmu.cntval_bits - 1))) | ||
595 | continue; | ||
596 | |||
597 | /* | ||
598 | * event overflow | ||
599 | */ | ||
600 | handled = 1; | ||
601 | data.period = event->hw.last_period; | ||
602 | |||
603 | if (!x86_perf_event_set_period(event)) | ||
604 | continue; | ||
605 | if (perf_event_overflow(event, 1, &data, regs)) | ||
606 | p4_pmu_disable_event(event); | ||
607 | } | ||
608 | |||
609 | if (handled) { | ||
610 | /* p4 quirk: unmask it again */ | ||
611 | apic_write(APIC_LVTPC, apic_read(APIC_LVTPC) & ~APIC_LVT_MASKED); | ||
612 | inc_irq_stat(apic_perf_irqs); | ||
613 | } | ||
614 | |||
615 | return handled; | ||
616 | } | ||
617 | |||
618 | /* | ||
619 | * swap thread specific fields according to a thread | ||
620 | * we are going to run on | ||
621 | */ | ||
622 | static void p4_pmu_swap_config_ts(struct hw_perf_event *hwc, int cpu) | ||
623 | { | ||
624 | u32 escr, cccr; | ||
625 | |||
626 | /* | ||
627 | * we either lucky and continue on same cpu or no HT support | ||
628 | */ | ||
629 | if (!p4_should_swap_ts(hwc->config, cpu)) | ||
630 | return; | ||
631 | |||
632 | /* | ||
633 | * the event is migrated from an another logical | ||
634 | * cpu, so we need to swap thread specific flags | ||
635 | */ | ||
636 | |||
637 | escr = p4_config_unpack_escr(hwc->config); | ||
638 | cccr = p4_config_unpack_cccr(hwc->config); | ||
639 | |||
640 | if (p4_ht_thread(cpu)) { | ||
641 | cccr &= ~P4_CCCR_OVF_PMI_T0; | ||
642 | cccr |= P4_CCCR_OVF_PMI_T1; | ||
643 | if (escr & P4_ESCR_T0_OS) { | ||
644 | escr &= ~P4_ESCR_T0_OS; | ||
645 | escr |= P4_ESCR_T1_OS; | ||
646 | } | ||
647 | if (escr & P4_ESCR_T0_USR) { | ||
648 | escr &= ~P4_ESCR_T0_USR; | ||
649 | escr |= P4_ESCR_T1_USR; | ||
650 | } | ||
651 | hwc->config = p4_config_pack_escr(escr); | ||
652 | hwc->config |= p4_config_pack_cccr(cccr); | ||
653 | hwc->config |= P4_CONFIG_HT; | ||
654 | } else { | ||
655 | cccr &= ~P4_CCCR_OVF_PMI_T1; | ||
656 | cccr |= P4_CCCR_OVF_PMI_T0; | ||
657 | if (escr & P4_ESCR_T1_OS) { | ||
658 | escr &= ~P4_ESCR_T1_OS; | ||
659 | escr |= P4_ESCR_T0_OS; | ||
660 | } | ||
661 | if (escr & P4_ESCR_T1_USR) { | ||
662 | escr &= ~P4_ESCR_T1_USR; | ||
663 | escr |= P4_ESCR_T0_USR; | ||
664 | } | ||
665 | hwc->config = p4_config_pack_escr(escr); | ||
666 | hwc->config |= p4_config_pack_cccr(cccr); | ||
667 | hwc->config &= ~P4_CONFIG_HT; | ||
668 | } | ||
669 | } | ||
670 | |||
671 | /* | ||
672 | * ESCR address hashing is tricky, ESCRs are not sequential | ||
673 | * in memory but all starts from MSR_P4_BSU_ESCR0 (0x03e0) and | ||
674 | * the metric between any ESCRs is laid in range [0xa0,0xe1] | ||
675 | * | ||
676 | * so we make ~70% filled hashtable | ||
677 | */ | ||
678 | |||
679 | #define P4_ESCR_MSR_BASE 0x000003a0 | ||
680 | #define P4_ESCR_MSR_MAX 0x000003e1 | ||
681 | #define P4_ESCR_MSR_TABLE_SIZE (P4_ESCR_MSR_MAX - P4_ESCR_MSR_BASE + 1) | ||
682 | #define P4_ESCR_MSR_IDX(msr) (msr - P4_ESCR_MSR_BASE) | ||
683 | #define P4_ESCR_MSR_TABLE_ENTRY(msr) [P4_ESCR_MSR_IDX(msr)] = msr | ||
684 | |||
685 | static const unsigned int p4_escr_table[P4_ESCR_MSR_TABLE_SIZE] = { | ||
686 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ALF_ESCR0), | ||
687 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ALF_ESCR1), | ||
688 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BPU_ESCR0), | ||
689 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BPU_ESCR1), | ||
690 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BSU_ESCR0), | ||
691 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_BSU_ESCR1), | ||
692 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR0), | ||
693 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR1), | ||
694 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR2), | ||
695 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR3), | ||
696 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR4), | ||
697 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_CRU_ESCR5), | ||
698 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_DAC_ESCR0), | ||
699 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_DAC_ESCR1), | ||
700 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FIRM_ESCR0), | ||
701 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FIRM_ESCR1), | ||
702 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FLAME_ESCR0), | ||
703 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FLAME_ESCR1), | ||
704 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FSB_ESCR0), | ||
705 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_FSB_ESCR1), | ||
706 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IQ_ESCR0), | ||
707 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IQ_ESCR1), | ||
708 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IS_ESCR0), | ||
709 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IS_ESCR1), | ||
710 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ITLB_ESCR0), | ||
711 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_ITLB_ESCR1), | ||
712 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IX_ESCR0), | ||
713 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_IX_ESCR1), | ||
714 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MOB_ESCR0), | ||
715 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MOB_ESCR1), | ||
716 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MS_ESCR0), | ||
717 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_MS_ESCR1), | ||
718 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_PMH_ESCR0), | ||
719 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_PMH_ESCR1), | ||
720 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_RAT_ESCR0), | ||
721 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_RAT_ESCR1), | ||
722 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SAAT_ESCR0), | ||
723 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SAAT_ESCR1), | ||
724 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SSU_ESCR0), | ||
725 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_SSU_ESCR1), | ||
726 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TBPU_ESCR0), | ||
727 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TBPU_ESCR1), | ||
728 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TC_ESCR0), | ||
729 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_TC_ESCR1), | ||
730 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_U2L_ESCR0), | ||
731 | P4_ESCR_MSR_TABLE_ENTRY(MSR_P4_U2L_ESCR1), | ||
732 | }; | ||
733 | |||
734 | static int p4_get_escr_idx(unsigned int addr) | ||
735 | { | ||
736 | unsigned int idx = P4_ESCR_MSR_IDX(addr); | ||
737 | |||
738 | if (unlikely(idx >= P4_ESCR_MSR_TABLE_SIZE || | ||
739 | !p4_escr_table[idx])) { | ||
740 | WARN_ONCE(1, "P4 PMU: Wrong address passed: %x\n", addr); | ||
741 | return -1; | ||
742 | } | ||
743 | |||
744 | return idx; | ||
745 | } | ||
746 | |||
747 | static int p4_next_cntr(int thread, unsigned long *used_mask, | ||
748 | struct p4_event_bind *bind) | ||
749 | { | ||
750 | int i, j; | ||
751 | |||
752 | for (i = 0; i < P4_CNTR_LIMIT; i++) { | ||
753 | j = bind->cntr[thread][i]; | ||
754 | if (j != -1 && !test_bit(j, used_mask)) | ||
755 | return j; | ||
756 | } | ||
757 | |||
758 | return -1; | ||
759 | } | ||
760 | |||
761 | static int p4_pmu_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign) | ||
762 | { | ||
763 | unsigned long used_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)]; | ||
764 | unsigned long escr_mask[BITS_TO_LONGS(P4_ESCR_MSR_TABLE_SIZE)]; | ||
765 | int cpu = raw_smp_processor_id(); | ||
766 | struct hw_perf_event *hwc; | ||
767 | struct p4_event_bind *bind; | ||
768 | unsigned int i, thread, num; | ||
769 | int cntr_idx, escr_idx; | ||
770 | |||
771 | bitmap_zero(used_mask, X86_PMC_IDX_MAX); | ||
772 | bitmap_zero(escr_mask, P4_ESCR_MSR_TABLE_SIZE); | ||
773 | |||
774 | for (i = 0, num = n; i < n; i++, num--) { | ||
775 | |||
776 | hwc = &cpuc->event_list[i]->hw; | ||
777 | thread = p4_ht_thread(cpu); | ||
778 | bind = p4_config_get_bind(hwc->config); | ||
779 | escr_idx = p4_get_escr_idx(bind->escr_msr[thread]); | ||
780 | if (unlikely(escr_idx == -1)) | ||
781 | goto done; | ||
782 | |||
783 | if (hwc->idx != -1 && !p4_should_swap_ts(hwc->config, cpu)) { | ||
784 | cntr_idx = hwc->idx; | ||
785 | if (assign) | ||
786 | assign[i] = hwc->idx; | ||
787 | goto reserve; | ||
788 | } | ||
789 | |||
790 | cntr_idx = p4_next_cntr(thread, used_mask, bind); | ||
791 | if (cntr_idx == -1 || test_bit(escr_idx, escr_mask)) | ||
792 | goto done; | ||
793 | |||
794 | p4_pmu_swap_config_ts(hwc, cpu); | ||
795 | if (assign) | ||
796 | assign[i] = cntr_idx; | ||
797 | reserve: | ||
798 | set_bit(cntr_idx, used_mask); | ||
799 | set_bit(escr_idx, escr_mask); | ||
800 | } | ||
801 | |||
802 | done: | ||
803 | return num ? -ENOSPC : 0; | ||
804 | } | ||
805 | |||
806 | static __initconst const struct x86_pmu p4_pmu = { | ||
807 | .name = "Netburst P4/Xeon", | ||
808 | .handle_irq = p4_pmu_handle_irq, | ||
809 | .disable_all = p4_pmu_disable_all, | ||
810 | .enable_all = p4_pmu_enable_all, | ||
811 | .enable = p4_pmu_enable_event, | ||
812 | .disable = p4_pmu_disable_event, | ||
813 | .eventsel = MSR_P4_BPU_CCCR0, | ||
814 | .perfctr = MSR_P4_BPU_PERFCTR0, | ||
815 | .event_map = p4_pmu_event_map, | ||
816 | .max_events = ARRAY_SIZE(p4_general_events), | ||
817 | .get_event_constraints = x86_get_event_constraints, | ||
818 | /* | ||
819 | * IF HT disabled we may need to use all | ||
820 | * ARCH_P4_MAX_CCCR counters simulaneously | ||
821 | * though leave it restricted at moment assuming | ||
822 | * HT is on | ||
823 | */ | ||
824 | .num_counters = ARCH_P4_MAX_CCCR, | ||
825 | .apic = 1, | ||
826 | .cntval_bits = 40, | ||
827 | .cntval_mask = (1ULL << 40) - 1, | ||
828 | .max_period = (1ULL << 39) - 1, | ||
829 | .hw_config = p4_hw_config, | ||
830 | .schedule_events = p4_pmu_schedule_events, | ||
831 | }; | ||
832 | |||
833 | static __init int p4_pmu_init(void) | ||
834 | { | ||
835 | unsigned int low, high; | ||
836 | |||
837 | /* If we get stripped -- indexig fails */ | ||
838 | BUILD_BUG_ON(ARCH_P4_MAX_CCCR > X86_PMC_MAX_GENERIC); | ||
839 | |||
840 | rdmsr(MSR_IA32_MISC_ENABLE, low, high); | ||
841 | if (!(low & (1 << 7))) { | ||
842 | pr_cont("unsupported Netburst CPU model %d ", | ||
843 | boot_cpu_data.x86_model); | ||
844 | return -ENODEV; | ||
845 | } | ||
846 | |||
847 | memcpy(hw_cache_event_ids, p4_hw_cache_event_ids, | ||
848 | sizeof(hw_cache_event_ids)); | ||
849 | |||
850 | pr_cont("Netburst events, "); | ||
851 | |||
852 | x86_pmu = p4_pmu; | ||
853 | |||
854 | return 0; | ||
855 | } | ||
856 | |||
857 | #endif /* CONFIG_CPU_SUP_INTEL */ | ||
diff --git a/arch/x86/kernel/cpu/perf_event_p6.c b/arch/x86/kernel/cpu/perf_event_p6.c index a330485d14da..34ba07be2cda 100644 --- a/arch/x86/kernel/cpu/perf_event_p6.c +++ b/arch/x86/kernel/cpu/perf_event_p6.c | |||
@@ -27,24 +27,6 @@ static u64 p6_pmu_event_map(int hw_event) | |||
27 | */ | 27 | */ |
28 | #define P6_NOP_EVENT 0x0000002EULL | 28 | #define P6_NOP_EVENT 0x0000002EULL |
29 | 29 | ||
30 | static u64 p6_pmu_raw_event(u64 hw_event) | ||
31 | { | ||
32 | #define P6_EVNTSEL_EVENT_MASK 0x000000FFULL | ||
33 | #define P6_EVNTSEL_UNIT_MASK 0x0000FF00ULL | ||
34 | #define P6_EVNTSEL_EDGE_MASK 0x00040000ULL | ||
35 | #define P6_EVNTSEL_INV_MASK 0x00800000ULL | ||
36 | #define P6_EVNTSEL_REG_MASK 0xFF000000ULL | ||
37 | |||
38 | #define P6_EVNTSEL_MASK \ | ||
39 | (P6_EVNTSEL_EVENT_MASK | \ | ||
40 | P6_EVNTSEL_UNIT_MASK | \ | ||
41 | P6_EVNTSEL_EDGE_MASK | \ | ||
42 | P6_EVNTSEL_INV_MASK | \ | ||
43 | P6_EVNTSEL_REG_MASK) | ||
44 | |||
45 | return hw_event & P6_EVNTSEL_MASK; | ||
46 | } | ||
47 | |||
48 | static struct event_constraint p6_event_constraints[] = | 30 | static struct event_constraint p6_event_constraints[] = |
49 | { | 31 | { |
50 | INTEL_EVENT_CONSTRAINT(0xc1, 0x1), /* FLOPS */ | 32 | INTEL_EVENT_CONSTRAINT(0xc1, 0x1), /* FLOPS */ |
@@ -66,7 +48,7 @@ static void p6_pmu_disable_all(void) | |||
66 | wrmsrl(MSR_P6_EVNTSEL0, val); | 48 | wrmsrl(MSR_P6_EVNTSEL0, val); |
67 | } | 49 | } |
68 | 50 | ||
69 | static void p6_pmu_enable_all(void) | 51 | static void p6_pmu_enable_all(int added) |
70 | { | 52 | { |
71 | unsigned long val; | 53 | unsigned long val; |
72 | 54 | ||
@@ -102,22 +84,23 @@ static void p6_pmu_enable_event(struct perf_event *event) | |||
102 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, val); | 84 | (void)checking_wrmsrl(hwc->config_base + hwc->idx, val); |
103 | } | 85 | } |
104 | 86 | ||
105 | static __initconst struct x86_pmu p6_pmu = { | 87 | static __initconst const struct x86_pmu p6_pmu = { |
106 | .name = "p6", | 88 | .name = "p6", |
107 | .handle_irq = x86_pmu_handle_irq, | 89 | .handle_irq = x86_pmu_handle_irq, |
108 | .disable_all = p6_pmu_disable_all, | 90 | .disable_all = p6_pmu_disable_all, |
109 | .enable_all = p6_pmu_enable_all, | 91 | .enable_all = p6_pmu_enable_all, |
110 | .enable = p6_pmu_enable_event, | 92 | .enable = p6_pmu_enable_event, |
111 | .disable = p6_pmu_disable_event, | 93 | .disable = p6_pmu_disable_event, |
94 | .hw_config = x86_pmu_hw_config, | ||
95 | .schedule_events = x86_schedule_events, | ||
112 | .eventsel = MSR_P6_EVNTSEL0, | 96 | .eventsel = MSR_P6_EVNTSEL0, |
113 | .perfctr = MSR_P6_PERFCTR0, | 97 | .perfctr = MSR_P6_PERFCTR0, |
114 | .event_map = p6_pmu_event_map, | 98 | .event_map = p6_pmu_event_map, |
115 | .raw_event = p6_pmu_raw_event, | ||
116 | .max_events = ARRAY_SIZE(p6_perfmon_event_map), | 99 | .max_events = ARRAY_SIZE(p6_perfmon_event_map), |
117 | .apic = 1, | 100 | .apic = 1, |
118 | .max_period = (1ULL << 31) - 1, | 101 | .max_period = (1ULL << 31) - 1, |
119 | .version = 0, | 102 | .version = 0, |
120 | .num_events = 2, | 103 | .num_counters = 2, |
121 | /* | 104 | /* |
122 | * Events have 40 bits implemented. However they are designed such | 105 | * Events have 40 bits implemented. However they are designed such |
123 | * that bits [32-39] are sign extensions of bit 31. As such the | 106 | * that bits [32-39] are sign extensions of bit 31. As such the |
@@ -125,8 +108,8 @@ static __initconst struct x86_pmu p6_pmu = { | |||
125 | * | 108 | * |
126 | * See IA-32 Intel Architecture Software developer manual Vol 3B | 109 | * See IA-32 Intel Architecture Software developer manual Vol 3B |
127 | */ | 110 | */ |
128 | .event_bits = 32, | 111 | .cntval_bits = 32, |
129 | .event_mask = (1ULL << 32) - 1, | 112 | .cntval_mask = (1ULL << 32) - 1, |
130 | .get_event_constraints = x86_get_event_constraints, | 113 | .get_event_constraints = x86_get_event_constraints, |
131 | .event_constraints = p6_event_constraints, | 114 | .event_constraints = p6_event_constraints, |
132 | }; | 115 | }; |
diff --git a/arch/x86/kernel/ds.c b/arch/x86/kernel/ds.c deleted file mode 100644 index 1c47390dd0e5..000000000000 --- a/arch/x86/kernel/ds.c +++ /dev/null | |||
@@ -1,1437 +0,0 @@ | |||
1 | /* | ||
2 | * Debug Store support | ||
3 | * | ||
4 | * This provides a low-level interface to the hardware's Debug Store | ||
5 | * feature that is used for branch trace store (BTS) and | ||
6 | * precise-event based sampling (PEBS). | ||
7 | * | ||
8 | * It manages: | ||
9 | * - DS and BTS hardware configuration | ||
10 | * - buffer overflow handling (to be done) | ||
11 | * - buffer access | ||
12 | * | ||
13 | * It does not do: | ||
14 | * - security checking (is the caller allowed to trace the task) | ||
15 | * - buffer allocation (memory accounting) | ||
16 | * | ||
17 | * | ||
18 | * Copyright (C) 2007-2009 Intel Corporation. | ||
19 | * Markus Metzger <markus.t.metzger@intel.com>, 2007-2009 | ||
20 | */ | ||
21 | |||
22 | #include <linux/kernel.h> | ||
23 | #include <linux/string.h> | ||
24 | #include <linux/errno.h> | ||
25 | #include <linux/sched.h> | ||
26 | #include <linux/slab.h> | ||
27 | #include <linux/mm.h> | ||
28 | #include <linux/trace_clock.h> | ||
29 | |||
30 | #include <asm/ds.h> | ||
31 | |||
32 | #include "ds_selftest.h" | ||
33 | |||
34 | /* | ||
35 | * The configuration for a particular DS hardware implementation: | ||
36 | */ | ||
37 | struct ds_configuration { | ||
38 | /* The name of the configuration: */ | ||
39 | const char *name; | ||
40 | |||
41 | /* The size of pointer-typed fields in DS, BTS, and PEBS: */ | ||
42 | unsigned char sizeof_ptr_field; | ||
43 | |||
44 | /* The size of a BTS/PEBS record in bytes: */ | ||
45 | unsigned char sizeof_rec[2]; | ||
46 | |||
47 | /* The number of pebs counter reset values in the DS structure. */ | ||
48 | unsigned char nr_counter_reset; | ||
49 | |||
50 | /* Control bit-masks indexed by enum ds_feature: */ | ||
51 | unsigned long ctl[dsf_ctl_max]; | ||
52 | }; | ||
53 | static struct ds_configuration ds_cfg __read_mostly; | ||
54 | |||
55 | |||
56 | /* Maximal size of a DS configuration: */ | ||
57 | #define MAX_SIZEOF_DS 0x80 | ||
58 | |||
59 | /* Maximal size of a BTS record: */ | ||
60 | #define MAX_SIZEOF_BTS (3 * 8) | ||
61 | |||
62 | /* BTS and PEBS buffer alignment: */ | ||
63 | #define DS_ALIGNMENT (1 << 3) | ||
64 | |||
65 | /* Number of buffer pointers in DS: */ | ||
66 | #define NUM_DS_PTR_FIELDS 8 | ||
67 | |||
68 | /* Size of a pebs reset value in DS: */ | ||
69 | #define PEBS_RESET_FIELD_SIZE 8 | ||
70 | |||
71 | /* Mask of control bits in the DS MSR register: */ | ||
72 | #define BTS_CONTROL \ | ||
73 | ( ds_cfg.ctl[dsf_bts] | \ | ||
74 | ds_cfg.ctl[dsf_bts_kernel] | \ | ||
75 | ds_cfg.ctl[dsf_bts_user] | \ | ||
76 | ds_cfg.ctl[dsf_bts_overflow] ) | ||
77 | |||
78 | /* | ||
79 | * A BTS or PEBS tracer. | ||
80 | * | ||
81 | * This holds the configuration of the tracer and serves as a handle | ||
82 | * to identify tracers. | ||
83 | */ | ||
84 | struct ds_tracer { | ||
85 | /* The DS context (partially) owned by this tracer. */ | ||
86 | struct ds_context *context; | ||
87 | /* The buffer provided on ds_request() and its size in bytes. */ | ||
88 | void *buffer; | ||
89 | size_t size; | ||
90 | }; | ||
91 | |||
92 | struct bts_tracer { | ||
93 | /* The common DS part: */ | ||
94 | struct ds_tracer ds; | ||
95 | |||
96 | /* The trace including the DS configuration: */ | ||
97 | struct bts_trace trace; | ||
98 | |||
99 | /* Buffer overflow notification function: */ | ||
100 | bts_ovfl_callback_t ovfl; | ||
101 | |||
102 | /* Active flags affecting trace collection. */ | ||
103 | unsigned int flags; | ||
104 | }; | ||
105 | |||
106 | struct pebs_tracer { | ||
107 | /* The common DS part: */ | ||
108 | struct ds_tracer ds; | ||
109 | |||
110 | /* The trace including the DS configuration: */ | ||
111 | struct pebs_trace trace; | ||
112 | |||
113 | /* Buffer overflow notification function: */ | ||
114 | pebs_ovfl_callback_t ovfl; | ||
115 | }; | ||
116 | |||
117 | /* | ||
118 | * Debug Store (DS) save area configuration (see Intel64 and IA32 | ||
119 | * Architectures Software Developer's Manual, section 18.5) | ||
120 | * | ||
121 | * The DS configuration consists of the following fields; different | ||
122 | * architetures vary in the size of those fields. | ||
123 | * | ||
124 | * - double-word aligned base linear address of the BTS buffer | ||
125 | * - write pointer into the BTS buffer | ||
126 | * - end linear address of the BTS buffer (one byte beyond the end of | ||
127 | * the buffer) | ||
128 | * - interrupt pointer into BTS buffer | ||
129 | * (interrupt occurs when write pointer passes interrupt pointer) | ||
130 | * - double-word aligned base linear address of the PEBS buffer | ||
131 | * - write pointer into the PEBS buffer | ||
132 | * - end linear address of the PEBS buffer (one byte beyond the end of | ||
133 | * the buffer) | ||
134 | * - interrupt pointer into PEBS buffer | ||
135 | * (interrupt occurs when write pointer passes interrupt pointer) | ||
136 | * - value to which counter is reset following counter overflow | ||
137 | * | ||
138 | * Later architectures use 64bit pointers throughout, whereas earlier | ||
139 | * architectures use 32bit pointers in 32bit mode. | ||
140 | * | ||
141 | * | ||
142 | * We compute the base address for the first 8 fields based on: | ||
143 | * - the field size stored in the DS configuration | ||
144 | * - the relative field position | ||
145 | * - an offset giving the start of the respective region | ||
146 | * | ||
147 | * This offset is further used to index various arrays holding | ||
148 | * information for BTS and PEBS at the respective index. | ||
149 | * | ||
150 | * On later 32bit processors, we only access the lower 32bit of the | ||
151 | * 64bit pointer fields. The upper halves will be zeroed out. | ||
152 | */ | ||
153 | |||
154 | enum ds_field { | ||
155 | ds_buffer_base = 0, | ||
156 | ds_index, | ||
157 | ds_absolute_maximum, | ||
158 | ds_interrupt_threshold, | ||
159 | }; | ||
160 | |||
161 | enum ds_qualifier { | ||
162 | ds_bts = 0, | ||
163 | ds_pebs | ||
164 | }; | ||
165 | |||
166 | static inline unsigned long | ||
167 | ds_get(const unsigned char *base, enum ds_qualifier qual, enum ds_field field) | ||
168 | { | ||
169 | base += (ds_cfg.sizeof_ptr_field * (field + (4 * qual))); | ||
170 | return *(unsigned long *)base; | ||
171 | } | ||
172 | |||
173 | static inline void | ||
174 | ds_set(unsigned char *base, enum ds_qualifier qual, enum ds_field field, | ||
175 | unsigned long value) | ||
176 | { | ||
177 | base += (ds_cfg.sizeof_ptr_field * (field + (4 * qual))); | ||
178 | (*(unsigned long *)base) = value; | ||
179 | } | ||
180 | |||
181 | |||
182 | /* | ||
183 | * Locking is done only for allocating BTS or PEBS resources. | ||
184 | */ | ||
185 | static DEFINE_SPINLOCK(ds_lock); | ||
186 | |||
187 | /* | ||
188 | * We either support (system-wide) per-cpu or per-thread allocation. | ||
189 | * We distinguish the two based on the task_struct pointer, where a | ||
190 | * NULL pointer indicates per-cpu allocation for the current cpu. | ||
191 | * | ||
192 | * Allocations are use-counted. As soon as resources are allocated, | ||
193 | * further allocations must be of the same type (per-cpu or | ||
194 | * per-thread). We model this by counting allocations (i.e. the number | ||
195 | * of tracers of a certain type) for one type negatively: | ||
196 | * =0 no tracers | ||
197 | * >0 number of per-thread tracers | ||
198 | * <0 number of per-cpu tracers | ||
199 | * | ||
200 | * Tracers essentially gives the number of ds contexts for a certain | ||
201 | * type of allocation. | ||
202 | */ | ||
203 | static atomic_t tracers = ATOMIC_INIT(0); | ||
204 | |||
205 | static inline int get_tracer(struct task_struct *task) | ||
206 | { | ||
207 | int error; | ||
208 | |||
209 | spin_lock_irq(&ds_lock); | ||
210 | |||
211 | if (task) { | ||
212 | error = -EPERM; | ||
213 | if (atomic_read(&tracers) < 0) | ||
214 | goto out; | ||
215 | atomic_inc(&tracers); | ||
216 | } else { | ||
217 | error = -EPERM; | ||
218 | if (atomic_read(&tracers) > 0) | ||
219 | goto out; | ||
220 | atomic_dec(&tracers); | ||
221 | } | ||
222 | |||
223 | error = 0; | ||
224 | out: | ||
225 | spin_unlock_irq(&ds_lock); | ||
226 | return error; | ||
227 | } | ||
228 | |||
229 | static inline void put_tracer(struct task_struct *task) | ||
230 | { | ||
231 | if (task) | ||
232 | atomic_dec(&tracers); | ||
233 | else | ||
234 | atomic_inc(&tracers); | ||
235 | } | ||
236 | |||
237 | /* | ||
238 | * The DS context is either attached to a thread or to a cpu: | ||
239 | * - in the former case, the thread_struct contains a pointer to the | ||
240 | * attached context. | ||
241 | * - in the latter case, we use a static array of per-cpu context | ||
242 | * pointers. | ||
243 | * | ||
244 | * Contexts are use-counted. They are allocated on first access and | ||
245 | * deallocated when the last user puts the context. | ||
246 | */ | ||
247 | struct ds_context { | ||
248 | /* The DS configuration; goes into MSR_IA32_DS_AREA: */ | ||
249 | unsigned char ds[MAX_SIZEOF_DS]; | ||
250 | |||
251 | /* The owner of the BTS and PEBS configuration, respectively: */ | ||
252 | struct bts_tracer *bts_master; | ||
253 | struct pebs_tracer *pebs_master; | ||
254 | |||
255 | /* Use count: */ | ||
256 | unsigned long count; | ||
257 | |||
258 | /* Pointer to the context pointer field: */ | ||
259 | struct ds_context **this; | ||
260 | |||
261 | /* The traced task; NULL for cpu tracing: */ | ||
262 | struct task_struct *task; | ||
263 | |||
264 | /* The traced cpu; only valid if task is NULL: */ | ||
265 | int cpu; | ||
266 | }; | ||
267 | |||
268 | static DEFINE_PER_CPU(struct ds_context *, cpu_ds_context); | ||
269 | |||
270 | |||
271 | static struct ds_context *ds_get_context(struct task_struct *task, int cpu) | ||
272 | { | ||
273 | struct ds_context **p_context = | ||
274 | (task ? &task->thread.ds_ctx : &per_cpu(cpu_ds_context, cpu)); | ||
275 | struct ds_context *context = NULL; | ||
276 | struct ds_context *new_context = NULL; | ||
277 | |||
278 | /* Chances are small that we already have a context. */ | ||
279 | new_context = kzalloc(sizeof(*new_context), GFP_KERNEL); | ||
280 | if (!new_context) | ||
281 | return NULL; | ||
282 | |||
283 | spin_lock_irq(&ds_lock); | ||
284 | |||
285 | context = *p_context; | ||
286 | if (likely(!context)) { | ||
287 | context = new_context; | ||
288 | |||
289 | context->this = p_context; | ||
290 | context->task = task; | ||
291 | context->cpu = cpu; | ||
292 | context->count = 0; | ||
293 | |||
294 | *p_context = context; | ||
295 | } | ||
296 | |||
297 | context->count++; | ||
298 | |||
299 | spin_unlock_irq(&ds_lock); | ||
300 | |||
301 | if (context != new_context) | ||
302 | kfree(new_context); | ||
303 | |||
304 | return context; | ||
305 | } | ||
306 | |||
307 | static void ds_put_context(struct ds_context *context) | ||
308 | { | ||
309 | struct task_struct *task; | ||
310 | unsigned long irq; | ||
311 | |||
312 | if (!context) | ||
313 | return; | ||
314 | |||
315 | spin_lock_irqsave(&ds_lock, irq); | ||
316 | |||
317 | if (--context->count) { | ||
318 | spin_unlock_irqrestore(&ds_lock, irq); | ||
319 | return; | ||
320 | } | ||
321 | |||
322 | *(context->this) = NULL; | ||
323 | |||
324 | task = context->task; | ||
325 | |||
326 | if (task) | ||
327 | clear_tsk_thread_flag(task, TIF_DS_AREA_MSR); | ||
328 | |||
329 | /* | ||
330 | * We leave the (now dangling) pointer to the DS configuration in | ||
331 | * the DS_AREA msr. This is as good or as bad as replacing it with | ||
332 | * NULL - the hardware would crash if we enabled tracing. | ||
333 | * | ||
334 | * This saves us some problems with having to write an msr on a | ||
335 | * different cpu while preventing others from doing the same for the | ||
336 | * next context for that same cpu. | ||
337 | */ | ||
338 | |||
339 | spin_unlock_irqrestore(&ds_lock, irq); | ||
340 | |||
341 | /* The context might still be in use for context switching. */ | ||
342 | if (task && (task != current)) | ||
343 | wait_task_context_switch(task); | ||
344 | |||
345 | kfree(context); | ||
346 | } | ||
347 | |||
348 | static void ds_install_ds_area(struct ds_context *context) | ||
349 | { | ||
350 | unsigned long ds; | ||
351 | |||
352 | ds = (unsigned long)context->ds; | ||
353 | |||
354 | /* | ||
355 | * There is a race between the bts master and the pebs master. | ||
356 | * | ||
357 | * The thread/cpu access is synchronized via get/put_cpu() for | ||
358 | * task tracing and via wrmsr_on_cpu for cpu tracing. | ||
359 | * | ||
360 | * If bts and pebs are collected for the same task or same cpu, | ||
361 | * the same confiuration is written twice. | ||
362 | */ | ||
363 | if (context->task) { | ||
364 | get_cpu(); | ||
365 | if (context->task == current) | ||
366 | wrmsrl(MSR_IA32_DS_AREA, ds); | ||
367 | set_tsk_thread_flag(context->task, TIF_DS_AREA_MSR); | ||
368 | put_cpu(); | ||
369 | } else | ||
370 | wrmsr_on_cpu(context->cpu, MSR_IA32_DS_AREA, | ||
371 | (u32)((u64)ds), (u32)((u64)ds >> 32)); | ||
372 | } | ||
373 | |||
374 | /* | ||
375 | * Call the tracer's callback on a buffer overflow. | ||
376 | * | ||
377 | * context: the ds context | ||
378 | * qual: the buffer type | ||
379 | */ | ||
380 | static void ds_overflow(struct ds_context *context, enum ds_qualifier qual) | ||
381 | { | ||
382 | switch (qual) { | ||
383 | case ds_bts: | ||
384 | if (context->bts_master && | ||
385 | context->bts_master->ovfl) | ||
386 | context->bts_master->ovfl(context->bts_master); | ||
387 | break; | ||
388 | case ds_pebs: | ||
389 | if (context->pebs_master && | ||
390 | context->pebs_master->ovfl) | ||
391 | context->pebs_master->ovfl(context->pebs_master); | ||
392 | break; | ||
393 | } | ||
394 | } | ||
395 | |||
396 | |||
397 | /* | ||
398 | * Write raw data into the BTS or PEBS buffer. | ||
399 | * | ||
400 | * The remainder of any partially written record is zeroed out. | ||
401 | * | ||
402 | * context: the DS context | ||
403 | * qual: the buffer type | ||
404 | * record: the data to write | ||
405 | * size: the size of the data | ||
406 | */ | ||
407 | static int ds_write(struct ds_context *context, enum ds_qualifier qual, | ||
408 | const void *record, size_t size) | ||
409 | { | ||
410 | int bytes_written = 0; | ||
411 | |||
412 | if (!record) | ||
413 | return -EINVAL; | ||
414 | |||
415 | while (size) { | ||
416 | unsigned long base, index, end, write_end, int_th; | ||
417 | unsigned long write_size, adj_write_size; | ||
418 | |||
419 | /* | ||
420 | * Write as much as possible without producing an | ||
421 | * overflow interrupt. | ||
422 | * | ||
423 | * Interrupt_threshold must either be | ||
424 | * - bigger than absolute_maximum or | ||
425 | * - point to a record between buffer_base and absolute_maximum | ||
426 | * | ||
427 | * Index points to a valid record. | ||
428 | */ | ||
429 | base = ds_get(context->ds, qual, ds_buffer_base); | ||
430 | index = ds_get(context->ds, qual, ds_index); | ||
431 | end = ds_get(context->ds, qual, ds_absolute_maximum); | ||
432 | int_th = ds_get(context->ds, qual, ds_interrupt_threshold); | ||
433 | |||
434 | write_end = min(end, int_th); | ||
435 | |||
436 | /* | ||
437 | * If we are already beyond the interrupt threshold, | ||
438 | * we fill the entire buffer. | ||
439 | */ | ||
440 | if (write_end <= index) | ||
441 | write_end = end; | ||
442 | |||
443 | if (write_end <= index) | ||
444 | break; | ||
445 | |||
446 | write_size = min((unsigned long) size, write_end - index); | ||
447 | memcpy((void *)index, record, write_size); | ||
448 | |||
449 | record = (const char *)record + write_size; | ||
450 | size -= write_size; | ||
451 | bytes_written += write_size; | ||
452 | |||
453 | adj_write_size = write_size / ds_cfg.sizeof_rec[qual]; | ||
454 | adj_write_size *= ds_cfg.sizeof_rec[qual]; | ||
455 | |||
456 | /* Zero out trailing bytes. */ | ||
457 | memset((char *)index + write_size, 0, | ||
458 | adj_write_size - write_size); | ||
459 | index += adj_write_size; | ||
460 | |||
461 | if (index >= end) | ||
462 | index = base; | ||
463 | ds_set(context->ds, qual, ds_index, index); | ||
464 | |||
465 | if (index >= int_th) | ||
466 | ds_overflow(context, qual); | ||
467 | } | ||
468 | |||
469 | return bytes_written; | ||
470 | } | ||
471 | |||
472 | |||
473 | /* | ||
474 | * Branch Trace Store (BTS) uses the following format. Different | ||
475 | * architectures vary in the size of those fields. | ||
476 | * - source linear address | ||
477 | * - destination linear address | ||
478 | * - flags | ||
479 | * | ||
480 | * Later architectures use 64bit pointers throughout, whereas earlier | ||
481 | * architectures use 32bit pointers in 32bit mode. | ||
482 | * | ||
483 | * We compute the base address for the fields based on: | ||
484 | * - the field size stored in the DS configuration | ||
485 | * - the relative field position | ||
486 | * | ||
487 | * In order to store additional information in the BTS buffer, we use | ||
488 | * a special source address to indicate that the record requires | ||
489 | * special interpretation. | ||
490 | * | ||
491 | * Netburst indicated via a bit in the flags field whether the branch | ||
492 | * was predicted; this is ignored. | ||
493 | * | ||
494 | * We use two levels of abstraction: | ||
495 | * - the raw data level defined here | ||
496 | * - an arch-independent level defined in ds.h | ||
497 | */ | ||
498 | |||
499 | enum bts_field { | ||
500 | bts_from, | ||
501 | bts_to, | ||
502 | bts_flags, | ||
503 | |||
504 | bts_qual = bts_from, | ||
505 | bts_clock = bts_to, | ||
506 | bts_pid = bts_flags, | ||
507 | |||
508 | bts_qual_mask = (bts_qual_max - 1), | ||
509 | bts_escape = ((unsigned long)-1 & ~bts_qual_mask) | ||
510 | }; | ||
511 | |||
512 | static inline unsigned long bts_get(const char *base, unsigned long field) | ||
513 | { | ||
514 | base += (ds_cfg.sizeof_ptr_field * field); | ||
515 | return *(unsigned long *)base; | ||
516 | } | ||
517 | |||
518 | static inline void bts_set(char *base, unsigned long field, unsigned long val) | ||
519 | { | ||
520 | base += (ds_cfg.sizeof_ptr_field * field); | ||
521 | (*(unsigned long *)base) = val; | ||
522 | } | ||
523 | |||
524 | |||
525 | /* | ||
526 | * The raw BTS data is architecture dependent. | ||
527 | * | ||
528 | * For higher-level users, we give an arch-independent view. | ||
529 | * - ds.h defines struct bts_struct | ||
530 | * - bts_read translates one raw bts record into a bts_struct | ||
531 | * - bts_write translates one bts_struct into the raw format and | ||
532 | * writes it into the top of the parameter tracer's buffer. | ||
533 | * | ||
534 | * return: bytes read/written on success; -Eerrno, otherwise | ||
535 | */ | ||
536 | static int | ||
537 | bts_read(struct bts_tracer *tracer, const void *at, struct bts_struct *out) | ||
538 | { | ||
539 | if (!tracer) | ||
540 | return -EINVAL; | ||
541 | |||
542 | if (at < tracer->trace.ds.begin) | ||
543 | return -EINVAL; | ||
544 | |||
545 | if (tracer->trace.ds.end < (at + tracer->trace.ds.size)) | ||
546 | return -EINVAL; | ||
547 | |||
548 | memset(out, 0, sizeof(*out)); | ||
549 | if ((bts_get(at, bts_qual) & ~bts_qual_mask) == bts_escape) { | ||
550 | out->qualifier = (bts_get(at, bts_qual) & bts_qual_mask); | ||
551 | out->variant.event.clock = bts_get(at, bts_clock); | ||
552 | out->variant.event.pid = bts_get(at, bts_pid); | ||
553 | } else { | ||
554 | out->qualifier = bts_branch; | ||
555 | out->variant.lbr.from = bts_get(at, bts_from); | ||
556 | out->variant.lbr.to = bts_get(at, bts_to); | ||
557 | |||
558 | if (!out->variant.lbr.from && !out->variant.lbr.to) | ||
559 | out->qualifier = bts_invalid; | ||
560 | } | ||
561 | |||
562 | return ds_cfg.sizeof_rec[ds_bts]; | ||
563 | } | ||
564 | |||
565 | static int bts_write(struct bts_tracer *tracer, const struct bts_struct *in) | ||
566 | { | ||
567 | unsigned char raw[MAX_SIZEOF_BTS]; | ||
568 | |||
569 | if (!tracer) | ||
570 | return -EINVAL; | ||
571 | |||
572 | if (MAX_SIZEOF_BTS < ds_cfg.sizeof_rec[ds_bts]) | ||
573 | return -EOVERFLOW; | ||
574 | |||
575 | switch (in->qualifier) { | ||
576 | case bts_invalid: | ||
577 | bts_set(raw, bts_from, 0); | ||
578 | bts_set(raw, bts_to, 0); | ||
579 | bts_set(raw, bts_flags, 0); | ||
580 | break; | ||
581 | case bts_branch: | ||
582 | bts_set(raw, bts_from, in->variant.lbr.from); | ||
583 | bts_set(raw, bts_to, in->variant.lbr.to); | ||
584 | bts_set(raw, bts_flags, 0); | ||
585 | break; | ||
586 | case bts_task_arrives: | ||
587 | case bts_task_departs: | ||
588 | bts_set(raw, bts_qual, (bts_escape | in->qualifier)); | ||
589 | bts_set(raw, bts_clock, in->variant.event.clock); | ||
590 | bts_set(raw, bts_pid, in->variant.event.pid); | ||
591 | break; | ||
592 | default: | ||
593 | return -EINVAL; | ||
594 | } | ||
595 | |||
596 | return ds_write(tracer->ds.context, ds_bts, raw, | ||
597 | ds_cfg.sizeof_rec[ds_bts]); | ||
598 | } | ||
599 | |||
600 | |||
601 | static void ds_write_config(struct ds_context *context, | ||
602 | struct ds_trace *cfg, enum ds_qualifier qual) | ||
603 | { | ||
604 | unsigned char *ds = context->ds; | ||
605 | |||
606 | ds_set(ds, qual, ds_buffer_base, (unsigned long)cfg->begin); | ||
607 | ds_set(ds, qual, ds_index, (unsigned long)cfg->top); | ||
608 | ds_set(ds, qual, ds_absolute_maximum, (unsigned long)cfg->end); | ||
609 | ds_set(ds, qual, ds_interrupt_threshold, (unsigned long)cfg->ith); | ||
610 | } | ||
611 | |||
612 | static void ds_read_config(struct ds_context *context, | ||
613 | struct ds_trace *cfg, enum ds_qualifier qual) | ||
614 | { | ||
615 | unsigned char *ds = context->ds; | ||
616 | |||
617 | cfg->begin = (void *)ds_get(ds, qual, ds_buffer_base); | ||
618 | cfg->top = (void *)ds_get(ds, qual, ds_index); | ||
619 | cfg->end = (void *)ds_get(ds, qual, ds_absolute_maximum); | ||
620 | cfg->ith = (void *)ds_get(ds, qual, ds_interrupt_threshold); | ||
621 | } | ||
622 | |||
623 | static void ds_init_ds_trace(struct ds_trace *trace, enum ds_qualifier qual, | ||
624 | void *base, size_t size, size_t ith, | ||
625 | unsigned int flags) { | ||
626 | unsigned long buffer, adj; | ||
627 | |||
628 | /* | ||
629 | * Adjust the buffer address and size to meet alignment | ||
630 | * constraints: | ||
631 | * - buffer is double-word aligned | ||
632 | * - size is multiple of record size | ||
633 | * | ||
634 | * We checked the size at the very beginning; we have enough | ||
635 | * space to do the adjustment. | ||
636 | */ | ||
637 | buffer = (unsigned long)base; | ||
638 | |||
639 | adj = ALIGN(buffer, DS_ALIGNMENT) - buffer; | ||
640 | buffer += adj; | ||
641 | size -= adj; | ||
642 | |||
643 | trace->n = size / ds_cfg.sizeof_rec[qual]; | ||
644 | trace->size = ds_cfg.sizeof_rec[qual]; | ||
645 | |||
646 | size = (trace->n * trace->size); | ||
647 | |||
648 | trace->begin = (void *)buffer; | ||
649 | trace->top = trace->begin; | ||
650 | trace->end = (void *)(buffer + size); | ||
651 | /* | ||
652 | * The value for 'no threshold' is -1, which will set the | ||
653 | * threshold outside of the buffer, just like we want it. | ||
654 | */ | ||
655 | ith *= ds_cfg.sizeof_rec[qual]; | ||
656 | trace->ith = (void *)(buffer + size - ith); | ||
657 | |||
658 | trace->flags = flags; | ||
659 | } | ||
660 | |||
661 | |||
662 | static int ds_request(struct ds_tracer *tracer, struct ds_trace *trace, | ||
663 | enum ds_qualifier qual, struct task_struct *task, | ||
664 | int cpu, void *base, size_t size, size_t th) | ||
665 | { | ||
666 | struct ds_context *context; | ||
667 | int error; | ||
668 | size_t req_size; | ||
669 | |||
670 | error = -EOPNOTSUPP; | ||
671 | if (!ds_cfg.sizeof_rec[qual]) | ||
672 | goto out; | ||
673 | |||
674 | error = -EINVAL; | ||
675 | if (!base) | ||
676 | goto out; | ||
677 | |||
678 | req_size = ds_cfg.sizeof_rec[qual]; | ||
679 | /* We might need space for alignment adjustments. */ | ||
680 | if (!IS_ALIGNED((unsigned long)base, DS_ALIGNMENT)) | ||
681 | req_size += DS_ALIGNMENT; | ||
682 | |||
683 | error = -EINVAL; | ||
684 | if (size < req_size) | ||
685 | goto out; | ||
686 | |||
687 | if (th != (size_t)-1) { | ||
688 | th *= ds_cfg.sizeof_rec[qual]; | ||
689 | |||
690 | error = -EINVAL; | ||
691 | if (size <= th) | ||
692 | goto out; | ||
693 | } | ||
694 | |||
695 | tracer->buffer = base; | ||
696 | tracer->size = size; | ||
697 | |||
698 | error = -ENOMEM; | ||
699 | context = ds_get_context(task, cpu); | ||
700 | if (!context) | ||
701 | goto out; | ||
702 | tracer->context = context; | ||
703 | |||
704 | /* | ||
705 | * Defer any tracer-specific initialization work for the context until | ||
706 | * context ownership has been clarified. | ||
707 | */ | ||
708 | |||
709 | error = 0; | ||
710 | out: | ||
711 | return error; | ||
712 | } | ||
713 | |||
714 | static struct bts_tracer *ds_request_bts(struct task_struct *task, int cpu, | ||
715 | void *base, size_t size, | ||
716 | bts_ovfl_callback_t ovfl, size_t th, | ||
717 | unsigned int flags) | ||
718 | { | ||
719 | struct bts_tracer *tracer; | ||
720 | int error; | ||
721 | |||
722 | /* Buffer overflow notification is not yet implemented. */ | ||
723 | error = -EOPNOTSUPP; | ||
724 | if (ovfl) | ||
725 | goto out; | ||
726 | |||
727 | error = get_tracer(task); | ||
728 | if (error < 0) | ||
729 | goto out; | ||
730 | |||
731 | error = -ENOMEM; | ||
732 | tracer = kzalloc(sizeof(*tracer), GFP_KERNEL); | ||
733 | if (!tracer) | ||
734 | goto out_put_tracer; | ||
735 | tracer->ovfl = ovfl; | ||
736 | |||
737 | /* Do some more error checking and acquire a tracing context. */ | ||
738 | error = ds_request(&tracer->ds, &tracer->trace.ds, | ||
739 | ds_bts, task, cpu, base, size, th); | ||
740 | if (error < 0) | ||
741 | goto out_tracer; | ||
742 | |||
743 | /* Claim the bts part of the tracing context we acquired above. */ | ||
744 | spin_lock_irq(&ds_lock); | ||
745 | |||
746 | error = -EPERM; | ||
747 | if (tracer->ds.context->bts_master) | ||
748 | goto out_unlock; | ||
749 | tracer->ds.context->bts_master = tracer; | ||
750 | |||
751 | spin_unlock_irq(&ds_lock); | ||
752 | |||
753 | /* | ||
754 | * Now that we own the bts part of the context, let's complete the | ||
755 | * initialization for that part. | ||
756 | */ | ||
757 | ds_init_ds_trace(&tracer->trace.ds, ds_bts, base, size, th, flags); | ||
758 | ds_write_config(tracer->ds.context, &tracer->trace.ds, ds_bts); | ||
759 | ds_install_ds_area(tracer->ds.context); | ||
760 | |||
761 | tracer->trace.read = bts_read; | ||
762 | tracer->trace.write = bts_write; | ||
763 | |||
764 | /* Start tracing. */ | ||
765 | ds_resume_bts(tracer); | ||
766 | |||
767 | return tracer; | ||
768 | |||
769 | out_unlock: | ||
770 | spin_unlock_irq(&ds_lock); | ||
771 | ds_put_context(tracer->ds.context); | ||
772 | out_tracer: | ||
773 | kfree(tracer); | ||
774 | out_put_tracer: | ||
775 | put_tracer(task); | ||
776 | out: | ||
777 | return ERR_PTR(error); | ||
778 | } | ||
779 | |||
780 | struct bts_tracer *ds_request_bts_task(struct task_struct *task, | ||
781 | void *base, size_t size, | ||
782 | bts_ovfl_callback_t ovfl, | ||
783 | size_t th, unsigned int flags) | ||
784 | { | ||
785 | return ds_request_bts(task, 0, base, size, ovfl, th, flags); | ||
786 | } | ||
787 | |||
788 | struct bts_tracer *ds_request_bts_cpu(int cpu, void *base, size_t size, | ||
789 | bts_ovfl_callback_t ovfl, | ||
790 | size_t th, unsigned int flags) | ||
791 | { | ||
792 | return ds_request_bts(NULL, cpu, base, size, ovfl, th, flags); | ||
793 | } | ||
794 | |||
795 | static struct pebs_tracer *ds_request_pebs(struct task_struct *task, int cpu, | ||
796 | void *base, size_t size, | ||
797 | pebs_ovfl_callback_t ovfl, size_t th, | ||
798 | unsigned int flags) | ||
799 | { | ||
800 | struct pebs_tracer *tracer; | ||
801 | int error; | ||
802 | |||
803 | /* Buffer overflow notification is not yet implemented. */ | ||
804 | error = -EOPNOTSUPP; | ||
805 | if (ovfl) | ||
806 | goto out; | ||
807 | |||
808 | error = get_tracer(task); | ||
809 | if (error < 0) | ||
810 | goto out; | ||
811 | |||
812 | error = -ENOMEM; | ||
813 | tracer = kzalloc(sizeof(*tracer), GFP_KERNEL); | ||
814 | if (!tracer) | ||
815 | goto out_put_tracer; | ||
816 | tracer->ovfl = ovfl; | ||
817 | |||
818 | /* Do some more error checking and acquire a tracing context. */ | ||
819 | error = ds_request(&tracer->ds, &tracer->trace.ds, | ||
820 | ds_pebs, task, cpu, base, size, th); | ||
821 | if (error < 0) | ||
822 | goto out_tracer; | ||
823 | |||
824 | /* Claim the pebs part of the tracing context we acquired above. */ | ||
825 | spin_lock_irq(&ds_lock); | ||
826 | |||
827 | error = -EPERM; | ||
828 | if (tracer->ds.context->pebs_master) | ||
829 | goto out_unlock; | ||
830 | tracer->ds.context->pebs_master = tracer; | ||
831 | |||
832 | spin_unlock_irq(&ds_lock); | ||
833 | |||
834 | /* | ||
835 | * Now that we own the pebs part of the context, let's complete the | ||
836 | * initialization for that part. | ||
837 | */ | ||
838 | ds_init_ds_trace(&tracer->trace.ds, ds_pebs, base, size, th, flags); | ||
839 | ds_write_config(tracer->ds.context, &tracer->trace.ds, ds_pebs); | ||
840 | ds_install_ds_area(tracer->ds.context); | ||
841 | |||
842 | /* Start tracing. */ | ||
843 | ds_resume_pebs(tracer); | ||
844 | |||
845 | return tracer; | ||
846 | |||
847 | out_unlock: | ||
848 | spin_unlock_irq(&ds_lock); | ||
849 | ds_put_context(tracer->ds.context); | ||
850 | out_tracer: | ||
851 | kfree(tracer); | ||
852 | out_put_tracer: | ||
853 | put_tracer(task); | ||
854 | out: | ||
855 | return ERR_PTR(error); | ||
856 | } | ||
857 | |||
858 | struct pebs_tracer *ds_request_pebs_task(struct task_struct *task, | ||
859 | void *base, size_t size, | ||
860 | pebs_ovfl_callback_t ovfl, | ||
861 | size_t th, unsigned int flags) | ||
862 | { | ||
863 | return ds_request_pebs(task, 0, base, size, ovfl, th, flags); | ||
864 | } | ||
865 | |||
866 | struct pebs_tracer *ds_request_pebs_cpu(int cpu, void *base, size_t size, | ||
867 | pebs_ovfl_callback_t ovfl, | ||
868 | size_t th, unsigned int flags) | ||
869 | { | ||
870 | return ds_request_pebs(NULL, cpu, base, size, ovfl, th, flags); | ||
871 | } | ||
872 | |||
873 | static void ds_free_bts(struct bts_tracer *tracer) | ||
874 | { | ||
875 | struct task_struct *task; | ||
876 | |||
877 | task = tracer->ds.context->task; | ||
878 | |||
879 | WARN_ON_ONCE(tracer->ds.context->bts_master != tracer); | ||
880 | tracer->ds.context->bts_master = NULL; | ||
881 | |||
882 | /* Make sure tracing stopped and the tracer is not in use. */ | ||
883 | if (task && (task != current)) | ||
884 | wait_task_context_switch(task); | ||
885 | |||
886 | ds_put_context(tracer->ds.context); | ||
887 | put_tracer(task); | ||
888 | |||
889 | kfree(tracer); | ||
890 | } | ||
891 | |||
892 | void ds_release_bts(struct bts_tracer *tracer) | ||
893 | { | ||
894 | might_sleep(); | ||
895 | |||
896 | if (!tracer) | ||
897 | return; | ||
898 | |||
899 | ds_suspend_bts(tracer); | ||
900 | ds_free_bts(tracer); | ||
901 | } | ||
902 | |||
903 | int ds_release_bts_noirq(struct bts_tracer *tracer) | ||
904 | { | ||
905 | struct task_struct *task; | ||
906 | unsigned long irq; | ||
907 | int error; | ||
908 | |||
909 | if (!tracer) | ||
910 | return 0; | ||
911 | |||
912 | task = tracer->ds.context->task; | ||
913 | |||
914 | local_irq_save(irq); | ||
915 | |||
916 | error = -EPERM; | ||
917 | if (!task && | ||
918 | (tracer->ds.context->cpu != smp_processor_id())) | ||
919 | goto out; | ||
920 | |||
921 | error = -EPERM; | ||
922 | if (task && (task != current)) | ||
923 | goto out; | ||
924 | |||
925 | ds_suspend_bts_noirq(tracer); | ||
926 | ds_free_bts(tracer); | ||
927 | |||
928 | error = 0; | ||
929 | out: | ||
930 | local_irq_restore(irq); | ||
931 | return error; | ||
932 | } | ||
933 | |||
934 | static void update_task_debugctlmsr(struct task_struct *task, | ||
935 | unsigned long debugctlmsr) | ||
936 | { | ||
937 | task->thread.debugctlmsr = debugctlmsr; | ||
938 | |||
939 | get_cpu(); | ||
940 | if (task == current) | ||
941 | update_debugctlmsr(debugctlmsr); | ||
942 | put_cpu(); | ||
943 | } | ||
944 | |||
945 | void ds_suspend_bts(struct bts_tracer *tracer) | ||
946 | { | ||
947 | struct task_struct *task; | ||
948 | unsigned long debugctlmsr; | ||
949 | int cpu; | ||
950 | |||
951 | if (!tracer) | ||
952 | return; | ||
953 | |||
954 | tracer->flags = 0; | ||
955 | |||
956 | task = tracer->ds.context->task; | ||
957 | cpu = tracer->ds.context->cpu; | ||
958 | |||
959 | WARN_ON(!task && irqs_disabled()); | ||
960 | |||
961 | debugctlmsr = (task ? | ||
962 | task->thread.debugctlmsr : | ||
963 | get_debugctlmsr_on_cpu(cpu)); | ||
964 | debugctlmsr &= ~BTS_CONTROL; | ||
965 | |||
966 | if (task) | ||
967 | update_task_debugctlmsr(task, debugctlmsr); | ||
968 | else | ||
969 | update_debugctlmsr_on_cpu(cpu, debugctlmsr); | ||
970 | } | ||
971 | |||
972 | int ds_suspend_bts_noirq(struct bts_tracer *tracer) | ||
973 | { | ||
974 | struct task_struct *task; | ||
975 | unsigned long debugctlmsr, irq; | ||
976 | int cpu, error = 0; | ||
977 | |||
978 | if (!tracer) | ||
979 | return 0; | ||
980 | |||
981 | tracer->flags = 0; | ||
982 | |||
983 | task = tracer->ds.context->task; | ||
984 | cpu = tracer->ds.context->cpu; | ||
985 | |||
986 | local_irq_save(irq); | ||
987 | |||
988 | error = -EPERM; | ||
989 | if (!task && (cpu != smp_processor_id())) | ||
990 | goto out; | ||
991 | |||
992 | debugctlmsr = (task ? | ||
993 | task->thread.debugctlmsr : | ||
994 | get_debugctlmsr()); | ||
995 | debugctlmsr &= ~BTS_CONTROL; | ||
996 | |||
997 | if (task) | ||
998 | update_task_debugctlmsr(task, debugctlmsr); | ||
999 | else | ||
1000 | update_debugctlmsr(debugctlmsr); | ||
1001 | |||
1002 | error = 0; | ||
1003 | out: | ||
1004 | local_irq_restore(irq); | ||
1005 | return error; | ||
1006 | } | ||
1007 | |||
1008 | static unsigned long ds_bts_control(struct bts_tracer *tracer) | ||
1009 | { | ||
1010 | unsigned long control; | ||
1011 | |||
1012 | control = ds_cfg.ctl[dsf_bts]; | ||
1013 | if (!(tracer->trace.ds.flags & BTS_KERNEL)) | ||
1014 | control |= ds_cfg.ctl[dsf_bts_kernel]; | ||
1015 | if (!(tracer->trace.ds.flags & BTS_USER)) | ||
1016 | control |= ds_cfg.ctl[dsf_bts_user]; | ||
1017 | |||
1018 | return control; | ||
1019 | } | ||
1020 | |||
1021 | void ds_resume_bts(struct bts_tracer *tracer) | ||
1022 | { | ||
1023 | struct task_struct *task; | ||
1024 | unsigned long debugctlmsr; | ||
1025 | int cpu; | ||
1026 | |||
1027 | if (!tracer) | ||
1028 | return; | ||
1029 | |||
1030 | tracer->flags = tracer->trace.ds.flags; | ||
1031 | |||
1032 | task = tracer->ds.context->task; | ||
1033 | cpu = tracer->ds.context->cpu; | ||
1034 | |||
1035 | WARN_ON(!task && irqs_disabled()); | ||
1036 | |||
1037 | debugctlmsr = (task ? | ||
1038 | task->thread.debugctlmsr : | ||
1039 | get_debugctlmsr_on_cpu(cpu)); | ||
1040 | debugctlmsr |= ds_bts_control(tracer); | ||
1041 | |||
1042 | if (task) | ||
1043 | update_task_debugctlmsr(task, debugctlmsr); | ||
1044 | else | ||
1045 | update_debugctlmsr_on_cpu(cpu, debugctlmsr); | ||
1046 | } | ||
1047 | |||
1048 | int ds_resume_bts_noirq(struct bts_tracer *tracer) | ||
1049 | { | ||
1050 | struct task_struct *task; | ||
1051 | unsigned long debugctlmsr, irq; | ||
1052 | int cpu, error = 0; | ||
1053 | |||
1054 | if (!tracer) | ||
1055 | return 0; | ||
1056 | |||
1057 | tracer->flags = tracer->trace.ds.flags; | ||
1058 | |||
1059 | task = tracer->ds.context->task; | ||
1060 | cpu = tracer->ds.context->cpu; | ||
1061 | |||
1062 | local_irq_save(irq); | ||
1063 | |||
1064 | error = -EPERM; | ||
1065 | if (!task && (cpu != smp_processor_id())) | ||
1066 | goto out; | ||
1067 | |||
1068 | debugctlmsr = (task ? | ||
1069 | task->thread.debugctlmsr : | ||
1070 | get_debugctlmsr()); | ||
1071 | debugctlmsr |= ds_bts_control(tracer); | ||
1072 | |||
1073 | if (task) | ||
1074 | update_task_debugctlmsr(task, debugctlmsr); | ||
1075 | else | ||
1076 | update_debugctlmsr(debugctlmsr); | ||
1077 | |||
1078 | error = 0; | ||
1079 | out: | ||
1080 | local_irq_restore(irq); | ||
1081 | return error; | ||
1082 | } | ||
1083 | |||
1084 | static void ds_free_pebs(struct pebs_tracer *tracer) | ||
1085 | { | ||
1086 | struct task_struct *task; | ||
1087 | |||
1088 | task = tracer->ds.context->task; | ||
1089 | |||
1090 | WARN_ON_ONCE(tracer->ds.context->pebs_master != tracer); | ||
1091 | tracer->ds.context->pebs_master = NULL; | ||
1092 | |||
1093 | ds_put_context(tracer->ds.context); | ||
1094 | put_tracer(task); | ||
1095 | |||
1096 | kfree(tracer); | ||
1097 | } | ||
1098 | |||
1099 | void ds_release_pebs(struct pebs_tracer *tracer) | ||
1100 | { | ||
1101 | might_sleep(); | ||
1102 | |||
1103 | if (!tracer) | ||
1104 | return; | ||
1105 | |||
1106 | ds_suspend_pebs(tracer); | ||
1107 | ds_free_pebs(tracer); | ||
1108 | } | ||
1109 | |||
1110 | int ds_release_pebs_noirq(struct pebs_tracer *tracer) | ||
1111 | { | ||
1112 | struct task_struct *task; | ||
1113 | unsigned long irq; | ||
1114 | int error; | ||
1115 | |||
1116 | if (!tracer) | ||
1117 | return 0; | ||
1118 | |||
1119 | task = tracer->ds.context->task; | ||
1120 | |||
1121 | local_irq_save(irq); | ||
1122 | |||
1123 | error = -EPERM; | ||
1124 | if (!task && | ||
1125 | (tracer->ds.context->cpu != smp_processor_id())) | ||
1126 | goto out; | ||
1127 | |||
1128 | error = -EPERM; | ||
1129 | if (task && (task != current)) | ||
1130 | goto out; | ||
1131 | |||
1132 | ds_suspend_pebs_noirq(tracer); | ||
1133 | ds_free_pebs(tracer); | ||
1134 | |||
1135 | error = 0; | ||
1136 | out: | ||
1137 | local_irq_restore(irq); | ||
1138 | return error; | ||
1139 | } | ||
1140 | |||
1141 | void ds_suspend_pebs(struct pebs_tracer *tracer) | ||
1142 | { | ||
1143 | |||
1144 | } | ||
1145 | |||
1146 | int ds_suspend_pebs_noirq(struct pebs_tracer *tracer) | ||
1147 | { | ||
1148 | return 0; | ||
1149 | } | ||
1150 | |||
1151 | void ds_resume_pebs(struct pebs_tracer *tracer) | ||
1152 | { | ||
1153 | |||
1154 | } | ||
1155 | |||
1156 | int ds_resume_pebs_noirq(struct pebs_tracer *tracer) | ||
1157 | { | ||
1158 | return 0; | ||
1159 | } | ||
1160 | |||
1161 | const struct bts_trace *ds_read_bts(struct bts_tracer *tracer) | ||
1162 | { | ||
1163 | if (!tracer) | ||
1164 | return NULL; | ||
1165 | |||
1166 | ds_read_config(tracer->ds.context, &tracer->trace.ds, ds_bts); | ||
1167 | return &tracer->trace; | ||
1168 | } | ||
1169 | |||
1170 | const struct pebs_trace *ds_read_pebs(struct pebs_tracer *tracer) | ||
1171 | { | ||
1172 | if (!tracer) | ||
1173 | return NULL; | ||
1174 | |||
1175 | ds_read_config(tracer->ds.context, &tracer->trace.ds, ds_pebs); | ||
1176 | |||
1177 | tracer->trace.counters = ds_cfg.nr_counter_reset; | ||
1178 | memcpy(tracer->trace.counter_reset, | ||
1179 | tracer->ds.context->ds + | ||
1180 | (NUM_DS_PTR_FIELDS * ds_cfg.sizeof_ptr_field), | ||
1181 | ds_cfg.nr_counter_reset * PEBS_RESET_FIELD_SIZE); | ||
1182 | |||
1183 | return &tracer->trace; | ||
1184 | } | ||
1185 | |||
1186 | int ds_reset_bts(struct bts_tracer *tracer) | ||
1187 | { | ||
1188 | if (!tracer) | ||
1189 | return -EINVAL; | ||
1190 | |||
1191 | tracer->trace.ds.top = tracer->trace.ds.begin; | ||
1192 | |||
1193 | ds_set(tracer->ds.context->ds, ds_bts, ds_index, | ||
1194 | (unsigned long)tracer->trace.ds.top); | ||
1195 | |||
1196 | return 0; | ||
1197 | } | ||
1198 | |||
1199 | int ds_reset_pebs(struct pebs_tracer *tracer) | ||
1200 | { | ||
1201 | if (!tracer) | ||
1202 | return -EINVAL; | ||
1203 | |||
1204 | tracer->trace.ds.top = tracer->trace.ds.begin; | ||
1205 | |||
1206 | ds_set(tracer->ds.context->ds, ds_pebs, ds_index, | ||
1207 | (unsigned long)tracer->trace.ds.top); | ||
1208 | |||
1209 | return 0; | ||
1210 | } | ||
1211 | |||
1212 | int ds_set_pebs_reset(struct pebs_tracer *tracer, | ||
1213 | unsigned int counter, u64 value) | ||
1214 | { | ||
1215 | if (!tracer) | ||
1216 | return -EINVAL; | ||
1217 | |||
1218 | if (ds_cfg.nr_counter_reset < counter) | ||
1219 | return -EINVAL; | ||
1220 | |||
1221 | *(u64 *)(tracer->ds.context->ds + | ||
1222 | (NUM_DS_PTR_FIELDS * ds_cfg.sizeof_ptr_field) + | ||
1223 | (counter * PEBS_RESET_FIELD_SIZE)) = value; | ||
1224 | |||
1225 | return 0; | ||
1226 | } | ||
1227 | |||
1228 | static const struct ds_configuration ds_cfg_netburst = { | ||
1229 | .name = "Netburst", | ||
1230 | .ctl[dsf_bts] = (1 << 2) | (1 << 3), | ||
1231 | .ctl[dsf_bts_kernel] = (1 << 5), | ||
1232 | .ctl[dsf_bts_user] = (1 << 6), | ||
1233 | .nr_counter_reset = 1, | ||
1234 | }; | ||
1235 | static const struct ds_configuration ds_cfg_pentium_m = { | ||
1236 | .name = "Pentium M", | ||
1237 | .ctl[dsf_bts] = (1 << 6) | (1 << 7), | ||
1238 | .nr_counter_reset = 1, | ||
1239 | }; | ||
1240 | static const struct ds_configuration ds_cfg_core2_atom = { | ||
1241 | .name = "Core 2/Atom", | ||
1242 | .ctl[dsf_bts] = (1 << 6) | (1 << 7), | ||
1243 | .ctl[dsf_bts_kernel] = (1 << 9), | ||
1244 | .ctl[dsf_bts_user] = (1 << 10), | ||
1245 | .nr_counter_reset = 1, | ||
1246 | }; | ||
1247 | static const struct ds_configuration ds_cfg_core_i7 = { | ||
1248 | .name = "Core i7", | ||
1249 | .ctl[dsf_bts] = (1 << 6) | (1 << 7), | ||
1250 | .ctl[dsf_bts_kernel] = (1 << 9), | ||
1251 | .ctl[dsf_bts_user] = (1 << 10), | ||
1252 | .nr_counter_reset = 4, | ||
1253 | }; | ||
1254 | |||
1255 | static void | ||
1256 | ds_configure(const struct ds_configuration *cfg, | ||
1257 | struct cpuinfo_x86 *cpu) | ||
1258 | { | ||
1259 | unsigned long nr_pebs_fields = 0; | ||
1260 | |||
1261 | printk(KERN_INFO "[ds] using %s configuration\n", cfg->name); | ||
1262 | |||
1263 | #ifdef __i386__ | ||
1264 | nr_pebs_fields = 10; | ||
1265 | #else | ||
1266 | nr_pebs_fields = 18; | ||
1267 | #endif | ||
1268 | |||
1269 | /* | ||
1270 | * Starting with version 2, architectural performance | ||
1271 | * monitoring supports a format specifier. | ||
1272 | */ | ||
1273 | if ((cpuid_eax(0xa) & 0xff) > 1) { | ||
1274 | unsigned long perf_capabilities, format; | ||
1275 | |||
1276 | rdmsrl(MSR_IA32_PERF_CAPABILITIES, perf_capabilities); | ||
1277 | |||
1278 | format = (perf_capabilities >> 8) & 0xf; | ||
1279 | |||
1280 | switch (format) { | ||
1281 | case 0: | ||
1282 | nr_pebs_fields = 18; | ||
1283 | break; | ||
1284 | case 1: | ||
1285 | nr_pebs_fields = 22; | ||
1286 | break; | ||
1287 | default: | ||
1288 | printk(KERN_INFO | ||
1289 | "[ds] unknown PEBS format: %lu\n", format); | ||
1290 | nr_pebs_fields = 0; | ||
1291 | break; | ||
1292 | } | ||
1293 | } | ||
1294 | |||
1295 | memset(&ds_cfg, 0, sizeof(ds_cfg)); | ||
1296 | ds_cfg = *cfg; | ||
1297 | |||
1298 | ds_cfg.sizeof_ptr_field = | ||
1299 | (cpu_has(cpu, X86_FEATURE_DTES64) ? 8 : 4); | ||
1300 | |||
1301 | ds_cfg.sizeof_rec[ds_bts] = ds_cfg.sizeof_ptr_field * 3; | ||
1302 | ds_cfg.sizeof_rec[ds_pebs] = ds_cfg.sizeof_ptr_field * nr_pebs_fields; | ||
1303 | |||
1304 | if (!cpu_has(cpu, X86_FEATURE_BTS)) { | ||
1305 | ds_cfg.sizeof_rec[ds_bts] = 0; | ||
1306 | printk(KERN_INFO "[ds] bts not available\n"); | ||
1307 | } | ||
1308 | if (!cpu_has(cpu, X86_FEATURE_PEBS)) { | ||
1309 | ds_cfg.sizeof_rec[ds_pebs] = 0; | ||
1310 | printk(KERN_INFO "[ds] pebs not available\n"); | ||
1311 | } | ||
1312 | |||
1313 | printk(KERN_INFO "[ds] sizes: address: %u bit, ", | ||
1314 | 8 * ds_cfg.sizeof_ptr_field); | ||
1315 | printk("bts/pebs record: %u/%u bytes\n", | ||
1316 | ds_cfg.sizeof_rec[ds_bts], ds_cfg.sizeof_rec[ds_pebs]); | ||
1317 | |||
1318 | WARN_ON_ONCE(MAX_PEBS_COUNTERS < ds_cfg.nr_counter_reset); | ||
1319 | } | ||
1320 | |||
1321 | void __cpuinit ds_init_intel(struct cpuinfo_x86 *c) | ||
1322 | { | ||
1323 | /* Only configure the first cpu. Others are identical. */ | ||
1324 | if (ds_cfg.name) | ||
1325 | return; | ||
1326 | |||
1327 | switch (c->x86) { | ||
1328 | case 0x6: | ||
1329 | switch (c->x86_model) { | ||
1330 | case 0x9: | ||
1331 | case 0xd: /* Pentium M */ | ||
1332 | ds_configure(&ds_cfg_pentium_m, c); | ||
1333 | break; | ||
1334 | case 0xf: | ||
1335 | case 0x17: /* Core2 */ | ||
1336 | case 0x1c: /* Atom */ | ||
1337 | ds_configure(&ds_cfg_core2_atom, c); | ||
1338 | break; | ||
1339 | case 0x1a: /* Core i7 */ | ||
1340 | ds_configure(&ds_cfg_core_i7, c); | ||
1341 | break; | ||
1342 | default: | ||
1343 | /* Sorry, don't know about them. */ | ||
1344 | break; | ||
1345 | } | ||
1346 | break; | ||
1347 | case 0xf: | ||
1348 | switch (c->x86_model) { | ||
1349 | case 0x0: | ||
1350 | case 0x1: | ||
1351 | case 0x2: /* Netburst */ | ||
1352 | ds_configure(&ds_cfg_netburst, c); | ||
1353 | break; | ||
1354 | default: | ||
1355 | /* Sorry, don't know about them. */ | ||
1356 | break; | ||
1357 | } | ||
1358 | break; | ||
1359 | default: | ||
1360 | /* Sorry, don't know about them. */ | ||
1361 | break; | ||
1362 | } | ||
1363 | } | ||
1364 | |||
1365 | static inline void ds_take_timestamp(struct ds_context *context, | ||
1366 | enum bts_qualifier qualifier, | ||
1367 | struct task_struct *task) | ||
1368 | { | ||
1369 | struct bts_tracer *tracer = context->bts_master; | ||
1370 | struct bts_struct ts; | ||
1371 | |||
1372 | /* Prevent compilers from reading the tracer pointer twice. */ | ||
1373 | barrier(); | ||
1374 | |||
1375 | if (!tracer || !(tracer->flags & BTS_TIMESTAMPS)) | ||
1376 | return; | ||
1377 | |||
1378 | memset(&ts, 0, sizeof(ts)); | ||
1379 | ts.qualifier = qualifier; | ||
1380 | ts.variant.event.clock = trace_clock_global(); | ||
1381 | ts.variant.event.pid = task->pid; | ||
1382 | |||
1383 | bts_write(tracer, &ts); | ||
1384 | } | ||
1385 | |||
1386 | /* | ||
1387 | * Change the DS configuration from tracing prev to tracing next. | ||
1388 | */ | ||
1389 | void ds_switch_to(struct task_struct *prev, struct task_struct *next) | ||
1390 | { | ||
1391 | struct ds_context *prev_ctx = prev->thread.ds_ctx; | ||
1392 | struct ds_context *next_ctx = next->thread.ds_ctx; | ||
1393 | unsigned long debugctlmsr = next->thread.debugctlmsr; | ||
1394 | |||
1395 | /* Make sure all data is read before we start. */ | ||
1396 | barrier(); | ||
1397 | |||
1398 | if (prev_ctx) { | ||
1399 | update_debugctlmsr(0); | ||
1400 | |||
1401 | ds_take_timestamp(prev_ctx, bts_task_departs, prev); | ||
1402 | } | ||
1403 | |||
1404 | if (next_ctx) { | ||
1405 | ds_take_timestamp(next_ctx, bts_task_arrives, next); | ||
1406 | |||
1407 | wrmsrl(MSR_IA32_DS_AREA, (unsigned long)next_ctx->ds); | ||
1408 | } | ||
1409 | |||
1410 | update_debugctlmsr(debugctlmsr); | ||
1411 | } | ||
1412 | |||
1413 | static __init int ds_selftest(void) | ||
1414 | { | ||
1415 | if (ds_cfg.sizeof_rec[ds_bts]) { | ||
1416 | int error; | ||
1417 | |||
1418 | error = ds_selftest_bts(); | ||
1419 | if (error) { | ||
1420 | WARN(1, "[ds] selftest failed. disabling bts.\n"); | ||
1421 | ds_cfg.sizeof_rec[ds_bts] = 0; | ||
1422 | } | ||
1423 | } | ||
1424 | |||
1425 | if (ds_cfg.sizeof_rec[ds_pebs]) { | ||
1426 | int error; | ||
1427 | |||
1428 | error = ds_selftest_pebs(); | ||
1429 | if (error) { | ||
1430 | WARN(1, "[ds] selftest failed. disabling pebs.\n"); | ||
1431 | ds_cfg.sizeof_rec[ds_pebs] = 0; | ||
1432 | } | ||
1433 | } | ||
1434 | |||
1435 | return 0; | ||
1436 | } | ||
1437 | device_initcall(ds_selftest); | ||
diff --git a/arch/x86/kernel/ds_selftest.c b/arch/x86/kernel/ds_selftest.c deleted file mode 100644 index 6bc7c199ab99..000000000000 --- a/arch/x86/kernel/ds_selftest.c +++ /dev/null | |||
@@ -1,408 +0,0 @@ | |||
1 | /* | ||
2 | * Debug Store support - selftest | ||
3 | * | ||
4 | * | ||
5 | * Copyright (C) 2009 Intel Corporation. | ||
6 | * Markus Metzger <markus.t.metzger@intel.com>, 2009 | ||
7 | */ | ||
8 | |||
9 | #include "ds_selftest.h" | ||
10 | |||
11 | #include <linux/kernel.h> | ||
12 | #include <linux/string.h> | ||
13 | #include <linux/smp.h> | ||
14 | #include <linux/cpu.h> | ||
15 | |||
16 | #include <asm/ds.h> | ||
17 | |||
18 | |||
19 | #define BUFFER_SIZE 521 /* Intentionally chose an odd size. */ | ||
20 | #define SMALL_BUFFER_SIZE 24 /* A single bts entry. */ | ||
21 | |||
22 | struct ds_selftest_bts_conf { | ||
23 | struct bts_tracer *tracer; | ||
24 | int error; | ||
25 | int (*suspend)(struct bts_tracer *); | ||
26 | int (*resume)(struct bts_tracer *); | ||
27 | }; | ||
28 | |||
29 | static int ds_selftest_bts_consistency(const struct bts_trace *trace) | ||
30 | { | ||
31 | int error = 0; | ||
32 | |||
33 | if (!trace) { | ||
34 | printk(KERN_CONT "failed to access trace..."); | ||
35 | /* Bail out. Other tests are pointless. */ | ||
36 | return -1; | ||
37 | } | ||
38 | |||
39 | if (!trace->read) { | ||
40 | printk(KERN_CONT "bts read not available..."); | ||
41 | error = -1; | ||
42 | } | ||
43 | |||
44 | /* Do some sanity checks on the trace configuration. */ | ||
45 | if (!trace->ds.n) { | ||
46 | printk(KERN_CONT "empty bts buffer..."); | ||
47 | error = -1; | ||
48 | } | ||
49 | if (!trace->ds.size) { | ||
50 | printk(KERN_CONT "bad bts trace setup..."); | ||
51 | error = -1; | ||
52 | } | ||
53 | if (trace->ds.end != | ||
54 | (char *)trace->ds.begin + (trace->ds.n * trace->ds.size)) { | ||
55 | printk(KERN_CONT "bad bts buffer setup..."); | ||
56 | error = -1; | ||
57 | } | ||
58 | /* | ||
59 | * We allow top in [begin; end], since its not clear when the | ||
60 | * overflow adjustment happens: after the increment or before the | ||
61 | * write. | ||
62 | */ | ||
63 | if ((trace->ds.top < trace->ds.begin) || | ||
64 | (trace->ds.end < trace->ds.top)) { | ||
65 | printk(KERN_CONT "bts top out of bounds..."); | ||
66 | error = -1; | ||
67 | } | ||
68 | |||
69 | return error; | ||
70 | } | ||
71 | |||
72 | static int ds_selftest_bts_read(struct bts_tracer *tracer, | ||
73 | const struct bts_trace *trace, | ||
74 | const void *from, const void *to) | ||
75 | { | ||
76 | const unsigned char *at; | ||
77 | |||
78 | /* | ||
79 | * Check a few things which do not belong to this test. | ||
80 | * They should be covered by other tests. | ||
81 | */ | ||
82 | if (!trace) | ||
83 | return -1; | ||
84 | |||
85 | if (!trace->read) | ||
86 | return -1; | ||
87 | |||
88 | if (to < from) | ||
89 | return -1; | ||
90 | |||
91 | if (from < trace->ds.begin) | ||
92 | return -1; | ||
93 | |||
94 | if (trace->ds.end < to) | ||
95 | return -1; | ||
96 | |||
97 | if (!trace->ds.size) | ||
98 | return -1; | ||
99 | |||
100 | /* Now to the test itself. */ | ||
101 | for (at = from; (void *)at < to; at += trace->ds.size) { | ||
102 | struct bts_struct bts; | ||
103 | unsigned long index; | ||
104 | int error; | ||
105 | |||
106 | if (((void *)at - trace->ds.begin) % trace->ds.size) { | ||
107 | printk(KERN_CONT | ||
108 | "read from non-integer index..."); | ||
109 | return -1; | ||
110 | } | ||
111 | index = ((void *)at - trace->ds.begin) / trace->ds.size; | ||
112 | |||
113 | memset(&bts, 0, sizeof(bts)); | ||
114 | error = trace->read(tracer, at, &bts); | ||
115 | if (error < 0) { | ||
116 | printk(KERN_CONT | ||
117 | "error reading bts trace at [%lu] (0x%p)...", | ||
118 | index, at); | ||
119 | return error; | ||
120 | } | ||
121 | |||
122 | switch (bts.qualifier) { | ||
123 | case BTS_BRANCH: | ||
124 | break; | ||
125 | default: | ||
126 | printk(KERN_CONT | ||
127 | "unexpected bts entry %llu at [%lu] (0x%p)...", | ||
128 | bts.qualifier, index, at); | ||
129 | return -1; | ||
130 | } | ||
131 | } | ||
132 | |||
133 | return 0; | ||
134 | } | ||
135 | |||
136 | static void ds_selftest_bts_cpu(void *arg) | ||
137 | { | ||
138 | struct ds_selftest_bts_conf *conf = arg; | ||
139 | const struct bts_trace *trace; | ||
140 | void *top; | ||
141 | |||
142 | if (IS_ERR(conf->tracer)) { | ||
143 | conf->error = PTR_ERR(conf->tracer); | ||
144 | conf->tracer = NULL; | ||
145 | |||
146 | printk(KERN_CONT | ||
147 | "initialization failed (err: %d)...", conf->error); | ||
148 | return; | ||
149 | } | ||
150 | |||
151 | /* We should meanwhile have enough trace. */ | ||
152 | conf->error = conf->suspend(conf->tracer); | ||
153 | if (conf->error < 0) | ||
154 | return; | ||
155 | |||
156 | /* Let's see if we can access the trace. */ | ||
157 | trace = ds_read_bts(conf->tracer); | ||
158 | |||
159 | conf->error = ds_selftest_bts_consistency(trace); | ||
160 | if (conf->error < 0) | ||
161 | return; | ||
162 | |||
163 | /* If everything went well, we should have a few trace entries. */ | ||
164 | if (trace->ds.top == trace->ds.begin) { | ||
165 | /* | ||
166 | * It is possible but highly unlikely that we got a | ||
167 | * buffer overflow and end up at exactly the same | ||
168 | * position we started from. | ||
169 | * Let's issue a warning, but continue. | ||
170 | */ | ||
171 | printk(KERN_CONT "no trace/overflow..."); | ||
172 | } | ||
173 | |||
174 | /* Let's try to read the trace we collected. */ | ||
175 | conf->error = | ||
176 | ds_selftest_bts_read(conf->tracer, trace, | ||
177 | trace->ds.begin, trace->ds.top); | ||
178 | if (conf->error < 0) | ||
179 | return; | ||
180 | |||
181 | /* | ||
182 | * Let's read the trace again. | ||
183 | * Since we suspended tracing, we should get the same result. | ||
184 | */ | ||
185 | top = trace->ds.top; | ||
186 | |||
187 | trace = ds_read_bts(conf->tracer); | ||
188 | conf->error = ds_selftest_bts_consistency(trace); | ||
189 | if (conf->error < 0) | ||
190 | return; | ||
191 | |||
192 | if (top != trace->ds.top) { | ||
193 | printk(KERN_CONT "suspend not working..."); | ||
194 | conf->error = -1; | ||
195 | return; | ||
196 | } | ||
197 | |||
198 | /* Let's collect some more trace - see if resume is working. */ | ||
199 | conf->error = conf->resume(conf->tracer); | ||
200 | if (conf->error < 0) | ||
201 | return; | ||
202 | |||
203 | conf->error = conf->suspend(conf->tracer); | ||
204 | if (conf->error < 0) | ||
205 | return; | ||
206 | |||
207 | trace = ds_read_bts(conf->tracer); | ||
208 | |||
209 | conf->error = ds_selftest_bts_consistency(trace); | ||
210 | if (conf->error < 0) | ||
211 | return; | ||
212 | |||
213 | if (trace->ds.top == top) { | ||
214 | /* | ||
215 | * It is possible but highly unlikely that we got a | ||
216 | * buffer overflow and end up at exactly the same | ||
217 | * position we started from. | ||
218 | * Let's issue a warning and check the full trace. | ||
219 | */ | ||
220 | printk(KERN_CONT | ||
221 | "no resume progress/overflow..."); | ||
222 | |||
223 | conf->error = | ||
224 | ds_selftest_bts_read(conf->tracer, trace, | ||
225 | trace->ds.begin, trace->ds.end); | ||
226 | } else if (trace->ds.top < top) { | ||
227 | /* | ||
228 | * We had a buffer overflow - the entire buffer should | ||
229 | * contain trace records. | ||
230 | */ | ||
231 | conf->error = | ||
232 | ds_selftest_bts_read(conf->tracer, trace, | ||
233 | trace->ds.begin, trace->ds.end); | ||
234 | } else { | ||
235 | /* | ||
236 | * It is quite likely that the buffer did not overflow. | ||
237 | * Let's just check the delta trace. | ||
238 | */ | ||
239 | conf->error = | ||
240 | ds_selftest_bts_read(conf->tracer, trace, top, | ||
241 | trace->ds.top); | ||
242 | } | ||
243 | if (conf->error < 0) | ||
244 | return; | ||
245 | |||
246 | conf->error = 0; | ||
247 | } | ||
248 | |||
249 | static int ds_suspend_bts_wrap(struct bts_tracer *tracer) | ||
250 | { | ||
251 | ds_suspend_bts(tracer); | ||
252 | return 0; | ||
253 | } | ||
254 | |||
255 | static int ds_resume_bts_wrap(struct bts_tracer *tracer) | ||
256 | { | ||
257 | ds_resume_bts(tracer); | ||
258 | return 0; | ||
259 | } | ||
260 | |||
261 | static void ds_release_bts_noirq_wrap(void *tracer) | ||
262 | { | ||
263 | (void)ds_release_bts_noirq(tracer); | ||
264 | } | ||
265 | |||
266 | static int ds_selftest_bts_bad_release_noirq(int cpu, | ||
267 | struct bts_tracer *tracer) | ||
268 | { | ||
269 | int error = -EPERM; | ||
270 | |||
271 | /* Try to release the tracer on the wrong cpu. */ | ||
272 | get_cpu(); | ||
273 | if (cpu != smp_processor_id()) { | ||
274 | error = ds_release_bts_noirq(tracer); | ||
275 | if (error != -EPERM) | ||
276 | printk(KERN_CONT "release on wrong cpu..."); | ||
277 | } | ||
278 | put_cpu(); | ||
279 | |||
280 | return error ? 0 : -1; | ||
281 | } | ||
282 | |||
283 | static int ds_selftest_bts_bad_request_cpu(int cpu, void *buffer) | ||
284 | { | ||
285 | struct bts_tracer *tracer; | ||
286 | int error; | ||
287 | |||
288 | /* Try to request cpu tracing while task tracing is active. */ | ||
289 | tracer = ds_request_bts_cpu(cpu, buffer, BUFFER_SIZE, NULL, | ||
290 | (size_t)-1, BTS_KERNEL); | ||
291 | error = PTR_ERR(tracer); | ||
292 | if (!IS_ERR(tracer)) { | ||
293 | ds_release_bts(tracer); | ||
294 | error = 0; | ||
295 | } | ||
296 | |||
297 | if (error != -EPERM) | ||
298 | printk(KERN_CONT "cpu/task tracing overlap..."); | ||
299 | |||
300 | return error ? 0 : -1; | ||
301 | } | ||
302 | |||
303 | static int ds_selftest_bts_bad_request_task(void *buffer) | ||
304 | { | ||
305 | struct bts_tracer *tracer; | ||
306 | int error; | ||
307 | |||
308 | /* Try to request cpu tracing while task tracing is active. */ | ||
309 | tracer = ds_request_bts_task(current, buffer, BUFFER_SIZE, NULL, | ||
310 | (size_t)-1, BTS_KERNEL); | ||
311 | error = PTR_ERR(tracer); | ||
312 | if (!IS_ERR(tracer)) { | ||
313 | error = 0; | ||
314 | ds_release_bts(tracer); | ||
315 | } | ||
316 | |||
317 | if (error != -EPERM) | ||
318 | printk(KERN_CONT "task/cpu tracing overlap..."); | ||
319 | |||
320 | return error ? 0 : -1; | ||
321 | } | ||
322 | |||
323 | int ds_selftest_bts(void) | ||
324 | { | ||
325 | struct ds_selftest_bts_conf conf; | ||
326 | unsigned char buffer[BUFFER_SIZE], *small_buffer; | ||
327 | unsigned long irq; | ||
328 | int cpu; | ||
329 | |||
330 | printk(KERN_INFO "[ds] bts selftest..."); | ||
331 | conf.error = 0; | ||
332 | |||
333 | small_buffer = (unsigned char *)ALIGN((unsigned long)buffer, 8) + 8; | ||
334 | |||
335 | get_online_cpus(); | ||
336 | for_each_online_cpu(cpu) { | ||
337 | conf.suspend = ds_suspend_bts_wrap; | ||
338 | conf.resume = ds_resume_bts_wrap; | ||
339 | conf.tracer = | ||
340 | ds_request_bts_cpu(cpu, buffer, BUFFER_SIZE, | ||
341 | NULL, (size_t)-1, BTS_KERNEL); | ||
342 | ds_selftest_bts_cpu(&conf); | ||
343 | if (conf.error >= 0) | ||
344 | conf.error = ds_selftest_bts_bad_request_task(buffer); | ||
345 | ds_release_bts(conf.tracer); | ||
346 | if (conf.error < 0) | ||
347 | goto out; | ||
348 | |||
349 | conf.suspend = ds_suspend_bts_noirq; | ||
350 | conf.resume = ds_resume_bts_noirq; | ||
351 | conf.tracer = | ||
352 | ds_request_bts_cpu(cpu, buffer, BUFFER_SIZE, | ||
353 | NULL, (size_t)-1, BTS_KERNEL); | ||
354 | smp_call_function_single(cpu, ds_selftest_bts_cpu, &conf, 1); | ||
355 | if (conf.error >= 0) { | ||
356 | conf.error = | ||
357 | ds_selftest_bts_bad_release_noirq(cpu, | ||
358 | conf.tracer); | ||
359 | /* We must not release the tracer twice. */ | ||
360 | if (conf.error < 0) | ||
361 | conf.tracer = NULL; | ||
362 | } | ||
363 | if (conf.error >= 0) | ||
364 | conf.error = ds_selftest_bts_bad_request_task(buffer); | ||
365 | smp_call_function_single(cpu, ds_release_bts_noirq_wrap, | ||
366 | conf.tracer, 1); | ||
367 | if (conf.error < 0) | ||
368 | goto out; | ||
369 | } | ||
370 | |||
371 | conf.suspend = ds_suspend_bts_wrap; | ||
372 | conf.resume = ds_resume_bts_wrap; | ||
373 | conf.tracer = | ||
374 | ds_request_bts_task(current, buffer, BUFFER_SIZE, | ||
375 | NULL, (size_t)-1, BTS_KERNEL); | ||
376 | ds_selftest_bts_cpu(&conf); | ||
377 | if (conf.error >= 0) | ||
378 | conf.error = ds_selftest_bts_bad_request_cpu(0, buffer); | ||
379 | ds_release_bts(conf.tracer); | ||
380 | if (conf.error < 0) | ||
381 | goto out; | ||
382 | |||
383 | conf.suspend = ds_suspend_bts_noirq; | ||
384 | conf.resume = ds_resume_bts_noirq; | ||
385 | conf.tracer = | ||
386 | ds_request_bts_task(current, small_buffer, SMALL_BUFFER_SIZE, | ||
387 | NULL, (size_t)-1, BTS_KERNEL); | ||
388 | local_irq_save(irq); | ||
389 | ds_selftest_bts_cpu(&conf); | ||
390 | if (conf.error >= 0) | ||
391 | conf.error = ds_selftest_bts_bad_request_cpu(0, buffer); | ||
392 | ds_release_bts_noirq(conf.tracer); | ||
393 | local_irq_restore(irq); | ||
394 | if (conf.error < 0) | ||
395 | goto out; | ||
396 | |||
397 | conf.error = 0; | ||
398 | out: | ||
399 | put_online_cpus(); | ||
400 | printk(KERN_CONT "%s.\n", (conf.error ? "failed" : "passed")); | ||
401 | |||
402 | return conf.error; | ||
403 | } | ||
404 | |||
405 | int ds_selftest_pebs(void) | ||
406 | { | ||
407 | return 0; | ||
408 | } | ||
diff --git a/arch/x86/kernel/ds_selftest.h b/arch/x86/kernel/ds_selftest.h deleted file mode 100644 index 2ba8745c6663..000000000000 --- a/arch/x86/kernel/ds_selftest.h +++ /dev/null | |||
@@ -1,15 +0,0 @@ | |||
1 | /* | ||
2 | * Debug Store support - selftest | ||
3 | * | ||
4 | * | ||
5 | * Copyright (C) 2009 Intel Corporation. | ||
6 | * Markus Metzger <markus.t.metzger@intel.com>, 2009 | ||
7 | */ | ||
8 | |||
9 | #ifdef CONFIG_X86_DS_SELFTEST | ||
10 | extern int ds_selftest_bts(void); | ||
11 | extern int ds_selftest_pebs(void); | ||
12 | #else | ||
13 | static inline int ds_selftest_bts(void) { return 0; } | ||
14 | static inline int ds_selftest_pebs(void) { return 0; } | ||
15 | #endif | ||
diff --git a/arch/x86/kernel/dumpstack.c b/arch/x86/kernel/dumpstack.c index 6d817554780a..c89a386930b7 100644 --- a/arch/x86/kernel/dumpstack.c +++ b/arch/x86/kernel/dumpstack.c | |||
@@ -224,11 +224,6 @@ unsigned __kprobes long oops_begin(void) | |||
224 | int cpu; | 224 | int cpu; |
225 | unsigned long flags; | 225 | unsigned long flags; |
226 | 226 | ||
227 | /* notify the hw-branch tracer so it may disable tracing and | ||
228 | add the last trace to the trace buffer - | ||
229 | the earlier this happens, the more useful the trace. */ | ||
230 | trace_hw_branch_oops(); | ||
231 | |||
232 | oops_enter(); | 227 | oops_enter(); |
233 | 228 | ||
234 | /* racy, but better than risking deadlock. */ | 229 | /* racy, but better than risking deadlock. */ |
diff --git a/arch/x86/kernel/hw_breakpoint.c b/arch/x86/kernel/hw_breakpoint.c index d6cc065f519f..a8f1b803d2fd 100644 --- a/arch/x86/kernel/hw_breakpoint.c +++ b/arch/x86/kernel/hw_breakpoint.c | |||
@@ -189,25 +189,16 @@ static int get_hbp_len(u8 hbp_len) | |||
189 | } | 189 | } |
190 | 190 | ||
191 | /* | 191 | /* |
192 | * Check for virtual address in user space. | ||
193 | */ | ||
194 | int arch_check_va_in_userspace(unsigned long va, u8 hbp_len) | ||
195 | { | ||
196 | unsigned int len; | ||
197 | |||
198 | len = get_hbp_len(hbp_len); | ||
199 | |||
200 | return (va <= TASK_SIZE - len); | ||
201 | } | ||
202 | |||
203 | /* | ||
204 | * Check for virtual address in kernel space. | 192 | * Check for virtual address in kernel space. |
205 | */ | 193 | */ |
206 | static int arch_check_va_in_kernelspace(unsigned long va, u8 hbp_len) | 194 | int arch_check_bp_in_kernelspace(struct perf_event *bp) |
207 | { | 195 | { |
208 | unsigned int len; | 196 | unsigned int len; |
197 | unsigned long va; | ||
198 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); | ||
209 | 199 | ||
210 | len = get_hbp_len(hbp_len); | 200 | va = info->address; |
201 | len = get_hbp_len(info->len); | ||
211 | 202 | ||
212 | return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE); | 203 | return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE); |
213 | } | 204 | } |
@@ -300,8 +291,7 @@ static int arch_build_bp_info(struct perf_event *bp) | |||
300 | /* | 291 | /* |
301 | * Validate the arch-specific HW Breakpoint register settings | 292 | * Validate the arch-specific HW Breakpoint register settings |
302 | */ | 293 | */ |
303 | int arch_validate_hwbkpt_settings(struct perf_event *bp, | 294 | int arch_validate_hwbkpt_settings(struct perf_event *bp) |
304 | struct task_struct *tsk) | ||
305 | { | 295 | { |
306 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); | 296 | struct arch_hw_breakpoint *info = counter_arch_bp(bp); |
307 | unsigned int align; | 297 | unsigned int align; |
@@ -314,16 +304,6 @@ int arch_validate_hwbkpt_settings(struct perf_event *bp, | |||
314 | 304 | ||
315 | ret = -EINVAL; | 305 | ret = -EINVAL; |
316 | 306 | ||
317 | if (info->type == X86_BREAKPOINT_EXECUTE) | ||
318 | /* | ||
319 | * Ptrace-refactoring code | ||
320 | * For now, we'll allow instruction breakpoint only for user-space | ||
321 | * addresses | ||
322 | */ | ||
323 | if ((!arch_check_va_in_userspace(info->address, info->len)) && | ||
324 | info->len != X86_BREAKPOINT_EXECUTE) | ||
325 | return ret; | ||
326 | |||
327 | switch (info->len) { | 307 | switch (info->len) { |
328 | case X86_BREAKPOINT_LEN_1: | 308 | case X86_BREAKPOINT_LEN_1: |
329 | align = 0; | 309 | align = 0; |
@@ -350,15 +330,6 @@ int arch_validate_hwbkpt_settings(struct perf_event *bp, | |||
350 | if (info->address & align) | 330 | if (info->address & align) |
351 | return -EINVAL; | 331 | return -EINVAL; |
352 | 332 | ||
353 | /* Check that the virtual address is in the proper range */ | ||
354 | if (tsk) { | ||
355 | if (!arch_check_va_in_userspace(info->address, info->len)) | ||
356 | return -EFAULT; | ||
357 | } else { | ||
358 | if (!arch_check_va_in_kernelspace(info->address, info->len)) | ||
359 | return -EFAULT; | ||
360 | } | ||
361 | |||
362 | return 0; | 333 | return 0; |
363 | } | 334 | } |
364 | 335 | ||
diff --git a/arch/x86/kernel/kprobes.c b/arch/x86/kernel/kprobes.c index 1658efdfb4e5..345a4b1fe144 100644 --- a/arch/x86/kernel/kprobes.c +++ b/arch/x86/kernel/kprobes.c | |||
@@ -422,14 +422,22 @@ static void __kprobes set_current_kprobe(struct kprobe *p, struct pt_regs *regs, | |||
422 | 422 | ||
423 | static void __kprobes clear_btf(void) | 423 | static void __kprobes clear_btf(void) |
424 | { | 424 | { |
425 | if (test_thread_flag(TIF_DEBUGCTLMSR)) | 425 | if (test_thread_flag(TIF_BLOCKSTEP)) { |
426 | update_debugctlmsr(0); | 426 | unsigned long debugctl = get_debugctlmsr(); |
427 | |||
428 | debugctl &= ~DEBUGCTLMSR_BTF; | ||
429 | update_debugctlmsr(debugctl); | ||
430 | } | ||
427 | } | 431 | } |
428 | 432 | ||
429 | static void __kprobes restore_btf(void) | 433 | static void __kprobes restore_btf(void) |
430 | { | 434 | { |
431 | if (test_thread_flag(TIF_DEBUGCTLMSR)) | 435 | if (test_thread_flag(TIF_BLOCKSTEP)) { |
432 | update_debugctlmsr(current->thread.debugctlmsr); | 436 | unsigned long debugctl = get_debugctlmsr(); |
437 | |||
438 | debugctl |= DEBUGCTLMSR_BTF; | ||
439 | update_debugctlmsr(debugctl); | ||
440 | } | ||
433 | } | 441 | } |
434 | 442 | ||
435 | void __kprobes arch_prepare_kretprobe(struct kretprobe_instance *ri, | 443 | void __kprobes arch_prepare_kretprobe(struct kretprobe_instance *ri, |
diff --git a/arch/x86/kernel/process.c b/arch/x86/kernel/process.c index 0415c3ef91b5..cc6877535ef4 100644 --- a/arch/x86/kernel/process.c +++ b/arch/x86/kernel/process.c | |||
@@ -20,7 +20,6 @@ | |||
20 | #include <asm/idle.h> | 20 | #include <asm/idle.h> |
21 | #include <asm/uaccess.h> | 21 | #include <asm/uaccess.h> |
22 | #include <asm/i387.h> | 22 | #include <asm/i387.h> |
23 | #include <asm/ds.h> | ||
24 | #include <asm/debugreg.h> | 23 | #include <asm/debugreg.h> |
25 | 24 | ||
26 | unsigned long idle_halt; | 25 | unsigned long idle_halt; |
@@ -50,8 +49,6 @@ void free_thread_xstate(struct task_struct *tsk) | |||
50 | kmem_cache_free(task_xstate_cachep, tsk->thread.xstate); | 49 | kmem_cache_free(task_xstate_cachep, tsk->thread.xstate); |
51 | tsk->thread.xstate = NULL; | 50 | tsk->thread.xstate = NULL; |
52 | } | 51 | } |
53 | |||
54 | WARN(tsk->thread.ds_ctx, "leaking DS context\n"); | ||
55 | } | 52 | } |
56 | 53 | ||
57 | void free_thread_info(struct thread_info *ti) | 54 | void free_thread_info(struct thread_info *ti) |
@@ -198,11 +195,16 @@ void __switch_to_xtra(struct task_struct *prev_p, struct task_struct *next_p, | |||
198 | prev = &prev_p->thread; | 195 | prev = &prev_p->thread; |
199 | next = &next_p->thread; | 196 | next = &next_p->thread; |
200 | 197 | ||
201 | if (test_tsk_thread_flag(next_p, TIF_DS_AREA_MSR) || | 198 | if (test_tsk_thread_flag(prev_p, TIF_BLOCKSTEP) ^ |
202 | test_tsk_thread_flag(prev_p, TIF_DS_AREA_MSR)) | 199 | test_tsk_thread_flag(next_p, TIF_BLOCKSTEP)) { |
203 | ds_switch_to(prev_p, next_p); | 200 | unsigned long debugctl = get_debugctlmsr(); |
204 | else if (next->debugctlmsr != prev->debugctlmsr) | 201 | |
205 | update_debugctlmsr(next->debugctlmsr); | 202 | debugctl &= ~DEBUGCTLMSR_BTF; |
203 | if (test_tsk_thread_flag(next_p, TIF_BLOCKSTEP)) | ||
204 | debugctl |= DEBUGCTLMSR_BTF; | ||
205 | |||
206 | update_debugctlmsr(debugctl); | ||
207 | } | ||
206 | 208 | ||
207 | if (test_tsk_thread_flag(prev_p, TIF_NOTSC) ^ | 209 | if (test_tsk_thread_flag(prev_p, TIF_NOTSC) ^ |
208 | test_tsk_thread_flag(next_p, TIF_NOTSC)) { | 210 | test_tsk_thread_flag(next_p, TIF_NOTSC)) { |
diff --git a/arch/x86/kernel/process_32.c b/arch/x86/kernel/process_32.c index f6c62667e30c..75090c589b7a 100644 --- a/arch/x86/kernel/process_32.c +++ b/arch/x86/kernel/process_32.c | |||
@@ -55,7 +55,6 @@ | |||
55 | #include <asm/cpu.h> | 55 | #include <asm/cpu.h> |
56 | #include <asm/idle.h> | 56 | #include <asm/idle.h> |
57 | #include <asm/syscalls.h> | 57 | #include <asm/syscalls.h> |
58 | #include <asm/ds.h> | ||
59 | #include <asm/debugreg.h> | 58 | #include <asm/debugreg.h> |
60 | 59 | ||
61 | asmlinkage void ret_from_fork(void) __asm__("ret_from_fork"); | 60 | asmlinkage void ret_from_fork(void) __asm__("ret_from_fork"); |
@@ -238,13 +237,6 @@ int copy_thread(unsigned long clone_flags, unsigned long sp, | |||
238 | kfree(p->thread.io_bitmap_ptr); | 237 | kfree(p->thread.io_bitmap_ptr); |
239 | p->thread.io_bitmap_max = 0; | 238 | p->thread.io_bitmap_max = 0; |
240 | } | 239 | } |
241 | |||
242 | clear_tsk_thread_flag(p, TIF_DS_AREA_MSR); | ||
243 | p->thread.ds_ctx = NULL; | ||
244 | |||
245 | clear_tsk_thread_flag(p, TIF_DEBUGCTLMSR); | ||
246 | p->thread.debugctlmsr = 0; | ||
247 | |||
248 | return err; | 240 | return err; |
249 | } | 241 | } |
250 | 242 | ||
diff --git a/arch/x86/kernel/process_64.c b/arch/x86/kernel/process_64.c index 17cb3295cbf7..50cc84ac0a0d 100644 --- a/arch/x86/kernel/process_64.c +++ b/arch/x86/kernel/process_64.c | |||
@@ -49,7 +49,6 @@ | |||
49 | #include <asm/ia32.h> | 49 | #include <asm/ia32.h> |
50 | #include <asm/idle.h> | 50 | #include <asm/idle.h> |
51 | #include <asm/syscalls.h> | 51 | #include <asm/syscalls.h> |
52 | #include <asm/ds.h> | ||
53 | #include <asm/debugreg.h> | 52 | #include <asm/debugreg.h> |
54 | 53 | ||
55 | asmlinkage extern void ret_from_fork(void); | 54 | asmlinkage extern void ret_from_fork(void); |
@@ -313,13 +312,6 @@ int copy_thread(unsigned long clone_flags, unsigned long sp, | |||
313 | if (err) | 312 | if (err) |
314 | goto out; | 313 | goto out; |
315 | } | 314 | } |
316 | |||
317 | clear_tsk_thread_flag(p, TIF_DS_AREA_MSR); | ||
318 | p->thread.ds_ctx = NULL; | ||
319 | |||
320 | clear_tsk_thread_flag(p, TIF_DEBUGCTLMSR); | ||
321 | p->thread.debugctlmsr = 0; | ||
322 | |||
323 | err = 0; | 315 | err = 0; |
324 | out: | 316 | out: |
325 | if (err && p->thread.io_bitmap_ptr) { | 317 | if (err && p->thread.io_bitmap_ptr) { |
diff --git a/arch/x86/kernel/ptrace.c b/arch/x86/kernel/ptrace.c index 2e9b55027b7e..70c4872cd8aa 100644 --- a/arch/x86/kernel/ptrace.c +++ b/arch/x86/kernel/ptrace.c | |||
@@ -2,9 +2,6 @@ | |||
2 | /* | 2 | /* |
3 | * Pentium III FXSR, SSE support | 3 | * Pentium III FXSR, SSE support |
4 | * Gareth Hughes <gareth@valinux.com>, May 2000 | 4 | * Gareth Hughes <gareth@valinux.com>, May 2000 |
5 | * | ||
6 | * BTS tracing | ||
7 | * Markus Metzger <markus.t.metzger@intel.com>, Dec 2007 | ||
8 | */ | 5 | */ |
9 | 6 | ||
10 | #include <linux/kernel.h> | 7 | #include <linux/kernel.h> |
@@ -22,7 +19,6 @@ | |||
22 | #include <linux/audit.h> | 19 | #include <linux/audit.h> |
23 | #include <linux/seccomp.h> | 20 | #include <linux/seccomp.h> |
24 | #include <linux/signal.h> | 21 | #include <linux/signal.h> |
25 | #include <linux/workqueue.h> | ||
26 | #include <linux/perf_event.h> | 22 | #include <linux/perf_event.h> |
27 | #include <linux/hw_breakpoint.h> | 23 | #include <linux/hw_breakpoint.h> |
28 | 24 | ||
@@ -36,7 +32,6 @@ | |||
36 | #include <asm/desc.h> | 32 | #include <asm/desc.h> |
37 | #include <asm/prctl.h> | 33 | #include <asm/prctl.h> |
38 | #include <asm/proto.h> | 34 | #include <asm/proto.h> |
39 | #include <asm/ds.h> | ||
40 | #include <asm/hw_breakpoint.h> | 35 | #include <asm/hw_breakpoint.h> |
41 | 36 | ||
42 | #include "tls.h" | 37 | #include "tls.h" |
@@ -693,7 +688,7 @@ static int ptrace_set_breakpoint_addr(struct task_struct *tsk, int nr, | |||
693 | struct perf_event_attr attr; | 688 | struct perf_event_attr attr; |
694 | 689 | ||
695 | if (!t->ptrace_bps[nr]) { | 690 | if (!t->ptrace_bps[nr]) { |
696 | hw_breakpoint_init(&attr); | 691 | ptrace_breakpoint_init(&attr); |
697 | /* | 692 | /* |
698 | * Put stub len and type to register (reserve) an inactive but | 693 | * Put stub len and type to register (reserve) an inactive but |
699 | * correct bp | 694 | * correct bp |
@@ -789,342 +784,6 @@ static int ioperm_get(struct task_struct *target, | |||
789 | 0, IO_BITMAP_BYTES); | 784 | 0, IO_BITMAP_BYTES); |
790 | } | 785 | } |
791 | 786 | ||
792 | #ifdef CONFIG_X86_PTRACE_BTS | ||
793 | /* | ||
794 | * A branch trace store context. | ||
795 | * | ||
796 | * Contexts may only be installed by ptrace_bts_config() and only for | ||
797 | * ptraced tasks. | ||
798 | * | ||
799 | * Contexts are destroyed when the tracee is detached from the tracer. | ||
800 | * The actual destruction work requires interrupts enabled, so the | ||
801 | * work is deferred and will be scheduled during __ptrace_unlink(). | ||
802 | * | ||
803 | * Contexts hold an additional task_struct reference on the traced | ||
804 | * task, as well as a reference on the tracer's mm. | ||
805 | * | ||
806 | * Ptrace already holds a task_struct for the duration of ptrace operations, | ||
807 | * but since destruction is deferred, it may be executed after both | ||
808 | * tracer and tracee exited. | ||
809 | */ | ||
810 | struct bts_context { | ||
811 | /* The branch trace handle. */ | ||
812 | struct bts_tracer *tracer; | ||
813 | |||
814 | /* The buffer used to store the branch trace and its size. */ | ||
815 | void *buffer; | ||
816 | unsigned int size; | ||
817 | |||
818 | /* The mm that paid for the above buffer. */ | ||
819 | struct mm_struct *mm; | ||
820 | |||
821 | /* The task this context belongs to. */ | ||
822 | struct task_struct *task; | ||
823 | |||
824 | /* The signal to send on a bts buffer overflow. */ | ||
825 | unsigned int bts_ovfl_signal; | ||
826 | |||
827 | /* The work struct to destroy a context. */ | ||
828 | struct work_struct work; | ||
829 | }; | ||
830 | |||
831 | static int alloc_bts_buffer(struct bts_context *context, unsigned int size) | ||
832 | { | ||
833 | void *buffer = NULL; | ||
834 | int err = -ENOMEM; | ||
835 | |||
836 | err = account_locked_memory(current->mm, current->signal->rlim, size); | ||
837 | if (err < 0) | ||
838 | return err; | ||
839 | |||
840 | buffer = kzalloc(size, GFP_KERNEL); | ||
841 | if (!buffer) | ||
842 | goto out_refund; | ||
843 | |||
844 | context->buffer = buffer; | ||
845 | context->size = size; | ||
846 | context->mm = get_task_mm(current); | ||
847 | |||
848 | return 0; | ||
849 | |||
850 | out_refund: | ||
851 | refund_locked_memory(current->mm, size); | ||
852 | return err; | ||
853 | } | ||
854 | |||
855 | static inline void free_bts_buffer(struct bts_context *context) | ||
856 | { | ||
857 | if (!context->buffer) | ||
858 | return; | ||
859 | |||
860 | kfree(context->buffer); | ||
861 | context->buffer = NULL; | ||
862 | |||
863 | refund_locked_memory(context->mm, context->size); | ||
864 | context->size = 0; | ||
865 | |||
866 | mmput(context->mm); | ||
867 | context->mm = NULL; | ||
868 | } | ||
869 | |||
870 | static void free_bts_context_work(struct work_struct *w) | ||
871 | { | ||
872 | struct bts_context *context; | ||
873 | |||
874 | context = container_of(w, struct bts_context, work); | ||
875 | |||
876 | ds_release_bts(context->tracer); | ||
877 | put_task_struct(context->task); | ||
878 | free_bts_buffer(context); | ||
879 | kfree(context); | ||
880 | } | ||
881 | |||
882 | static inline void free_bts_context(struct bts_context *context) | ||
883 | { | ||
884 | INIT_WORK(&context->work, free_bts_context_work); | ||
885 | schedule_work(&context->work); | ||
886 | } | ||
887 | |||
888 | static inline struct bts_context *alloc_bts_context(struct task_struct *task) | ||
889 | { | ||
890 | struct bts_context *context = kzalloc(sizeof(*context), GFP_KERNEL); | ||
891 | if (context) { | ||
892 | context->task = task; | ||
893 | task->bts = context; | ||
894 | |||
895 | get_task_struct(task); | ||
896 | } | ||
897 | |||
898 | return context; | ||
899 | } | ||
900 | |||
901 | static int ptrace_bts_read_record(struct task_struct *child, size_t index, | ||
902 | struct bts_struct __user *out) | ||
903 | { | ||
904 | struct bts_context *context; | ||
905 | const struct bts_trace *trace; | ||
906 | struct bts_struct bts; | ||
907 | const unsigned char *at; | ||
908 | int error; | ||
909 | |||
910 | context = child->bts; | ||
911 | if (!context) | ||
912 | return -ESRCH; | ||
913 | |||
914 | trace = ds_read_bts(context->tracer); | ||
915 | if (!trace) | ||
916 | return -ESRCH; | ||
917 | |||
918 | at = trace->ds.top - ((index + 1) * trace->ds.size); | ||
919 | if ((void *)at < trace->ds.begin) | ||
920 | at += (trace->ds.n * trace->ds.size); | ||
921 | |||
922 | if (!trace->read) | ||
923 | return -EOPNOTSUPP; | ||
924 | |||
925 | error = trace->read(context->tracer, at, &bts); | ||
926 | if (error < 0) | ||
927 | return error; | ||
928 | |||
929 | if (copy_to_user(out, &bts, sizeof(bts))) | ||
930 | return -EFAULT; | ||
931 | |||
932 | return sizeof(bts); | ||
933 | } | ||
934 | |||
935 | static int ptrace_bts_drain(struct task_struct *child, | ||
936 | long size, | ||
937 | struct bts_struct __user *out) | ||
938 | { | ||
939 | struct bts_context *context; | ||
940 | const struct bts_trace *trace; | ||
941 | const unsigned char *at; | ||
942 | int error, drained = 0; | ||
943 | |||
944 | context = child->bts; | ||
945 | if (!context) | ||
946 | return -ESRCH; | ||
947 | |||
948 | trace = ds_read_bts(context->tracer); | ||
949 | if (!trace) | ||
950 | return -ESRCH; | ||
951 | |||
952 | if (!trace->read) | ||
953 | return -EOPNOTSUPP; | ||
954 | |||
955 | if (size < (trace->ds.top - trace->ds.begin)) | ||
956 | return -EIO; | ||
957 | |||
958 | for (at = trace->ds.begin; (void *)at < trace->ds.top; | ||
959 | out++, drained++, at += trace->ds.size) { | ||
960 | struct bts_struct bts; | ||
961 | |||
962 | error = trace->read(context->tracer, at, &bts); | ||
963 | if (error < 0) | ||
964 | return error; | ||
965 | |||
966 | if (copy_to_user(out, &bts, sizeof(bts))) | ||
967 | return -EFAULT; | ||
968 | } | ||
969 | |||
970 | memset(trace->ds.begin, 0, trace->ds.n * trace->ds.size); | ||
971 | |||
972 | error = ds_reset_bts(context->tracer); | ||
973 | if (error < 0) | ||
974 | return error; | ||
975 | |||
976 | return drained; | ||
977 | } | ||
978 | |||
979 | static int ptrace_bts_config(struct task_struct *child, | ||
980 | long cfg_size, | ||
981 | const struct ptrace_bts_config __user *ucfg) | ||
982 | { | ||
983 | struct bts_context *context; | ||
984 | struct ptrace_bts_config cfg; | ||
985 | unsigned int flags = 0; | ||
986 | |||
987 | if (cfg_size < sizeof(cfg)) | ||
988 | return -EIO; | ||
989 | |||
990 | if (copy_from_user(&cfg, ucfg, sizeof(cfg))) | ||
991 | return -EFAULT; | ||
992 | |||
993 | context = child->bts; | ||
994 | if (!context) | ||
995 | context = alloc_bts_context(child); | ||
996 | if (!context) | ||
997 | return -ENOMEM; | ||
998 | |||
999 | if (cfg.flags & PTRACE_BTS_O_SIGNAL) { | ||
1000 | if (!cfg.signal) | ||
1001 | return -EINVAL; | ||
1002 | |||
1003 | return -EOPNOTSUPP; | ||
1004 | context->bts_ovfl_signal = cfg.signal; | ||
1005 | } | ||
1006 | |||
1007 | ds_release_bts(context->tracer); | ||
1008 | context->tracer = NULL; | ||
1009 | |||
1010 | if ((cfg.flags & PTRACE_BTS_O_ALLOC) && (cfg.size != context->size)) { | ||
1011 | int err; | ||
1012 | |||
1013 | free_bts_buffer(context); | ||
1014 | if (!cfg.size) | ||
1015 | return 0; | ||
1016 | |||
1017 | err = alloc_bts_buffer(context, cfg.size); | ||
1018 | if (err < 0) | ||
1019 | return err; | ||
1020 | } | ||
1021 | |||
1022 | if (cfg.flags & PTRACE_BTS_O_TRACE) | ||
1023 | flags |= BTS_USER; | ||
1024 | |||
1025 | if (cfg.flags & PTRACE_BTS_O_SCHED) | ||
1026 | flags |= BTS_TIMESTAMPS; | ||
1027 | |||
1028 | context->tracer = | ||
1029 | ds_request_bts_task(child, context->buffer, context->size, | ||
1030 | NULL, (size_t)-1, flags); | ||
1031 | if (unlikely(IS_ERR(context->tracer))) { | ||
1032 | int error = PTR_ERR(context->tracer); | ||
1033 | |||
1034 | free_bts_buffer(context); | ||
1035 | context->tracer = NULL; | ||
1036 | return error; | ||
1037 | } | ||
1038 | |||
1039 | return sizeof(cfg); | ||
1040 | } | ||
1041 | |||
1042 | static int ptrace_bts_status(struct task_struct *child, | ||
1043 | long cfg_size, | ||
1044 | struct ptrace_bts_config __user *ucfg) | ||
1045 | { | ||
1046 | struct bts_context *context; | ||
1047 | const struct bts_trace *trace; | ||
1048 | struct ptrace_bts_config cfg; | ||
1049 | |||
1050 | context = child->bts; | ||
1051 | if (!context) | ||
1052 | return -ESRCH; | ||
1053 | |||
1054 | if (cfg_size < sizeof(cfg)) | ||
1055 | return -EIO; | ||
1056 | |||
1057 | trace = ds_read_bts(context->tracer); | ||
1058 | if (!trace) | ||
1059 | return -ESRCH; | ||
1060 | |||
1061 | memset(&cfg, 0, sizeof(cfg)); | ||
1062 | cfg.size = trace->ds.end - trace->ds.begin; | ||
1063 | cfg.signal = context->bts_ovfl_signal; | ||
1064 | cfg.bts_size = sizeof(struct bts_struct); | ||
1065 | |||
1066 | if (cfg.signal) | ||
1067 | cfg.flags |= PTRACE_BTS_O_SIGNAL; | ||
1068 | |||
1069 | if (trace->ds.flags & BTS_USER) | ||
1070 | cfg.flags |= PTRACE_BTS_O_TRACE; | ||
1071 | |||
1072 | if (trace->ds.flags & BTS_TIMESTAMPS) | ||
1073 | cfg.flags |= PTRACE_BTS_O_SCHED; | ||
1074 | |||
1075 | if (copy_to_user(ucfg, &cfg, sizeof(cfg))) | ||
1076 | return -EFAULT; | ||
1077 | |||
1078 | return sizeof(cfg); | ||
1079 | } | ||
1080 | |||
1081 | static int ptrace_bts_clear(struct task_struct *child) | ||
1082 | { | ||
1083 | struct bts_context *context; | ||
1084 | const struct bts_trace *trace; | ||
1085 | |||
1086 | context = child->bts; | ||
1087 | if (!context) | ||
1088 | return -ESRCH; | ||
1089 | |||
1090 | trace = ds_read_bts(context->tracer); | ||
1091 | if (!trace) | ||
1092 | return -ESRCH; | ||
1093 | |||
1094 | memset(trace->ds.begin, 0, trace->ds.n * trace->ds.size); | ||
1095 | |||
1096 | return ds_reset_bts(context->tracer); | ||
1097 | } | ||
1098 | |||
1099 | static int ptrace_bts_size(struct task_struct *child) | ||
1100 | { | ||
1101 | struct bts_context *context; | ||
1102 | const struct bts_trace *trace; | ||
1103 | |||
1104 | context = child->bts; | ||
1105 | if (!context) | ||
1106 | return -ESRCH; | ||
1107 | |||
1108 | trace = ds_read_bts(context->tracer); | ||
1109 | if (!trace) | ||
1110 | return -ESRCH; | ||
1111 | |||
1112 | return (trace->ds.top - trace->ds.begin) / trace->ds.size; | ||
1113 | } | ||
1114 | |||
1115 | /* | ||
1116 | * Called from __ptrace_unlink() after the child has been moved back | ||
1117 | * to its original parent. | ||
1118 | */ | ||
1119 | void ptrace_bts_untrace(struct task_struct *child) | ||
1120 | { | ||
1121 | if (unlikely(child->bts)) { | ||
1122 | free_bts_context(child->bts); | ||
1123 | child->bts = NULL; | ||
1124 | } | ||
1125 | } | ||
1126 | #endif /* CONFIG_X86_PTRACE_BTS */ | ||
1127 | |||
1128 | /* | 787 | /* |
1129 | * Called by kernel/ptrace.c when detaching.. | 788 | * Called by kernel/ptrace.c when detaching.. |
1130 | * | 789 | * |
@@ -1252,39 +911,6 @@ long arch_ptrace(struct task_struct *child, long request, long addr, long data) | |||
1252 | break; | 911 | break; |
1253 | #endif | 912 | #endif |
1254 | 913 | ||
1255 | /* | ||
1256 | * These bits need more cooking - not enabled yet: | ||
1257 | */ | ||
1258 | #ifdef CONFIG_X86_PTRACE_BTS | ||
1259 | case PTRACE_BTS_CONFIG: | ||
1260 | ret = ptrace_bts_config | ||
1261 | (child, data, (struct ptrace_bts_config __user *)addr); | ||
1262 | break; | ||
1263 | |||
1264 | case PTRACE_BTS_STATUS: | ||
1265 | ret = ptrace_bts_status | ||
1266 | (child, data, (struct ptrace_bts_config __user *)addr); | ||
1267 | break; | ||
1268 | |||
1269 | case PTRACE_BTS_SIZE: | ||
1270 | ret = ptrace_bts_size(child); | ||
1271 | break; | ||
1272 | |||
1273 | case PTRACE_BTS_GET: | ||
1274 | ret = ptrace_bts_read_record | ||
1275 | (child, data, (struct bts_struct __user *) addr); | ||
1276 | break; | ||
1277 | |||
1278 | case PTRACE_BTS_CLEAR: | ||
1279 | ret = ptrace_bts_clear(child); | ||
1280 | break; | ||
1281 | |||
1282 | case PTRACE_BTS_DRAIN: | ||
1283 | ret = ptrace_bts_drain | ||
1284 | (child, data, (struct bts_struct __user *) addr); | ||
1285 | break; | ||
1286 | #endif /* CONFIG_X86_PTRACE_BTS */ | ||
1287 | |||
1288 | default: | 914 | default: |
1289 | ret = ptrace_request(child, request, addr, data); | 915 | ret = ptrace_request(child, request, addr, data); |
1290 | break; | 916 | break; |
@@ -1544,14 +1170,6 @@ long compat_arch_ptrace(struct task_struct *child, compat_long_t request, | |||
1544 | 1170 | ||
1545 | case PTRACE_GET_THREAD_AREA: | 1171 | case PTRACE_GET_THREAD_AREA: |
1546 | case PTRACE_SET_THREAD_AREA: | 1172 | case PTRACE_SET_THREAD_AREA: |
1547 | #ifdef CONFIG_X86_PTRACE_BTS | ||
1548 | case PTRACE_BTS_CONFIG: | ||
1549 | case PTRACE_BTS_STATUS: | ||
1550 | case PTRACE_BTS_SIZE: | ||
1551 | case PTRACE_BTS_GET: | ||
1552 | case PTRACE_BTS_CLEAR: | ||
1553 | case PTRACE_BTS_DRAIN: | ||
1554 | #endif /* CONFIG_X86_PTRACE_BTS */ | ||
1555 | return arch_ptrace(child, request, addr, data); | 1173 | return arch_ptrace(child, request, addr, data); |
1556 | 1174 | ||
1557 | default: | 1175 | default: |
diff --git a/arch/x86/kernel/step.c b/arch/x86/kernel/step.c index 3149032ff107..58de45ee08b6 100644 --- a/arch/x86/kernel/step.c +++ b/arch/x86/kernel/step.c | |||
@@ -158,22 +158,6 @@ static int enable_single_step(struct task_struct *child) | |||
158 | } | 158 | } |
159 | 159 | ||
160 | /* | 160 | /* |
161 | * Install this value in MSR_IA32_DEBUGCTLMSR whenever child is running. | ||
162 | */ | ||
163 | static void write_debugctlmsr(struct task_struct *child, unsigned long val) | ||
164 | { | ||
165 | if (child->thread.debugctlmsr == val) | ||
166 | return; | ||
167 | |||
168 | child->thread.debugctlmsr = val; | ||
169 | |||
170 | if (child != current) | ||
171 | return; | ||
172 | |||
173 | update_debugctlmsr(val); | ||
174 | } | ||
175 | |||
176 | /* | ||
177 | * Enable single or block step. | 161 | * Enable single or block step. |
178 | */ | 162 | */ |
179 | static void enable_step(struct task_struct *child, bool block) | 163 | static void enable_step(struct task_struct *child, bool block) |
@@ -186,15 +170,17 @@ static void enable_step(struct task_struct *child, bool block) | |||
186 | * that uses user-mode single stepping itself. | 170 | * that uses user-mode single stepping itself. |
187 | */ | 171 | */ |
188 | if (enable_single_step(child) && block) { | 172 | if (enable_single_step(child) && block) { |
189 | set_tsk_thread_flag(child, TIF_DEBUGCTLMSR); | 173 | unsigned long debugctl = get_debugctlmsr(); |
190 | write_debugctlmsr(child, | 174 | |
191 | child->thread.debugctlmsr | DEBUGCTLMSR_BTF); | 175 | debugctl |= DEBUGCTLMSR_BTF; |
192 | } else { | 176 | update_debugctlmsr(debugctl); |
193 | write_debugctlmsr(child, | 177 | set_tsk_thread_flag(child, TIF_BLOCKSTEP); |
194 | child->thread.debugctlmsr & ~DEBUGCTLMSR_BTF); | 178 | } else if (test_tsk_thread_flag(child, TIF_BLOCKSTEP)) { |
195 | 179 | unsigned long debugctl = get_debugctlmsr(); | |
196 | if (!child->thread.debugctlmsr) | 180 | |
197 | clear_tsk_thread_flag(child, TIF_DEBUGCTLMSR); | 181 | debugctl &= ~DEBUGCTLMSR_BTF; |
182 | update_debugctlmsr(debugctl); | ||
183 | clear_tsk_thread_flag(child, TIF_BLOCKSTEP); | ||
198 | } | 184 | } |
199 | } | 185 | } |
200 | 186 | ||
@@ -213,11 +199,13 @@ void user_disable_single_step(struct task_struct *child) | |||
213 | /* | 199 | /* |
214 | * Make sure block stepping (BTF) is disabled. | 200 | * Make sure block stepping (BTF) is disabled. |
215 | */ | 201 | */ |
216 | write_debugctlmsr(child, | 202 | if (test_tsk_thread_flag(child, TIF_BLOCKSTEP)) { |
217 | child->thread.debugctlmsr & ~DEBUGCTLMSR_BTF); | 203 | unsigned long debugctl = get_debugctlmsr(); |
218 | 204 | ||
219 | if (!child->thread.debugctlmsr) | 205 | debugctl &= ~DEBUGCTLMSR_BTF; |
220 | clear_tsk_thread_flag(child, TIF_DEBUGCTLMSR); | 206 | update_debugctlmsr(debugctl); |
207 | clear_tsk_thread_flag(child, TIF_BLOCKSTEP); | ||
208 | } | ||
221 | 209 | ||
222 | /* Always clear TIF_SINGLESTEP... */ | 210 | /* Always clear TIF_SINGLESTEP... */ |
223 | clear_tsk_thread_flag(child, TIF_SINGLESTEP); | 211 | clear_tsk_thread_flag(child, TIF_SINGLESTEP); |
diff --git a/arch/x86/kernel/traps.c b/arch/x86/kernel/traps.c index 1168e4454188..36f1bd9f8e76 100644 --- a/arch/x86/kernel/traps.c +++ b/arch/x86/kernel/traps.c | |||
@@ -543,11 +543,11 @@ dotraplinkage void __kprobes do_debug(struct pt_regs *regs, long error_code) | |||
543 | 543 | ||
544 | /* DR6 may or may not be cleared by the CPU */ | 544 | /* DR6 may or may not be cleared by the CPU */ |
545 | set_debugreg(0, 6); | 545 | set_debugreg(0, 6); |
546 | |||
546 | /* | 547 | /* |
547 | * The processor cleared BTF, so don't mark that we need it set. | 548 | * The processor cleared BTF, so don't mark that we need it set. |
548 | */ | 549 | */ |
549 | clear_tsk_thread_flag(tsk, TIF_DEBUGCTLMSR); | 550 | clear_tsk_thread_flag(tsk, TIF_BLOCKSTEP); |
550 | tsk->thread.debugctlmsr = 0; | ||
551 | 551 | ||
552 | /* Store the virtualized DR6 value */ | 552 | /* Store the virtualized DR6 value */ |
553 | tsk->thread.debugreg6 = dr6; | 553 | tsk->thread.debugreg6 = dr6; |
diff --git a/arch/x86/kvm/vmx.c b/arch/x86/kvm/vmx.c index 2f8db0ec8ae4..edca080407a5 100644 --- a/arch/x86/kvm/vmx.c +++ b/arch/x86/kvm/vmx.c | |||
@@ -3659,8 +3659,11 @@ static void vmx_complete_interrupts(struct vcpu_vmx *vmx) | |||
3659 | 3659 | ||
3660 | /* We need to handle NMIs before interrupts are enabled */ | 3660 | /* We need to handle NMIs before interrupts are enabled */ |
3661 | if ((exit_intr_info & INTR_INFO_INTR_TYPE_MASK) == INTR_TYPE_NMI_INTR && | 3661 | if ((exit_intr_info & INTR_INFO_INTR_TYPE_MASK) == INTR_TYPE_NMI_INTR && |
3662 | (exit_intr_info & INTR_INFO_VALID_MASK)) | 3662 | (exit_intr_info & INTR_INFO_VALID_MASK)) { |
3663 | kvm_before_handle_nmi(&vmx->vcpu); | ||
3663 | asm("int $2"); | 3664 | asm("int $2"); |
3665 | kvm_after_handle_nmi(&vmx->vcpu); | ||
3666 | } | ||
3664 | 3667 | ||
3665 | idtv_info_valid = idt_vectoring_info & VECTORING_INFO_VALID_MASK; | 3668 | idtv_info_valid = idt_vectoring_info & VECTORING_INFO_VALID_MASK; |
3666 | 3669 | ||
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c index c4f35b545c1d..dd9bc8fb81ab 100644 --- a/arch/x86/kvm/x86.c +++ b/arch/x86/kvm/x86.c | |||
@@ -40,6 +40,7 @@ | |||
40 | #include <linux/user-return-notifier.h> | 40 | #include <linux/user-return-notifier.h> |
41 | #include <linux/srcu.h> | 41 | #include <linux/srcu.h> |
42 | #include <linux/slab.h> | 42 | #include <linux/slab.h> |
43 | #include <linux/perf_event.h> | ||
43 | #include <trace/events/kvm.h> | 44 | #include <trace/events/kvm.h> |
44 | #undef TRACE_INCLUDE_FILE | 45 | #undef TRACE_INCLUDE_FILE |
45 | #define CREATE_TRACE_POINTS | 46 | #define CREATE_TRACE_POINTS |
@@ -3747,6 +3748,51 @@ static void kvm_timer_init(void) | |||
3747 | } | 3748 | } |
3748 | } | 3749 | } |
3749 | 3750 | ||
3751 | static DEFINE_PER_CPU(struct kvm_vcpu *, current_vcpu); | ||
3752 | |||
3753 | static int kvm_is_in_guest(void) | ||
3754 | { | ||
3755 | return percpu_read(current_vcpu) != NULL; | ||
3756 | } | ||
3757 | |||
3758 | static int kvm_is_user_mode(void) | ||
3759 | { | ||
3760 | int user_mode = 3; | ||
3761 | |||
3762 | if (percpu_read(current_vcpu)) | ||
3763 | user_mode = kvm_x86_ops->get_cpl(percpu_read(current_vcpu)); | ||
3764 | |||
3765 | return user_mode != 0; | ||
3766 | } | ||
3767 | |||
3768 | static unsigned long kvm_get_guest_ip(void) | ||
3769 | { | ||
3770 | unsigned long ip = 0; | ||
3771 | |||
3772 | if (percpu_read(current_vcpu)) | ||
3773 | ip = kvm_rip_read(percpu_read(current_vcpu)); | ||
3774 | |||
3775 | return ip; | ||
3776 | } | ||
3777 | |||
3778 | static struct perf_guest_info_callbacks kvm_guest_cbs = { | ||
3779 | .is_in_guest = kvm_is_in_guest, | ||
3780 | .is_user_mode = kvm_is_user_mode, | ||
3781 | .get_guest_ip = kvm_get_guest_ip, | ||
3782 | }; | ||
3783 | |||
3784 | void kvm_before_handle_nmi(struct kvm_vcpu *vcpu) | ||
3785 | { | ||
3786 | percpu_write(current_vcpu, vcpu); | ||
3787 | } | ||
3788 | EXPORT_SYMBOL_GPL(kvm_before_handle_nmi); | ||
3789 | |||
3790 | void kvm_after_handle_nmi(struct kvm_vcpu *vcpu) | ||
3791 | { | ||
3792 | percpu_write(current_vcpu, NULL); | ||
3793 | } | ||
3794 | EXPORT_SYMBOL_GPL(kvm_after_handle_nmi); | ||
3795 | |||
3750 | int kvm_arch_init(void *opaque) | 3796 | int kvm_arch_init(void *opaque) |
3751 | { | 3797 | { |
3752 | int r; | 3798 | int r; |
@@ -3783,6 +3829,8 @@ int kvm_arch_init(void *opaque) | |||
3783 | 3829 | ||
3784 | kvm_timer_init(); | 3830 | kvm_timer_init(); |
3785 | 3831 | ||
3832 | perf_register_guest_info_callbacks(&kvm_guest_cbs); | ||
3833 | |||
3786 | return 0; | 3834 | return 0; |
3787 | 3835 | ||
3788 | out: | 3836 | out: |
@@ -3791,6 +3839,8 @@ out: | |||
3791 | 3839 | ||
3792 | void kvm_arch_exit(void) | 3840 | void kvm_arch_exit(void) |
3793 | { | 3841 | { |
3842 | perf_unregister_guest_info_callbacks(&kvm_guest_cbs); | ||
3843 | |||
3794 | if (!boot_cpu_has(X86_FEATURE_CONSTANT_TSC)) | 3844 | if (!boot_cpu_has(X86_FEATURE_CONSTANT_TSC)) |
3795 | cpufreq_unregister_notifier(&kvmclock_cpufreq_notifier_block, | 3845 | cpufreq_unregister_notifier(&kvmclock_cpufreq_notifier_block, |
3796 | CPUFREQ_TRANSITION_NOTIFIER); | 3846 | CPUFREQ_TRANSITION_NOTIFIER); |
diff --git a/arch/x86/kvm/x86.h b/arch/x86/kvm/x86.h index 2d101639bd8d..b7a404722d2b 100644 --- a/arch/x86/kvm/x86.h +++ b/arch/x86/kvm/x86.h | |||
@@ -65,4 +65,7 @@ static inline int is_paging(struct kvm_vcpu *vcpu) | |||
65 | return kvm_read_cr0_bits(vcpu, X86_CR0_PG); | 65 | return kvm_read_cr0_bits(vcpu, X86_CR0_PG); |
66 | } | 66 | } |
67 | 67 | ||
68 | void kvm_before_handle_nmi(struct kvm_vcpu *vcpu); | ||
69 | void kvm_after_handle_nmi(struct kvm_vcpu *vcpu); | ||
70 | |||
68 | #endif | 71 | #endif |
diff --git a/arch/x86/lib/Makefile b/arch/x86/lib/Makefile index 419386c24b82..cbaf8f2b83df 100644 --- a/arch/x86/lib/Makefile +++ b/arch/x86/lib/Makefile | |||
@@ -20,7 +20,7 @@ lib-y := delay.o | |||
20 | lib-y += thunk_$(BITS).o | 20 | lib-y += thunk_$(BITS).o |
21 | lib-y += usercopy_$(BITS).o getuser.o putuser.o | 21 | lib-y += usercopy_$(BITS).o getuser.o putuser.o |
22 | lib-y += memcpy_$(BITS).o | 22 | lib-y += memcpy_$(BITS).o |
23 | lib-$(CONFIG_KPROBES) += insn.o inat.o | 23 | lib-$(CONFIG_INSTRUCTION_DECODER) += insn.o inat.o |
24 | 24 | ||
25 | obj-y += msr.o msr-reg.o msr-reg-export.o | 25 | obj-y += msr.o msr-reg.o msr-reg-export.o |
26 | 26 | ||
diff --git a/arch/x86/oprofile/op_model_ppro.c b/arch/x86/oprofile/op_model_ppro.c index 1fd17cfb956b..d769cda54082 100644 --- a/arch/x86/oprofile/op_model_ppro.c +++ b/arch/x86/oprofile/op_model_ppro.c | |||
@@ -238,11 +238,11 @@ static void arch_perfmon_setup_counters(void) | |||
238 | if (eax.split.version_id == 0 && current_cpu_data.x86 == 6 && | 238 | if (eax.split.version_id == 0 && current_cpu_data.x86 == 6 && |
239 | current_cpu_data.x86_model == 15) { | 239 | current_cpu_data.x86_model == 15) { |
240 | eax.split.version_id = 2; | 240 | eax.split.version_id = 2; |
241 | eax.split.num_events = 2; | 241 | eax.split.num_counters = 2; |
242 | eax.split.bit_width = 40; | 242 | eax.split.bit_width = 40; |
243 | } | 243 | } |
244 | 244 | ||
245 | num_counters = eax.split.num_events; | 245 | num_counters = eax.split.num_counters; |
246 | 246 | ||
247 | op_arch_perfmon_spec.num_counters = num_counters; | 247 | op_arch_perfmon_spec.num_counters = num_counters; |
248 | op_arch_perfmon_spec.num_controls = num_counters; | 248 | op_arch_perfmon_spec.num_controls = num_counters; |
diff --git a/include/linux/ftrace.h b/include/linux/ftrace.h index 01e6adea07ec..cc12b3c556b3 100644 --- a/include/linux/ftrace.h +++ b/include/linux/ftrace.h | |||
@@ -504,18 +504,6 @@ extern int ftrace_dump_on_oops; | |||
504 | #define INIT_TRACE_RECURSION | 504 | #define INIT_TRACE_RECURSION |
505 | #endif | 505 | #endif |
506 | 506 | ||
507 | #ifdef CONFIG_HW_BRANCH_TRACER | ||
508 | |||
509 | void trace_hw_branch(u64 from, u64 to); | ||
510 | void trace_hw_branch_oops(void); | ||
511 | |||
512 | #else /* CONFIG_HW_BRANCH_TRACER */ | ||
513 | |||
514 | static inline void trace_hw_branch(u64 from, u64 to) {} | ||
515 | static inline void trace_hw_branch_oops(void) {} | ||
516 | |||
517 | #endif /* CONFIG_HW_BRANCH_TRACER */ | ||
518 | |||
519 | #ifdef CONFIG_FTRACE_SYSCALLS | 507 | #ifdef CONFIG_FTRACE_SYSCALLS |
520 | 508 | ||
521 | unsigned long arch_syscall_addr(int nr); | 509 | unsigned long arch_syscall_addr(int nr); |
diff --git a/include/linux/hw_breakpoint.h b/include/linux/hw_breakpoint.h index c70d27af03f9..a2d6ea49ec56 100644 --- a/include/linux/hw_breakpoint.h +++ b/include/linux/hw_breakpoint.h | |||
@@ -9,9 +9,22 @@ enum { | |||
9 | }; | 9 | }; |
10 | 10 | ||
11 | enum { | 11 | enum { |
12 | HW_BREAKPOINT_R = 1, | 12 | HW_BREAKPOINT_EMPTY = 0, |
13 | HW_BREAKPOINT_W = 2, | 13 | HW_BREAKPOINT_R = 1, |
14 | HW_BREAKPOINT_X = 4, | 14 | HW_BREAKPOINT_W = 2, |
15 | HW_BREAKPOINT_RW = HW_BREAKPOINT_R | HW_BREAKPOINT_W, | ||
16 | HW_BREAKPOINT_X = 4, | ||
17 | HW_BREAKPOINT_INVALID = HW_BREAKPOINT_RW | HW_BREAKPOINT_X, | ||
18 | }; | ||
19 | |||
20 | enum bp_type_idx { | ||
21 | TYPE_INST = 0, | ||
22 | #ifdef CONFIG_HAVE_MIXED_BREAKPOINTS_REGS | ||
23 | TYPE_DATA = 0, | ||
24 | #else | ||
25 | TYPE_DATA = 1, | ||
26 | #endif | ||
27 | TYPE_MAX | ||
15 | }; | 28 | }; |
16 | 29 | ||
17 | #ifdef __KERNEL__ | 30 | #ifdef __KERNEL__ |
@@ -34,6 +47,12 @@ static inline void hw_breakpoint_init(struct perf_event_attr *attr) | |||
34 | attr->sample_period = 1; | 47 | attr->sample_period = 1; |
35 | } | 48 | } |
36 | 49 | ||
50 | static inline void ptrace_breakpoint_init(struct perf_event_attr *attr) | ||
51 | { | ||
52 | hw_breakpoint_init(attr); | ||
53 | attr->exclude_kernel = 1; | ||
54 | } | ||
55 | |||
37 | static inline unsigned long hw_breakpoint_addr(struct perf_event *bp) | 56 | static inline unsigned long hw_breakpoint_addr(struct perf_event *bp) |
38 | { | 57 | { |
39 | return bp->attr.bp_addr; | 58 | return bp->attr.bp_addr; |
diff --git a/include/linux/mm.h b/include/linux/mm.h index 462acaf36f3a..fb19bb92b809 100644 --- a/include/linux/mm.h +++ b/include/linux/mm.h | |||
@@ -19,7 +19,6 @@ struct anon_vma; | |||
19 | struct file_ra_state; | 19 | struct file_ra_state; |
20 | struct user_struct; | 20 | struct user_struct; |
21 | struct writeback_control; | 21 | struct writeback_control; |
22 | struct rlimit; | ||
23 | 22 | ||
24 | #ifndef CONFIG_DISCONTIGMEM /* Don't use mapnrs, do it properly */ | 23 | #ifndef CONFIG_DISCONTIGMEM /* Don't use mapnrs, do it properly */ |
25 | extern unsigned long max_mapnr; | 24 | extern unsigned long max_mapnr; |
@@ -1449,9 +1448,6 @@ int vmemmap_populate_basepages(struct page *start_page, | |||
1449 | int vmemmap_populate(struct page *start_page, unsigned long pages, int node); | 1448 | int vmemmap_populate(struct page *start_page, unsigned long pages, int node); |
1450 | void vmemmap_populate_print_last(void); | 1449 | void vmemmap_populate_print_last(void); |
1451 | 1450 | ||
1452 | extern int account_locked_memory(struct mm_struct *mm, struct rlimit *rlim, | ||
1453 | size_t size); | ||
1454 | extern void refund_locked_memory(struct mm_struct *mm, size_t size); | ||
1455 | 1451 | ||
1456 | enum mf_flags { | 1452 | enum mf_flags { |
1457 | MF_COUNT_INCREASED = 1 << 0, | 1453 | MF_COUNT_INCREASED = 1 << 0, |
diff --git a/include/linux/perf_event.h b/include/linux/perf_event.h index c8e375440403..3fd5c82e0e18 100644 --- a/include/linux/perf_event.h +++ b/include/linux/perf_event.h | |||
@@ -203,8 +203,19 @@ struct perf_event_attr { | |||
203 | enable_on_exec : 1, /* next exec enables */ | 203 | enable_on_exec : 1, /* next exec enables */ |
204 | task : 1, /* trace fork/exit */ | 204 | task : 1, /* trace fork/exit */ |
205 | watermark : 1, /* wakeup_watermark */ | 205 | watermark : 1, /* wakeup_watermark */ |
206 | 206 | /* | |
207 | __reserved_1 : 49; | 207 | * precise_ip: |
208 | * | ||
209 | * 0 - SAMPLE_IP can have arbitrary skid | ||
210 | * 1 - SAMPLE_IP must have constant skid | ||
211 | * 2 - SAMPLE_IP requested to have 0 skid | ||
212 | * 3 - SAMPLE_IP must have 0 skid | ||
213 | * | ||
214 | * See also PERF_RECORD_MISC_EXACT_IP | ||
215 | */ | ||
216 | precise_ip : 2, /* skid constraint */ | ||
217 | |||
218 | __reserved_1 : 47; | ||
208 | 219 | ||
209 | union { | 220 | union { |
210 | __u32 wakeup_events; /* wakeup every n events */ | 221 | __u32 wakeup_events; /* wakeup every n events */ |
@@ -287,11 +298,24 @@ struct perf_event_mmap_page { | |||
287 | __u64 data_tail; /* user-space written tail */ | 298 | __u64 data_tail; /* user-space written tail */ |
288 | }; | 299 | }; |
289 | 300 | ||
290 | #define PERF_RECORD_MISC_CPUMODE_MASK (3 << 0) | 301 | #define PERF_RECORD_MISC_CPUMODE_MASK (7 << 0) |
291 | #define PERF_RECORD_MISC_CPUMODE_UNKNOWN (0 << 0) | 302 | #define PERF_RECORD_MISC_CPUMODE_UNKNOWN (0 << 0) |
292 | #define PERF_RECORD_MISC_KERNEL (1 << 0) | 303 | #define PERF_RECORD_MISC_KERNEL (1 << 0) |
293 | #define PERF_RECORD_MISC_USER (2 << 0) | 304 | #define PERF_RECORD_MISC_USER (2 << 0) |
294 | #define PERF_RECORD_MISC_HYPERVISOR (3 << 0) | 305 | #define PERF_RECORD_MISC_HYPERVISOR (3 << 0) |
306 | #define PERF_RECORD_MISC_GUEST_KERNEL (4 << 0) | ||
307 | #define PERF_RECORD_MISC_GUEST_USER (5 << 0) | ||
308 | |||
309 | /* | ||
310 | * Indicates that the content of PERF_SAMPLE_IP points to | ||
311 | * the actual instruction that triggered the event. See also | ||
312 | * perf_event_attr::precise_ip. | ||
313 | */ | ||
314 | #define PERF_RECORD_MISC_EXACT_IP (1 << 14) | ||
315 | /* | ||
316 | * Reserve the last bit to indicate some extended misc field | ||
317 | */ | ||
318 | #define PERF_RECORD_MISC_EXT_RESERVED (1 << 15) | ||
295 | 319 | ||
296 | struct perf_event_header { | 320 | struct perf_event_header { |
297 | __u32 type; | 321 | __u32 type; |
@@ -439,6 +463,12 @@ enum perf_callchain_context { | |||
439 | # include <asm/perf_event.h> | 463 | # include <asm/perf_event.h> |
440 | #endif | 464 | #endif |
441 | 465 | ||
466 | struct perf_guest_info_callbacks { | ||
467 | int (*is_in_guest) (void); | ||
468 | int (*is_user_mode) (void); | ||
469 | unsigned long (*get_guest_ip) (void); | ||
470 | }; | ||
471 | |||
442 | #ifdef CONFIG_HAVE_HW_BREAKPOINT | 472 | #ifdef CONFIG_HAVE_HW_BREAKPOINT |
443 | #include <asm/hw_breakpoint.h> | 473 | #include <asm/hw_breakpoint.h> |
444 | #endif | 474 | #endif |
@@ -468,6 +498,17 @@ struct perf_raw_record { | |||
468 | void *data; | 498 | void *data; |
469 | }; | 499 | }; |
470 | 500 | ||
501 | struct perf_branch_entry { | ||
502 | __u64 from; | ||
503 | __u64 to; | ||
504 | __u64 flags; | ||
505 | }; | ||
506 | |||
507 | struct perf_branch_stack { | ||
508 | __u64 nr; | ||
509 | struct perf_branch_entry entries[0]; | ||
510 | }; | ||
511 | |||
471 | struct task_struct; | 512 | struct task_struct; |
472 | 513 | ||
473 | /** | 514 | /** |
@@ -506,6 +547,8 @@ struct hw_perf_event { | |||
506 | 547 | ||
507 | struct perf_event; | 548 | struct perf_event; |
508 | 549 | ||
550 | #define PERF_EVENT_TXN_STARTED 1 | ||
551 | |||
509 | /** | 552 | /** |
510 | * struct pmu - generic performance monitoring unit | 553 | * struct pmu - generic performance monitoring unit |
511 | */ | 554 | */ |
@@ -516,6 +559,16 @@ struct pmu { | |||
516 | void (*stop) (struct perf_event *event); | 559 | void (*stop) (struct perf_event *event); |
517 | void (*read) (struct perf_event *event); | 560 | void (*read) (struct perf_event *event); |
518 | void (*unthrottle) (struct perf_event *event); | 561 | void (*unthrottle) (struct perf_event *event); |
562 | |||
563 | /* | ||
564 | * group events scheduling is treated as a transaction, | ||
565 | * add group events as a whole and perform one schedulability test. | ||
566 | * If test fails, roll back the whole group | ||
567 | */ | ||
568 | |||
569 | void (*start_txn) (const struct pmu *pmu); | ||
570 | void (*cancel_txn) (const struct pmu *pmu); | ||
571 | int (*commit_txn) (const struct pmu *pmu); | ||
519 | }; | 572 | }; |
520 | 573 | ||
521 | /** | 574 | /** |
@@ -571,6 +624,14 @@ enum perf_group_flag { | |||
571 | PERF_GROUP_SOFTWARE = 0x1, | 624 | PERF_GROUP_SOFTWARE = 0x1, |
572 | }; | 625 | }; |
573 | 626 | ||
627 | #define SWEVENT_HLIST_BITS 8 | ||
628 | #define SWEVENT_HLIST_SIZE (1 << SWEVENT_HLIST_BITS) | ||
629 | |||
630 | struct swevent_hlist { | ||
631 | struct hlist_head heads[SWEVENT_HLIST_SIZE]; | ||
632 | struct rcu_head rcu_head; | ||
633 | }; | ||
634 | |||
574 | /** | 635 | /** |
575 | * struct perf_event - performance event kernel representation: | 636 | * struct perf_event - performance event kernel representation: |
576 | */ | 637 | */ |
@@ -579,6 +640,7 @@ struct perf_event { | |||
579 | struct list_head group_entry; | 640 | struct list_head group_entry; |
580 | struct list_head event_entry; | 641 | struct list_head event_entry; |
581 | struct list_head sibling_list; | 642 | struct list_head sibling_list; |
643 | struct hlist_node hlist_entry; | ||
582 | int nr_siblings; | 644 | int nr_siblings; |
583 | int group_flags; | 645 | int group_flags; |
584 | struct perf_event *group_leader; | 646 | struct perf_event *group_leader; |
@@ -726,6 +788,9 @@ struct perf_cpu_context { | |||
726 | int active_oncpu; | 788 | int active_oncpu; |
727 | int max_pertask; | 789 | int max_pertask; |
728 | int exclusive; | 790 | int exclusive; |
791 | struct swevent_hlist *swevent_hlist; | ||
792 | struct mutex hlist_mutex; | ||
793 | int hlist_refcount; | ||
729 | 794 | ||
730 | /* | 795 | /* |
731 | * Recursion avoidance: | 796 | * Recursion avoidance: |
@@ -769,9 +834,6 @@ extern void perf_disable(void); | |||
769 | extern void perf_enable(void); | 834 | extern void perf_enable(void); |
770 | extern int perf_event_task_disable(void); | 835 | extern int perf_event_task_disable(void); |
771 | extern int perf_event_task_enable(void); | 836 | extern int perf_event_task_enable(void); |
772 | extern int hw_perf_group_sched_in(struct perf_event *group_leader, | ||
773 | struct perf_cpu_context *cpuctx, | ||
774 | struct perf_event_context *ctx); | ||
775 | extern void perf_event_update_userpage(struct perf_event *event); | 837 | extern void perf_event_update_userpage(struct perf_event *event); |
776 | extern int perf_event_release_kernel(struct perf_event *event); | 838 | extern int perf_event_release_kernel(struct perf_event *event); |
777 | extern struct perf_event * | 839 | extern struct perf_event * |
@@ -902,6 +964,10 @@ static inline void perf_event_mmap(struct vm_area_struct *vma) | |||
902 | __perf_event_mmap(vma); | 964 | __perf_event_mmap(vma); |
903 | } | 965 | } |
904 | 966 | ||
967 | extern struct perf_guest_info_callbacks *perf_guest_cbs; | ||
968 | extern int perf_register_guest_info_callbacks(struct perf_guest_info_callbacks *callbacks); | ||
969 | extern int perf_unregister_guest_info_callbacks(struct perf_guest_info_callbacks *callbacks); | ||
970 | |||
905 | extern void perf_event_comm(struct task_struct *tsk); | 971 | extern void perf_event_comm(struct task_struct *tsk); |
906 | extern void perf_event_fork(struct task_struct *tsk); | 972 | extern void perf_event_fork(struct task_struct *tsk); |
907 | 973 | ||
@@ -971,6 +1037,11 @@ perf_sw_event(u32 event_id, u64 nr, int nmi, | |||
971 | static inline void | 1037 | static inline void |
972 | perf_bp_event(struct perf_event *event, void *data) { } | 1038 | perf_bp_event(struct perf_event *event, void *data) { } |
973 | 1039 | ||
1040 | static inline int perf_register_guest_info_callbacks | ||
1041 | (struct perf_guest_info_callbacks *callbacks) { return 0; } | ||
1042 | static inline int perf_unregister_guest_info_callbacks | ||
1043 | (struct perf_guest_info_callbacks *callbacks) { return 0; } | ||
1044 | |||
974 | static inline void perf_event_mmap(struct vm_area_struct *vma) { } | 1045 | static inline void perf_event_mmap(struct vm_area_struct *vma) { } |
975 | static inline void perf_event_comm(struct task_struct *tsk) { } | 1046 | static inline void perf_event_comm(struct task_struct *tsk) { } |
976 | static inline void perf_event_fork(struct task_struct *tsk) { } | 1047 | static inline void perf_event_fork(struct task_struct *tsk) { } |
diff --git a/include/linux/ptrace.h b/include/linux/ptrace.h index e1fb60729979..4272521e29e9 100644 --- a/include/linux/ptrace.h +++ b/include/linux/ptrace.h | |||
@@ -345,18 +345,6 @@ static inline void user_single_step_siginfo(struct task_struct *tsk, | |||
345 | #define arch_ptrace_stop(code, info) do { } while (0) | 345 | #define arch_ptrace_stop(code, info) do { } while (0) |
346 | #endif | 346 | #endif |
347 | 347 | ||
348 | #ifndef arch_ptrace_untrace | ||
349 | /* | ||
350 | * Do machine-specific work before untracing child. | ||
351 | * | ||
352 | * This is called for a normal detach as well as from ptrace_exit() | ||
353 | * when the tracing task dies. | ||
354 | * | ||
355 | * Called with write_lock(&tasklist_lock) held. | ||
356 | */ | ||
357 | #define arch_ptrace_untrace(task) do { } while (0) | ||
358 | #endif | ||
359 | |||
360 | extern int task_current_syscall(struct task_struct *target, long *callno, | 348 | extern int task_current_syscall(struct task_struct *target, long *callno, |
361 | unsigned long args[6], unsigned int maxargs, | 349 | unsigned long args[6], unsigned int maxargs, |
362 | unsigned long *sp, unsigned long *pc); | 350 | unsigned long *sp, unsigned long *pc); |
diff --git a/include/linux/sched.h b/include/linux/sched.h index 2b7b81df78b3..28b71ee133f0 100644 --- a/include/linux/sched.h +++ b/include/linux/sched.h | |||
@@ -99,7 +99,6 @@ struct futex_pi_state; | |||
99 | struct robust_list_head; | 99 | struct robust_list_head; |
100 | struct bio_list; | 100 | struct bio_list; |
101 | struct fs_struct; | 101 | struct fs_struct; |
102 | struct bts_context; | ||
103 | struct perf_event_context; | 102 | struct perf_event_context; |
104 | 103 | ||
105 | /* | 104 | /* |
@@ -1272,12 +1271,6 @@ struct task_struct { | |||
1272 | struct list_head ptraced; | 1271 | struct list_head ptraced; |
1273 | struct list_head ptrace_entry; | 1272 | struct list_head ptrace_entry; |
1274 | 1273 | ||
1275 | /* | ||
1276 | * This is the tracer handle for the ptrace BTS extension. | ||
1277 | * This field actually belongs to the ptracer task. | ||
1278 | */ | ||
1279 | struct bts_context *bts; | ||
1280 | |||
1281 | /* PID/PID hash table linkage. */ | 1274 | /* PID/PID hash table linkage. */ |
1282 | struct pid_link pids[PIDTYPE_MAX]; | 1275 | struct pid_link pids[PIDTYPE_MAX]; |
1283 | struct list_head thread_group; | 1276 | struct list_head thread_group; |
@@ -2122,10 +2115,8 @@ extern void set_task_comm(struct task_struct *tsk, char *from); | |||
2122 | extern char *get_task_comm(char *to, struct task_struct *tsk); | 2115 | extern char *get_task_comm(char *to, struct task_struct *tsk); |
2123 | 2116 | ||
2124 | #ifdef CONFIG_SMP | 2117 | #ifdef CONFIG_SMP |
2125 | extern void wait_task_context_switch(struct task_struct *p); | ||
2126 | extern unsigned long wait_task_inactive(struct task_struct *, long match_state); | 2118 | extern unsigned long wait_task_inactive(struct task_struct *, long match_state); |
2127 | #else | 2119 | #else |
2128 | static inline void wait_task_context_switch(struct task_struct *p) {} | ||
2129 | static inline unsigned long wait_task_inactive(struct task_struct *p, | 2120 | static inline unsigned long wait_task_inactive(struct task_struct *p, |
2130 | long match_state) | 2121 | long match_state) |
2131 | { | 2122 | { |
diff --git a/include/trace/events/lock.h b/include/trace/events/lock.h index 5c1dcfc16c60..2821b86de63b 100644 --- a/include/trace/events/lock.h +++ b/include/trace/events/lock.h | |||
@@ -35,15 +35,15 @@ TRACE_EVENT(lock_acquire, | |||
35 | __get_str(name)) | 35 | __get_str(name)) |
36 | ); | 36 | ); |
37 | 37 | ||
38 | TRACE_EVENT(lock_release, | 38 | DECLARE_EVENT_CLASS(lock, |
39 | 39 | ||
40 | TP_PROTO(struct lockdep_map *lock, int nested, unsigned long ip), | 40 | TP_PROTO(struct lockdep_map *lock, unsigned long ip), |
41 | 41 | ||
42 | TP_ARGS(lock, nested, ip), | 42 | TP_ARGS(lock, ip), |
43 | 43 | ||
44 | TP_STRUCT__entry( | 44 | TP_STRUCT__entry( |
45 | __string(name, lock->name) | 45 | __string( name, lock->name ) |
46 | __field(void *, lockdep_addr) | 46 | __field( void *, lockdep_addr ) |
47 | ), | 47 | ), |
48 | 48 | ||
49 | TP_fast_assign( | 49 | TP_fast_assign( |
@@ -51,51 +51,30 @@ TRACE_EVENT(lock_release, | |||
51 | __entry->lockdep_addr = lock; | 51 | __entry->lockdep_addr = lock; |
52 | ), | 52 | ), |
53 | 53 | ||
54 | TP_printk("%p %s", | 54 | TP_printk("%p %s", __entry->lockdep_addr, __get_str(name)) |
55 | __entry->lockdep_addr, __get_str(name)) | ||
56 | ); | 55 | ); |
57 | 56 | ||
58 | #ifdef CONFIG_LOCK_STAT | 57 | DEFINE_EVENT(lock, lock_release, |
59 | |||
60 | TRACE_EVENT(lock_contended, | ||
61 | 58 | ||
62 | TP_PROTO(struct lockdep_map *lock, unsigned long ip), | 59 | TP_PROTO(struct lockdep_map *lock, unsigned long ip), |
63 | 60 | ||
64 | TP_ARGS(lock, ip), | 61 | TP_ARGS(lock, ip) |
62 | ); | ||
65 | 63 | ||
66 | TP_STRUCT__entry( | 64 | #ifdef CONFIG_LOCK_STAT |
67 | __string(name, lock->name) | ||
68 | __field(void *, lockdep_addr) | ||
69 | ), | ||
70 | 65 | ||
71 | TP_fast_assign( | 66 | DEFINE_EVENT(lock, lock_contended, |
72 | __assign_str(name, lock->name); | ||
73 | __entry->lockdep_addr = lock; | ||
74 | ), | ||
75 | 67 | ||
76 | TP_printk("%p %s", | 68 | TP_PROTO(struct lockdep_map *lock, unsigned long ip), |
77 | __entry->lockdep_addr, __get_str(name)) | ||
78 | ); | ||
79 | 69 | ||
80 | TRACE_EVENT(lock_acquired, | 70 | TP_ARGS(lock, ip) |
81 | TP_PROTO(struct lockdep_map *lock, unsigned long ip, s64 waittime), | 71 | ); |
82 | 72 | ||
83 | TP_ARGS(lock, ip, waittime), | 73 | DEFINE_EVENT(lock, lock_acquired, |
84 | 74 | ||
85 | TP_STRUCT__entry( | 75 | TP_PROTO(struct lockdep_map *lock, unsigned long ip), |
86 | __string(name, lock->name) | ||
87 | __field(s64, wait_nsec) | ||
88 | __field(void *, lockdep_addr) | ||
89 | ), | ||
90 | 76 | ||
91 | TP_fast_assign( | 77 | TP_ARGS(lock, ip) |
92 | __assign_str(name, lock->name); | ||
93 | __entry->wait_nsec = waittime; | ||
94 | __entry->lockdep_addr = lock; | ||
95 | ), | ||
96 | TP_printk("%p %s (%llu ns)", __entry->lockdep_addr, | ||
97 | __get_str(name), | ||
98 | __entry->wait_nsec) | ||
99 | ); | 78 | ); |
100 | 79 | ||
101 | #endif | 80 | #endif |
diff --git a/include/trace/ftrace.h b/include/trace/ftrace.h index 75dd7787fb37..16253db38d73 100644 --- a/include/trace/ftrace.h +++ b/include/trace/ftrace.h | |||
@@ -763,13 +763,12 @@ __attribute__((section("_ftrace_events"))) event_##call = { \ | |||
763 | #define DECLARE_EVENT_CLASS(call, proto, args, tstruct, assign, print) \ | 763 | #define DECLARE_EVENT_CLASS(call, proto, args, tstruct, assign, print) \ |
764 | static notrace void \ | 764 | static notrace void \ |
765 | perf_trace_templ_##call(struct ftrace_event_call *event_call, \ | 765 | perf_trace_templ_##call(struct ftrace_event_call *event_call, \ |
766 | proto) \ | 766 | struct pt_regs *__regs, proto) \ |
767 | { \ | 767 | { \ |
768 | struct ftrace_data_offsets_##call __maybe_unused __data_offsets;\ | 768 | struct ftrace_data_offsets_##call __maybe_unused __data_offsets;\ |
769 | struct ftrace_raw_##call *entry; \ | 769 | struct ftrace_raw_##call *entry; \ |
770 | u64 __addr = 0, __count = 1; \ | 770 | u64 __addr = 0, __count = 1; \ |
771 | unsigned long irq_flags; \ | 771 | unsigned long irq_flags; \ |
772 | struct pt_regs *__regs; \ | ||
773 | int __entry_size; \ | 772 | int __entry_size; \ |
774 | int __data_size; \ | 773 | int __data_size; \ |
775 | int rctx; \ | 774 | int rctx; \ |
@@ -790,20 +789,22 @@ perf_trace_templ_##call(struct ftrace_event_call *event_call, \ | |||
790 | \ | 789 | \ |
791 | { assign; } \ | 790 | { assign; } \ |
792 | \ | 791 | \ |
793 | __regs = &__get_cpu_var(perf_trace_regs); \ | ||
794 | perf_fetch_caller_regs(__regs, 2); \ | ||
795 | \ | ||
796 | perf_trace_buf_submit(entry, __entry_size, rctx, __addr, \ | 792 | perf_trace_buf_submit(entry, __entry_size, rctx, __addr, \ |
797 | __count, irq_flags, __regs); \ | 793 | __count, irq_flags, __regs); \ |
798 | } | 794 | } |
799 | 795 | ||
800 | #undef DEFINE_EVENT | 796 | #undef DEFINE_EVENT |
801 | #define DEFINE_EVENT(template, call, proto, args) \ | 797 | #define DEFINE_EVENT(template, call, proto, args) \ |
802 | static notrace void perf_trace_##call(proto) \ | 798 | static notrace void perf_trace_##call(proto) \ |
803 | { \ | 799 | { \ |
804 | struct ftrace_event_call *event_call = &event_##call; \ | 800 | struct ftrace_event_call *event_call = &event_##call; \ |
805 | \ | 801 | struct pt_regs *__regs = &get_cpu_var(perf_trace_regs); \ |
806 | perf_trace_templ_##template(event_call, args); \ | 802 | \ |
803 | perf_fetch_caller_regs(__regs, 1); \ | ||
804 | \ | ||
805 | perf_trace_templ_##template(event_call, __regs, args); \ | ||
806 | \ | ||
807 | put_cpu_var(perf_trace_regs); \ | ||
807 | } | 808 | } |
808 | 809 | ||
809 | #undef DEFINE_EVENT_PRINT | 810 | #undef DEFINE_EVENT_PRINT |
diff --git a/kernel/fork.c b/kernel/fork.c index 4c14942a0ee3..4d57d9e3a6e9 100644 --- a/kernel/fork.c +++ b/kernel/fork.c | |||
@@ -1112,8 +1112,6 @@ static struct task_struct *copy_process(unsigned long clone_flags, | |||
1112 | p->memcg_batch.memcg = NULL; | 1112 | p->memcg_batch.memcg = NULL; |
1113 | #endif | 1113 | #endif |
1114 | 1114 | ||
1115 | p->bts = NULL; | ||
1116 | |||
1117 | /* Perform scheduler related setup. Assign this task to a CPU. */ | 1115 | /* Perform scheduler related setup. Assign this task to a CPU. */ |
1118 | sched_fork(p, clone_flags); | 1116 | sched_fork(p, clone_flags); |
1119 | 1117 | ||
diff --git a/kernel/hw_breakpoint.c b/kernel/hw_breakpoint.c index 03808ed342a6..7a56b22e0602 100644 --- a/kernel/hw_breakpoint.c +++ b/kernel/hw_breakpoint.c | |||
@@ -40,23 +40,29 @@ | |||
40 | #include <linux/percpu.h> | 40 | #include <linux/percpu.h> |
41 | #include <linux/sched.h> | 41 | #include <linux/sched.h> |
42 | #include <linux/init.h> | 42 | #include <linux/init.h> |
43 | #include <linux/slab.h> | ||
43 | #include <linux/cpu.h> | 44 | #include <linux/cpu.h> |
44 | #include <linux/smp.h> | 45 | #include <linux/smp.h> |
45 | 46 | ||
46 | #include <linux/hw_breakpoint.h> | 47 | #include <linux/hw_breakpoint.h> |
47 | 48 | ||
49 | |||
48 | /* | 50 | /* |
49 | * Constraints data | 51 | * Constraints data |
50 | */ | 52 | */ |
51 | 53 | ||
52 | /* Number of pinned cpu breakpoints in a cpu */ | 54 | /* Number of pinned cpu breakpoints in a cpu */ |
53 | static DEFINE_PER_CPU(unsigned int, nr_cpu_bp_pinned); | 55 | static DEFINE_PER_CPU(unsigned int, nr_cpu_bp_pinned[TYPE_MAX]); |
54 | 56 | ||
55 | /* Number of pinned task breakpoints in a cpu */ | 57 | /* Number of pinned task breakpoints in a cpu */ |
56 | static DEFINE_PER_CPU(unsigned int, nr_task_bp_pinned[HBP_NUM]); | 58 | static DEFINE_PER_CPU(unsigned int *, nr_task_bp_pinned[TYPE_MAX]); |
57 | 59 | ||
58 | /* Number of non-pinned cpu/task breakpoints in a cpu */ | 60 | /* Number of non-pinned cpu/task breakpoints in a cpu */ |
59 | static DEFINE_PER_CPU(unsigned int, nr_bp_flexible); | 61 | static DEFINE_PER_CPU(unsigned int, nr_bp_flexible[TYPE_MAX]); |
62 | |||
63 | static int nr_slots[TYPE_MAX]; | ||
64 | |||
65 | static int constraints_initialized; | ||
60 | 66 | ||
61 | /* Gather the number of total pinned and un-pinned bp in a cpuset */ | 67 | /* Gather the number of total pinned and un-pinned bp in a cpuset */ |
62 | struct bp_busy_slots { | 68 | struct bp_busy_slots { |
@@ -67,16 +73,29 @@ struct bp_busy_slots { | |||
67 | /* Serialize accesses to the above constraints */ | 73 | /* Serialize accesses to the above constraints */ |
68 | static DEFINE_MUTEX(nr_bp_mutex); | 74 | static DEFINE_MUTEX(nr_bp_mutex); |
69 | 75 | ||
76 | __weak int hw_breakpoint_weight(struct perf_event *bp) | ||
77 | { | ||
78 | return 1; | ||
79 | } | ||
80 | |||
81 | static inline enum bp_type_idx find_slot_idx(struct perf_event *bp) | ||
82 | { | ||
83 | if (bp->attr.bp_type & HW_BREAKPOINT_RW) | ||
84 | return TYPE_DATA; | ||
85 | |||
86 | return TYPE_INST; | ||
87 | } | ||
88 | |||
70 | /* | 89 | /* |
71 | * Report the maximum number of pinned breakpoints a task | 90 | * Report the maximum number of pinned breakpoints a task |
72 | * have in this cpu | 91 | * have in this cpu |
73 | */ | 92 | */ |
74 | static unsigned int max_task_bp_pinned(int cpu) | 93 | static unsigned int max_task_bp_pinned(int cpu, enum bp_type_idx type) |
75 | { | 94 | { |
76 | int i; | 95 | int i; |
77 | unsigned int *tsk_pinned = per_cpu(nr_task_bp_pinned, cpu); | 96 | unsigned int *tsk_pinned = per_cpu(nr_task_bp_pinned[type], cpu); |
78 | 97 | ||
79 | for (i = HBP_NUM -1; i >= 0; i--) { | 98 | for (i = nr_slots[type] - 1; i >= 0; i--) { |
80 | if (tsk_pinned[i] > 0) | 99 | if (tsk_pinned[i] > 0) |
81 | return i + 1; | 100 | return i + 1; |
82 | } | 101 | } |
@@ -84,7 +103,7 @@ static unsigned int max_task_bp_pinned(int cpu) | |||
84 | return 0; | 103 | return 0; |
85 | } | 104 | } |
86 | 105 | ||
87 | static int task_bp_pinned(struct task_struct *tsk) | 106 | static int task_bp_pinned(struct task_struct *tsk, enum bp_type_idx type) |
88 | { | 107 | { |
89 | struct perf_event_context *ctx = tsk->perf_event_ctxp; | 108 | struct perf_event_context *ctx = tsk->perf_event_ctxp; |
90 | struct list_head *list; | 109 | struct list_head *list; |
@@ -105,7 +124,8 @@ static int task_bp_pinned(struct task_struct *tsk) | |||
105 | */ | 124 | */ |
106 | list_for_each_entry(bp, list, event_entry) { | 125 | list_for_each_entry(bp, list, event_entry) { |
107 | if (bp->attr.type == PERF_TYPE_BREAKPOINT) | 126 | if (bp->attr.type == PERF_TYPE_BREAKPOINT) |
108 | count++; | 127 | if (find_slot_idx(bp) == type) |
128 | count += hw_breakpoint_weight(bp); | ||
109 | } | 129 | } |
110 | 130 | ||
111 | raw_spin_unlock_irqrestore(&ctx->lock, flags); | 131 | raw_spin_unlock_irqrestore(&ctx->lock, flags); |
@@ -118,18 +138,19 @@ static int task_bp_pinned(struct task_struct *tsk) | |||
118 | * a given cpu (cpu > -1) or in all of them (cpu = -1). | 138 | * a given cpu (cpu > -1) or in all of them (cpu = -1). |
119 | */ | 139 | */ |
120 | static void | 140 | static void |
121 | fetch_bp_busy_slots(struct bp_busy_slots *slots, struct perf_event *bp) | 141 | fetch_bp_busy_slots(struct bp_busy_slots *slots, struct perf_event *bp, |
142 | enum bp_type_idx type) | ||
122 | { | 143 | { |
123 | int cpu = bp->cpu; | 144 | int cpu = bp->cpu; |
124 | struct task_struct *tsk = bp->ctx->task; | 145 | struct task_struct *tsk = bp->ctx->task; |
125 | 146 | ||
126 | if (cpu >= 0) { | 147 | if (cpu >= 0) { |
127 | slots->pinned = per_cpu(nr_cpu_bp_pinned, cpu); | 148 | slots->pinned = per_cpu(nr_cpu_bp_pinned[type], cpu); |
128 | if (!tsk) | 149 | if (!tsk) |
129 | slots->pinned += max_task_bp_pinned(cpu); | 150 | slots->pinned += max_task_bp_pinned(cpu, type); |
130 | else | 151 | else |
131 | slots->pinned += task_bp_pinned(tsk); | 152 | slots->pinned += task_bp_pinned(tsk, type); |
132 | slots->flexible = per_cpu(nr_bp_flexible, cpu); | 153 | slots->flexible = per_cpu(nr_bp_flexible[type], cpu); |
133 | 154 | ||
134 | return; | 155 | return; |
135 | } | 156 | } |
@@ -137,16 +158,16 @@ fetch_bp_busy_slots(struct bp_busy_slots *slots, struct perf_event *bp) | |||
137 | for_each_online_cpu(cpu) { | 158 | for_each_online_cpu(cpu) { |
138 | unsigned int nr; | 159 | unsigned int nr; |
139 | 160 | ||
140 | nr = per_cpu(nr_cpu_bp_pinned, cpu); | 161 | nr = per_cpu(nr_cpu_bp_pinned[type], cpu); |
141 | if (!tsk) | 162 | if (!tsk) |
142 | nr += max_task_bp_pinned(cpu); | 163 | nr += max_task_bp_pinned(cpu, type); |
143 | else | 164 | else |
144 | nr += task_bp_pinned(tsk); | 165 | nr += task_bp_pinned(tsk, type); |
145 | 166 | ||
146 | if (nr > slots->pinned) | 167 | if (nr > slots->pinned) |
147 | slots->pinned = nr; | 168 | slots->pinned = nr; |
148 | 169 | ||
149 | nr = per_cpu(nr_bp_flexible, cpu); | 170 | nr = per_cpu(nr_bp_flexible[type], cpu); |
150 | 171 | ||
151 | if (nr > slots->flexible) | 172 | if (nr > slots->flexible) |
152 | slots->flexible = nr; | 173 | slots->flexible = nr; |
@@ -154,31 +175,49 @@ fetch_bp_busy_slots(struct bp_busy_slots *slots, struct perf_event *bp) | |||
154 | } | 175 | } |
155 | 176 | ||
156 | /* | 177 | /* |
178 | * For now, continue to consider flexible as pinned, until we can | ||
179 | * ensure no flexible event can ever be scheduled before a pinned event | ||
180 | * in a same cpu. | ||
181 | */ | ||
182 | static void | ||
183 | fetch_this_slot(struct bp_busy_slots *slots, int weight) | ||
184 | { | ||
185 | slots->pinned += weight; | ||
186 | } | ||
187 | |||
188 | /* | ||
157 | * Add a pinned breakpoint for the given task in our constraint table | 189 | * Add a pinned breakpoint for the given task in our constraint table |
158 | */ | 190 | */ |
159 | static void toggle_bp_task_slot(struct task_struct *tsk, int cpu, bool enable) | 191 | static void toggle_bp_task_slot(struct task_struct *tsk, int cpu, bool enable, |
192 | enum bp_type_idx type, int weight) | ||
160 | { | 193 | { |
161 | unsigned int *tsk_pinned; | 194 | unsigned int *tsk_pinned; |
162 | int count = 0; | 195 | int old_count = 0; |
196 | int old_idx = 0; | ||
197 | int idx = 0; | ||
163 | 198 | ||
164 | count = task_bp_pinned(tsk); | 199 | old_count = task_bp_pinned(tsk, type); |
200 | old_idx = old_count - 1; | ||
201 | idx = old_idx + weight; | ||
165 | 202 | ||
166 | tsk_pinned = per_cpu(nr_task_bp_pinned, cpu); | 203 | tsk_pinned = per_cpu(nr_task_bp_pinned[type], cpu); |
167 | if (enable) { | 204 | if (enable) { |
168 | tsk_pinned[count]++; | 205 | tsk_pinned[idx]++; |
169 | if (count > 0) | 206 | if (old_count > 0) |
170 | tsk_pinned[count-1]--; | 207 | tsk_pinned[old_idx]--; |
171 | } else { | 208 | } else { |
172 | tsk_pinned[count]--; | 209 | tsk_pinned[idx]--; |
173 | if (count > 0) | 210 | if (old_count > 0) |
174 | tsk_pinned[count-1]++; | 211 | tsk_pinned[old_idx]++; |
175 | } | 212 | } |
176 | } | 213 | } |
177 | 214 | ||
178 | /* | 215 | /* |
179 | * Add/remove the given breakpoint in our constraint table | 216 | * Add/remove the given breakpoint in our constraint table |
180 | */ | 217 | */ |
181 | static void toggle_bp_slot(struct perf_event *bp, bool enable) | 218 | static void |
219 | toggle_bp_slot(struct perf_event *bp, bool enable, enum bp_type_idx type, | ||
220 | int weight) | ||
182 | { | 221 | { |
183 | int cpu = bp->cpu; | 222 | int cpu = bp->cpu; |
184 | struct task_struct *tsk = bp->ctx->task; | 223 | struct task_struct *tsk = bp->ctx->task; |
@@ -186,20 +225,20 @@ static void toggle_bp_slot(struct perf_event *bp, bool enable) | |||
186 | /* Pinned counter task profiling */ | 225 | /* Pinned counter task profiling */ |
187 | if (tsk) { | 226 | if (tsk) { |
188 | if (cpu >= 0) { | 227 | if (cpu >= 0) { |
189 | toggle_bp_task_slot(tsk, cpu, enable); | 228 | toggle_bp_task_slot(tsk, cpu, enable, type, weight); |
190 | return; | 229 | return; |
191 | } | 230 | } |
192 | 231 | ||
193 | for_each_online_cpu(cpu) | 232 | for_each_online_cpu(cpu) |
194 | toggle_bp_task_slot(tsk, cpu, enable); | 233 | toggle_bp_task_slot(tsk, cpu, enable, type, weight); |
195 | return; | 234 | return; |
196 | } | 235 | } |
197 | 236 | ||
198 | /* Pinned counter cpu profiling */ | 237 | /* Pinned counter cpu profiling */ |
199 | if (enable) | 238 | if (enable) |
200 | per_cpu(nr_cpu_bp_pinned, bp->cpu)++; | 239 | per_cpu(nr_cpu_bp_pinned[type], bp->cpu) += weight; |
201 | else | 240 | else |
202 | per_cpu(nr_cpu_bp_pinned, bp->cpu)--; | 241 | per_cpu(nr_cpu_bp_pinned[type], bp->cpu) -= weight; |
203 | } | 242 | } |
204 | 243 | ||
205 | /* | 244 | /* |
@@ -246,14 +285,29 @@ static void toggle_bp_slot(struct perf_event *bp, bool enable) | |||
246 | static int __reserve_bp_slot(struct perf_event *bp) | 285 | static int __reserve_bp_slot(struct perf_event *bp) |
247 | { | 286 | { |
248 | struct bp_busy_slots slots = {0}; | 287 | struct bp_busy_slots slots = {0}; |
288 | enum bp_type_idx type; | ||
289 | int weight; | ||
249 | 290 | ||
250 | fetch_bp_busy_slots(&slots, bp); | 291 | /* We couldn't initialize breakpoint constraints on boot */ |
292 | if (!constraints_initialized) | ||
293 | return -ENOMEM; | ||
294 | |||
295 | /* Basic checks */ | ||
296 | if (bp->attr.bp_type == HW_BREAKPOINT_EMPTY || | ||
297 | bp->attr.bp_type == HW_BREAKPOINT_INVALID) | ||
298 | return -EINVAL; | ||
299 | |||
300 | type = find_slot_idx(bp); | ||
301 | weight = hw_breakpoint_weight(bp); | ||
302 | |||
303 | fetch_bp_busy_slots(&slots, bp, type); | ||
304 | fetch_this_slot(&slots, weight); | ||
251 | 305 | ||
252 | /* Flexible counters need to keep at least one slot */ | 306 | /* Flexible counters need to keep at least one slot */ |
253 | if (slots.pinned + (!!slots.flexible) == HBP_NUM) | 307 | if (slots.pinned + (!!slots.flexible) > nr_slots[type]) |
254 | return -ENOSPC; | 308 | return -ENOSPC; |
255 | 309 | ||
256 | toggle_bp_slot(bp, true); | 310 | toggle_bp_slot(bp, true, type, weight); |
257 | 311 | ||
258 | return 0; | 312 | return 0; |
259 | } | 313 | } |
@@ -273,7 +327,12 @@ int reserve_bp_slot(struct perf_event *bp) | |||
273 | 327 | ||
274 | static void __release_bp_slot(struct perf_event *bp) | 328 | static void __release_bp_slot(struct perf_event *bp) |
275 | { | 329 | { |
276 | toggle_bp_slot(bp, false); | 330 | enum bp_type_idx type; |
331 | int weight; | ||
332 | |||
333 | type = find_slot_idx(bp); | ||
334 | weight = hw_breakpoint_weight(bp); | ||
335 | toggle_bp_slot(bp, false, type, weight); | ||
277 | } | 336 | } |
278 | 337 | ||
279 | void release_bp_slot(struct perf_event *bp) | 338 | void release_bp_slot(struct perf_event *bp) |
@@ -308,6 +367,28 @@ int dbg_release_bp_slot(struct perf_event *bp) | |||
308 | return 0; | 367 | return 0; |
309 | } | 368 | } |
310 | 369 | ||
370 | static int validate_hw_breakpoint(struct perf_event *bp) | ||
371 | { | ||
372 | int ret; | ||
373 | |||
374 | ret = arch_validate_hwbkpt_settings(bp); | ||
375 | if (ret) | ||
376 | return ret; | ||
377 | |||
378 | if (arch_check_bp_in_kernelspace(bp)) { | ||
379 | if (bp->attr.exclude_kernel) | ||
380 | return -EINVAL; | ||
381 | /* | ||
382 | * Don't let unprivileged users set a breakpoint in the trap | ||
383 | * path to avoid trap recursion attacks. | ||
384 | */ | ||
385 | if (!capable(CAP_SYS_ADMIN)) | ||
386 | return -EPERM; | ||
387 | } | ||
388 | |||
389 | return 0; | ||
390 | } | ||
391 | |||
311 | int register_perf_hw_breakpoint(struct perf_event *bp) | 392 | int register_perf_hw_breakpoint(struct perf_event *bp) |
312 | { | 393 | { |
313 | int ret; | 394 | int ret; |
@@ -316,17 +397,7 @@ int register_perf_hw_breakpoint(struct perf_event *bp) | |||
316 | if (ret) | 397 | if (ret) |
317 | return ret; | 398 | return ret; |
318 | 399 | ||
319 | /* | 400 | ret = validate_hw_breakpoint(bp); |
320 | * Ptrace breakpoints can be temporary perf events only | ||
321 | * meant to reserve a slot. In this case, it is created disabled and | ||
322 | * we don't want to check the params right now (as we put a null addr) | ||
323 | * But perf tools create events as disabled and we want to check | ||
324 | * the params for them. | ||
325 | * This is a quick hack that will be removed soon, once we remove | ||
326 | * the tmp breakpoints from ptrace | ||
327 | */ | ||
328 | if (!bp->attr.disabled || !bp->overflow_handler) | ||
329 | ret = arch_validate_hwbkpt_settings(bp, bp->ctx->task); | ||
330 | 401 | ||
331 | /* if arch_validate_hwbkpt_settings() fails then release bp slot */ | 402 | /* if arch_validate_hwbkpt_settings() fails then release bp slot */ |
332 | if (ret) | 403 | if (ret) |
@@ -373,7 +444,7 @@ int modify_user_hw_breakpoint(struct perf_event *bp, struct perf_event_attr *att | |||
373 | if (attr->disabled) | 444 | if (attr->disabled) |
374 | goto end; | 445 | goto end; |
375 | 446 | ||
376 | err = arch_validate_hwbkpt_settings(bp, bp->ctx->task); | 447 | err = validate_hw_breakpoint(bp); |
377 | if (!err) | 448 | if (!err) |
378 | perf_event_enable(bp); | 449 | perf_event_enable(bp); |
379 | 450 | ||
@@ -480,7 +551,36 @@ static struct notifier_block hw_breakpoint_exceptions_nb = { | |||
480 | 551 | ||
481 | static int __init init_hw_breakpoint(void) | 552 | static int __init init_hw_breakpoint(void) |
482 | { | 553 | { |
554 | unsigned int **task_bp_pinned; | ||
555 | int cpu, err_cpu; | ||
556 | int i; | ||
557 | |||
558 | for (i = 0; i < TYPE_MAX; i++) | ||
559 | nr_slots[i] = hw_breakpoint_slots(i); | ||
560 | |||
561 | for_each_possible_cpu(cpu) { | ||
562 | for (i = 0; i < TYPE_MAX; i++) { | ||
563 | task_bp_pinned = &per_cpu(nr_task_bp_pinned[i], cpu); | ||
564 | *task_bp_pinned = kzalloc(sizeof(int) * nr_slots[i], | ||
565 | GFP_KERNEL); | ||
566 | if (!*task_bp_pinned) | ||
567 | goto err_alloc; | ||
568 | } | ||
569 | } | ||
570 | |||
571 | constraints_initialized = 1; | ||
572 | |||
483 | return register_die_notifier(&hw_breakpoint_exceptions_nb); | 573 | return register_die_notifier(&hw_breakpoint_exceptions_nb); |
574 | |||
575 | err_alloc: | ||
576 | for_each_possible_cpu(err_cpu) { | ||
577 | if (err_cpu == cpu) | ||
578 | break; | ||
579 | for (i = 0; i < TYPE_MAX; i++) | ||
580 | kfree(per_cpu(nr_task_bp_pinned[i], cpu)); | ||
581 | } | ||
582 | |||
583 | return -ENOMEM; | ||
484 | } | 584 | } |
485 | core_initcall(init_hw_breakpoint); | 585 | core_initcall(init_hw_breakpoint); |
486 | 586 | ||
diff --git a/kernel/kprobes.c b/kernel/kprobes.c index 0ed46f3e51e9..282035f3ae96 100644 --- a/kernel/kprobes.c +++ b/kernel/kprobes.c | |||
@@ -1588,6 +1588,72 @@ static void __kprobes kill_kprobe(struct kprobe *p) | |||
1588 | arch_remove_kprobe(p); | 1588 | arch_remove_kprobe(p); |
1589 | } | 1589 | } |
1590 | 1590 | ||
1591 | /* Disable one kprobe */ | ||
1592 | int __kprobes disable_kprobe(struct kprobe *kp) | ||
1593 | { | ||
1594 | int ret = 0; | ||
1595 | struct kprobe *p; | ||
1596 | |||
1597 | mutex_lock(&kprobe_mutex); | ||
1598 | |||
1599 | /* Check whether specified probe is valid. */ | ||
1600 | p = __get_valid_kprobe(kp); | ||
1601 | if (unlikely(p == NULL)) { | ||
1602 | ret = -EINVAL; | ||
1603 | goto out; | ||
1604 | } | ||
1605 | |||
1606 | /* If the probe is already disabled (or gone), just return */ | ||
1607 | if (kprobe_disabled(kp)) | ||
1608 | goto out; | ||
1609 | |||
1610 | kp->flags |= KPROBE_FLAG_DISABLED; | ||
1611 | if (p != kp) | ||
1612 | /* When kp != p, p is always enabled. */ | ||
1613 | try_to_disable_aggr_kprobe(p); | ||
1614 | |||
1615 | if (!kprobes_all_disarmed && kprobe_disabled(p)) | ||
1616 | disarm_kprobe(p); | ||
1617 | out: | ||
1618 | mutex_unlock(&kprobe_mutex); | ||
1619 | return ret; | ||
1620 | } | ||
1621 | EXPORT_SYMBOL_GPL(disable_kprobe); | ||
1622 | |||
1623 | /* Enable one kprobe */ | ||
1624 | int __kprobes enable_kprobe(struct kprobe *kp) | ||
1625 | { | ||
1626 | int ret = 0; | ||
1627 | struct kprobe *p; | ||
1628 | |||
1629 | mutex_lock(&kprobe_mutex); | ||
1630 | |||
1631 | /* Check whether specified probe is valid. */ | ||
1632 | p = __get_valid_kprobe(kp); | ||
1633 | if (unlikely(p == NULL)) { | ||
1634 | ret = -EINVAL; | ||
1635 | goto out; | ||
1636 | } | ||
1637 | |||
1638 | if (kprobe_gone(kp)) { | ||
1639 | /* This kprobe has gone, we couldn't enable it. */ | ||
1640 | ret = -EINVAL; | ||
1641 | goto out; | ||
1642 | } | ||
1643 | |||
1644 | if (p != kp) | ||
1645 | kp->flags &= ~KPROBE_FLAG_DISABLED; | ||
1646 | |||
1647 | if (!kprobes_all_disarmed && kprobe_disabled(p)) { | ||
1648 | p->flags &= ~KPROBE_FLAG_DISABLED; | ||
1649 | arm_kprobe(p); | ||
1650 | } | ||
1651 | out: | ||
1652 | mutex_unlock(&kprobe_mutex); | ||
1653 | return ret; | ||
1654 | } | ||
1655 | EXPORT_SYMBOL_GPL(enable_kprobe); | ||
1656 | |||
1591 | void __kprobes dump_kprobe(struct kprobe *kp) | 1657 | void __kprobes dump_kprobe(struct kprobe *kp) |
1592 | { | 1658 | { |
1593 | printk(KERN_WARNING "Dumping kprobe:\n"); | 1659 | printk(KERN_WARNING "Dumping kprobe:\n"); |
@@ -1805,72 +1871,6 @@ static const struct file_operations debugfs_kprobes_operations = { | |||
1805 | .release = seq_release, | 1871 | .release = seq_release, |
1806 | }; | 1872 | }; |
1807 | 1873 | ||
1808 | /* Disable one kprobe */ | ||
1809 | int __kprobes disable_kprobe(struct kprobe *kp) | ||
1810 | { | ||
1811 | int ret = 0; | ||
1812 | struct kprobe *p; | ||
1813 | |||
1814 | mutex_lock(&kprobe_mutex); | ||
1815 | |||
1816 | /* Check whether specified probe is valid. */ | ||
1817 | p = __get_valid_kprobe(kp); | ||
1818 | if (unlikely(p == NULL)) { | ||
1819 | ret = -EINVAL; | ||
1820 | goto out; | ||
1821 | } | ||
1822 | |||
1823 | /* If the probe is already disabled (or gone), just return */ | ||
1824 | if (kprobe_disabled(kp)) | ||
1825 | goto out; | ||
1826 | |||
1827 | kp->flags |= KPROBE_FLAG_DISABLED; | ||
1828 | if (p != kp) | ||
1829 | /* When kp != p, p is always enabled. */ | ||
1830 | try_to_disable_aggr_kprobe(p); | ||
1831 | |||
1832 | if (!kprobes_all_disarmed && kprobe_disabled(p)) | ||
1833 | disarm_kprobe(p); | ||
1834 | out: | ||
1835 | mutex_unlock(&kprobe_mutex); | ||
1836 | return ret; | ||
1837 | } | ||
1838 | EXPORT_SYMBOL_GPL(disable_kprobe); | ||
1839 | |||
1840 | /* Enable one kprobe */ | ||
1841 | int __kprobes enable_kprobe(struct kprobe *kp) | ||
1842 | { | ||
1843 | int ret = 0; | ||
1844 | struct kprobe *p; | ||
1845 | |||
1846 | mutex_lock(&kprobe_mutex); | ||
1847 | |||
1848 | /* Check whether specified probe is valid. */ | ||
1849 | p = __get_valid_kprobe(kp); | ||
1850 | if (unlikely(p == NULL)) { | ||
1851 | ret = -EINVAL; | ||
1852 | goto out; | ||
1853 | } | ||
1854 | |||
1855 | if (kprobe_gone(kp)) { | ||
1856 | /* This kprobe has gone, we couldn't enable it. */ | ||
1857 | ret = -EINVAL; | ||
1858 | goto out; | ||
1859 | } | ||
1860 | |||
1861 | if (p != kp) | ||
1862 | kp->flags &= ~KPROBE_FLAG_DISABLED; | ||
1863 | |||
1864 | if (!kprobes_all_disarmed && kprobe_disabled(p)) { | ||
1865 | p->flags &= ~KPROBE_FLAG_DISABLED; | ||
1866 | arm_kprobe(p); | ||
1867 | } | ||
1868 | out: | ||
1869 | mutex_unlock(&kprobe_mutex); | ||
1870 | return ret; | ||
1871 | } | ||
1872 | EXPORT_SYMBOL_GPL(enable_kprobe); | ||
1873 | |||
1874 | static void __kprobes arm_all_kprobes(void) | 1874 | static void __kprobes arm_all_kprobes(void) |
1875 | { | 1875 | { |
1876 | struct hlist_head *head; | 1876 | struct hlist_head *head; |
diff --git a/kernel/lockdep.c b/kernel/lockdep.c index 4349e9793419..ec21304856d1 100644 --- a/kernel/lockdep.c +++ b/kernel/lockdep.c | |||
@@ -3232,7 +3232,7 @@ void lock_release(struct lockdep_map *lock, int nested, | |||
3232 | raw_local_irq_save(flags); | 3232 | raw_local_irq_save(flags); |
3233 | check_flags(flags); | 3233 | check_flags(flags); |
3234 | current->lockdep_recursion = 1; | 3234 | current->lockdep_recursion = 1; |
3235 | trace_lock_release(lock, nested, ip); | 3235 | trace_lock_release(lock, ip); |
3236 | __lock_release(lock, nested, ip); | 3236 | __lock_release(lock, nested, ip); |
3237 | current->lockdep_recursion = 0; | 3237 | current->lockdep_recursion = 0; |
3238 | raw_local_irq_restore(flags); | 3238 | raw_local_irq_restore(flags); |
@@ -3385,7 +3385,7 @@ found_it: | |||
3385 | hlock->holdtime_stamp = now; | 3385 | hlock->holdtime_stamp = now; |
3386 | } | 3386 | } |
3387 | 3387 | ||
3388 | trace_lock_acquired(lock, ip, waittime); | 3388 | trace_lock_acquired(lock, ip); |
3389 | 3389 | ||
3390 | stats = get_lock_stats(hlock_class(hlock)); | 3390 | stats = get_lock_stats(hlock_class(hlock)); |
3391 | if (waittime) { | 3391 | if (waittime) { |
diff --git a/kernel/perf_event.c b/kernel/perf_event.c index 3d1552d3c12b..a4fa381db3c2 100644 --- a/kernel/perf_event.c +++ b/kernel/perf_event.c | |||
@@ -16,6 +16,7 @@ | |||
16 | #include <linux/file.h> | 16 | #include <linux/file.h> |
17 | #include <linux/poll.h> | 17 | #include <linux/poll.h> |
18 | #include <linux/slab.h> | 18 | #include <linux/slab.h> |
19 | #include <linux/hash.h> | ||
19 | #include <linux/sysfs.h> | 20 | #include <linux/sysfs.h> |
20 | #include <linux/dcache.h> | 21 | #include <linux/dcache.h> |
21 | #include <linux/percpu.h> | 22 | #include <linux/percpu.h> |
@@ -82,14 +83,6 @@ extern __weak const struct pmu *hw_perf_event_init(struct perf_event *event) | |||
82 | void __weak hw_perf_disable(void) { barrier(); } | 83 | void __weak hw_perf_disable(void) { barrier(); } |
83 | void __weak hw_perf_enable(void) { barrier(); } | 84 | void __weak hw_perf_enable(void) { barrier(); } |
84 | 85 | ||
85 | int __weak | ||
86 | hw_perf_group_sched_in(struct perf_event *group_leader, | ||
87 | struct perf_cpu_context *cpuctx, | ||
88 | struct perf_event_context *ctx) | ||
89 | { | ||
90 | return 0; | ||
91 | } | ||
92 | |||
93 | void __weak perf_event_print_debug(void) { } | 86 | void __weak perf_event_print_debug(void) { } |
94 | 87 | ||
95 | static DEFINE_PER_CPU(int, perf_disable_count); | 88 | static DEFINE_PER_CPU(int, perf_disable_count); |
@@ -262,6 +255,18 @@ static void update_event_times(struct perf_event *event) | |||
262 | event->total_time_running = run_end - event->tstamp_running; | 255 | event->total_time_running = run_end - event->tstamp_running; |
263 | } | 256 | } |
264 | 257 | ||
258 | /* | ||
259 | * Update total_time_enabled and total_time_running for all events in a group. | ||
260 | */ | ||
261 | static void update_group_times(struct perf_event *leader) | ||
262 | { | ||
263 | struct perf_event *event; | ||
264 | |||
265 | update_event_times(leader); | ||
266 | list_for_each_entry(event, &leader->sibling_list, group_entry) | ||
267 | update_event_times(event); | ||
268 | } | ||
269 | |||
265 | static struct list_head * | 270 | static struct list_head * |
266 | ctx_group_list(struct perf_event *event, struct perf_event_context *ctx) | 271 | ctx_group_list(struct perf_event *event, struct perf_event_context *ctx) |
267 | { | 272 | { |
@@ -315,8 +320,6 @@ list_add_event(struct perf_event *event, struct perf_event_context *ctx) | |||
315 | static void | 320 | static void |
316 | list_del_event(struct perf_event *event, struct perf_event_context *ctx) | 321 | list_del_event(struct perf_event *event, struct perf_event_context *ctx) |
317 | { | 322 | { |
318 | struct perf_event *sibling, *tmp; | ||
319 | |||
320 | if (list_empty(&event->group_entry)) | 323 | if (list_empty(&event->group_entry)) |
321 | return; | 324 | return; |
322 | ctx->nr_events--; | 325 | ctx->nr_events--; |
@@ -329,7 +332,7 @@ list_del_event(struct perf_event *event, struct perf_event_context *ctx) | |||
329 | if (event->group_leader != event) | 332 | if (event->group_leader != event) |
330 | event->group_leader->nr_siblings--; | 333 | event->group_leader->nr_siblings--; |
331 | 334 | ||
332 | update_event_times(event); | 335 | update_group_times(event); |
333 | 336 | ||
334 | /* | 337 | /* |
335 | * If event was in error state, then keep it | 338 | * If event was in error state, then keep it |
@@ -340,6 +343,12 @@ list_del_event(struct perf_event *event, struct perf_event_context *ctx) | |||
340 | */ | 343 | */ |
341 | if (event->state > PERF_EVENT_STATE_OFF) | 344 | if (event->state > PERF_EVENT_STATE_OFF) |
342 | event->state = PERF_EVENT_STATE_OFF; | 345 | event->state = PERF_EVENT_STATE_OFF; |
346 | } | ||
347 | |||
348 | static void | ||
349 | perf_destroy_group(struct perf_event *event, struct perf_event_context *ctx) | ||
350 | { | ||
351 | struct perf_event *sibling, *tmp; | ||
343 | 352 | ||
344 | /* | 353 | /* |
345 | * If this was a group event with sibling events then | 354 | * If this was a group event with sibling events then |
@@ -505,18 +514,6 @@ retry: | |||
505 | } | 514 | } |
506 | 515 | ||
507 | /* | 516 | /* |
508 | * Update total_time_enabled and total_time_running for all events in a group. | ||
509 | */ | ||
510 | static void update_group_times(struct perf_event *leader) | ||
511 | { | ||
512 | struct perf_event *event; | ||
513 | |||
514 | update_event_times(leader); | ||
515 | list_for_each_entry(event, &leader->sibling_list, group_entry) | ||
516 | update_event_times(event); | ||
517 | } | ||
518 | |||
519 | /* | ||
520 | * Cross CPU call to disable a performance event | 517 | * Cross CPU call to disable a performance event |
521 | */ | 518 | */ |
522 | static void __perf_event_disable(void *info) | 519 | static void __perf_event_disable(void *info) |
@@ -640,15 +637,20 @@ group_sched_in(struct perf_event *group_event, | |||
640 | struct perf_cpu_context *cpuctx, | 637 | struct perf_cpu_context *cpuctx, |
641 | struct perf_event_context *ctx) | 638 | struct perf_event_context *ctx) |
642 | { | 639 | { |
643 | struct perf_event *event, *partial_group; | 640 | struct perf_event *event, *partial_group = NULL; |
641 | const struct pmu *pmu = group_event->pmu; | ||
642 | bool txn = false; | ||
644 | int ret; | 643 | int ret; |
645 | 644 | ||
646 | if (group_event->state == PERF_EVENT_STATE_OFF) | 645 | if (group_event->state == PERF_EVENT_STATE_OFF) |
647 | return 0; | 646 | return 0; |
648 | 647 | ||
649 | ret = hw_perf_group_sched_in(group_event, cpuctx, ctx); | 648 | /* Check if group transaction availabe */ |
650 | if (ret) | 649 | if (pmu->start_txn) |
651 | return ret < 0 ? ret : 0; | 650 | txn = true; |
651 | |||
652 | if (txn) | ||
653 | pmu->start_txn(pmu); | ||
652 | 654 | ||
653 | if (event_sched_in(group_event, cpuctx, ctx)) | 655 | if (event_sched_in(group_event, cpuctx, ctx)) |
654 | return -EAGAIN; | 656 | return -EAGAIN; |
@@ -663,9 +665,19 @@ group_sched_in(struct perf_event *group_event, | |||
663 | } | 665 | } |
664 | } | 666 | } |
665 | 667 | ||
666 | return 0; | 668 | if (!txn) |
669 | return 0; | ||
670 | |||
671 | ret = pmu->commit_txn(pmu); | ||
672 | if (!ret) { | ||
673 | pmu->cancel_txn(pmu); | ||
674 | return 0; | ||
675 | } | ||
667 | 676 | ||
668 | group_error: | 677 | group_error: |
678 | if (txn) | ||
679 | pmu->cancel_txn(pmu); | ||
680 | |||
669 | /* | 681 | /* |
670 | * Groups can be scheduled in as one unit only, so undo any | 682 | * Groups can be scheduled in as one unit only, so undo any |
671 | * partial group before returning: | 683 | * partial group before returning: |
@@ -1367,6 +1379,8 @@ void perf_event_task_sched_in(struct task_struct *task) | |||
1367 | if (cpuctx->task_ctx == ctx) | 1379 | if (cpuctx->task_ctx == ctx) |
1368 | return; | 1380 | return; |
1369 | 1381 | ||
1382 | perf_disable(); | ||
1383 | |||
1370 | /* | 1384 | /* |
1371 | * We want to keep the following priority order: | 1385 | * We want to keep the following priority order: |
1372 | * cpu pinned (that don't need to move), task pinned, | 1386 | * cpu pinned (that don't need to move), task pinned, |
@@ -1379,6 +1393,8 @@ void perf_event_task_sched_in(struct task_struct *task) | |||
1379 | ctx_sched_in(ctx, cpuctx, EVENT_FLEXIBLE); | 1393 | ctx_sched_in(ctx, cpuctx, EVENT_FLEXIBLE); |
1380 | 1394 | ||
1381 | cpuctx->task_ctx = ctx; | 1395 | cpuctx->task_ctx = ctx; |
1396 | |||
1397 | perf_enable(); | ||
1382 | } | 1398 | } |
1383 | 1399 | ||
1384 | #define MAX_INTERRUPTS (~0ULL) | 1400 | #define MAX_INTERRUPTS (~0ULL) |
@@ -1856,9 +1872,30 @@ int perf_event_release_kernel(struct perf_event *event) | |||
1856 | { | 1872 | { |
1857 | struct perf_event_context *ctx = event->ctx; | 1873 | struct perf_event_context *ctx = event->ctx; |
1858 | 1874 | ||
1875 | /* | ||
1876 | * Remove from the PMU, can't get re-enabled since we got | ||
1877 | * here because the last ref went. | ||
1878 | */ | ||
1879 | perf_event_disable(event); | ||
1880 | |||
1859 | WARN_ON_ONCE(ctx->parent_ctx); | 1881 | WARN_ON_ONCE(ctx->parent_ctx); |
1860 | mutex_lock(&ctx->mutex); | 1882 | /* |
1861 | perf_event_remove_from_context(event); | 1883 | * There are two ways this annotation is useful: |
1884 | * | ||
1885 | * 1) there is a lock recursion from perf_event_exit_task | ||
1886 | * see the comment there. | ||
1887 | * | ||
1888 | * 2) there is a lock-inversion with mmap_sem through | ||
1889 | * perf_event_read_group(), which takes faults while | ||
1890 | * holding ctx->mutex, however this is called after | ||
1891 | * the last filedesc died, so there is no possibility | ||
1892 | * to trigger the AB-BA case. | ||
1893 | */ | ||
1894 | mutex_lock_nested(&ctx->mutex, SINGLE_DEPTH_NESTING); | ||
1895 | raw_spin_lock_irq(&ctx->lock); | ||
1896 | list_del_event(event, ctx); | ||
1897 | perf_destroy_group(event, ctx); | ||
1898 | raw_spin_unlock_irq(&ctx->lock); | ||
1862 | mutex_unlock(&ctx->mutex); | 1899 | mutex_unlock(&ctx->mutex); |
1863 | 1900 | ||
1864 | mutex_lock(&event->owner->perf_event_mutex); | 1901 | mutex_lock(&event->owner->perf_event_mutex); |
@@ -2642,6 +2679,7 @@ static int perf_fasync(int fd, struct file *filp, int on) | |||
2642 | } | 2679 | } |
2643 | 2680 | ||
2644 | static const struct file_operations perf_fops = { | 2681 | static const struct file_operations perf_fops = { |
2682 | .llseek = no_llseek, | ||
2645 | .release = perf_release, | 2683 | .release = perf_release, |
2646 | .read = perf_read, | 2684 | .read = perf_read, |
2647 | .poll = perf_poll, | 2685 | .poll = perf_poll, |
@@ -2792,6 +2830,27 @@ void perf_arch_fetch_caller_regs(struct pt_regs *regs, unsigned long ip, int ski | |||
2792 | 2830 | ||
2793 | 2831 | ||
2794 | /* | 2832 | /* |
2833 | * We assume there is only KVM supporting the callbacks. | ||
2834 | * Later on, we might change it to a list if there is | ||
2835 | * another virtualization implementation supporting the callbacks. | ||
2836 | */ | ||
2837 | struct perf_guest_info_callbacks *perf_guest_cbs; | ||
2838 | |||
2839 | int perf_register_guest_info_callbacks(struct perf_guest_info_callbacks *cbs) | ||
2840 | { | ||
2841 | perf_guest_cbs = cbs; | ||
2842 | return 0; | ||
2843 | } | ||
2844 | EXPORT_SYMBOL_GPL(perf_register_guest_info_callbacks); | ||
2845 | |||
2846 | int perf_unregister_guest_info_callbacks(struct perf_guest_info_callbacks *cbs) | ||
2847 | { | ||
2848 | perf_guest_cbs = NULL; | ||
2849 | return 0; | ||
2850 | } | ||
2851 | EXPORT_SYMBOL_GPL(perf_unregister_guest_info_callbacks); | ||
2852 | |||
2853 | /* | ||
2795 | * Output | 2854 | * Output |
2796 | */ | 2855 | */ |
2797 | static bool perf_output_space(struct perf_mmap_data *data, unsigned long tail, | 2856 | static bool perf_output_space(struct perf_mmap_data *data, unsigned long tail, |
@@ -3743,7 +3802,7 @@ void __perf_event_mmap(struct vm_area_struct *vma) | |||
3743 | .event_id = { | 3802 | .event_id = { |
3744 | .header = { | 3803 | .header = { |
3745 | .type = PERF_RECORD_MMAP, | 3804 | .type = PERF_RECORD_MMAP, |
3746 | .misc = 0, | 3805 | .misc = PERF_RECORD_MISC_USER, |
3747 | /* .size */ | 3806 | /* .size */ |
3748 | }, | 3807 | }, |
3749 | /* .pid */ | 3808 | /* .pid */ |
@@ -3961,36 +4020,6 @@ static void perf_swevent_add(struct perf_event *event, u64 nr, | |||
3961 | perf_swevent_overflow(event, 0, nmi, data, regs); | 4020 | perf_swevent_overflow(event, 0, nmi, data, regs); |
3962 | } | 4021 | } |
3963 | 4022 | ||
3964 | static int perf_swevent_is_counting(struct perf_event *event) | ||
3965 | { | ||
3966 | /* | ||
3967 | * The event is active, we're good! | ||
3968 | */ | ||
3969 | if (event->state == PERF_EVENT_STATE_ACTIVE) | ||
3970 | return 1; | ||
3971 | |||
3972 | /* | ||
3973 | * The event is off/error, not counting. | ||
3974 | */ | ||
3975 | if (event->state != PERF_EVENT_STATE_INACTIVE) | ||
3976 | return 0; | ||
3977 | |||
3978 | /* | ||
3979 | * The event is inactive, if the context is active | ||
3980 | * we're part of a group that didn't make it on the 'pmu', | ||
3981 | * not counting. | ||
3982 | */ | ||
3983 | if (event->ctx->is_active) | ||
3984 | return 0; | ||
3985 | |||
3986 | /* | ||
3987 | * We're inactive and the context is too, this means the | ||
3988 | * task is scheduled out, we're counting events that happen | ||
3989 | * to us, like migration events. | ||
3990 | */ | ||
3991 | return 1; | ||
3992 | } | ||
3993 | |||
3994 | static int perf_tp_event_match(struct perf_event *event, | 4023 | static int perf_tp_event_match(struct perf_event *event, |
3995 | struct perf_sample_data *data); | 4024 | struct perf_sample_data *data); |
3996 | 4025 | ||
@@ -4014,12 +4043,6 @@ static int perf_swevent_match(struct perf_event *event, | |||
4014 | struct perf_sample_data *data, | 4043 | struct perf_sample_data *data, |
4015 | struct pt_regs *regs) | 4044 | struct pt_regs *regs) |
4016 | { | 4045 | { |
4017 | if (event->cpu != -1 && event->cpu != smp_processor_id()) | ||
4018 | return 0; | ||
4019 | |||
4020 | if (!perf_swevent_is_counting(event)) | ||
4021 | return 0; | ||
4022 | |||
4023 | if (event->attr.type != type) | 4046 | if (event->attr.type != type) |
4024 | return 0; | 4047 | return 0; |
4025 | 4048 | ||
@@ -4036,18 +4059,53 @@ static int perf_swevent_match(struct perf_event *event, | |||
4036 | return 1; | 4059 | return 1; |
4037 | } | 4060 | } |
4038 | 4061 | ||
4039 | static void perf_swevent_ctx_event(struct perf_event_context *ctx, | 4062 | static inline u64 swevent_hash(u64 type, u32 event_id) |
4040 | enum perf_type_id type, | ||
4041 | u32 event_id, u64 nr, int nmi, | ||
4042 | struct perf_sample_data *data, | ||
4043 | struct pt_regs *regs) | ||
4044 | { | 4063 | { |
4064 | u64 val = event_id | (type << 32); | ||
4065 | |||
4066 | return hash_64(val, SWEVENT_HLIST_BITS); | ||
4067 | } | ||
4068 | |||
4069 | static struct hlist_head * | ||
4070 | find_swevent_head(struct perf_cpu_context *ctx, u64 type, u32 event_id) | ||
4071 | { | ||
4072 | u64 hash; | ||
4073 | struct swevent_hlist *hlist; | ||
4074 | |||
4075 | hash = swevent_hash(type, event_id); | ||
4076 | |||
4077 | hlist = rcu_dereference(ctx->swevent_hlist); | ||
4078 | if (!hlist) | ||
4079 | return NULL; | ||
4080 | |||
4081 | return &hlist->heads[hash]; | ||
4082 | } | ||
4083 | |||
4084 | static void do_perf_sw_event(enum perf_type_id type, u32 event_id, | ||
4085 | u64 nr, int nmi, | ||
4086 | struct perf_sample_data *data, | ||
4087 | struct pt_regs *regs) | ||
4088 | { | ||
4089 | struct perf_cpu_context *cpuctx; | ||
4045 | struct perf_event *event; | 4090 | struct perf_event *event; |
4091 | struct hlist_node *node; | ||
4092 | struct hlist_head *head; | ||
4046 | 4093 | ||
4047 | list_for_each_entry_rcu(event, &ctx->event_list, event_entry) { | 4094 | cpuctx = &__get_cpu_var(perf_cpu_context); |
4095 | |||
4096 | rcu_read_lock(); | ||
4097 | |||
4098 | head = find_swevent_head(cpuctx, type, event_id); | ||
4099 | |||
4100 | if (!head) | ||
4101 | goto end; | ||
4102 | |||
4103 | hlist_for_each_entry_rcu(event, node, head, hlist_entry) { | ||
4048 | if (perf_swevent_match(event, type, event_id, data, regs)) | 4104 | if (perf_swevent_match(event, type, event_id, data, regs)) |
4049 | perf_swevent_add(event, nr, nmi, data, regs); | 4105 | perf_swevent_add(event, nr, nmi, data, regs); |
4050 | } | 4106 | } |
4107 | end: | ||
4108 | rcu_read_unlock(); | ||
4051 | } | 4109 | } |
4052 | 4110 | ||
4053 | int perf_swevent_get_recursion_context(void) | 4111 | int perf_swevent_get_recursion_context(void) |
@@ -4085,27 +4143,6 @@ void perf_swevent_put_recursion_context(int rctx) | |||
4085 | } | 4143 | } |
4086 | EXPORT_SYMBOL_GPL(perf_swevent_put_recursion_context); | 4144 | EXPORT_SYMBOL_GPL(perf_swevent_put_recursion_context); |
4087 | 4145 | ||
4088 | static void do_perf_sw_event(enum perf_type_id type, u32 event_id, | ||
4089 | u64 nr, int nmi, | ||
4090 | struct perf_sample_data *data, | ||
4091 | struct pt_regs *regs) | ||
4092 | { | ||
4093 | struct perf_cpu_context *cpuctx; | ||
4094 | struct perf_event_context *ctx; | ||
4095 | |||
4096 | cpuctx = &__get_cpu_var(perf_cpu_context); | ||
4097 | rcu_read_lock(); | ||
4098 | perf_swevent_ctx_event(&cpuctx->ctx, type, event_id, | ||
4099 | nr, nmi, data, regs); | ||
4100 | /* | ||
4101 | * doesn't really matter which of the child contexts the | ||
4102 | * events ends up in. | ||
4103 | */ | ||
4104 | ctx = rcu_dereference(current->perf_event_ctxp); | ||
4105 | if (ctx) | ||
4106 | perf_swevent_ctx_event(ctx, type, event_id, nr, nmi, data, regs); | ||
4107 | rcu_read_unlock(); | ||
4108 | } | ||
4109 | 4146 | ||
4110 | void __perf_sw_event(u32 event_id, u64 nr, int nmi, | 4147 | void __perf_sw_event(u32 event_id, u64 nr, int nmi, |
4111 | struct pt_regs *regs, u64 addr) | 4148 | struct pt_regs *regs, u64 addr) |
@@ -4131,16 +4168,28 @@ static void perf_swevent_read(struct perf_event *event) | |||
4131 | static int perf_swevent_enable(struct perf_event *event) | 4168 | static int perf_swevent_enable(struct perf_event *event) |
4132 | { | 4169 | { |
4133 | struct hw_perf_event *hwc = &event->hw; | 4170 | struct hw_perf_event *hwc = &event->hw; |
4171 | struct perf_cpu_context *cpuctx; | ||
4172 | struct hlist_head *head; | ||
4173 | |||
4174 | cpuctx = &__get_cpu_var(perf_cpu_context); | ||
4134 | 4175 | ||
4135 | if (hwc->sample_period) { | 4176 | if (hwc->sample_period) { |
4136 | hwc->last_period = hwc->sample_period; | 4177 | hwc->last_period = hwc->sample_period; |
4137 | perf_swevent_set_period(event); | 4178 | perf_swevent_set_period(event); |
4138 | } | 4179 | } |
4180 | |||
4181 | head = find_swevent_head(cpuctx, event->attr.type, event->attr.config); | ||
4182 | if (WARN_ON_ONCE(!head)) | ||
4183 | return -EINVAL; | ||
4184 | |||
4185 | hlist_add_head_rcu(&event->hlist_entry, head); | ||
4186 | |||
4139 | return 0; | 4187 | return 0; |
4140 | } | 4188 | } |
4141 | 4189 | ||
4142 | static void perf_swevent_disable(struct perf_event *event) | 4190 | static void perf_swevent_disable(struct perf_event *event) |
4143 | { | 4191 | { |
4192 | hlist_del_rcu(&event->hlist_entry); | ||
4144 | } | 4193 | } |
4145 | 4194 | ||
4146 | static const struct pmu perf_ops_generic = { | 4195 | static const struct pmu perf_ops_generic = { |
@@ -4168,15 +4217,8 @@ static enum hrtimer_restart perf_swevent_hrtimer(struct hrtimer *hrtimer) | |||
4168 | perf_sample_data_init(&data, 0); | 4217 | perf_sample_data_init(&data, 0); |
4169 | data.period = event->hw.last_period; | 4218 | data.period = event->hw.last_period; |
4170 | regs = get_irq_regs(); | 4219 | regs = get_irq_regs(); |
4171 | /* | ||
4172 | * In case we exclude kernel IPs or are somehow not in interrupt | ||
4173 | * context, provide the next best thing, the user IP. | ||
4174 | */ | ||
4175 | if ((event->attr.exclude_kernel || !regs) && | ||
4176 | !event->attr.exclude_user) | ||
4177 | regs = task_pt_regs(current); | ||
4178 | 4220 | ||
4179 | if (regs) { | 4221 | if (regs && !perf_exclude_event(event, regs)) { |
4180 | if (!(event->attr.exclude_idle && current->pid == 0)) | 4222 | if (!(event->attr.exclude_idle && current->pid == 0)) |
4181 | if (perf_event_overflow(event, 0, &data, regs)) | 4223 | if (perf_event_overflow(event, 0, &data, regs)) |
4182 | ret = HRTIMER_NORESTART; | 4224 | ret = HRTIMER_NORESTART; |
@@ -4324,6 +4366,105 @@ static const struct pmu perf_ops_task_clock = { | |||
4324 | .read = task_clock_perf_event_read, | 4366 | .read = task_clock_perf_event_read, |
4325 | }; | 4367 | }; |
4326 | 4368 | ||
4369 | static void swevent_hlist_release_rcu(struct rcu_head *rcu_head) | ||
4370 | { | ||
4371 | struct swevent_hlist *hlist; | ||
4372 | |||
4373 | hlist = container_of(rcu_head, struct swevent_hlist, rcu_head); | ||
4374 | kfree(hlist); | ||
4375 | } | ||
4376 | |||
4377 | static void swevent_hlist_release(struct perf_cpu_context *cpuctx) | ||
4378 | { | ||
4379 | struct swevent_hlist *hlist; | ||
4380 | |||
4381 | if (!cpuctx->swevent_hlist) | ||
4382 | return; | ||
4383 | |||
4384 | hlist = cpuctx->swevent_hlist; | ||
4385 | rcu_assign_pointer(cpuctx->swevent_hlist, NULL); | ||
4386 | call_rcu(&hlist->rcu_head, swevent_hlist_release_rcu); | ||
4387 | } | ||
4388 | |||
4389 | static void swevent_hlist_put_cpu(struct perf_event *event, int cpu) | ||
4390 | { | ||
4391 | struct perf_cpu_context *cpuctx = &per_cpu(perf_cpu_context, cpu); | ||
4392 | |||
4393 | mutex_lock(&cpuctx->hlist_mutex); | ||
4394 | |||
4395 | if (!--cpuctx->hlist_refcount) | ||
4396 | swevent_hlist_release(cpuctx); | ||
4397 | |||
4398 | mutex_unlock(&cpuctx->hlist_mutex); | ||
4399 | } | ||
4400 | |||
4401 | static void swevent_hlist_put(struct perf_event *event) | ||
4402 | { | ||
4403 | int cpu; | ||
4404 | |||
4405 | if (event->cpu != -1) { | ||
4406 | swevent_hlist_put_cpu(event, event->cpu); | ||
4407 | return; | ||
4408 | } | ||
4409 | |||
4410 | for_each_possible_cpu(cpu) | ||
4411 | swevent_hlist_put_cpu(event, cpu); | ||
4412 | } | ||
4413 | |||
4414 | static int swevent_hlist_get_cpu(struct perf_event *event, int cpu) | ||
4415 | { | ||
4416 | struct perf_cpu_context *cpuctx = &per_cpu(perf_cpu_context, cpu); | ||
4417 | int err = 0; | ||
4418 | |||
4419 | mutex_lock(&cpuctx->hlist_mutex); | ||
4420 | |||
4421 | if (!cpuctx->swevent_hlist && cpu_online(cpu)) { | ||
4422 | struct swevent_hlist *hlist; | ||
4423 | |||
4424 | hlist = kzalloc(sizeof(*hlist), GFP_KERNEL); | ||
4425 | if (!hlist) { | ||
4426 | err = -ENOMEM; | ||
4427 | goto exit; | ||
4428 | } | ||
4429 | rcu_assign_pointer(cpuctx->swevent_hlist, hlist); | ||
4430 | } | ||
4431 | cpuctx->hlist_refcount++; | ||
4432 | exit: | ||
4433 | mutex_unlock(&cpuctx->hlist_mutex); | ||
4434 | |||
4435 | return err; | ||
4436 | } | ||
4437 | |||
4438 | static int swevent_hlist_get(struct perf_event *event) | ||
4439 | { | ||
4440 | int err; | ||
4441 | int cpu, failed_cpu; | ||
4442 | |||
4443 | if (event->cpu != -1) | ||
4444 | return swevent_hlist_get_cpu(event, event->cpu); | ||
4445 | |||
4446 | get_online_cpus(); | ||
4447 | for_each_possible_cpu(cpu) { | ||
4448 | err = swevent_hlist_get_cpu(event, cpu); | ||
4449 | if (err) { | ||
4450 | failed_cpu = cpu; | ||
4451 | goto fail; | ||
4452 | } | ||
4453 | } | ||
4454 | put_online_cpus(); | ||
4455 | |||
4456 | return 0; | ||
4457 | fail: | ||
4458 | for_each_possible_cpu(cpu) { | ||
4459 | if (cpu == failed_cpu) | ||
4460 | break; | ||
4461 | swevent_hlist_put_cpu(event, cpu); | ||
4462 | } | ||
4463 | |||
4464 | put_online_cpus(); | ||
4465 | return err; | ||
4466 | } | ||
4467 | |||
4327 | #ifdef CONFIG_EVENT_TRACING | 4468 | #ifdef CONFIG_EVENT_TRACING |
4328 | 4469 | ||
4329 | void perf_tp_event(int event_id, u64 addr, u64 count, void *record, | 4470 | void perf_tp_event(int event_id, u64 addr, u64 count, void *record, |
@@ -4357,10 +4498,13 @@ static int perf_tp_event_match(struct perf_event *event, | |||
4357 | static void tp_perf_event_destroy(struct perf_event *event) | 4498 | static void tp_perf_event_destroy(struct perf_event *event) |
4358 | { | 4499 | { |
4359 | perf_trace_disable(event->attr.config); | 4500 | perf_trace_disable(event->attr.config); |
4501 | swevent_hlist_put(event); | ||
4360 | } | 4502 | } |
4361 | 4503 | ||
4362 | static const struct pmu *tp_perf_event_init(struct perf_event *event) | 4504 | static const struct pmu *tp_perf_event_init(struct perf_event *event) |
4363 | { | 4505 | { |
4506 | int err; | ||
4507 | |||
4364 | /* | 4508 | /* |
4365 | * Raw tracepoint data is a severe data leak, only allow root to | 4509 | * Raw tracepoint data is a severe data leak, only allow root to |
4366 | * have these. | 4510 | * have these. |
@@ -4374,6 +4518,11 @@ static const struct pmu *tp_perf_event_init(struct perf_event *event) | |||
4374 | return NULL; | 4518 | return NULL; |
4375 | 4519 | ||
4376 | event->destroy = tp_perf_event_destroy; | 4520 | event->destroy = tp_perf_event_destroy; |
4521 | err = swevent_hlist_get(event); | ||
4522 | if (err) { | ||
4523 | perf_trace_disable(event->attr.config); | ||
4524 | return ERR_PTR(err); | ||
4525 | } | ||
4377 | 4526 | ||
4378 | return &perf_ops_generic; | 4527 | return &perf_ops_generic; |
4379 | } | 4528 | } |
@@ -4474,6 +4623,7 @@ static void sw_perf_event_destroy(struct perf_event *event) | |||
4474 | WARN_ON(event->parent); | 4623 | WARN_ON(event->parent); |
4475 | 4624 | ||
4476 | atomic_dec(&perf_swevent_enabled[event_id]); | 4625 | atomic_dec(&perf_swevent_enabled[event_id]); |
4626 | swevent_hlist_put(event); | ||
4477 | } | 4627 | } |
4478 | 4628 | ||
4479 | static const struct pmu *sw_perf_event_init(struct perf_event *event) | 4629 | static const struct pmu *sw_perf_event_init(struct perf_event *event) |
@@ -4512,6 +4662,12 @@ static const struct pmu *sw_perf_event_init(struct perf_event *event) | |||
4512 | case PERF_COUNT_SW_ALIGNMENT_FAULTS: | 4662 | case PERF_COUNT_SW_ALIGNMENT_FAULTS: |
4513 | case PERF_COUNT_SW_EMULATION_FAULTS: | 4663 | case PERF_COUNT_SW_EMULATION_FAULTS: |
4514 | if (!event->parent) { | 4664 | if (!event->parent) { |
4665 | int err; | ||
4666 | |||
4667 | err = swevent_hlist_get(event); | ||
4668 | if (err) | ||
4669 | return ERR_PTR(err); | ||
4670 | |||
4515 | atomic_inc(&perf_swevent_enabled[event_id]); | 4671 | atomic_inc(&perf_swevent_enabled[event_id]); |
4516 | event->destroy = sw_perf_event_destroy; | 4672 | event->destroy = sw_perf_event_destroy; |
4517 | } | 4673 | } |
@@ -5176,7 +5332,7 @@ void perf_event_exit_task(struct task_struct *child) | |||
5176 | * | 5332 | * |
5177 | * But since its the parent context it won't be the same instance. | 5333 | * But since its the parent context it won't be the same instance. |
5178 | */ | 5334 | */ |
5179 | mutex_lock_nested(&child_ctx->mutex, SINGLE_DEPTH_NESTING); | 5335 | mutex_lock(&child_ctx->mutex); |
5180 | 5336 | ||
5181 | again: | 5337 | again: |
5182 | list_for_each_entry_safe(child_event, tmp, &child_ctx->pinned_groups, | 5338 | list_for_each_entry_safe(child_event, tmp, &child_ctx->pinned_groups, |
@@ -5384,6 +5540,7 @@ static void __init perf_event_init_all_cpus(void) | |||
5384 | 5540 | ||
5385 | for_each_possible_cpu(cpu) { | 5541 | for_each_possible_cpu(cpu) { |
5386 | cpuctx = &per_cpu(perf_cpu_context, cpu); | 5542 | cpuctx = &per_cpu(perf_cpu_context, cpu); |
5543 | mutex_init(&cpuctx->hlist_mutex); | ||
5387 | __perf_event_init_context(&cpuctx->ctx, NULL); | 5544 | __perf_event_init_context(&cpuctx->ctx, NULL); |
5388 | } | 5545 | } |
5389 | } | 5546 | } |
@@ -5397,6 +5554,16 @@ static void __cpuinit perf_event_init_cpu(int cpu) | |||
5397 | spin_lock(&perf_resource_lock); | 5554 | spin_lock(&perf_resource_lock); |
5398 | cpuctx->max_pertask = perf_max_events - perf_reserved_percpu; | 5555 | cpuctx->max_pertask = perf_max_events - perf_reserved_percpu; |
5399 | spin_unlock(&perf_resource_lock); | 5556 | spin_unlock(&perf_resource_lock); |
5557 | |||
5558 | mutex_lock(&cpuctx->hlist_mutex); | ||
5559 | if (cpuctx->hlist_refcount > 0) { | ||
5560 | struct swevent_hlist *hlist; | ||
5561 | |||
5562 | hlist = kzalloc(sizeof(*hlist), GFP_KERNEL); | ||
5563 | WARN_ON_ONCE(!hlist); | ||
5564 | rcu_assign_pointer(cpuctx->swevent_hlist, hlist); | ||
5565 | } | ||
5566 | mutex_unlock(&cpuctx->hlist_mutex); | ||
5400 | } | 5567 | } |
5401 | 5568 | ||
5402 | #ifdef CONFIG_HOTPLUG_CPU | 5569 | #ifdef CONFIG_HOTPLUG_CPU |
@@ -5416,6 +5583,10 @@ static void perf_event_exit_cpu(int cpu) | |||
5416 | struct perf_cpu_context *cpuctx = &per_cpu(perf_cpu_context, cpu); | 5583 | struct perf_cpu_context *cpuctx = &per_cpu(perf_cpu_context, cpu); |
5417 | struct perf_event_context *ctx = &cpuctx->ctx; | 5584 | struct perf_event_context *ctx = &cpuctx->ctx; |
5418 | 5585 | ||
5586 | mutex_lock(&cpuctx->hlist_mutex); | ||
5587 | swevent_hlist_release(cpuctx); | ||
5588 | mutex_unlock(&cpuctx->hlist_mutex); | ||
5589 | |||
5419 | mutex_lock(&ctx->mutex); | 5590 | mutex_lock(&ctx->mutex); |
5420 | smp_call_function_single(cpu, __perf_event_exit_cpu, NULL, 1); | 5591 | smp_call_function_single(cpu, __perf_event_exit_cpu, NULL, 1); |
5421 | mutex_unlock(&ctx->mutex); | 5592 | mutex_unlock(&ctx->mutex); |
diff --git a/kernel/ptrace.c b/kernel/ptrace.c index 2f0f50b450a3..6af9cdd558b7 100644 --- a/kernel/ptrace.c +++ b/kernel/ptrace.c | |||
@@ -75,7 +75,6 @@ void __ptrace_unlink(struct task_struct *child) | |||
75 | child->parent = child->real_parent; | 75 | child->parent = child->real_parent; |
76 | list_del_init(&child->ptrace_entry); | 76 | list_del_init(&child->ptrace_entry); |
77 | 77 | ||
78 | arch_ptrace_untrace(child); | ||
79 | if (task_is_traced(child)) | 78 | if (task_is_traced(child)) |
80 | ptrace_untrace(child); | 79 | ptrace_untrace(child); |
81 | } | 80 | } |
diff --git a/kernel/sched.c b/kernel/sched.c index d8a213ccdc3b..5cd607ec8405 100644 --- a/kernel/sched.c +++ b/kernel/sched.c | |||
@@ -2088,49 +2088,6 @@ migrate_task(struct task_struct *p, int dest_cpu, struct migration_req *req) | |||
2088 | } | 2088 | } |
2089 | 2089 | ||
2090 | /* | 2090 | /* |
2091 | * wait_task_context_switch - wait for a thread to complete at least one | ||
2092 | * context switch. | ||
2093 | * | ||
2094 | * @p must not be current. | ||
2095 | */ | ||
2096 | void wait_task_context_switch(struct task_struct *p) | ||
2097 | { | ||
2098 | unsigned long nvcsw, nivcsw, flags; | ||
2099 | int running; | ||
2100 | struct rq *rq; | ||
2101 | |||
2102 | nvcsw = p->nvcsw; | ||
2103 | nivcsw = p->nivcsw; | ||
2104 | for (;;) { | ||
2105 | /* | ||
2106 | * The runqueue is assigned before the actual context | ||
2107 | * switch. We need to take the runqueue lock. | ||
2108 | * | ||
2109 | * We could check initially without the lock but it is | ||
2110 | * very likely that we need to take the lock in every | ||
2111 | * iteration. | ||
2112 | */ | ||
2113 | rq = task_rq_lock(p, &flags); | ||
2114 | running = task_running(rq, p); | ||
2115 | task_rq_unlock(rq, &flags); | ||
2116 | |||
2117 | if (likely(!running)) | ||
2118 | break; | ||
2119 | /* | ||
2120 | * The switch count is incremented before the actual | ||
2121 | * context switch. We thus wait for two switches to be | ||
2122 | * sure at least one completed. | ||
2123 | */ | ||
2124 | if ((p->nvcsw - nvcsw) > 1) | ||
2125 | break; | ||
2126 | if ((p->nivcsw - nivcsw) > 1) | ||
2127 | break; | ||
2128 | |||
2129 | cpu_relax(); | ||
2130 | } | ||
2131 | } | ||
2132 | |||
2133 | /* | ||
2134 | * wait_task_inactive - wait for a thread to unschedule. | 2091 | * wait_task_inactive - wait for a thread to unschedule. |
2135 | * | 2092 | * |
2136 | * If @match_state is nonzero, it's the @p->state value just checked and | 2093 | * If @match_state is nonzero, it's the @p->state value just checked and |
diff --git a/kernel/trace/Kconfig b/kernel/trace/Kconfig index 13e13d428cd3..8b1797c4545b 100644 --- a/kernel/trace/Kconfig +++ b/kernel/trace/Kconfig | |||
@@ -44,9 +44,6 @@ config HAVE_FTRACE_MCOUNT_RECORD | |||
44 | help | 44 | help |
45 | See Documentation/trace/ftrace-design.txt | 45 | See Documentation/trace/ftrace-design.txt |
46 | 46 | ||
47 | config HAVE_HW_BRANCH_TRACER | ||
48 | bool | ||
49 | |||
50 | config HAVE_SYSCALL_TRACEPOINTS | 47 | config HAVE_SYSCALL_TRACEPOINTS |
51 | bool | 48 | bool |
52 | help | 49 | help |
@@ -374,14 +371,6 @@ config STACK_TRACER | |||
374 | 371 | ||
375 | Say N if unsure. | 372 | Say N if unsure. |
376 | 373 | ||
377 | config HW_BRANCH_TRACER | ||
378 | depends on HAVE_HW_BRANCH_TRACER | ||
379 | bool "Trace hw branches" | ||
380 | select GENERIC_TRACER | ||
381 | help | ||
382 | This tracer records all branches on the system in a circular | ||
383 | buffer, giving access to the last N branches for each cpu. | ||
384 | |||
385 | config KMEMTRACE | 374 | config KMEMTRACE |
386 | bool "Trace SLAB allocations" | 375 | bool "Trace SLAB allocations" |
387 | select GENERIC_TRACER | 376 | select GENERIC_TRACER |
diff --git a/kernel/trace/Makefile b/kernel/trace/Makefile index 78edc6490038..ffb1a5b0550e 100644 --- a/kernel/trace/Makefile +++ b/kernel/trace/Makefile | |||
@@ -41,7 +41,6 @@ obj-$(CONFIG_MMIOTRACE) += trace_mmiotrace.o | |||
41 | obj-$(CONFIG_BOOT_TRACER) += trace_boot.o | 41 | obj-$(CONFIG_BOOT_TRACER) += trace_boot.o |
42 | obj-$(CONFIG_FUNCTION_GRAPH_TRACER) += trace_functions_graph.o | 42 | obj-$(CONFIG_FUNCTION_GRAPH_TRACER) += trace_functions_graph.o |
43 | obj-$(CONFIG_TRACE_BRANCH_PROFILING) += trace_branch.o | 43 | obj-$(CONFIG_TRACE_BRANCH_PROFILING) += trace_branch.o |
44 | obj-$(CONFIG_HW_BRANCH_TRACER) += trace_hw_branches.o | ||
45 | obj-$(CONFIG_KMEMTRACE) += kmemtrace.o | 44 | obj-$(CONFIG_KMEMTRACE) += kmemtrace.o |
46 | obj-$(CONFIG_WORKQUEUE_TRACER) += trace_workqueue.o | 45 | obj-$(CONFIG_WORKQUEUE_TRACER) += trace_workqueue.o |
47 | obj-$(CONFIG_BLK_DEV_IO_TRACE) += blktrace.o | 46 | obj-$(CONFIG_BLK_DEV_IO_TRACE) += blktrace.o |
diff --git a/kernel/trace/trace.h b/kernel/trace/trace.h index 2825ef2c0b15..3ebdb6bd2362 100644 --- a/kernel/trace/trace.h +++ b/kernel/trace/trace.h | |||
@@ -34,7 +34,6 @@ enum trace_type { | |||
34 | TRACE_GRAPH_RET, | 34 | TRACE_GRAPH_RET, |
35 | TRACE_GRAPH_ENT, | 35 | TRACE_GRAPH_ENT, |
36 | TRACE_USER_STACK, | 36 | TRACE_USER_STACK, |
37 | TRACE_HW_BRANCHES, | ||
38 | TRACE_KMEM_ALLOC, | 37 | TRACE_KMEM_ALLOC, |
39 | TRACE_KMEM_FREE, | 38 | TRACE_KMEM_FREE, |
40 | TRACE_BLK, | 39 | TRACE_BLK, |
@@ -103,29 +102,17 @@ struct syscall_trace_exit { | |||
103 | long ret; | 102 | long ret; |
104 | }; | 103 | }; |
105 | 104 | ||
106 | struct kprobe_trace_entry { | 105 | struct kprobe_trace_entry_head { |
107 | struct trace_entry ent; | 106 | struct trace_entry ent; |
108 | unsigned long ip; | 107 | unsigned long ip; |
109 | int nargs; | ||
110 | unsigned long args[]; | ||
111 | }; | 108 | }; |
112 | 109 | ||
113 | #define SIZEOF_KPROBE_TRACE_ENTRY(n) \ | 110 | struct kretprobe_trace_entry_head { |
114 | (offsetof(struct kprobe_trace_entry, args) + \ | ||
115 | (sizeof(unsigned long) * (n))) | ||
116 | |||
117 | struct kretprobe_trace_entry { | ||
118 | struct trace_entry ent; | 111 | struct trace_entry ent; |
119 | unsigned long func; | 112 | unsigned long func; |
120 | unsigned long ret_ip; | 113 | unsigned long ret_ip; |
121 | int nargs; | ||
122 | unsigned long args[]; | ||
123 | }; | 114 | }; |
124 | 115 | ||
125 | #define SIZEOF_KRETPROBE_TRACE_ENTRY(n) \ | ||
126 | (offsetof(struct kretprobe_trace_entry, args) + \ | ||
127 | (sizeof(unsigned long) * (n))) | ||
128 | |||
129 | /* | 116 | /* |
130 | * trace_flag_type is an enumeration that holds different | 117 | * trace_flag_type is an enumeration that holds different |
131 | * states when a trace occurs. These are: | 118 | * states when a trace occurs. These are: |
@@ -229,7 +216,6 @@ extern void __ftrace_bad_type(void); | |||
229 | TRACE_GRAPH_ENT); \ | 216 | TRACE_GRAPH_ENT); \ |
230 | IF_ASSIGN(var, ent, struct ftrace_graph_ret_entry, \ | 217 | IF_ASSIGN(var, ent, struct ftrace_graph_ret_entry, \ |
231 | TRACE_GRAPH_RET); \ | 218 | TRACE_GRAPH_RET); \ |
232 | IF_ASSIGN(var, ent, struct hw_branch_entry, TRACE_HW_BRANCHES);\ | ||
233 | IF_ASSIGN(var, ent, struct kmemtrace_alloc_entry, \ | 219 | IF_ASSIGN(var, ent, struct kmemtrace_alloc_entry, \ |
234 | TRACE_KMEM_ALLOC); \ | 220 | TRACE_KMEM_ALLOC); \ |
235 | IF_ASSIGN(var, ent, struct kmemtrace_free_entry, \ | 221 | IF_ASSIGN(var, ent, struct kmemtrace_free_entry, \ |
@@ -467,8 +453,6 @@ extern int trace_selftest_startup_sysprof(struct tracer *trace, | |||
467 | struct trace_array *tr); | 453 | struct trace_array *tr); |
468 | extern int trace_selftest_startup_branch(struct tracer *trace, | 454 | extern int trace_selftest_startup_branch(struct tracer *trace, |
469 | struct trace_array *tr); | 455 | struct trace_array *tr); |
470 | extern int trace_selftest_startup_hw_branches(struct tracer *trace, | ||
471 | struct trace_array *tr); | ||
472 | extern int trace_selftest_startup_ksym(struct tracer *trace, | 456 | extern int trace_selftest_startup_ksym(struct tracer *trace, |
473 | struct trace_array *tr); | 457 | struct trace_array *tr); |
474 | #endif /* CONFIG_FTRACE_STARTUP_TEST */ | 458 | #endif /* CONFIG_FTRACE_STARTUP_TEST */ |
diff --git a/kernel/trace/trace_entries.h b/kernel/trace/trace_entries.h index c16a08f399df..dc008c1240da 100644 --- a/kernel/trace/trace_entries.h +++ b/kernel/trace/trace_entries.h | |||
@@ -318,18 +318,6 @@ FTRACE_ENTRY(branch, trace_branch, | |||
318 | __entry->func, __entry->file, __entry->correct) | 318 | __entry->func, __entry->file, __entry->correct) |
319 | ); | 319 | ); |
320 | 320 | ||
321 | FTRACE_ENTRY(hw_branch, hw_branch_entry, | ||
322 | |||
323 | TRACE_HW_BRANCHES, | ||
324 | |||
325 | F_STRUCT( | ||
326 | __field( u64, from ) | ||
327 | __field( u64, to ) | ||
328 | ), | ||
329 | |||
330 | F_printk("from: %llx to: %llx", __entry->from, __entry->to) | ||
331 | ); | ||
332 | |||
333 | FTRACE_ENTRY(kmem_alloc, kmemtrace_alloc_entry, | 321 | FTRACE_ENTRY(kmem_alloc, kmemtrace_alloc_entry, |
334 | 322 | ||
335 | TRACE_KMEM_ALLOC, | 323 | TRACE_KMEM_ALLOC, |
diff --git a/kernel/trace/trace_events_filter.c b/kernel/trace/trace_events_filter.c index 88c0b6dbd7fe..58092d844a1f 100644 --- a/kernel/trace/trace_events_filter.c +++ b/kernel/trace/trace_events_filter.c | |||
@@ -1398,7 +1398,7 @@ int ftrace_profile_set_filter(struct perf_event *event, int event_id, | |||
1398 | } | 1398 | } |
1399 | 1399 | ||
1400 | err = -EINVAL; | 1400 | err = -EINVAL; |
1401 | if (!call) | 1401 | if (&call->list == &ftrace_events) |
1402 | goto out_unlock; | 1402 | goto out_unlock; |
1403 | 1403 | ||
1404 | err = -EEXIST; | 1404 | err = -EEXIST; |
diff --git a/kernel/trace/trace_hw_branches.c b/kernel/trace/trace_hw_branches.c deleted file mode 100644 index 7b97000745f5..000000000000 --- a/kernel/trace/trace_hw_branches.c +++ /dev/null | |||
@@ -1,312 +0,0 @@ | |||
1 | /* | ||
2 | * h/w branch tracer for x86 based on BTS | ||
3 | * | ||
4 | * Copyright (C) 2008-2009 Intel Corporation. | ||
5 | * Markus Metzger <markus.t.metzger@gmail.com>, 2008-2009 | ||
6 | */ | ||
7 | #include <linux/kallsyms.h> | ||
8 | #include <linux/debugfs.h> | ||
9 | #include <linux/ftrace.h> | ||
10 | #include <linux/module.h> | ||
11 | #include <linux/cpu.h> | ||
12 | #include <linux/smp.h> | ||
13 | #include <linux/fs.h> | ||
14 | |||
15 | #include <asm/ds.h> | ||
16 | |||
17 | #include "trace_output.h" | ||
18 | #include "trace.h" | ||
19 | |||
20 | |||
21 | #define BTS_BUFFER_SIZE (1 << 13) | ||
22 | |||
23 | static DEFINE_PER_CPU(struct bts_tracer *, hwb_tracer); | ||
24 | static DEFINE_PER_CPU(unsigned char[BTS_BUFFER_SIZE], hwb_buffer); | ||
25 | |||
26 | #define this_tracer per_cpu(hwb_tracer, smp_processor_id()) | ||
27 | |||
28 | static int trace_hw_branches_enabled __read_mostly; | ||
29 | static int trace_hw_branches_suspended __read_mostly; | ||
30 | static struct trace_array *hw_branch_trace __read_mostly; | ||
31 | |||
32 | |||
33 | static void bts_trace_init_cpu(int cpu) | ||
34 | { | ||
35 | per_cpu(hwb_tracer, cpu) = | ||
36 | ds_request_bts_cpu(cpu, per_cpu(hwb_buffer, cpu), | ||
37 | BTS_BUFFER_SIZE, NULL, (size_t)-1, | ||
38 | BTS_KERNEL); | ||
39 | |||
40 | if (IS_ERR(per_cpu(hwb_tracer, cpu))) | ||
41 | per_cpu(hwb_tracer, cpu) = NULL; | ||
42 | } | ||
43 | |||
44 | static int bts_trace_init(struct trace_array *tr) | ||
45 | { | ||
46 | int cpu; | ||
47 | |||
48 | hw_branch_trace = tr; | ||
49 | trace_hw_branches_enabled = 0; | ||
50 | |||
51 | get_online_cpus(); | ||
52 | for_each_online_cpu(cpu) { | ||
53 | bts_trace_init_cpu(cpu); | ||
54 | |||
55 | if (likely(per_cpu(hwb_tracer, cpu))) | ||
56 | trace_hw_branches_enabled = 1; | ||
57 | } | ||
58 | trace_hw_branches_suspended = 0; | ||
59 | put_online_cpus(); | ||
60 | |||
61 | /* If we could not enable tracing on a single cpu, we fail. */ | ||
62 | return trace_hw_branches_enabled ? 0 : -EOPNOTSUPP; | ||
63 | } | ||
64 | |||
65 | static void bts_trace_reset(struct trace_array *tr) | ||
66 | { | ||
67 | int cpu; | ||
68 | |||
69 | get_online_cpus(); | ||
70 | for_each_online_cpu(cpu) { | ||
71 | if (likely(per_cpu(hwb_tracer, cpu))) { | ||
72 | ds_release_bts(per_cpu(hwb_tracer, cpu)); | ||
73 | per_cpu(hwb_tracer, cpu) = NULL; | ||
74 | } | ||
75 | } | ||
76 | trace_hw_branches_enabled = 0; | ||
77 | trace_hw_branches_suspended = 0; | ||
78 | put_online_cpus(); | ||
79 | } | ||
80 | |||
81 | static void bts_trace_start(struct trace_array *tr) | ||
82 | { | ||
83 | int cpu; | ||
84 | |||
85 | get_online_cpus(); | ||
86 | for_each_online_cpu(cpu) | ||
87 | if (likely(per_cpu(hwb_tracer, cpu))) | ||
88 | ds_resume_bts(per_cpu(hwb_tracer, cpu)); | ||
89 | trace_hw_branches_suspended = 0; | ||
90 | put_online_cpus(); | ||
91 | } | ||
92 | |||
93 | static void bts_trace_stop(struct trace_array *tr) | ||
94 | { | ||
95 | int cpu; | ||
96 | |||
97 | get_online_cpus(); | ||
98 | for_each_online_cpu(cpu) | ||
99 | if (likely(per_cpu(hwb_tracer, cpu))) | ||
100 | ds_suspend_bts(per_cpu(hwb_tracer, cpu)); | ||
101 | trace_hw_branches_suspended = 1; | ||
102 | put_online_cpus(); | ||
103 | } | ||
104 | |||
105 | static int __cpuinit bts_hotcpu_handler(struct notifier_block *nfb, | ||
106 | unsigned long action, void *hcpu) | ||
107 | { | ||
108 | int cpu = (long)hcpu; | ||
109 | |||
110 | switch (action) { | ||
111 | case CPU_ONLINE: | ||
112 | case CPU_DOWN_FAILED: | ||
113 | /* The notification is sent with interrupts enabled. */ | ||
114 | if (trace_hw_branches_enabled) { | ||
115 | bts_trace_init_cpu(cpu); | ||
116 | |||
117 | if (trace_hw_branches_suspended && | ||
118 | likely(per_cpu(hwb_tracer, cpu))) | ||
119 | ds_suspend_bts(per_cpu(hwb_tracer, cpu)); | ||
120 | } | ||
121 | break; | ||
122 | |||
123 | case CPU_DOWN_PREPARE: | ||
124 | /* The notification is sent with interrupts enabled. */ | ||
125 | if (likely(per_cpu(hwb_tracer, cpu))) { | ||
126 | ds_release_bts(per_cpu(hwb_tracer, cpu)); | ||
127 | per_cpu(hwb_tracer, cpu) = NULL; | ||
128 | } | ||
129 | } | ||
130 | |||
131 | return NOTIFY_DONE; | ||
132 | } | ||
133 | |||
134 | static struct notifier_block bts_hotcpu_notifier __cpuinitdata = { | ||
135 | .notifier_call = bts_hotcpu_handler | ||
136 | }; | ||
137 | |||
138 | static void bts_trace_print_header(struct seq_file *m) | ||
139 | { | ||
140 | seq_puts(m, "# CPU# TO <- FROM\n"); | ||
141 | } | ||
142 | |||
143 | static enum print_line_t bts_trace_print_line(struct trace_iterator *iter) | ||
144 | { | ||
145 | unsigned long symflags = TRACE_ITER_SYM_OFFSET; | ||
146 | struct trace_entry *entry = iter->ent; | ||
147 | struct trace_seq *seq = &iter->seq; | ||
148 | struct hw_branch_entry *it; | ||
149 | |||
150 | trace_assign_type(it, entry); | ||
151 | |||
152 | if (entry->type == TRACE_HW_BRANCHES) { | ||
153 | if (trace_seq_printf(seq, "%4d ", iter->cpu) && | ||
154 | seq_print_ip_sym(seq, it->to, symflags) && | ||
155 | trace_seq_printf(seq, "\t <- ") && | ||
156 | seq_print_ip_sym(seq, it->from, symflags) && | ||
157 | trace_seq_printf(seq, "\n")) | ||
158 | return TRACE_TYPE_HANDLED; | ||
159 | return TRACE_TYPE_PARTIAL_LINE; | ||
160 | } | ||
161 | return TRACE_TYPE_UNHANDLED; | ||
162 | } | ||
163 | |||
164 | void trace_hw_branch(u64 from, u64 to) | ||
165 | { | ||
166 | struct ftrace_event_call *call = &event_hw_branch; | ||
167 | struct trace_array *tr = hw_branch_trace; | ||
168 | struct ring_buffer_event *event; | ||
169 | struct ring_buffer *buf; | ||
170 | struct hw_branch_entry *entry; | ||
171 | unsigned long irq1; | ||
172 | int cpu; | ||
173 | |||
174 | if (unlikely(!tr)) | ||
175 | return; | ||
176 | |||
177 | if (unlikely(!trace_hw_branches_enabled)) | ||
178 | return; | ||
179 | |||
180 | local_irq_save(irq1); | ||
181 | cpu = raw_smp_processor_id(); | ||
182 | if (atomic_inc_return(&tr->data[cpu]->disabled) != 1) | ||
183 | goto out; | ||
184 | |||
185 | buf = tr->buffer; | ||
186 | event = trace_buffer_lock_reserve(buf, TRACE_HW_BRANCHES, | ||
187 | sizeof(*entry), 0, 0); | ||
188 | if (!event) | ||
189 | goto out; | ||
190 | entry = ring_buffer_event_data(event); | ||
191 | tracing_generic_entry_update(&entry->ent, 0, from); | ||
192 | entry->ent.type = TRACE_HW_BRANCHES; | ||
193 | entry->from = from; | ||
194 | entry->to = to; | ||
195 | if (!filter_check_discard(call, entry, buf, event)) | ||
196 | trace_buffer_unlock_commit(buf, event, 0, 0); | ||
197 | |||
198 | out: | ||
199 | atomic_dec(&tr->data[cpu]->disabled); | ||
200 | local_irq_restore(irq1); | ||
201 | } | ||
202 | |||
203 | static void trace_bts_at(const struct bts_trace *trace, void *at) | ||
204 | { | ||
205 | struct bts_struct bts; | ||
206 | int err = 0; | ||
207 | |||
208 | WARN_ON_ONCE(!trace->read); | ||
209 | if (!trace->read) | ||
210 | return; | ||
211 | |||
212 | err = trace->read(this_tracer, at, &bts); | ||
213 | if (err < 0) | ||
214 | return; | ||
215 | |||
216 | switch (bts.qualifier) { | ||
217 | case BTS_BRANCH: | ||
218 | trace_hw_branch(bts.variant.lbr.from, bts.variant.lbr.to); | ||
219 | break; | ||
220 | } | ||
221 | } | ||
222 | |||
223 | /* | ||
224 | * Collect the trace on the current cpu and write it into the ftrace buffer. | ||
225 | * | ||
226 | * pre: tracing must be suspended on the current cpu | ||
227 | */ | ||
228 | static void trace_bts_cpu(void *arg) | ||
229 | { | ||
230 | struct trace_array *tr = (struct trace_array *)arg; | ||
231 | const struct bts_trace *trace; | ||
232 | unsigned char *at; | ||
233 | |||
234 | if (unlikely(!tr)) | ||
235 | return; | ||
236 | |||
237 | if (unlikely(atomic_read(&tr->data[raw_smp_processor_id()]->disabled))) | ||
238 | return; | ||
239 | |||
240 | if (unlikely(!this_tracer)) | ||
241 | return; | ||
242 | |||
243 | trace = ds_read_bts(this_tracer); | ||
244 | if (!trace) | ||
245 | return; | ||
246 | |||
247 | for (at = trace->ds.top; (void *)at < trace->ds.end; | ||
248 | at += trace->ds.size) | ||
249 | trace_bts_at(trace, at); | ||
250 | |||
251 | for (at = trace->ds.begin; (void *)at < trace->ds.top; | ||
252 | at += trace->ds.size) | ||
253 | trace_bts_at(trace, at); | ||
254 | } | ||
255 | |||
256 | static void trace_bts_prepare(struct trace_iterator *iter) | ||
257 | { | ||
258 | int cpu; | ||
259 | |||
260 | get_online_cpus(); | ||
261 | for_each_online_cpu(cpu) | ||
262 | if (likely(per_cpu(hwb_tracer, cpu))) | ||
263 | ds_suspend_bts(per_cpu(hwb_tracer, cpu)); | ||
264 | /* | ||
265 | * We need to collect the trace on the respective cpu since ftrace | ||
266 | * implicitly adds the record for the current cpu. | ||
267 | * Once that is more flexible, we could collect the data from any cpu. | ||
268 | */ | ||
269 | on_each_cpu(trace_bts_cpu, iter->tr, 1); | ||
270 | |||
271 | for_each_online_cpu(cpu) | ||
272 | if (likely(per_cpu(hwb_tracer, cpu))) | ||
273 | ds_resume_bts(per_cpu(hwb_tracer, cpu)); | ||
274 | put_online_cpus(); | ||
275 | } | ||
276 | |||
277 | static void trace_bts_close(struct trace_iterator *iter) | ||
278 | { | ||
279 | tracing_reset_online_cpus(iter->tr); | ||
280 | } | ||
281 | |||
282 | void trace_hw_branch_oops(void) | ||
283 | { | ||
284 | if (this_tracer) { | ||
285 | ds_suspend_bts_noirq(this_tracer); | ||
286 | trace_bts_cpu(hw_branch_trace); | ||
287 | ds_resume_bts_noirq(this_tracer); | ||
288 | } | ||
289 | } | ||
290 | |||
291 | struct tracer bts_tracer __read_mostly = | ||
292 | { | ||
293 | .name = "hw-branch-tracer", | ||
294 | .init = bts_trace_init, | ||
295 | .reset = bts_trace_reset, | ||
296 | .print_header = bts_trace_print_header, | ||
297 | .print_line = bts_trace_print_line, | ||
298 | .start = bts_trace_start, | ||
299 | .stop = bts_trace_stop, | ||
300 | .open = trace_bts_prepare, | ||
301 | .close = trace_bts_close, | ||
302 | #ifdef CONFIG_FTRACE_SELFTEST | ||
303 | .selftest = trace_selftest_startup_hw_branches, | ||
304 | #endif /* CONFIG_FTRACE_SELFTEST */ | ||
305 | }; | ||
306 | |||
307 | __init static int init_bts_trace(void) | ||
308 | { | ||
309 | register_hotcpu_notifier(&bts_hotcpu_notifier); | ||
310 | return register_tracer(&bts_tracer); | ||
311 | } | ||
312 | device_initcall(init_bts_trace); | ||
diff --git a/kernel/trace/trace_kprobe.c b/kernel/trace/trace_kprobe.c index 1251e367bae9..a7514326052b 100644 --- a/kernel/trace/trace_kprobe.c +++ b/kernel/trace/trace_kprobe.c | |||
@@ -29,6 +29,8 @@ | |||
29 | #include <linux/ctype.h> | 29 | #include <linux/ctype.h> |
30 | #include <linux/ptrace.h> | 30 | #include <linux/ptrace.h> |
31 | #include <linux/perf_event.h> | 31 | #include <linux/perf_event.h> |
32 | #include <linux/stringify.h> | ||
33 | #include <asm/bitsperlong.h> | ||
32 | 34 | ||
33 | #include "trace.h" | 35 | #include "trace.h" |
34 | #include "trace_output.h" | 36 | #include "trace_output.h" |
@@ -40,7 +42,6 @@ | |||
40 | 42 | ||
41 | /* Reserved field names */ | 43 | /* Reserved field names */ |
42 | #define FIELD_STRING_IP "__probe_ip" | 44 | #define FIELD_STRING_IP "__probe_ip" |
43 | #define FIELD_STRING_NARGS "__probe_nargs" | ||
44 | #define FIELD_STRING_RETIP "__probe_ret_ip" | 45 | #define FIELD_STRING_RETIP "__probe_ret_ip" |
45 | #define FIELD_STRING_FUNC "__probe_func" | 46 | #define FIELD_STRING_FUNC "__probe_func" |
46 | 47 | ||
@@ -52,56 +53,102 @@ const char *reserved_field_names[] = { | |||
52 | "common_tgid", | 53 | "common_tgid", |
53 | "common_lock_depth", | 54 | "common_lock_depth", |
54 | FIELD_STRING_IP, | 55 | FIELD_STRING_IP, |
55 | FIELD_STRING_NARGS, | ||
56 | FIELD_STRING_RETIP, | 56 | FIELD_STRING_RETIP, |
57 | FIELD_STRING_FUNC, | 57 | FIELD_STRING_FUNC, |
58 | }; | 58 | }; |
59 | 59 | ||
60 | struct fetch_func { | 60 | /* Printing function type */ |
61 | unsigned long (*func)(struct pt_regs *, void *); | 61 | typedef int (*print_type_func_t)(struct trace_seq *, const char *, void *); |
62 | #define PRINT_TYPE_FUNC_NAME(type) print_type_##type | ||
63 | #define PRINT_TYPE_FMT_NAME(type) print_type_format_##type | ||
64 | |||
65 | /* Printing in basic type function template */ | ||
66 | #define DEFINE_BASIC_PRINT_TYPE_FUNC(type, fmt, cast) \ | ||
67 | static __kprobes int PRINT_TYPE_FUNC_NAME(type)(struct trace_seq *s, \ | ||
68 | const char *name, void *data)\ | ||
69 | { \ | ||
70 | return trace_seq_printf(s, " %s=" fmt, name, (cast)*(type *)data);\ | ||
71 | } \ | ||
72 | static const char PRINT_TYPE_FMT_NAME(type)[] = fmt; | ||
73 | |||
74 | DEFINE_BASIC_PRINT_TYPE_FUNC(u8, "%x", unsigned int) | ||
75 | DEFINE_BASIC_PRINT_TYPE_FUNC(u16, "%x", unsigned int) | ||
76 | DEFINE_BASIC_PRINT_TYPE_FUNC(u32, "%lx", unsigned long) | ||
77 | DEFINE_BASIC_PRINT_TYPE_FUNC(u64, "%llx", unsigned long long) | ||
78 | DEFINE_BASIC_PRINT_TYPE_FUNC(s8, "%d", int) | ||
79 | DEFINE_BASIC_PRINT_TYPE_FUNC(s16, "%d", int) | ||
80 | DEFINE_BASIC_PRINT_TYPE_FUNC(s32, "%ld", long) | ||
81 | DEFINE_BASIC_PRINT_TYPE_FUNC(s64, "%lld", long long) | ||
82 | |||
83 | /* Data fetch function type */ | ||
84 | typedef void (*fetch_func_t)(struct pt_regs *, void *, void *); | ||
85 | |||
86 | struct fetch_param { | ||
87 | fetch_func_t fn; | ||
62 | void *data; | 88 | void *data; |
63 | }; | 89 | }; |
64 | 90 | ||
65 | static __kprobes unsigned long call_fetch(struct fetch_func *f, | 91 | static __kprobes void call_fetch(struct fetch_param *fprm, |
66 | struct pt_regs *regs) | 92 | struct pt_regs *regs, void *dest) |
67 | { | 93 | { |
68 | return f->func(regs, f->data); | 94 | return fprm->fn(regs, fprm->data, dest); |
69 | } | 95 | } |
70 | 96 | ||
71 | /* fetch handlers */ | 97 | #define FETCH_FUNC_NAME(kind, type) fetch_##kind##_##type |
72 | static __kprobes unsigned long fetch_register(struct pt_regs *regs, | 98 | /* |
73 | void *offset) | 99 | * Define macro for basic types - we don't need to define s* types, because |
74 | { | 100 | * we have to care only about bitwidth at recording time. |
75 | return regs_get_register(regs, (unsigned int)((unsigned long)offset)); | 101 | */ |
102 | #define DEFINE_BASIC_FETCH_FUNCS(kind) \ | ||
103 | DEFINE_FETCH_##kind(u8) \ | ||
104 | DEFINE_FETCH_##kind(u16) \ | ||
105 | DEFINE_FETCH_##kind(u32) \ | ||
106 | DEFINE_FETCH_##kind(u64) | ||
107 | |||
108 | #define CHECK_BASIC_FETCH_FUNCS(kind, fn) \ | ||
109 | ((FETCH_FUNC_NAME(kind, u8) == fn) || \ | ||
110 | (FETCH_FUNC_NAME(kind, u16) == fn) || \ | ||
111 | (FETCH_FUNC_NAME(kind, u32) == fn) || \ | ||
112 | (FETCH_FUNC_NAME(kind, u64) == fn)) | ||
113 | |||
114 | /* Data fetch function templates */ | ||
115 | #define DEFINE_FETCH_reg(type) \ | ||
116 | static __kprobes void FETCH_FUNC_NAME(reg, type)(struct pt_regs *regs, \ | ||
117 | void *offset, void *dest) \ | ||
118 | { \ | ||
119 | *(type *)dest = (type)regs_get_register(regs, \ | ||
120 | (unsigned int)((unsigned long)offset)); \ | ||
76 | } | 121 | } |
77 | 122 | DEFINE_BASIC_FETCH_FUNCS(reg) | |
78 | static __kprobes unsigned long fetch_stack(struct pt_regs *regs, | 123 | |
79 | void *num) | 124 | #define DEFINE_FETCH_stack(type) \ |
80 | { | 125 | static __kprobes void FETCH_FUNC_NAME(stack, type)(struct pt_regs *regs,\ |
81 | return regs_get_kernel_stack_nth(regs, | 126 | void *offset, void *dest) \ |
82 | (unsigned int)((unsigned long)num)); | 127 | { \ |
128 | *(type *)dest = (type)regs_get_kernel_stack_nth(regs, \ | ||
129 | (unsigned int)((unsigned long)offset)); \ | ||
83 | } | 130 | } |
131 | DEFINE_BASIC_FETCH_FUNCS(stack) | ||
84 | 132 | ||
85 | static __kprobes unsigned long fetch_memory(struct pt_regs *regs, void *addr) | 133 | #define DEFINE_FETCH_retval(type) \ |
86 | { | 134 | static __kprobes void FETCH_FUNC_NAME(retval, type)(struct pt_regs *regs,\ |
87 | unsigned long retval; | 135 | void *dummy, void *dest) \ |
88 | 136 | { \ | |
89 | if (probe_kernel_address(addr, retval)) | 137 | *(type *)dest = (type)regs_return_value(regs); \ |
90 | return 0; | ||
91 | return retval; | ||
92 | } | 138 | } |
93 | 139 | DEFINE_BASIC_FETCH_FUNCS(retval) | |
94 | static __kprobes unsigned long fetch_retvalue(struct pt_regs *regs, | 140 | |
95 | void *dummy) | 141 | #define DEFINE_FETCH_memory(type) \ |
96 | { | 142 | static __kprobes void FETCH_FUNC_NAME(memory, type)(struct pt_regs *regs,\ |
97 | return regs_return_value(regs); | 143 | void *addr, void *dest) \ |
98 | } | 144 | { \ |
99 | 145 | type retval; \ | |
100 | static __kprobes unsigned long fetch_stack_address(struct pt_regs *regs, | 146 | if (probe_kernel_address(addr, retval)) \ |
101 | void *dummy) | 147 | *(type *)dest = 0; \ |
102 | { | 148 | else \ |
103 | return kernel_stack_pointer(regs); | 149 | *(type *)dest = retval; \ |
104 | } | 150 | } |
151 | DEFINE_BASIC_FETCH_FUNCS(memory) | ||
105 | 152 | ||
106 | /* Memory fetching by symbol */ | 153 | /* Memory fetching by symbol */ |
107 | struct symbol_cache { | 154 | struct symbol_cache { |
@@ -145,51 +192,126 @@ static struct symbol_cache *alloc_symbol_cache(const char *sym, long offset) | |||
145 | return sc; | 192 | return sc; |
146 | } | 193 | } |
147 | 194 | ||
148 | static __kprobes unsigned long fetch_symbol(struct pt_regs *regs, void *data) | 195 | #define DEFINE_FETCH_symbol(type) \ |
149 | { | 196 | static __kprobes void FETCH_FUNC_NAME(symbol, type)(struct pt_regs *regs,\ |
150 | struct symbol_cache *sc = data; | 197 | void *data, void *dest) \ |
151 | 198 | { \ | |
152 | if (sc->addr) | 199 | struct symbol_cache *sc = data; \ |
153 | return fetch_memory(regs, (void *)sc->addr); | 200 | if (sc->addr) \ |
154 | else | 201 | fetch_memory_##type(regs, (void *)sc->addr, dest); \ |
155 | return 0; | 202 | else \ |
203 | *(type *)dest = 0; \ | ||
156 | } | 204 | } |
205 | DEFINE_BASIC_FETCH_FUNCS(symbol) | ||
157 | 206 | ||
158 | /* Special indirect memory access interface */ | 207 | /* Dereference memory access function */ |
159 | struct indirect_fetch_data { | 208 | struct deref_fetch_param { |
160 | struct fetch_func orig; | 209 | struct fetch_param orig; |
161 | long offset; | 210 | long offset; |
162 | }; | 211 | }; |
163 | 212 | ||
164 | static __kprobes unsigned long fetch_indirect(struct pt_regs *regs, void *data) | 213 | #define DEFINE_FETCH_deref(type) \ |
165 | { | 214 | static __kprobes void FETCH_FUNC_NAME(deref, type)(struct pt_regs *regs,\ |
166 | struct indirect_fetch_data *ind = data; | 215 | void *data, void *dest) \ |
167 | unsigned long addr; | 216 | { \ |
168 | 217 | struct deref_fetch_param *dprm = data; \ | |
169 | addr = call_fetch(&ind->orig, regs); | 218 | unsigned long addr; \ |
170 | if (addr) { | 219 | call_fetch(&dprm->orig, regs, &addr); \ |
171 | addr += ind->offset; | 220 | if (addr) { \ |
172 | return fetch_memory(regs, (void *)addr); | 221 | addr += dprm->offset; \ |
173 | } else | 222 | fetch_memory_##type(regs, (void *)addr, dest); \ |
174 | return 0; | 223 | } else \ |
224 | *(type *)dest = 0; \ | ||
175 | } | 225 | } |
226 | DEFINE_BASIC_FETCH_FUNCS(deref) | ||
176 | 227 | ||
177 | static __kprobes void free_indirect_fetch_data(struct indirect_fetch_data *data) | 228 | static __kprobes void free_deref_fetch_param(struct deref_fetch_param *data) |
178 | { | 229 | { |
179 | if (data->orig.func == fetch_indirect) | 230 | if (CHECK_BASIC_FETCH_FUNCS(deref, data->orig.fn)) |
180 | free_indirect_fetch_data(data->orig.data); | 231 | free_deref_fetch_param(data->orig.data); |
181 | else if (data->orig.func == fetch_symbol) | 232 | else if (CHECK_BASIC_FETCH_FUNCS(symbol, data->orig.fn)) |
182 | free_symbol_cache(data->orig.data); | 233 | free_symbol_cache(data->orig.data); |
183 | kfree(data); | 234 | kfree(data); |
184 | } | 235 | } |
185 | 236 | ||
237 | /* Default (unsigned long) fetch type */ | ||
238 | #define __DEFAULT_FETCH_TYPE(t) u##t | ||
239 | #define _DEFAULT_FETCH_TYPE(t) __DEFAULT_FETCH_TYPE(t) | ||
240 | #define DEFAULT_FETCH_TYPE _DEFAULT_FETCH_TYPE(BITS_PER_LONG) | ||
241 | #define DEFAULT_FETCH_TYPE_STR __stringify(DEFAULT_FETCH_TYPE) | ||
242 | |||
243 | #define ASSIGN_FETCH_FUNC(kind, type) \ | ||
244 | .kind = FETCH_FUNC_NAME(kind, type) | ||
245 | |||
246 | #define ASSIGN_FETCH_TYPE(ptype, ftype, sign) \ | ||
247 | {.name = #ptype, \ | ||
248 | .size = sizeof(ftype), \ | ||
249 | .is_signed = sign, \ | ||
250 | .print = PRINT_TYPE_FUNC_NAME(ptype), \ | ||
251 | .fmt = PRINT_TYPE_FMT_NAME(ptype), \ | ||
252 | ASSIGN_FETCH_FUNC(reg, ftype), \ | ||
253 | ASSIGN_FETCH_FUNC(stack, ftype), \ | ||
254 | ASSIGN_FETCH_FUNC(retval, ftype), \ | ||
255 | ASSIGN_FETCH_FUNC(memory, ftype), \ | ||
256 | ASSIGN_FETCH_FUNC(symbol, ftype), \ | ||
257 | ASSIGN_FETCH_FUNC(deref, ftype), \ | ||
258 | } | ||
259 | |||
260 | /* Fetch type information table */ | ||
261 | static const struct fetch_type { | ||
262 | const char *name; /* Name of type */ | ||
263 | size_t size; /* Byte size of type */ | ||
264 | int is_signed; /* Signed flag */ | ||
265 | print_type_func_t print; /* Print functions */ | ||
266 | const char *fmt; /* Fromat string */ | ||
267 | /* Fetch functions */ | ||
268 | fetch_func_t reg; | ||
269 | fetch_func_t stack; | ||
270 | fetch_func_t retval; | ||
271 | fetch_func_t memory; | ||
272 | fetch_func_t symbol; | ||
273 | fetch_func_t deref; | ||
274 | } fetch_type_table[] = { | ||
275 | ASSIGN_FETCH_TYPE(u8, u8, 0), | ||
276 | ASSIGN_FETCH_TYPE(u16, u16, 0), | ||
277 | ASSIGN_FETCH_TYPE(u32, u32, 0), | ||
278 | ASSIGN_FETCH_TYPE(u64, u64, 0), | ||
279 | ASSIGN_FETCH_TYPE(s8, u8, 1), | ||
280 | ASSIGN_FETCH_TYPE(s16, u16, 1), | ||
281 | ASSIGN_FETCH_TYPE(s32, u32, 1), | ||
282 | ASSIGN_FETCH_TYPE(s64, u64, 1), | ||
283 | }; | ||
284 | |||
285 | static const struct fetch_type *find_fetch_type(const char *type) | ||
286 | { | ||
287 | int i; | ||
288 | |||
289 | if (!type) | ||
290 | type = DEFAULT_FETCH_TYPE_STR; | ||
291 | |||
292 | for (i = 0; i < ARRAY_SIZE(fetch_type_table); i++) | ||
293 | if (strcmp(type, fetch_type_table[i].name) == 0) | ||
294 | return &fetch_type_table[i]; | ||
295 | return NULL; | ||
296 | } | ||
297 | |||
298 | /* Special function : only accept unsigned long */ | ||
299 | static __kprobes void fetch_stack_address(struct pt_regs *regs, | ||
300 | void *dummy, void *dest) | ||
301 | { | ||
302 | *(unsigned long *)dest = kernel_stack_pointer(regs); | ||
303 | } | ||
304 | |||
186 | /** | 305 | /** |
187 | * Kprobe event core functions | 306 | * Kprobe event core functions |
188 | */ | 307 | */ |
189 | 308 | ||
190 | struct probe_arg { | 309 | struct probe_arg { |
191 | struct fetch_func fetch; | 310 | struct fetch_param fetch; |
192 | const char *name; | 311 | unsigned int offset; /* Offset from argument entry */ |
312 | const char *name; /* Name of this argument */ | ||
313 | const char *comm; /* Command of this argument */ | ||
314 | const struct fetch_type *type; /* Type of this argument */ | ||
193 | }; | 315 | }; |
194 | 316 | ||
195 | /* Flags for trace_probe */ | 317 | /* Flags for trace_probe */ |
@@ -204,6 +326,7 @@ struct trace_probe { | |||
204 | const char *symbol; /* symbol name */ | 326 | const char *symbol; /* symbol name */ |
205 | struct ftrace_event_call call; | 327 | struct ftrace_event_call call; |
206 | struct trace_event event; | 328 | struct trace_event event; |
329 | ssize_t size; /* trace entry size */ | ||
207 | unsigned int nr_args; | 330 | unsigned int nr_args; |
208 | struct probe_arg args[]; | 331 | struct probe_arg args[]; |
209 | }; | 332 | }; |
@@ -212,6 +335,7 @@ struct trace_probe { | |||
212 | (offsetof(struct trace_probe, args) + \ | 335 | (offsetof(struct trace_probe, args) + \ |
213 | (sizeof(struct probe_arg) * (n))) | 336 | (sizeof(struct probe_arg) * (n))) |
214 | 337 | ||
338 | |||
215 | static __kprobes int probe_is_return(struct trace_probe *tp) | 339 | static __kprobes int probe_is_return(struct trace_probe *tp) |
216 | { | 340 | { |
217 | return tp->rp.handler != NULL; | 341 | return tp->rp.handler != NULL; |
@@ -222,49 +346,6 @@ static __kprobes const char *probe_symbol(struct trace_probe *tp) | |||
222 | return tp->symbol ? tp->symbol : "unknown"; | 346 | return tp->symbol ? tp->symbol : "unknown"; |
223 | } | 347 | } |
224 | 348 | ||
225 | static int probe_arg_string(char *buf, size_t n, struct fetch_func *ff) | ||
226 | { | ||
227 | int ret = -EINVAL; | ||
228 | |||
229 | if (ff->func == fetch_register) { | ||
230 | const char *name; | ||
231 | name = regs_query_register_name((unsigned int)((long)ff->data)); | ||
232 | ret = snprintf(buf, n, "%%%s", name); | ||
233 | } else if (ff->func == fetch_stack) | ||
234 | ret = snprintf(buf, n, "$stack%lu", (unsigned long)ff->data); | ||
235 | else if (ff->func == fetch_memory) | ||
236 | ret = snprintf(buf, n, "@0x%p", ff->data); | ||
237 | else if (ff->func == fetch_symbol) { | ||
238 | struct symbol_cache *sc = ff->data; | ||
239 | if (sc->offset) | ||
240 | ret = snprintf(buf, n, "@%s%+ld", sc->symbol, | ||
241 | sc->offset); | ||
242 | else | ||
243 | ret = snprintf(buf, n, "@%s", sc->symbol); | ||
244 | } else if (ff->func == fetch_retvalue) | ||
245 | ret = snprintf(buf, n, "$retval"); | ||
246 | else if (ff->func == fetch_stack_address) | ||
247 | ret = snprintf(buf, n, "$stack"); | ||
248 | else if (ff->func == fetch_indirect) { | ||
249 | struct indirect_fetch_data *id = ff->data; | ||
250 | size_t l = 0; | ||
251 | ret = snprintf(buf, n, "%+ld(", id->offset); | ||
252 | if (ret >= n) | ||
253 | goto end; | ||
254 | l += ret; | ||
255 | ret = probe_arg_string(buf + l, n - l, &id->orig); | ||
256 | if (ret < 0) | ||
257 | goto end; | ||
258 | l += ret; | ||
259 | ret = snprintf(buf + l, n - l, ")"); | ||
260 | ret += l; | ||
261 | } | ||
262 | end: | ||
263 | if (ret >= n) | ||
264 | return -ENOSPC; | ||
265 | return ret; | ||
266 | } | ||
267 | |||
268 | static int register_probe_event(struct trace_probe *tp); | 349 | static int register_probe_event(struct trace_probe *tp); |
269 | static void unregister_probe_event(struct trace_probe *tp); | 350 | static void unregister_probe_event(struct trace_probe *tp); |
270 | 351 | ||
@@ -347,11 +428,12 @@ error: | |||
347 | 428 | ||
348 | static void free_probe_arg(struct probe_arg *arg) | 429 | static void free_probe_arg(struct probe_arg *arg) |
349 | { | 430 | { |
350 | if (arg->fetch.func == fetch_symbol) | 431 | if (CHECK_BASIC_FETCH_FUNCS(deref, arg->fetch.fn)) |
432 | free_deref_fetch_param(arg->fetch.data); | ||
433 | else if (CHECK_BASIC_FETCH_FUNCS(symbol, arg->fetch.fn)) | ||
351 | free_symbol_cache(arg->fetch.data); | 434 | free_symbol_cache(arg->fetch.data); |
352 | else if (arg->fetch.func == fetch_indirect) | ||
353 | free_indirect_fetch_data(arg->fetch.data); | ||
354 | kfree(arg->name); | 435 | kfree(arg->name); |
436 | kfree(arg->comm); | ||
355 | } | 437 | } |
356 | 438 | ||
357 | static void free_trace_probe(struct trace_probe *tp) | 439 | static void free_trace_probe(struct trace_probe *tp) |
@@ -457,28 +539,30 @@ static int split_symbol_offset(char *symbol, unsigned long *offset) | |||
457 | #define PARAM_MAX_ARGS 16 | 539 | #define PARAM_MAX_ARGS 16 |
458 | #define PARAM_MAX_STACK (THREAD_SIZE / sizeof(unsigned long)) | 540 | #define PARAM_MAX_STACK (THREAD_SIZE / sizeof(unsigned long)) |
459 | 541 | ||
460 | static int parse_probe_vars(char *arg, struct fetch_func *ff, int is_return) | 542 | static int parse_probe_vars(char *arg, const struct fetch_type *t, |
543 | struct fetch_param *f, int is_return) | ||
461 | { | 544 | { |
462 | int ret = 0; | 545 | int ret = 0; |
463 | unsigned long param; | 546 | unsigned long param; |
464 | 547 | ||
465 | if (strcmp(arg, "retval") == 0) { | 548 | if (strcmp(arg, "retval") == 0) { |
466 | if (is_return) { | 549 | if (is_return) |
467 | ff->func = fetch_retvalue; | 550 | f->fn = t->retval; |
468 | ff->data = NULL; | 551 | else |
469 | } else | ||
470 | ret = -EINVAL; | 552 | ret = -EINVAL; |
471 | } else if (strncmp(arg, "stack", 5) == 0) { | 553 | } else if (strncmp(arg, "stack", 5) == 0) { |
472 | if (arg[5] == '\0') { | 554 | if (arg[5] == '\0') { |
473 | ff->func = fetch_stack_address; | 555 | if (strcmp(t->name, DEFAULT_FETCH_TYPE_STR) == 0) |
474 | ff->data = NULL; | 556 | f->fn = fetch_stack_address; |
557 | else | ||
558 | ret = -EINVAL; | ||
475 | } else if (isdigit(arg[5])) { | 559 | } else if (isdigit(arg[5])) { |
476 | ret = strict_strtoul(arg + 5, 10, ¶m); | 560 | ret = strict_strtoul(arg + 5, 10, ¶m); |
477 | if (ret || param > PARAM_MAX_STACK) | 561 | if (ret || param > PARAM_MAX_STACK) |
478 | ret = -EINVAL; | 562 | ret = -EINVAL; |
479 | else { | 563 | else { |
480 | ff->func = fetch_stack; | 564 | f->fn = t->stack; |
481 | ff->data = (void *)param; | 565 | f->data = (void *)param; |
482 | } | 566 | } |
483 | } else | 567 | } else |
484 | ret = -EINVAL; | 568 | ret = -EINVAL; |
@@ -488,7 +572,8 @@ static int parse_probe_vars(char *arg, struct fetch_func *ff, int is_return) | |||
488 | } | 572 | } |
489 | 573 | ||
490 | /* Recursive argument parser */ | 574 | /* Recursive argument parser */ |
491 | static int __parse_probe_arg(char *arg, struct fetch_func *ff, int is_return) | 575 | static int __parse_probe_arg(char *arg, const struct fetch_type *t, |
576 | struct fetch_param *f, int is_return) | ||
492 | { | 577 | { |
493 | int ret = 0; | 578 | int ret = 0; |
494 | unsigned long param; | 579 | unsigned long param; |
@@ -497,13 +582,13 @@ static int __parse_probe_arg(char *arg, struct fetch_func *ff, int is_return) | |||
497 | 582 | ||
498 | switch (arg[0]) { | 583 | switch (arg[0]) { |
499 | case '$': | 584 | case '$': |
500 | ret = parse_probe_vars(arg + 1, ff, is_return); | 585 | ret = parse_probe_vars(arg + 1, t, f, is_return); |
501 | break; | 586 | break; |
502 | case '%': /* named register */ | 587 | case '%': /* named register */ |
503 | ret = regs_query_register_offset(arg + 1); | 588 | ret = regs_query_register_offset(arg + 1); |
504 | if (ret >= 0) { | 589 | if (ret >= 0) { |
505 | ff->func = fetch_register; | 590 | f->fn = t->reg; |
506 | ff->data = (void *)(unsigned long)ret; | 591 | f->data = (void *)(unsigned long)ret; |
507 | ret = 0; | 592 | ret = 0; |
508 | } | 593 | } |
509 | break; | 594 | break; |
@@ -512,26 +597,22 @@ static int __parse_probe_arg(char *arg, struct fetch_func *ff, int is_return) | |||
512 | ret = strict_strtoul(arg + 1, 0, ¶m); | 597 | ret = strict_strtoul(arg + 1, 0, ¶m); |
513 | if (ret) | 598 | if (ret) |
514 | break; | 599 | break; |
515 | ff->func = fetch_memory; | 600 | f->fn = t->memory; |
516 | ff->data = (void *)param; | 601 | f->data = (void *)param; |
517 | } else { | 602 | } else { |
518 | ret = split_symbol_offset(arg + 1, &offset); | 603 | ret = split_symbol_offset(arg + 1, &offset); |
519 | if (ret) | 604 | if (ret) |
520 | break; | 605 | break; |
521 | ff->data = alloc_symbol_cache(arg + 1, offset); | 606 | f->data = alloc_symbol_cache(arg + 1, offset); |
522 | if (ff->data) | 607 | if (f->data) |
523 | ff->func = fetch_symbol; | 608 | f->fn = t->symbol; |
524 | else | ||
525 | ret = -EINVAL; | ||
526 | } | 609 | } |
527 | break; | 610 | break; |
528 | case '+': /* indirect memory */ | 611 | case '+': /* deref memory */ |
529 | case '-': | 612 | case '-': |
530 | tmp = strchr(arg, '('); | 613 | tmp = strchr(arg, '('); |
531 | if (!tmp) { | 614 | if (!tmp) |
532 | ret = -EINVAL; | ||
533 | break; | 615 | break; |
534 | } | ||
535 | *tmp = '\0'; | 616 | *tmp = '\0'; |
536 | ret = strict_strtol(arg + 1, 0, &offset); | 617 | ret = strict_strtol(arg + 1, 0, &offset); |
537 | if (ret) | 618 | if (ret) |
@@ -541,38 +622,58 @@ static int __parse_probe_arg(char *arg, struct fetch_func *ff, int is_return) | |||
541 | arg = tmp + 1; | 622 | arg = tmp + 1; |
542 | tmp = strrchr(arg, ')'); | 623 | tmp = strrchr(arg, ')'); |
543 | if (tmp) { | 624 | if (tmp) { |
544 | struct indirect_fetch_data *id; | 625 | struct deref_fetch_param *dprm; |
626 | const struct fetch_type *t2 = find_fetch_type(NULL); | ||
545 | *tmp = '\0'; | 627 | *tmp = '\0'; |
546 | id = kzalloc(sizeof(struct indirect_fetch_data), | 628 | dprm = kzalloc(sizeof(struct deref_fetch_param), |
547 | GFP_KERNEL); | 629 | GFP_KERNEL); |
548 | if (!id) | 630 | if (!dprm) |
549 | return -ENOMEM; | 631 | return -ENOMEM; |
550 | id->offset = offset; | 632 | dprm->offset = offset; |
551 | ret = __parse_probe_arg(arg, &id->orig, is_return); | 633 | ret = __parse_probe_arg(arg, t2, &dprm->orig, |
634 | is_return); | ||
552 | if (ret) | 635 | if (ret) |
553 | kfree(id); | 636 | kfree(dprm); |
554 | else { | 637 | else { |
555 | ff->func = fetch_indirect; | 638 | f->fn = t->deref; |
556 | ff->data = (void *)id; | 639 | f->data = (void *)dprm; |
557 | } | 640 | } |
558 | } else | 641 | } |
559 | ret = -EINVAL; | ||
560 | break; | 642 | break; |
561 | default: | ||
562 | /* TODO: support custom handler */ | ||
563 | ret = -EINVAL; | ||
564 | } | 643 | } |
644 | if (!ret && !f->fn) | ||
645 | ret = -EINVAL; | ||
565 | return ret; | 646 | return ret; |
566 | } | 647 | } |
567 | 648 | ||
568 | /* String length checking wrapper */ | 649 | /* String length checking wrapper */ |
569 | static int parse_probe_arg(char *arg, struct fetch_func *ff, int is_return) | 650 | static int parse_probe_arg(char *arg, struct trace_probe *tp, |
651 | struct probe_arg *parg, int is_return) | ||
570 | { | 652 | { |
653 | const char *t; | ||
654 | |||
571 | if (strlen(arg) > MAX_ARGSTR_LEN) { | 655 | if (strlen(arg) > MAX_ARGSTR_LEN) { |
572 | pr_info("Argument is too long.: %s\n", arg); | 656 | pr_info("Argument is too long.: %s\n", arg); |
573 | return -ENOSPC; | 657 | return -ENOSPC; |
574 | } | 658 | } |
575 | return __parse_probe_arg(arg, ff, is_return); | 659 | parg->comm = kstrdup(arg, GFP_KERNEL); |
660 | if (!parg->comm) { | ||
661 | pr_info("Failed to allocate memory for command '%s'.\n", arg); | ||
662 | return -ENOMEM; | ||
663 | } | ||
664 | t = strchr(parg->comm, ':'); | ||
665 | if (t) { | ||
666 | arg[t - parg->comm] = '\0'; | ||
667 | t++; | ||
668 | } | ||
669 | parg->type = find_fetch_type(t); | ||
670 | if (!parg->type) { | ||
671 | pr_info("Unsupported type: %s\n", t); | ||
672 | return -EINVAL; | ||
673 | } | ||
674 | parg->offset = tp->size; | ||
675 | tp->size += parg->type->size; | ||
676 | return __parse_probe_arg(arg, parg->type, &parg->fetch, is_return); | ||
576 | } | 677 | } |
577 | 678 | ||
578 | /* Return 1 if name is reserved or already used by another argument */ | 679 | /* Return 1 if name is reserved or already used by another argument */ |
@@ -602,15 +703,18 @@ static int create_trace_probe(int argc, char **argv) | |||
602 | * @ADDR : fetch memory at ADDR (ADDR should be in kernel) | 703 | * @ADDR : fetch memory at ADDR (ADDR should be in kernel) |
603 | * @SYM[+|-offs] : fetch memory at SYM +|- offs (SYM is a data symbol) | 704 | * @SYM[+|-offs] : fetch memory at SYM +|- offs (SYM is a data symbol) |
604 | * %REG : fetch register REG | 705 | * %REG : fetch register REG |
605 | * Indirect memory fetch: | 706 | * Dereferencing memory fetch: |
606 | * +|-offs(ARG) : fetch memory at ARG +|- offs address. | 707 | * +|-offs(ARG) : fetch memory at ARG +|- offs address. |
607 | * Alias name of args: | 708 | * Alias name of args: |
608 | * NAME=FETCHARG : set NAME as alias of FETCHARG. | 709 | * NAME=FETCHARG : set NAME as alias of FETCHARG. |
710 | * Type of args: | ||
711 | * FETCHARG:TYPE : use TYPE instead of unsigned long. | ||
609 | */ | 712 | */ |
610 | struct trace_probe *tp; | 713 | struct trace_probe *tp; |
611 | int i, ret = 0; | 714 | int i, ret = 0; |
612 | int is_return = 0, is_delete = 0; | 715 | int is_return = 0, is_delete = 0; |
613 | char *symbol = NULL, *event = NULL, *arg = NULL, *group = NULL; | 716 | char *symbol = NULL, *event = NULL, *group = NULL; |
717 | char *arg, *tmp; | ||
614 | unsigned long offset = 0; | 718 | unsigned long offset = 0; |
615 | void *addr = NULL; | 719 | void *addr = NULL; |
616 | char buf[MAX_EVENT_NAME_LEN]; | 720 | char buf[MAX_EVENT_NAME_LEN]; |
@@ -723,13 +827,6 @@ static int create_trace_probe(int argc, char **argv) | |||
723 | else | 827 | else |
724 | arg = argv[i]; | 828 | arg = argv[i]; |
725 | 829 | ||
726 | if (conflict_field_name(argv[i], tp->args, i)) { | ||
727 | pr_info("Argument%d name '%s' conflicts with " | ||
728 | "another field.\n", i, argv[i]); | ||
729 | ret = -EINVAL; | ||
730 | goto error; | ||
731 | } | ||
732 | |||
733 | tp->args[i].name = kstrdup(argv[i], GFP_KERNEL); | 830 | tp->args[i].name = kstrdup(argv[i], GFP_KERNEL); |
734 | if (!tp->args[i].name) { | 831 | if (!tp->args[i].name) { |
735 | pr_info("Failed to allocate argument%d name '%s'.\n", | 832 | pr_info("Failed to allocate argument%d name '%s'.\n", |
@@ -737,9 +834,19 @@ static int create_trace_probe(int argc, char **argv) | |||
737 | ret = -ENOMEM; | 834 | ret = -ENOMEM; |
738 | goto error; | 835 | goto error; |
739 | } | 836 | } |
837 | tmp = strchr(tp->args[i].name, ':'); | ||
838 | if (tmp) | ||
839 | *tmp = '_'; /* convert : to _ */ | ||
840 | |||
841 | if (conflict_field_name(tp->args[i].name, tp->args, i)) { | ||
842 | pr_info("Argument%d name '%s' conflicts with " | ||
843 | "another field.\n", i, argv[i]); | ||
844 | ret = -EINVAL; | ||
845 | goto error; | ||
846 | } | ||
740 | 847 | ||
741 | /* Parse fetch argument */ | 848 | /* Parse fetch argument */ |
742 | ret = parse_probe_arg(arg, &tp->args[i].fetch, is_return); | 849 | ret = parse_probe_arg(arg, tp, &tp->args[i], is_return); |
743 | if (ret) { | 850 | if (ret) { |
744 | pr_info("Parse error at argument%d. (%d)\n", i, ret); | 851 | pr_info("Parse error at argument%d. (%d)\n", i, ret); |
745 | kfree(tp->args[i].name); | 852 | kfree(tp->args[i].name); |
@@ -794,8 +901,7 @@ static void probes_seq_stop(struct seq_file *m, void *v) | |||
794 | static int probes_seq_show(struct seq_file *m, void *v) | 901 | static int probes_seq_show(struct seq_file *m, void *v) |
795 | { | 902 | { |
796 | struct trace_probe *tp = v; | 903 | struct trace_probe *tp = v; |
797 | int i, ret; | 904 | int i; |
798 | char buf[MAX_ARGSTR_LEN + 1]; | ||
799 | 905 | ||
800 | seq_printf(m, "%c", probe_is_return(tp) ? 'r' : 'p'); | 906 | seq_printf(m, "%c", probe_is_return(tp) ? 'r' : 'p'); |
801 | seq_printf(m, ":%s/%s", tp->call.system, tp->call.name); | 907 | seq_printf(m, ":%s/%s", tp->call.system, tp->call.name); |
@@ -807,15 +913,10 @@ static int probes_seq_show(struct seq_file *m, void *v) | |||
807 | else | 913 | else |
808 | seq_printf(m, " %s", probe_symbol(tp)); | 914 | seq_printf(m, " %s", probe_symbol(tp)); |
809 | 915 | ||
810 | for (i = 0; i < tp->nr_args; i++) { | 916 | for (i = 0; i < tp->nr_args; i++) |
811 | ret = probe_arg_string(buf, MAX_ARGSTR_LEN, &tp->args[i].fetch); | 917 | seq_printf(m, " %s=%s", tp->args[i].name, tp->args[i].comm); |
812 | if (ret < 0) { | ||
813 | pr_warning("Argument%d decoding error(%d).\n", i, ret); | ||
814 | return ret; | ||
815 | } | ||
816 | seq_printf(m, " %s=%s", tp->args[i].name, buf); | ||
817 | } | ||
818 | seq_printf(m, "\n"); | 918 | seq_printf(m, "\n"); |
919 | |||
819 | return 0; | 920 | return 0; |
820 | } | 921 | } |
821 | 922 | ||
@@ -945,9 +1046,10 @@ static const struct file_operations kprobe_profile_ops = { | |||
945 | static __kprobes void kprobe_trace_func(struct kprobe *kp, struct pt_regs *regs) | 1046 | static __kprobes void kprobe_trace_func(struct kprobe *kp, struct pt_regs *regs) |
946 | { | 1047 | { |
947 | struct trace_probe *tp = container_of(kp, struct trace_probe, rp.kp); | 1048 | struct trace_probe *tp = container_of(kp, struct trace_probe, rp.kp); |
948 | struct kprobe_trace_entry *entry; | 1049 | struct kprobe_trace_entry_head *entry; |
949 | struct ring_buffer_event *event; | 1050 | struct ring_buffer_event *event; |
950 | struct ring_buffer *buffer; | 1051 | struct ring_buffer *buffer; |
1052 | u8 *data; | ||
951 | int size, i, pc; | 1053 | int size, i, pc; |
952 | unsigned long irq_flags; | 1054 | unsigned long irq_flags; |
953 | struct ftrace_event_call *call = &tp->call; | 1055 | struct ftrace_event_call *call = &tp->call; |
@@ -957,7 +1059,7 @@ static __kprobes void kprobe_trace_func(struct kprobe *kp, struct pt_regs *regs) | |||
957 | local_save_flags(irq_flags); | 1059 | local_save_flags(irq_flags); |
958 | pc = preempt_count(); | 1060 | pc = preempt_count(); |
959 | 1061 | ||
960 | size = SIZEOF_KPROBE_TRACE_ENTRY(tp->nr_args); | 1062 | size = sizeof(*entry) + tp->size; |
961 | 1063 | ||
962 | event = trace_current_buffer_lock_reserve(&buffer, call->id, size, | 1064 | event = trace_current_buffer_lock_reserve(&buffer, call->id, size, |
963 | irq_flags, pc); | 1065 | irq_flags, pc); |
@@ -965,10 +1067,10 @@ static __kprobes void kprobe_trace_func(struct kprobe *kp, struct pt_regs *regs) | |||
965 | return; | 1067 | return; |
966 | 1068 | ||
967 | entry = ring_buffer_event_data(event); | 1069 | entry = ring_buffer_event_data(event); |
968 | entry->nargs = tp->nr_args; | ||
969 | entry->ip = (unsigned long)kp->addr; | 1070 | entry->ip = (unsigned long)kp->addr; |
1071 | data = (u8 *)&entry[1]; | ||
970 | for (i = 0; i < tp->nr_args; i++) | 1072 | for (i = 0; i < tp->nr_args; i++) |
971 | entry->args[i] = call_fetch(&tp->args[i].fetch, regs); | 1073 | call_fetch(&tp->args[i].fetch, regs, data + tp->args[i].offset); |
972 | 1074 | ||
973 | if (!filter_current_check_discard(buffer, call, entry, event)) | 1075 | if (!filter_current_check_discard(buffer, call, entry, event)) |
974 | trace_nowake_buffer_unlock_commit(buffer, event, irq_flags, pc); | 1076 | trace_nowake_buffer_unlock_commit(buffer, event, irq_flags, pc); |
@@ -979,9 +1081,10 @@ static __kprobes void kretprobe_trace_func(struct kretprobe_instance *ri, | |||
979 | struct pt_regs *regs) | 1081 | struct pt_regs *regs) |
980 | { | 1082 | { |
981 | struct trace_probe *tp = container_of(ri->rp, struct trace_probe, rp); | 1083 | struct trace_probe *tp = container_of(ri->rp, struct trace_probe, rp); |
982 | struct kretprobe_trace_entry *entry; | 1084 | struct kretprobe_trace_entry_head *entry; |
983 | struct ring_buffer_event *event; | 1085 | struct ring_buffer_event *event; |
984 | struct ring_buffer *buffer; | 1086 | struct ring_buffer *buffer; |
1087 | u8 *data; | ||
985 | int size, i, pc; | 1088 | int size, i, pc; |
986 | unsigned long irq_flags; | 1089 | unsigned long irq_flags; |
987 | struct ftrace_event_call *call = &tp->call; | 1090 | struct ftrace_event_call *call = &tp->call; |
@@ -989,7 +1092,7 @@ static __kprobes void kretprobe_trace_func(struct kretprobe_instance *ri, | |||
989 | local_save_flags(irq_flags); | 1092 | local_save_flags(irq_flags); |
990 | pc = preempt_count(); | 1093 | pc = preempt_count(); |
991 | 1094 | ||
992 | size = SIZEOF_KRETPROBE_TRACE_ENTRY(tp->nr_args); | 1095 | size = sizeof(*entry) + tp->size; |
993 | 1096 | ||
994 | event = trace_current_buffer_lock_reserve(&buffer, call->id, size, | 1097 | event = trace_current_buffer_lock_reserve(&buffer, call->id, size, |
995 | irq_flags, pc); | 1098 | irq_flags, pc); |
@@ -997,11 +1100,11 @@ static __kprobes void kretprobe_trace_func(struct kretprobe_instance *ri, | |||
997 | return; | 1100 | return; |
998 | 1101 | ||
999 | entry = ring_buffer_event_data(event); | 1102 | entry = ring_buffer_event_data(event); |
1000 | entry->nargs = tp->nr_args; | ||
1001 | entry->func = (unsigned long)tp->rp.kp.addr; | 1103 | entry->func = (unsigned long)tp->rp.kp.addr; |
1002 | entry->ret_ip = (unsigned long)ri->ret_addr; | 1104 | entry->ret_ip = (unsigned long)ri->ret_addr; |
1105 | data = (u8 *)&entry[1]; | ||
1003 | for (i = 0; i < tp->nr_args; i++) | 1106 | for (i = 0; i < tp->nr_args; i++) |
1004 | entry->args[i] = call_fetch(&tp->args[i].fetch, regs); | 1107 | call_fetch(&tp->args[i].fetch, regs, data + tp->args[i].offset); |
1005 | 1108 | ||
1006 | if (!filter_current_check_discard(buffer, call, entry, event)) | 1109 | if (!filter_current_check_discard(buffer, call, entry, event)) |
1007 | trace_nowake_buffer_unlock_commit(buffer, event, irq_flags, pc); | 1110 | trace_nowake_buffer_unlock_commit(buffer, event, irq_flags, pc); |
@@ -1011,13 +1114,14 @@ static __kprobes void kretprobe_trace_func(struct kretprobe_instance *ri, | |||
1011 | enum print_line_t | 1114 | enum print_line_t |
1012 | print_kprobe_event(struct trace_iterator *iter, int flags) | 1115 | print_kprobe_event(struct trace_iterator *iter, int flags) |
1013 | { | 1116 | { |
1014 | struct kprobe_trace_entry *field; | 1117 | struct kprobe_trace_entry_head *field; |
1015 | struct trace_seq *s = &iter->seq; | 1118 | struct trace_seq *s = &iter->seq; |
1016 | struct trace_event *event; | 1119 | struct trace_event *event; |
1017 | struct trace_probe *tp; | 1120 | struct trace_probe *tp; |
1121 | u8 *data; | ||
1018 | int i; | 1122 | int i; |
1019 | 1123 | ||
1020 | field = (struct kprobe_trace_entry *)iter->ent; | 1124 | field = (struct kprobe_trace_entry_head *)iter->ent; |
1021 | event = ftrace_find_event(field->ent.type); | 1125 | event = ftrace_find_event(field->ent.type); |
1022 | tp = container_of(event, struct trace_probe, event); | 1126 | tp = container_of(event, struct trace_probe, event); |
1023 | 1127 | ||
@@ -1030,9 +1134,10 @@ print_kprobe_event(struct trace_iterator *iter, int flags) | |||
1030 | if (!trace_seq_puts(s, ")")) | 1134 | if (!trace_seq_puts(s, ")")) |
1031 | goto partial; | 1135 | goto partial; |
1032 | 1136 | ||
1033 | for (i = 0; i < field->nargs; i++) | 1137 | data = (u8 *)&field[1]; |
1034 | if (!trace_seq_printf(s, " %s=%lx", | 1138 | for (i = 0; i < tp->nr_args; i++) |
1035 | tp->args[i].name, field->args[i])) | 1139 | if (!tp->args[i].type->print(s, tp->args[i].name, |
1140 | data + tp->args[i].offset)) | ||
1036 | goto partial; | 1141 | goto partial; |
1037 | 1142 | ||
1038 | if (!trace_seq_puts(s, "\n")) | 1143 | if (!trace_seq_puts(s, "\n")) |
@@ -1046,13 +1151,14 @@ partial: | |||
1046 | enum print_line_t | 1151 | enum print_line_t |
1047 | print_kretprobe_event(struct trace_iterator *iter, int flags) | 1152 | print_kretprobe_event(struct trace_iterator *iter, int flags) |
1048 | { | 1153 | { |
1049 | struct kretprobe_trace_entry *field; | 1154 | struct kretprobe_trace_entry_head *field; |
1050 | struct trace_seq *s = &iter->seq; | 1155 | struct trace_seq *s = &iter->seq; |
1051 | struct trace_event *event; | 1156 | struct trace_event *event; |
1052 | struct trace_probe *tp; | 1157 | struct trace_probe *tp; |
1158 | u8 *data; | ||
1053 | int i; | 1159 | int i; |
1054 | 1160 | ||
1055 | field = (struct kretprobe_trace_entry *)iter->ent; | 1161 | field = (struct kretprobe_trace_entry_head *)iter->ent; |
1056 | event = ftrace_find_event(field->ent.type); | 1162 | event = ftrace_find_event(field->ent.type); |
1057 | tp = container_of(event, struct trace_probe, event); | 1163 | tp = container_of(event, struct trace_probe, event); |
1058 | 1164 | ||
@@ -1071,9 +1177,10 @@ print_kretprobe_event(struct trace_iterator *iter, int flags) | |||
1071 | if (!trace_seq_puts(s, ")")) | 1177 | if (!trace_seq_puts(s, ")")) |
1072 | goto partial; | 1178 | goto partial; |
1073 | 1179 | ||
1074 | for (i = 0; i < field->nargs; i++) | 1180 | data = (u8 *)&field[1]; |
1075 | if (!trace_seq_printf(s, " %s=%lx", | 1181 | for (i = 0; i < tp->nr_args; i++) |
1076 | tp->args[i].name, field->args[i])) | 1182 | if (!tp->args[i].type->print(s, tp->args[i].name, |
1183 | data + tp->args[i].offset)) | ||
1077 | goto partial; | 1184 | goto partial; |
1078 | 1185 | ||
1079 | if (!trace_seq_puts(s, "\n")) | 1186 | if (!trace_seq_puts(s, "\n")) |
@@ -1129,29 +1236,43 @@ static int probe_event_raw_init(struct ftrace_event_call *event_call) | |||
1129 | static int kprobe_event_define_fields(struct ftrace_event_call *event_call) | 1236 | static int kprobe_event_define_fields(struct ftrace_event_call *event_call) |
1130 | { | 1237 | { |
1131 | int ret, i; | 1238 | int ret, i; |
1132 | struct kprobe_trace_entry field; | 1239 | struct kprobe_trace_entry_head field; |
1133 | struct trace_probe *tp = (struct trace_probe *)event_call->data; | 1240 | struct trace_probe *tp = (struct trace_probe *)event_call->data; |
1134 | 1241 | ||
1135 | DEFINE_FIELD(unsigned long, ip, FIELD_STRING_IP, 0); | 1242 | DEFINE_FIELD(unsigned long, ip, FIELD_STRING_IP, 0); |
1136 | DEFINE_FIELD(int, nargs, FIELD_STRING_NARGS, 1); | ||
1137 | /* Set argument names as fields */ | 1243 | /* Set argument names as fields */ |
1138 | for (i = 0; i < tp->nr_args; i++) | 1244 | for (i = 0; i < tp->nr_args; i++) { |
1139 | DEFINE_FIELD(unsigned long, args[i], tp->args[i].name, 0); | 1245 | ret = trace_define_field(event_call, tp->args[i].type->name, |
1246 | tp->args[i].name, | ||
1247 | sizeof(field) + tp->args[i].offset, | ||
1248 | tp->args[i].type->size, | ||
1249 | tp->args[i].type->is_signed, | ||
1250 | FILTER_OTHER); | ||
1251 | if (ret) | ||
1252 | return ret; | ||
1253 | } | ||
1140 | return 0; | 1254 | return 0; |
1141 | } | 1255 | } |
1142 | 1256 | ||
1143 | static int kretprobe_event_define_fields(struct ftrace_event_call *event_call) | 1257 | static int kretprobe_event_define_fields(struct ftrace_event_call *event_call) |
1144 | { | 1258 | { |
1145 | int ret, i; | 1259 | int ret, i; |
1146 | struct kretprobe_trace_entry field; | 1260 | struct kretprobe_trace_entry_head field; |
1147 | struct trace_probe *tp = (struct trace_probe *)event_call->data; | 1261 | struct trace_probe *tp = (struct trace_probe *)event_call->data; |
1148 | 1262 | ||
1149 | DEFINE_FIELD(unsigned long, func, FIELD_STRING_FUNC, 0); | 1263 | DEFINE_FIELD(unsigned long, func, FIELD_STRING_FUNC, 0); |
1150 | DEFINE_FIELD(unsigned long, ret_ip, FIELD_STRING_RETIP, 0); | 1264 | DEFINE_FIELD(unsigned long, ret_ip, FIELD_STRING_RETIP, 0); |
1151 | DEFINE_FIELD(int, nargs, FIELD_STRING_NARGS, 1); | ||
1152 | /* Set argument names as fields */ | 1265 | /* Set argument names as fields */ |
1153 | for (i = 0; i < tp->nr_args; i++) | 1266 | for (i = 0; i < tp->nr_args; i++) { |
1154 | DEFINE_FIELD(unsigned long, args[i], tp->args[i].name, 0); | 1267 | ret = trace_define_field(event_call, tp->args[i].type->name, |
1268 | tp->args[i].name, | ||
1269 | sizeof(field) + tp->args[i].offset, | ||
1270 | tp->args[i].type->size, | ||
1271 | tp->args[i].type->is_signed, | ||
1272 | FILTER_OTHER); | ||
1273 | if (ret) | ||
1274 | return ret; | ||
1275 | } | ||
1155 | return 0; | 1276 | return 0; |
1156 | } | 1277 | } |
1157 | 1278 | ||
@@ -1176,8 +1297,8 @@ static int __set_print_fmt(struct trace_probe *tp, char *buf, int len) | |||
1176 | pos += snprintf(buf + pos, LEN_OR_ZERO, "\"%s", fmt); | 1297 | pos += snprintf(buf + pos, LEN_OR_ZERO, "\"%s", fmt); |
1177 | 1298 | ||
1178 | for (i = 0; i < tp->nr_args; i++) { | 1299 | for (i = 0; i < tp->nr_args; i++) { |
1179 | pos += snprintf(buf + pos, LEN_OR_ZERO, " %s=%%lx", | 1300 | pos += snprintf(buf + pos, LEN_OR_ZERO, " %s=%s", |
1180 | tp->args[i].name); | 1301 | tp->args[i].name, tp->args[i].type->fmt); |
1181 | } | 1302 | } |
1182 | 1303 | ||
1183 | pos += snprintf(buf + pos, LEN_OR_ZERO, "\", %s", arg); | 1304 | pos += snprintf(buf + pos, LEN_OR_ZERO, "\", %s", arg); |
@@ -1219,12 +1340,13 @@ static __kprobes void kprobe_perf_func(struct kprobe *kp, | |||
1219 | { | 1340 | { |
1220 | struct trace_probe *tp = container_of(kp, struct trace_probe, rp.kp); | 1341 | struct trace_probe *tp = container_of(kp, struct trace_probe, rp.kp); |
1221 | struct ftrace_event_call *call = &tp->call; | 1342 | struct ftrace_event_call *call = &tp->call; |
1222 | struct kprobe_trace_entry *entry; | 1343 | struct kprobe_trace_entry_head *entry; |
1344 | u8 *data; | ||
1223 | int size, __size, i; | 1345 | int size, __size, i; |
1224 | unsigned long irq_flags; | 1346 | unsigned long irq_flags; |
1225 | int rctx; | 1347 | int rctx; |
1226 | 1348 | ||
1227 | __size = SIZEOF_KPROBE_TRACE_ENTRY(tp->nr_args); | 1349 | __size = sizeof(*entry) + tp->size; |
1228 | size = ALIGN(__size + sizeof(u32), sizeof(u64)); | 1350 | size = ALIGN(__size + sizeof(u32), sizeof(u64)); |
1229 | size -= sizeof(u32); | 1351 | size -= sizeof(u32); |
1230 | if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE, | 1352 | if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE, |
@@ -1235,10 +1357,10 @@ static __kprobes void kprobe_perf_func(struct kprobe *kp, | |||
1235 | if (!entry) | 1357 | if (!entry) |
1236 | return; | 1358 | return; |
1237 | 1359 | ||
1238 | entry->nargs = tp->nr_args; | ||
1239 | entry->ip = (unsigned long)kp->addr; | 1360 | entry->ip = (unsigned long)kp->addr; |
1361 | data = (u8 *)&entry[1]; | ||
1240 | for (i = 0; i < tp->nr_args; i++) | 1362 | for (i = 0; i < tp->nr_args; i++) |
1241 | entry->args[i] = call_fetch(&tp->args[i].fetch, regs); | 1363 | call_fetch(&tp->args[i].fetch, regs, data + tp->args[i].offset); |
1242 | 1364 | ||
1243 | perf_trace_buf_submit(entry, size, rctx, entry->ip, 1, irq_flags, regs); | 1365 | perf_trace_buf_submit(entry, size, rctx, entry->ip, 1, irq_flags, regs); |
1244 | } | 1366 | } |
@@ -1249,12 +1371,13 @@ static __kprobes void kretprobe_perf_func(struct kretprobe_instance *ri, | |||
1249 | { | 1371 | { |
1250 | struct trace_probe *tp = container_of(ri->rp, struct trace_probe, rp); | 1372 | struct trace_probe *tp = container_of(ri->rp, struct trace_probe, rp); |
1251 | struct ftrace_event_call *call = &tp->call; | 1373 | struct ftrace_event_call *call = &tp->call; |
1252 | struct kretprobe_trace_entry *entry; | 1374 | struct kretprobe_trace_entry_head *entry; |
1375 | u8 *data; | ||
1253 | int size, __size, i; | 1376 | int size, __size, i; |
1254 | unsigned long irq_flags; | 1377 | unsigned long irq_flags; |
1255 | int rctx; | 1378 | int rctx; |
1256 | 1379 | ||
1257 | __size = SIZEOF_KRETPROBE_TRACE_ENTRY(tp->nr_args); | 1380 | __size = sizeof(*entry) + tp->size; |
1258 | size = ALIGN(__size + sizeof(u32), sizeof(u64)); | 1381 | size = ALIGN(__size + sizeof(u32), sizeof(u64)); |
1259 | size -= sizeof(u32); | 1382 | size -= sizeof(u32); |
1260 | if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE, | 1383 | if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE, |
@@ -1265,11 +1388,11 @@ static __kprobes void kretprobe_perf_func(struct kretprobe_instance *ri, | |||
1265 | if (!entry) | 1388 | if (!entry) |
1266 | return; | 1389 | return; |
1267 | 1390 | ||
1268 | entry->nargs = tp->nr_args; | ||
1269 | entry->func = (unsigned long)tp->rp.kp.addr; | 1391 | entry->func = (unsigned long)tp->rp.kp.addr; |
1270 | entry->ret_ip = (unsigned long)ri->ret_addr; | 1392 | entry->ret_ip = (unsigned long)ri->ret_addr; |
1393 | data = (u8 *)&entry[1]; | ||
1271 | for (i = 0; i < tp->nr_args; i++) | 1394 | for (i = 0; i < tp->nr_args; i++) |
1272 | entry->args[i] = call_fetch(&tp->args[i].fetch, regs); | 1395 | call_fetch(&tp->args[i].fetch, regs, data + tp->args[i].offset); |
1273 | 1396 | ||
1274 | perf_trace_buf_submit(entry, size, rctx, entry->ret_ip, 1, | 1397 | perf_trace_buf_submit(entry, size, rctx, entry->ret_ip, 1, |
1275 | irq_flags, regs); | 1398 | irq_flags, regs); |
diff --git a/kernel/trace/trace_ksym.c b/kernel/trace/trace_ksym.c index d59cd6879477..8eaf00749b65 100644 --- a/kernel/trace/trace_ksym.c +++ b/kernel/trace/trace_ksym.c | |||
@@ -34,12 +34,6 @@ | |||
34 | 34 | ||
35 | #include <asm/atomic.h> | 35 | #include <asm/atomic.h> |
36 | 36 | ||
37 | /* | ||
38 | * For now, let us restrict the no. of symbols traced simultaneously to number | ||
39 | * of available hardware breakpoint registers. | ||
40 | */ | ||
41 | #define KSYM_TRACER_MAX HBP_NUM | ||
42 | |||
43 | #define KSYM_TRACER_OP_LEN 3 /* rw- */ | 37 | #define KSYM_TRACER_OP_LEN 3 /* rw- */ |
44 | 38 | ||
45 | struct trace_ksym { | 39 | struct trace_ksym { |
@@ -53,7 +47,6 @@ struct trace_ksym { | |||
53 | 47 | ||
54 | static struct trace_array *ksym_trace_array; | 48 | static struct trace_array *ksym_trace_array; |
55 | 49 | ||
56 | static unsigned int ksym_filter_entry_count; | ||
57 | static unsigned int ksym_tracing_enabled; | 50 | static unsigned int ksym_tracing_enabled; |
58 | 51 | ||
59 | static HLIST_HEAD(ksym_filter_head); | 52 | static HLIST_HEAD(ksym_filter_head); |
@@ -181,13 +174,6 @@ int process_new_ksym_entry(char *ksymname, int op, unsigned long addr) | |||
181 | struct trace_ksym *entry; | 174 | struct trace_ksym *entry; |
182 | int ret = -ENOMEM; | 175 | int ret = -ENOMEM; |
183 | 176 | ||
184 | if (ksym_filter_entry_count >= KSYM_TRACER_MAX) { | ||
185 | printk(KERN_ERR "ksym_tracer: Maximum limit:(%d) reached. No" | ||
186 | " new requests for tracing can be accepted now.\n", | ||
187 | KSYM_TRACER_MAX); | ||
188 | return -ENOSPC; | ||
189 | } | ||
190 | |||
191 | entry = kzalloc(sizeof(struct trace_ksym), GFP_KERNEL); | 177 | entry = kzalloc(sizeof(struct trace_ksym), GFP_KERNEL); |
192 | if (!entry) | 178 | if (!entry) |
193 | return -ENOMEM; | 179 | return -ENOMEM; |
@@ -203,13 +189,17 @@ int process_new_ksym_entry(char *ksymname, int op, unsigned long addr) | |||
203 | 189 | ||
204 | if (IS_ERR(entry->ksym_hbp)) { | 190 | if (IS_ERR(entry->ksym_hbp)) { |
205 | ret = PTR_ERR(entry->ksym_hbp); | 191 | ret = PTR_ERR(entry->ksym_hbp); |
206 | printk(KERN_INFO "ksym_tracer request failed. Try again" | 192 | if (ret == -ENOSPC) { |
207 | " later!!\n"); | 193 | printk(KERN_ERR "ksym_tracer: Maximum limit reached." |
194 | " No new requests for tracing can be accepted now.\n"); | ||
195 | } else { | ||
196 | printk(KERN_INFO "ksym_tracer request failed. Try again" | ||
197 | " later!!\n"); | ||
198 | } | ||
208 | goto err; | 199 | goto err; |
209 | } | 200 | } |
210 | 201 | ||
211 | hlist_add_head_rcu(&(entry->ksym_hlist), &ksym_filter_head); | 202 | hlist_add_head_rcu(&(entry->ksym_hlist), &ksym_filter_head); |
212 | ksym_filter_entry_count++; | ||
213 | 203 | ||
214 | return 0; | 204 | return 0; |
215 | 205 | ||
@@ -265,7 +255,6 @@ static void __ksym_trace_reset(void) | |||
265 | hlist_for_each_entry_safe(entry, node, node1, &ksym_filter_head, | 255 | hlist_for_each_entry_safe(entry, node, node1, &ksym_filter_head, |
266 | ksym_hlist) { | 256 | ksym_hlist) { |
267 | unregister_wide_hw_breakpoint(entry->ksym_hbp); | 257 | unregister_wide_hw_breakpoint(entry->ksym_hbp); |
268 | ksym_filter_entry_count--; | ||
269 | hlist_del_rcu(&(entry->ksym_hlist)); | 258 | hlist_del_rcu(&(entry->ksym_hlist)); |
270 | synchronize_rcu(); | 259 | synchronize_rcu(); |
271 | kfree(entry); | 260 | kfree(entry); |
@@ -338,7 +327,6 @@ static ssize_t ksym_trace_filter_write(struct file *file, | |||
338 | goto out_unlock; | 327 | goto out_unlock; |
339 | } | 328 | } |
340 | /* Error or "symbol:---" case: drop it */ | 329 | /* Error or "symbol:---" case: drop it */ |
341 | ksym_filter_entry_count--; | ||
342 | hlist_del_rcu(&(entry->ksym_hlist)); | 330 | hlist_del_rcu(&(entry->ksym_hlist)); |
343 | synchronize_rcu(); | 331 | synchronize_rcu(); |
344 | kfree(entry); | 332 | kfree(entry); |
diff --git a/kernel/trace/trace_selftest.c b/kernel/trace/trace_selftest.c index 9398034f814a..71fa771ee4d7 100644 --- a/kernel/trace/trace_selftest.c +++ b/kernel/trace/trace_selftest.c | |||
@@ -17,7 +17,6 @@ static inline int trace_valid_entry(struct trace_entry *entry) | |||
17 | case TRACE_BRANCH: | 17 | case TRACE_BRANCH: |
18 | case TRACE_GRAPH_ENT: | 18 | case TRACE_GRAPH_ENT: |
19 | case TRACE_GRAPH_RET: | 19 | case TRACE_GRAPH_RET: |
20 | case TRACE_HW_BRANCHES: | ||
21 | case TRACE_KSYM: | 20 | case TRACE_KSYM: |
22 | return 1; | 21 | return 1; |
23 | } | 22 | } |
@@ -755,62 +754,6 @@ trace_selftest_startup_branch(struct tracer *trace, struct trace_array *tr) | |||
755 | } | 754 | } |
756 | #endif /* CONFIG_BRANCH_TRACER */ | 755 | #endif /* CONFIG_BRANCH_TRACER */ |
757 | 756 | ||
758 | #ifdef CONFIG_HW_BRANCH_TRACER | ||
759 | int | ||
760 | trace_selftest_startup_hw_branches(struct tracer *trace, | ||
761 | struct trace_array *tr) | ||
762 | { | ||
763 | struct trace_iterator *iter; | ||
764 | struct tracer tracer; | ||
765 | unsigned long count; | ||
766 | int ret; | ||
767 | |||
768 | if (!trace->open) { | ||
769 | printk(KERN_CONT "missing open function..."); | ||
770 | return -1; | ||
771 | } | ||
772 | |||
773 | ret = tracer_init(trace, tr); | ||
774 | if (ret) { | ||
775 | warn_failed_init_tracer(trace, ret); | ||
776 | return ret; | ||
777 | } | ||
778 | |||
779 | /* | ||
780 | * The hw-branch tracer needs to collect the trace from the various | ||
781 | * cpu trace buffers - before tracing is stopped. | ||
782 | */ | ||
783 | iter = kzalloc(sizeof(*iter), GFP_KERNEL); | ||
784 | if (!iter) | ||
785 | return -ENOMEM; | ||
786 | |||
787 | memcpy(&tracer, trace, sizeof(tracer)); | ||
788 | |||
789 | iter->trace = &tracer; | ||
790 | iter->tr = tr; | ||
791 | iter->pos = -1; | ||
792 | mutex_init(&iter->mutex); | ||
793 | |||
794 | trace->open(iter); | ||
795 | |||
796 | mutex_destroy(&iter->mutex); | ||
797 | kfree(iter); | ||
798 | |||
799 | tracing_stop(); | ||
800 | |||
801 | ret = trace_test_buffer(tr, &count); | ||
802 | trace->reset(tr); | ||
803 | tracing_start(); | ||
804 | |||
805 | if (!ret && !count) { | ||
806 | printk(KERN_CONT "no entries found.."); | ||
807 | ret = -1; | ||
808 | } | ||
809 | |||
810 | return ret; | ||
811 | } | ||
812 | #endif /* CONFIG_HW_BRANCH_TRACER */ | ||
813 | |||
814 | #ifdef CONFIG_KSYM_TRACER | 757 | #ifdef CONFIG_KSYM_TRACER |
815 | static int ksym_selftest_dummy; | 758 | static int ksym_selftest_dummy; |
816 | 759 | ||
diff --git a/mm/mlock.c b/mm/mlock.c index 8f4e2dfceec1..3f82720e0515 100644 --- a/mm/mlock.c +++ b/mm/mlock.c | |||
@@ -607,44 +607,3 @@ void user_shm_unlock(size_t size, struct user_struct *user) | |||
607 | spin_unlock(&shmlock_user_lock); | 607 | spin_unlock(&shmlock_user_lock); |
608 | free_uid(user); | 608 | free_uid(user); |
609 | } | 609 | } |
610 | |||
611 | int account_locked_memory(struct mm_struct *mm, struct rlimit *rlim, | ||
612 | size_t size) | ||
613 | { | ||
614 | unsigned long lim, vm, pgsz; | ||
615 | int error = -ENOMEM; | ||
616 | |||
617 | pgsz = PAGE_ALIGN(size) >> PAGE_SHIFT; | ||
618 | |||
619 | down_write(&mm->mmap_sem); | ||
620 | |||
621 | lim = ACCESS_ONCE(rlim[RLIMIT_AS].rlim_cur) >> PAGE_SHIFT; | ||
622 | vm = mm->total_vm + pgsz; | ||
623 | if (lim < vm) | ||
624 | goto out; | ||
625 | |||
626 | lim = ACCESS_ONCE(rlim[RLIMIT_MEMLOCK].rlim_cur) >> PAGE_SHIFT; | ||
627 | vm = mm->locked_vm + pgsz; | ||
628 | if (lim < vm) | ||
629 | goto out; | ||
630 | |||
631 | mm->total_vm += pgsz; | ||
632 | mm->locked_vm += pgsz; | ||
633 | |||
634 | error = 0; | ||
635 | out: | ||
636 | up_write(&mm->mmap_sem); | ||
637 | return error; | ||
638 | } | ||
639 | |||
640 | void refund_locked_memory(struct mm_struct *mm, size_t size) | ||
641 | { | ||
642 | unsigned long pgsz = PAGE_ALIGN(size) >> PAGE_SHIFT; | ||
643 | |||
644 | down_write(&mm->mmap_sem); | ||
645 | |||
646 | mm->total_vm -= pgsz; | ||
647 | mm->locked_vm -= pgsz; | ||
648 | |||
649 | up_write(&mm->mmap_sem); | ||
650 | } | ||
diff --git a/tools/perf/Documentation/perf-annotate.txt b/tools/perf/Documentation/perf-annotate.txt index c9dcade06831..5164a655c39f 100644 --- a/tools/perf/Documentation/perf-annotate.txt +++ b/tools/perf/Documentation/perf-annotate.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-annotate(1) | 1 | perf-annotate(1) |
2 | ============== | 2 | ================ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-bench.txt b/tools/perf/Documentation/perf-bench.txt index ae525ac5a2ce..a3dbadb26ef5 100644 --- a/tools/perf/Documentation/perf-bench.txt +++ b/tools/perf/Documentation/perf-bench.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-bench(1) | 1 | perf-bench(1) |
2 | ============ | 2 | ============= |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
@@ -19,12 +19,12 @@ COMMON OPTIONS | |||
19 | -f:: | 19 | -f:: |
20 | --format=:: | 20 | --format=:: |
21 | Specify format style. | 21 | Specify format style. |
22 | Current available format styles are, | 22 | Current available format styles are: |
23 | 23 | ||
24 | 'default':: | 24 | 'default':: |
25 | Default style. This is mainly for human reading. | 25 | Default style. This is mainly for human reading. |
26 | --------------------- | 26 | --------------------- |
27 | % perf bench sched pipe # with no style specify | 27 | % perf bench sched pipe # with no style specified |
28 | (executing 1000000 pipe operations between two tasks) | 28 | (executing 1000000 pipe operations between two tasks) |
29 | Total time:5.855 sec | 29 | Total time:5.855 sec |
30 | 5.855061 usecs/op | 30 | 5.855061 usecs/op |
@@ -79,7 +79,7 @@ options (20 sender and receiver processes per group) | |||
79 | 79 | ||
80 | Total time:0.308 sec | 80 | Total time:0.308 sec |
81 | 81 | ||
82 | % perf bench sched messaging -t -g 20 # be multi-thread,with 20 groups | 82 | % perf bench sched messaging -t -g 20 # be multi-thread, with 20 groups |
83 | (20 sender and receiver threads per group) | 83 | (20 sender and receiver threads per group) |
84 | (20 groups == 800 threads run) | 84 | (20 groups == 800 threads run) |
85 | 85 | ||
diff --git a/tools/perf/Documentation/perf-buildid-cache.txt b/tools/perf/Documentation/perf-buildid-cache.txt index 88bc3b519746..5d1a9500277f 100644 --- a/tools/perf/Documentation/perf-buildid-cache.txt +++ b/tools/perf/Documentation/perf-buildid-cache.txt | |||
@@ -8,7 +8,7 @@ perf-buildid-cache - Manage build-id cache. | |||
8 | SYNOPSIS | 8 | SYNOPSIS |
9 | -------- | 9 | -------- |
10 | [verse] | 10 | [verse] |
11 | 'perf buildid-list <options>' | 11 | 'perf buildid-cache <options>' |
12 | 12 | ||
13 | DESCRIPTION | 13 | DESCRIPTION |
14 | ----------- | 14 | ----------- |
@@ -30,4 +30,4 @@ OPTIONS | |||
30 | 30 | ||
31 | SEE ALSO | 31 | SEE ALSO |
32 | -------- | 32 | -------- |
33 | linkperf:perf-record[1], linkperf:perf-report[1] | 33 | linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-buildid-list[1] |
diff --git a/tools/perf/Documentation/perf-diff.txt b/tools/perf/Documentation/perf-diff.txt index 8974e208cba6..20d97d84ea1c 100644 --- a/tools/perf/Documentation/perf-diff.txt +++ b/tools/perf/Documentation/perf-diff.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-diff(1) | 1 | perf-diff(1) |
2 | ============== | 2 | ============ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-inject.txt b/tools/perf/Documentation/perf-inject.txt new file mode 100644 index 000000000000..025630d43cd2 --- /dev/null +++ b/tools/perf/Documentation/perf-inject.txt | |||
@@ -0,0 +1,35 @@ | |||
1 | perf-inject(1) | ||
2 | ============== | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-inject - Filter to augment the events stream with additional information | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf inject <options>' | ||
12 | |||
13 | DESCRIPTION | ||
14 | ----------- | ||
15 | perf-inject reads a perf-record event stream and repipes it to stdout. At any | ||
16 | point the processing code can inject other events into the event stream - in | ||
17 | this case build-ids (-b option) are read and injected as needed into the event | ||
18 | stream. | ||
19 | |||
20 | Build-ids are just the first user of perf-inject - potentially anything that | ||
21 | needs userspace processing to augment the events stream with additional | ||
22 | information could make use of this facility. | ||
23 | |||
24 | OPTIONS | ||
25 | ------- | ||
26 | -b:: | ||
27 | --build-ids=:: | ||
28 | Inject build-ids into the output stream | ||
29 | -v:: | ||
30 | --verbose:: | ||
31 | Be more verbose. | ||
32 | |||
33 | SEE ALSO | ||
34 | -------- | ||
35 | linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-archive[1] | ||
diff --git a/tools/perf/Documentation/perf-kmem.txt b/tools/perf/Documentation/perf-kmem.txt index eac4d852e7cd..a52fcde894c7 100644 --- a/tools/perf/Documentation/perf-kmem.txt +++ b/tools/perf/Documentation/perf-kmem.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-kmem(1) | 1 | perf-kmem(1) |
2 | ============== | 2 | ============ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-kvm.txt b/tools/perf/Documentation/perf-kvm.txt new file mode 100644 index 000000000000..d004e19fe6d6 --- /dev/null +++ b/tools/perf/Documentation/perf-kvm.txt | |||
@@ -0,0 +1,68 @@ | |||
1 | perf-kvm(1) | ||
2 | =========== | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-kvm - Tool to trace/measure kvm guest os | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf kvm' [--host] [--guest] [--guestmount=<path> | ||
12 | [--guestkallsyms=<path> --guestmodules=<path> | --guestvmlinux=<path>]] | ||
13 | {top|record|report|diff|buildid-list} | ||
14 | 'perf kvm' [--host] [--guest] [--guestkallsyms=<path> --guestmodules=<path> | ||
15 | | --guestvmlinux=<path>] {top|record|report|diff|buildid-list} | ||
16 | |||
17 | DESCRIPTION | ||
18 | ----------- | ||
19 | There are a couple of variants of perf kvm: | ||
20 | |||
21 | 'perf kvm [options] top <command>' to generates and displays | ||
22 | a performance counter profile of guest os in realtime | ||
23 | of an arbitrary workload. | ||
24 | |||
25 | 'perf kvm record <command>' to record the performance couinter profile | ||
26 | of an arbitrary workload and save it into a perf data file. If both | ||
27 | --host and --guest are input, the perf data file name is perf.data.kvm. | ||
28 | If there is no --host but --guest, the file name is perf.data.guest. | ||
29 | If there is no --guest but --host, the file name is perf.data.host. | ||
30 | |||
31 | 'perf kvm report' to display the performance counter profile information | ||
32 | recorded via perf kvm record. | ||
33 | |||
34 | 'perf kvm diff' to displays the performance difference amongst two perf.data | ||
35 | files captured via perf record. | ||
36 | |||
37 | 'perf kvm buildid-list' to display the buildids found in a perf data file, | ||
38 | so that other tools can be used to fetch packages with matching symbol tables | ||
39 | for use by perf report. | ||
40 | |||
41 | OPTIONS | ||
42 | ------- | ||
43 | --host=:: | ||
44 | Collect host side performance profile. | ||
45 | --guest=:: | ||
46 | Collect guest side performance profile. | ||
47 | --guestmount=<path>:: | ||
48 | Guest os root file system mount directory. Users mounts guest os | ||
49 | root directories under <path> by a specific filesystem access method, | ||
50 | typically, sshfs. For example, start 2 guest os. The one's pid is 8888 | ||
51 | and the other's is 9999. | ||
52 | #mkdir ~/guestmount; cd ~/guestmount | ||
53 | #sshfs -o allow_other,direct_io -p 5551 localhost:/ 8888/ | ||
54 | #sshfs -o allow_other,direct_io -p 5552 localhost:/ 9999/ | ||
55 | #perf kvm --host --guest --guestmount=~/guestmount top | ||
56 | --guestkallsyms=<path>:: | ||
57 | Guest os /proc/kallsyms file copy. 'perf' kvm' reads it to get guest | ||
58 | kernel symbols. Users copy it out from guest os. | ||
59 | --guestmodules=<path>:: | ||
60 | Guest os /proc/modules file copy. 'perf' kvm' reads it to get guest | ||
61 | kernel module information. Users copy it out from guest os. | ||
62 | --guestvmlinux=<path>:: | ||
63 | Guest os kernel vmlinux. | ||
64 | |||
65 | SEE ALSO | ||
66 | -------- | ||
67 | linkperf:perf-top[1], linkperf:perf-record[1], linkperf:perf-report[1], | ||
68 | linkperf:perf-diff[1], linkperf:perf-buildid-list[1] | ||
diff --git a/tools/perf/Documentation/perf-list.txt b/tools/perf/Documentation/perf-list.txt index 8290b9422668..43e3dd284b90 100644 --- a/tools/perf/Documentation/perf-list.txt +++ b/tools/perf/Documentation/perf-list.txt | |||
@@ -15,6 +15,35 @@ DESCRIPTION | |||
15 | This command displays the symbolic event types which can be selected in the | 15 | This command displays the symbolic event types which can be selected in the |
16 | various perf commands with the -e option. | 16 | various perf commands with the -e option. |
17 | 17 | ||
18 | RAW HARDWARE EVENT DESCRIPTOR | ||
19 | ----------------------------- | ||
20 | Even when an event is not available in a symbolic form within perf right now, | ||
21 | it can be encoded in a per processor specific way. | ||
22 | |||
23 | For instance For x86 CPUs NNN represents the raw register encoding with the | ||
24 | layout of IA32_PERFEVTSELx MSRs (see [Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide] Figure 30-1 Layout | ||
25 | of IA32_PERFEVTSELx MSRs) or AMD's PerfEvtSeln (see [AMD64 Architecture Programmer’s Manual Volume 2: System Programming], Page 344, | ||
26 | Figure 13-7 Performance Event-Select Register (PerfEvtSeln)). | ||
27 | |||
28 | Example: | ||
29 | |||
30 | If the Intel docs for a QM720 Core i7 describe an event as: | ||
31 | |||
32 | Event Umask Event Mask | ||
33 | Num. Value Mnemonic Description Comment | ||
34 | |||
35 | A8H 01H LSD.UOPS Counts the number of micro-ops Use cmask=1 and | ||
36 | delivered by loop stream detector invert to count | ||
37 | cycles | ||
38 | |||
39 | raw encoding of 0x1A8 can be used: | ||
40 | |||
41 | perf stat -e r1a8 -a sleep 1 | ||
42 | perf record -e r1a8 ... | ||
43 | |||
44 | You should refer to the processor specific documentation for getting these | ||
45 | details. Some of them are referenced in the SEE ALSO section below. | ||
46 | |||
18 | OPTIONS | 47 | OPTIONS |
19 | ------- | 48 | ------- |
20 | None | 49 | None |
@@ -22,4 +51,6 @@ None | |||
22 | SEE ALSO | 51 | SEE ALSO |
23 | -------- | 52 | -------- |
24 | linkperf:perf-stat[1], linkperf:perf-top[1], | 53 | linkperf:perf-stat[1], linkperf:perf-top[1], |
25 | linkperf:perf-record[1] | 54 | linkperf:perf-record[1], |
55 | http://www.intel.com/Assets/PDF/manual/253669.pdf[Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide], | ||
56 | http://support.amd.com/us/Processor_TechDocs/24593.pdf[AMD64 Architecture Programmer’s Manual Volume 2: System Programming] | ||
diff --git a/tools/perf/Documentation/perf-probe.txt b/tools/perf/Documentation/perf-probe.txt index 34202b1be0bb..94a258c96a44 100644 --- a/tools/perf/Documentation/perf-probe.txt +++ b/tools/perf/Documentation/perf-probe.txt | |||
@@ -57,6 +57,14 @@ OPTIONS | |||
57 | --force:: | 57 | --force:: |
58 | Forcibly add events with existing name. | 58 | Forcibly add events with existing name. |
59 | 59 | ||
60 | -n:: | ||
61 | --dry-run:: | ||
62 | Dry run. With this option, --add and --del doesn't execute actual | ||
63 | adding and removal operations. | ||
64 | |||
65 | --max-probes:: | ||
66 | Set the maximum number of probe points for an event. Default is 128. | ||
67 | |||
60 | PROBE SYNTAX | 68 | PROBE SYNTAX |
61 | ------------ | 69 | ------------ |
62 | Probe points are defined by following syntax. | 70 | Probe points are defined by following syntax. |
@@ -74,13 +82,22 @@ Probe points are defined by following syntax. | |||
74 | 'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'. | 82 | 'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'. |
75 | 'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, ':RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. And ';PTN' means lazy matching pattern (see LAZY MATCHING). Note that ';PTN' must be the end of the probe point definition. In addition, '@SRC' specifies a source file which has that function. | 83 | 'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, ':RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. And ';PTN' means lazy matching pattern (see LAZY MATCHING). Note that ';PTN' must be the end of the probe point definition. In addition, '@SRC' specifies a source file which has that function. |
76 | It is also possible to specify a probe point by the source line number or lazy matching by using 'SRC:ALN' or 'SRC;PTN' syntax, where 'SRC' is the source file path, ':ALN' is the line number and ';PTN' is the lazy matching pattern. | 84 | It is also possible to specify a probe point by the source line number or lazy matching by using 'SRC:ALN' or 'SRC;PTN' syntax, where 'SRC' is the source file path, ':ALN' is the line number and ';PTN' is the lazy matching pattern. |
77 | 'ARG' specifies the arguments of this probe point. You can use the name of local variable, or kprobe-tracer argument format (e.g. $retval, %ax, etc). | 85 | 'ARG' specifies the arguments of this probe point, (see PROBE ARGUMENT). |
86 | |||
87 | PROBE ARGUMENT | ||
88 | -------------- | ||
89 | Each probe argument follows below syntax. | ||
90 | |||
91 | [NAME=]LOCALVAR|$retval|%REG|@SYMBOL[:TYPE] | ||
92 | |||
93 | 'NAME' specifies the name of this argument (optional). You can use the name of local variable, local data structure member (e.g. var->field, var.field2), or kprobe-tracer argument format (e.g. $retval, %ax, etc). Note that the name of this argument will be set as the last member name if you specify a local data structure member (e.g. field2 for 'var->field1.field2'.) | ||
94 | 'TYPE' casts the type of this argument (optional). If omitted, perf probe automatically set the type based on debuginfo. | ||
78 | 95 | ||
79 | LINE SYNTAX | 96 | LINE SYNTAX |
80 | ----------- | 97 | ----------- |
81 | Line range is descripted by following syntax. | 98 | Line range is descripted by following syntax. |
82 | 99 | ||
83 | "FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]" | 100 | "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]" |
84 | 101 | ||
85 | FUNC specifies the function name of showing lines. 'RLN' is the start line | 102 | FUNC specifies the function name of showing lines. 'RLN' is the start line |
86 | number from function entry line, and 'RLN2' is the end line number. As same as | 103 | number from function entry line, and 'RLN2' is the end line number. As same as |
diff --git a/tools/perf/Documentation/perf-record.txt b/tools/perf/Documentation/perf-record.txt index fc46c0b40f6e..34e255fc3e2f 100644 --- a/tools/perf/Documentation/perf-record.txt +++ b/tools/perf/Documentation/perf-record.txt | |||
@@ -58,7 +58,7 @@ OPTIONS | |||
58 | 58 | ||
59 | -f:: | 59 | -f:: |
60 | --force:: | 60 | --force:: |
61 | Overwrite existing data file. | 61 | Overwrite existing data file. (deprecated) |
62 | 62 | ||
63 | -c:: | 63 | -c:: |
64 | --count=:: | 64 | --count=:: |
@@ -69,8 +69,8 @@ OPTIONS | |||
69 | Output file name. | 69 | Output file name. |
70 | 70 | ||
71 | -i:: | 71 | -i:: |
72 | --inherit:: | 72 | --no-inherit:: |
73 | Child tasks inherit counters. | 73 | Child tasks do not inherit counters. |
74 | -F:: | 74 | -F:: |
75 | --freq=:: | 75 | --freq=:: |
76 | Profile at this frequency. | 76 | Profile at this frequency. |
@@ -101,7 +101,7 @@ OPTIONS | |||
101 | 101 | ||
102 | -R:: | 102 | -R:: |
103 | --raw-samples:: | 103 | --raw-samples:: |
104 | Collect raw sample records from all opened counters (typically for tracepoint counters). | 104 | Collect raw sample records from all opened counters (default for tracepoint counters). |
105 | 105 | ||
106 | SEE ALSO | 106 | SEE ALSO |
107 | -------- | 107 | -------- |
diff --git a/tools/perf/Documentation/perf-sched.txt b/tools/perf/Documentation/perf-sched.txt index 1ce79198997b..8417644a6166 100644 --- a/tools/perf/Documentation/perf-sched.txt +++ b/tools/perf/Documentation/perf-sched.txt | |||
@@ -12,7 +12,7 @@ SYNOPSIS | |||
12 | 12 | ||
13 | DESCRIPTION | 13 | DESCRIPTION |
14 | ----------- | 14 | ----------- |
15 | There's four variants of perf sched: | 15 | There are four variants of perf sched: |
16 | 16 | ||
17 | 'perf sched record <command>' to record the scheduling events | 17 | 'perf sched record <command>' to record the scheduling events |
18 | of an arbitrary workload. | 18 | of an arbitrary workload. |
@@ -27,7 +27,7 @@ There's four variants of perf sched: | |||
27 | via perf sched record. (this is done by starting up mockup threads | 27 | via perf sched record. (this is done by starting up mockup threads |
28 | that mimic the workload based on the events in the trace. These | 28 | that mimic the workload based on the events in the trace. These |
29 | threads can then replay the timings (CPU runtime and sleep patterns) | 29 | threads can then replay the timings (CPU runtime and sleep patterns) |
30 | of the workload as it occured when it was recorded - and can repeat | 30 | of the workload as it occurred when it was recorded - and can repeat |
31 | it a number of times, measuring its performance.) | 31 | it a number of times, measuring its performance.) |
32 | 32 | ||
33 | OPTIONS | 33 | OPTIONS |
diff --git a/tools/perf/Documentation/perf-stat.txt b/tools/perf/Documentation/perf-stat.txt index 484080dd5b6f..2cab8e8c33d0 100644 --- a/tools/perf/Documentation/perf-stat.txt +++ b/tools/perf/Documentation/perf-stat.txt | |||
@@ -31,8 +31,8 @@ OPTIONS | |||
31 | hexadecimal event descriptor. | 31 | hexadecimal event descriptor. |
32 | 32 | ||
33 | -i:: | 33 | -i:: |
34 | --inherit:: | 34 | --no-inherit:: |
35 | child tasks inherit counters | 35 | child tasks do not inherit counters |
36 | -p:: | 36 | -p:: |
37 | --pid=<pid>:: | 37 | --pid=<pid>:: |
38 | stat events on existing pid | 38 | stat events on existing pid |
diff --git a/tools/perf/Documentation/perf-test.txt b/tools/perf/Documentation/perf-test.txt new file mode 100644 index 000000000000..1c4b5f5b7f71 --- /dev/null +++ b/tools/perf/Documentation/perf-test.txt | |||
@@ -0,0 +1,22 @@ | |||
1 | perf-test(1) | ||
2 | ============ | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-test - Runs sanity tests. | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf test <options>' | ||
12 | |||
13 | DESCRIPTION | ||
14 | ----------- | ||
15 | This command does assorted sanity tests, initially thru linked routines but | ||
16 | also will look for a directory with more tests in the form of scripts. | ||
17 | |||
18 | OPTIONS | ||
19 | ------- | ||
20 | -v:: | ||
21 | --verbose:: | ||
22 | Be more verbose. | ||
diff --git a/tools/perf/Documentation/perf-trace-perl.txt b/tools/perf/Documentation/perf-trace-perl.txt index d729cee8d987..ee6525ee6d69 100644 --- a/tools/perf/Documentation/perf-trace-perl.txt +++ b/tools/perf/Documentation/perf-trace-perl.txt | |||
@@ -49,12 +49,10 @@ available as calls back into the perf executable (see below). | |||
49 | As an example, the following perf record command can be used to record | 49 | As an example, the following perf record command can be used to record |
50 | all sched_wakeup events in the system: | 50 | all sched_wakeup events in the system: |
51 | 51 | ||
52 | # perf record -c 1 -f -a -M -R -e sched:sched_wakeup | 52 | # perf record -a -e sched:sched_wakeup |
53 | 53 | ||
54 | Traces meant to be processed using a script should be recorded with | 54 | Traces meant to be processed using a script should be recorded with |
55 | the above options: -c 1 says to sample every event, -a to enable | 55 | the above option: -a to enable system-wide collection. |
56 | system-wide collection, -M to multiplex the output, and -R to collect | ||
57 | raw samples. | ||
58 | 56 | ||
59 | The format file for the sched_wakep event defines the following fields | 57 | The format file for the sched_wakep event defines the following fields |
60 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): | 58 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): |
diff --git a/tools/perf/Documentation/perf-trace-python.txt b/tools/perf/Documentation/perf-trace-python.txt index a241aca77184..693be804dd3d 100644 --- a/tools/perf/Documentation/perf-trace-python.txt +++ b/tools/perf/Documentation/perf-trace-python.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-trace-python(1) | 1 | perf-trace-python(1) |
2 | ================== | 2 | ==================== |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
@@ -93,7 +93,7 @@ don't care how it exited, so we'll use 'perf record' to record only | |||
93 | the sys_enter events: | 93 | the sys_enter events: |
94 | 94 | ||
95 | ---- | 95 | ---- |
96 | # perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 96 | # perf record -a -e raw_syscalls:sys_enter |
97 | 97 | ||
98 | ^C[ perf record: Woken up 1 times to write data ] | 98 | ^C[ perf record: Woken up 1 times to write data ] |
99 | [ perf record: Captured and wrote 56.545 MB perf.data (~2470503 samples) ] | 99 | [ perf record: Captured and wrote 56.545 MB perf.data (~2470503 samples) ] |
@@ -182,7 +182,7 @@ mean either that the record step recorded event types that it wasn't | |||
182 | really interested in, or the script was run against a trace file that | 182 | really interested in, or the script was run against a trace file that |
183 | doesn't correspond to the script. | 183 | doesn't correspond to the script. |
184 | 184 | ||
185 | The script generated by -g option option simply prints a line for each | 185 | The script generated by -g option simply prints a line for each |
186 | event found in the trace stream i.e. it basically just dumps the event | 186 | event found in the trace stream i.e. it basically just dumps the event |
187 | and its parameter values to stdout. The print_header() function is | 187 | and its parameter values to stdout. The print_header() function is |
188 | simply a utility function used for that purpose. Let's rename the | 188 | simply a utility function used for that purpose. Let's rename the |
@@ -359,7 +359,7 @@ your script: | |||
359 | # cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-record | 359 | # cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-record |
360 | 360 | ||
361 | #!/bin/bash | 361 | #!/bin/bash |
362 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 362 | perf record -a -e raw_syscalls:sys_enter |
363 | ---- | 363 | ---- |
364 | 364 | ||
365 | The 'report' script is also a shell script with the same base name as | 365 | The 'report' script is also a shell script with the same base name as |
@@ -449,12 +449,10 @@ available as calls back into the perf executable (see below). | |||
449 | As an example, the following perf record command can be used to record | 449 | As an example, the following perf record command can be used to record |
450 | all sched_wakeup events in the system: | 450 | all sched_wakeup events in the system: |
451 | 451 | ||
452 | # perf record -c 1 -f -a -M -R -e sched:sched_wakeup | 452 | # perf record -a -e sched:sched_wakeup |
453 | 453 | ||
454 | Traces meant to be processed using a script should be recorded with | 454 | Traces meant to be processed using a script should be recorded with |
455 | the above options: -c 1 says to sample every event, -a to enable | 455 | the above option: -a to enable system-wide collection. |
456 | system-wide collection, -M to multiplex the output, and -R to collect | ||
457 | raw samples. | ||
458 | 456 | ||
459 | The format file for the sched_wakep event defines the following fields | 457 | The format file for the sched_wakep event defines the following fields |
460 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): | 458 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): |
@@ -584,7 +582,7 @@ files: | |||
584 | flag_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the flag field field_name of event event_name | 582 | flag_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the flag field field_name of event event_name |
585 | symbol_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the symbolic field field_name of event event_name | 583 | symbol_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the symbolic field field_name of event event_name |
586 | 584 | ||
587 | The *autodict* function returns a special special kind of Python | 585 | The *autodict* function returns a special kind of Python |
588 | dictionary that implements Perl's 'autovivifying' hashes in Python | 586 | dictionary that implements Perl's 'autovivifying' hashes in Python |
589 | i.e. with autovivifying hashes, you can assign nested hash values | 587 | i.e. with autovivifying hashes, you can assign nested hash values |
590 | without having to go to the trouble of creating intermediate levels if | 588 | without having to go to the trouble of creating intermediate levels if |
diff --git a/tools/perf/Documentation/perf-trace.txt b/tools/perf/Documentation/perf-trace.txt index 8879299cd9df..122ec9dc4853 100644 --- a/tools/perf/Documentation/perf-trace.txt +++ b/tools/perf/Documentation/perf-trace.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-trace(1) | 1 | perf-trace(1) |
2 | ============== | 2 | ============= |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Makefile b/tools/perf/Makefile index bc0f670a8338..3d8f31ed771d 100644 --- a/tools/perf/Makefile +++ b/tools/perf/Makefile | |||
@@ -1,3 +1,7 @@ | |||
1 | ifeq ("$(origin O)", "command line") | ||
2 | OUTPUT := $(O)/ | ||
3 | endif | ||
4 | |||
1 | # The default target of this Makefile is... | 5 | # The default target of this Makefile is... |
2 | all:: | 6 | all:: |
3 | 7 | ||
@@ -150,10 +154,17 @@ all:: | |||
150 | # Define LDFLAGS=-static to build a static binary. | 154 | # Define LDFLAGS=-static to build a static binary. |
151 | # | 155 | # |
152 | # Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds. | 156 | # Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds. |
157 | # | ||
158 | # Define NO_DWARF if you do not want debug-info analysis feature at all. | ||
153 | 159 | ||
154 | PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE | 160 | $(shell sh -c 'mkdir -p $(OUTPUT)scripts/python/Perf-Trace-Util/' 2> /dev/null) |
155 | @$(SHELL_PATH) util/PERF-VERSION-GEN | 161 | $(shell sh -c 'mkdir -p $(OUTPUT)scripts/perl/Perf-Trace-Util/' 2> /dev/null) |
156 | -include PERF-VERSION-FILE | 162 | $(shell sh -c 'mkdir -p $(OUTPUT)util/scripting-engines/' 2> /dev/null) |
163 | $(shell sh -c 'mkdir $(OUTPUT)bench' 2> /dev/null) | ||
164 | |||
165 | $(OUTPUT)PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE | ||
166 | @$(SHELL_PATH) util/PERF-VERSION-GEN $(OUTPUT) | ||
167 | -include $(OUTPUT)PERF-VERSION-FILE | ||
157 | 168 | ||
158 | uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not') | 169 | uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not') |
159 | uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not') | 170 | uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not') |
@@ -162,6 +173,22 @@ uname_R := $(shell sh -c 'uname -r 2>/dev/null || echo not') | |||
162 | uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not') | 173 | uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not') |
163 | uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not') | 174 | uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not') |
164 | 175 | ||
176 | ARCH ?= $(shell echo $(uname_M) | sed -e s/i.86/i386/ -e s/sun4u/sparc64/ \ | ||
177 | -e s/arm.*/arm/ -e s/sa110/arm/ \ | ||
178 | -e s/s390x/s390/ -e s/parisc64/parisc/ \ | ||
179 | -e s/ppc.*/powerpc/ -e s/mips.*/mips/ \ | ||
180 | -e s/sh[234].*/sh/ ) | ||
181 | |||
182 | # Additional ARCH settings for x86 | ||
183 | ifeq ($(ARCH),i386) | ||
184 | ARCH := x86 | ||
185 | endif | ||
186 | ifeq ($(ARCH),x86_64) | ||
187 | ARCH := x86 | ||
188 | endif | ||
189 | |||
190 | $(shell sh -c 'mkdir -p $(OUTPUT)arch/$(ARCH)/util/' 2> /dev/null) | ||
191 | |||
165 | # CFLAGS and LDFLAGS are for the users to override from the command line. | 192 | # CFLAGS and LDFLAGS are for the users to override from the command line. |
166 | 193 | ||
167 | # | 194 | # |
@@ -274,7 +301,7 @@ endif | |||
274 | # Those must not be GNU-specific; they are shared with perl/ which may | 301 | # Those must not be GNU-specific; they are shared with perl/ which may |
275 | # be built by a different compiler. (Note that this is an artifact now | 302 | # be built by a different compiler. (Note that this is an artifact now |
276 | # but it still might be nice to keep that distinction.) | 303 | # but it still might be nice to keep that distinction.) |
277 | BASIC_CFLAGS = -Iutil/include | 304 | BASIC_CFLAGS = -Iutil/include -Iarch/$(ARCH)/include |
278 | BASIC_LDFLAGS = | 305 | BASIC_LDFLAGS = |
279 | 306 | ||
280 | # Guard against environment variables | 307 | # Guard against environment variables |
@@ -308,7 +335,7 @@ PROGRAMS += $(EXTRA_PROGRAMS) | |||
308 | # | 335 | # |
309 | # Single 'perf' binary right now: | 336 | # Single 'perf' binary right now: |
310 | # | 337 | # |
311 | PROGRAMS += perf | 338 | PROGRAMS += $(OUTPUT)perf |
312 | 339 | ||
313 | # List built-in command $C whose implementation cmd_$C() is not in | 340 | # List built-in command $C whose implementation cmd_$C() is not in |
314 | # builtin-$C.o but is linked in as part of some other command. | 341 | # builtin-$C.o but is linked in as part of some other command. |
@@ -318,7 +345,7 @@ PROGRAMS += perf | |||
318 | ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS) | 345 | ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS) |
319 | 346 | ||
320 | # what 'all' will build but not install in perfexecdir | 347 | # what 'all' will build but not install in perfexecdir |
321 | OTHER_PROGRAMS = perf$X | 348 | OTHER_PROGRAMS = $(OUTPUT)perf$X |
322 | 349 | ||
323 | # Set paths to tools early so that they can be used for version tests. | 350 | # Set paths to tools early so that they can be used for version tests. |
324 | ifndef SHELL_PATH | 351 | ifndef SHELL_PATH |
@@ -330,7 +357,7 @@ endif | |||
330 | 357 | ||
331 | export PERL_PATH | 358 | export PERL_PATH |
332 | 359 | ||
333 | LIB_FILE=libperf.a | 360 | LIB_FILE=$(OUTPUT)libperf.a |
334 | 361 | ||
335 | LIB_H += ../../include/linux/perf_event.h | 362 | LIB_H += ../../include/linux/perf_event.h |
336 | LIB_H += ../../include/linux/rbtree.h | 363 | LIB_H += ../../include/linux/rbtree.h |
@@ -350,12 +377,13 @@ LIB_H += util/include/linux/rbtree.h | |||
350 | LIB_H += util/include/linux/string.h | 377 | LIB_H += util/include/linux/string.h |
351 | LIB_H += util/include/linux/types.h | 378 | LIB_H += util/include/linux/types.h |
352 | LIB_H += util/include/asm/asm-offsets.h | 379 | LIB_H += util/include/asm/asm-offsets.h |
353 | LIB_H += util/include/asm/bitops.h | ||
354 | LIB_H += util/include/asm/bug.h | 380 | LIB_H += util/include/asm/bug.h |
355 | LIB_H += util/include/asm/byteorder.h | 381 | LIB_H += util/include/asm/byteorder.h |
382 | LIB_H += util/include/asm/hweight.h | ||
356 | LIB_H += util/include/asm/swab.h | 383 | LIB_H += util/include/asm/swab.h |
357 | LIB_H += util/include/asm/system.h | 384 | LIB_H += util/include/asm/system.h |
358 | LIB_H += util/include/asm/uaccess.h | 385 | LIB_H += util/include/asm/uaccess.h |
386 | LIB_H += util/include/dwarf-regs.h | ||
359 | LIB_H += perf.h | 387 | LIB_H += perf.h |
360 | LIB_H += util/cache.h | 388 | LIB_H += util/cache.h |
361 | LIB_H += util/callchain.h | 389 | LIB_H += util/callchain.h |
@@ -375,7 +403,6 @@ LIB_H += util/header.h | |||
375 | LIB_H += util/help.h | 403 | LIB_H += util/help.h |
376 | LIB_H += util/session.h | 404 | LIB_H += util/session.h |
377 | LIB_H += util/strbuf.h | 405 | LIB_H += util/strbuf.h |
378 | LIB_H += util/string.h | ||
379 | LIB_H += util/strlist.h | 406 | LIB_H += util/strlist.h |
380 | LIB_H += util/svghelper.h | 407 | LIB_H += util/svghelper.h |
381 | LIB_H += util/run-command.h | 408 | LIB_H += util/run-command.h |
@@ -389,79 +416,83 @@ LIB_H += util/thread.h | |||
389 | LIB_H += util/trace-event.h | 416 | LIB_H += util/trace-event.h |
390 | LIB_H += util/probe-finder.h | 417 | LIB_H += util/probe-finder.h |
391 | LIB_H += util/probe-event.h | 418 | LIB_H += util/probe-event.h |
419 | LIB_H += util/pstack.h | ||
392 | LIB_H += util/cpumap.h | 420 | LIB_H += util/cpumap.h |
393 | 421 | ||
394 | LIB_OBJS += util/abspath.o | 422 | LIB_OBJS += $(OUTPUT)util/abspath.o |
395 | LIB_OBJS += util/alias.o | 423 | LIB_OBJS += $(OUTPUT)util/alias.o |
396 | LIB_OBJS += util/build-id.o | 424 | LIB_OBJS += $(OUTPUT)util/build-id.o |
397 | LIB_OBJS += util/config.o | 425 | LIB_OBJS += $(OUTPUT)util/config.o |
398 | LIB_OBJS += util/ctype.o | 426 | LIB_OBJS += $(OUTPUT)util/ctype.o |
399 | LIB_OBJS += util/debugfs.o | 427 | LIB_OBJS += $(OUTPUT)util/debugfs.o |
400 | LIB_OBJS += util/environment.o | 428 | LIB_OBJS += $(OUTPUT)util/environment.o |
401 | LIB_OBJS += util/event.o | 429 | LIB_OBJS += $(OUTPUT)util/event.o |
402 | LIB_OBJS += util/exec_cmd.o | 430 | LIB_OBJS += $(OUTPUT)util/exec_cmd.o |
403 | LIB_OBJS += util/help.o | 431 | LIB_OBJS += $(OUTPUT)util/help.o |
404 | LIB_OBJS += util/levenshtein.o | 432 | LIB_OBJS += $(OUTPUT)util/levenshtein.o |
405 | LIB_OBJS += util/parse-options.o | 433 | LIB_OBJS += $(OUTPUT)util/parse-options.o |
406 | LIB_OBJS += util/parse-events.o | 434 | LIB_OBJS += $(OUTPUT)util/parse-events.o |
407 | LIB_OBJS += util/path.o | 435 | LIB_OBJS += $(OUTPUT)util/path.o |
408 | LIB_OBJS += util/rbtree.o | 436 | LIB_OBJS += $(OUTPUT)util/rbtree.o |
409 | LIB_OBJS += util/bitmap.o | 437 | LIB_OBJS += $(OUTPUT)util/bitmap.o |
410 | LIB_OBJS += util/hweight.o | 438 | LIB_OBJS += $(OUTPUT)util/hweight.o |
411 | LIB_OBJS += util/find_next_bit.o | 439 | LIB_OBJS += $(OUTPUT)util/run-command.o |
412 | LIB_OBJS += util/run-command.o | 440 | LIB_OBJS += $(OUTPUT)util/quote.o |
413 | LIB_OBJS += util/quote.o | 441 | LIB_OBJS += $(OUTPUT)util/strbuf.o |
414 | LIB_OBJS += util/strbuf.o | 442 | LIB_OBJS += $(OUTPUT)util/string.o |
415 | LIB_OBJS += util/string.o | 443 | LIB_OBJS += $(OUTPUT)util/strlist.o |
416 | LIB_OBJS += util/strlist.o | 444 | LIB_OBJS += $(OUTPUT)util/usage.o |
417 | LIB_OBJS += util/usage.o | 445 | LIB_OBJS += $(OUTPUT)util/wrapper.o |
418 | LIB_OBJS += util/wrapper.o | 446 | LIB_OBJS += $(OUTPUT)util/sigchain.o |
419 | LIB_OBJS += util/sigchain.o | 447 | LIB_OBJS += $(OUTPUT)util/symbol.o |
420 | LIB_OBJS += util/symbol.o | 448 | LIB_OBJS += $(OUTPUT)util/color.o |
421 | LIB_OBJS += util/color.o | 449 | LIB_OBJS += $(OUTPUT)util/pager.o |
422 | LIB_OBJS += util/pager.o | 450 | LIB_OBJS += $(OUTPUT)util/header.o |
423 | LIB_OBJS += util/header.o | 451 | LIB_OBJS += $(OUTPUT)util/callchain.o |
424 | LIB_OBJS += util/callchain.o | 452 | LIB_OBJS += $(OUTPUT)util/values.o |
425 | LIB_OBJS += util/values.o | 453 | LIB_OBJS += $(OUTPUT)util/debug.o |
426 | LIB_OBJS += util/debug.o | 454 | LIB_OBJS += $(OUTPUT)util/map.o |
427 | LIB_OBJS += util/map.o | 455 | LIB_OBJS += $(OUTPUT)util/pstack.o |
428 | LIB_OBJS += util/session.o | 456 | LIB_OBJS += $(OUTPUT)util/session.o |
429 | LIB_OBJS += util/thread.o | 457 | LIB_OBJS += $(OUTPUT)util/thread.o |
430 | LIB_OBJS += util/trace-event-parse.o | 458 | LIB_OBJS += $(OUTPUT)util/trace-event-parse.o |
431 | LIB_OBJS += util/trace-event-read.o | 459 | LIB_OBJS += $(OUTPUT)util/trace-event-read.o |
432 | LIB_OBJS += util/trace-event-info.o | 460 | LIB_OBJS += $(OUTPUT)util/trace-event-info.o |
433 | LIB_OBJS += util/trace-event-scripting.o | 461 | LIB_OBJS += $(OUTPUT)util/trace-event-scripting.o |
434 | LIB_OBJS += util/svghelper.o | 462 | LIB_OBJS += $(OUTPUT)util/svghelper.o |
435 | LIB_OBJS += util/sort.o | 463 | LIB_OBJS += $(OUTPUT)util/sort.o |
436 | LIB_OBJS += util/hist.o | 464 | LIB_OBJS += $(OUTPUT)util/hist.o |
437 | LIB_OBJS += util/probe-event.o | 465 | LIB_OBJS += $(OUTPUT)util/probe-event.o |
438 | LIB_OBJS += util/util.o | 466 | LIB_OBJS += $(OUTPUT)util/util.o |
439 | LIB_OBJS += util/cpumap.o | 467 | LIB_OBJS += $(OUTPUT)util/cpumap.o |
440 | 468 | ||
441 | BUILTIN_OBJS += builtin-annotate.o | 469 | BUILTIN_OBJS += $(OUTPUT)builtin-annotate.o |
442 | 470 | ||
443 | BUILTIN_OBJS += builtin-bench.o | 471 | BUILTIN_OBJS += $(OUTPUT)builtin-bench.o |
444 | 472 | ||
445 | # Benchmark modules | 473 | # Benchmark modules |
446 | BUILTIN_OBJS += bench/sched-messaging.o | 474 | BUILTIN_OBJS += $(OUTPUT)bench/sched-messaging.o |
447 | BUILTIN_OBJS += bench/sched-pipe.o | 475 | BUILTIN_OBJS += $(OUTPUT)bench/sched-pipe.o |
448 | BUILTIN_OBJS += bench/mem-memcpy.o | 476 | BUILTIN_OBJS += $(OUTPUT)bench/mem-memcpy.o |
449 | 477 | ||
450 | BUILTIN_OBJS += builtin-diff.o | 478 | BUILTIN_OBJS += $(OUTPUT)builtin-diff.o |
451 | BUILTIN_OBJS += builtin-help.o | 479 | BUILTIN_OBJS += $(OUTPUT)builtin-help.o |
452 | BUILTIN_OBJS += builtin-sched.o | 480 | BUILTIN_OBJS += $(OUTPUT)builtin-sched.o |
453 | BUILTIN_OBJS += builtin-buildid-list.o | 481 | BUILTIN_OBJS += $(OUTPUT)builtin-buildid-list.o |
454 | BUILTIN_OBJS += builtin-buildid-cache.o | 482 | BUILTIN_OBJS += $(OUTPUT)builtin-buildid-cache.o |
455 | BUILTIN_OBJS += builtin-list.o | 483 | BUILTIN_OBJS += $(OUTPUT)builtin-list.o |
456 | BUILTIN_OBJS += builtin-record.o | 484 | BUILTIN_OBJS += $(OUTPUT)builtin-record.o |
457 | BUILTIN_OBJS += builtin-report.o | 485 | BUILTIN_OBJS += $(OUTPUT)builtin-report.o |
458 | BUILTIN_OBJS += builtin-stat.o | 486 | BUILTIN_OBJS += $(OUTPUT)builtin-stat.o |
459 | BUILTIN_OBJS += builtin-timechart.o | 487 | BUILTIN_OBJS += $(OUTPUT)builtin-timechart.o |
460 | BUILTIN_OBJS += builtin-top.o | 488 | BUILTIN_OBJS += $(OUTPUT)builtin-top.o |
461 | BUILTIN_OBJS += builtin-trace.o | 489 | BUILTIN_OBJS += $(OUTPUT)builtin-trace.o |
462 | BUILTIN_OBJS += builtin-probe.o | 490 | BUILTIN_OBJS += $(OUTPUT)builtin-probe.o |
463 | BUILTIN_OBJS += builtin-kmem.o | 491 | BUILTIN_OBJS += $(OUTPUT)builtin-kmem.o |
464 | BUILTIN_OBJS += builtin-lock.o | 492 | BUILTIN_OBJS += $(OUTPUT)builtin-lock.o |
493 | BUILTIN_OBJS += $(OUTPUT)builtin-kvm.o | ||
494 | BUILTIN_OBJS += $(OUTPUT)builtin-test.o | ||
495 | BUILTIN_OBJS += $(OUTPUT)builtin-inject.o | ||
465 | 496 | ||
466 | PERFLIBS = $(LIB_FILE) | 497 | PERFLIBS = $(LIB_FILE) |
467 | 498 | ||
@@ -476,6 +507,15 @@ PERFLIBS = $(LIB_FILE) | |||
476 | -include config.mak.autogen | 507 | -include config.mak.autogen |
477 | -include config.mak | 508 | -include config.mak |
478 | 509 | ||
510 | ifndef NO_DWARF | ||
511 | ifneq ($(shell sh -c "(echo '\#include <dwarf.h>'; echo '\#include <libdw.h>'; echo '\#include <version.h>'; echo '\#ifndef _ELFUTILS_PREREQ'; echo '\#error'; echo '\#endif'; echo 'int main(void) { Dwarf *dbg; dbg = dwarf_begin(0, DWARF_C_READ); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -I/usr/include/elfutils -ldw -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | ||
512 | msg := $(warning No libdw.h found or old libdw.h found or elfutils is older than 0.138, disables dwarf support. Please install new elfutils-devel/libdw-dev); | ||
513 | NO_DWARF := 1 | ||
514 | endif # Dwarf support | ||
515 | endif # NO_DWARF | ||
516 | |||
517 | -include arch/$(ARCH)/Makefile | ||
518 | |||
479 | ifeq ($(uname_S),Darwin) | 519 | ifeq ($(uname_S),Darwin) |
480 | ifndef NO_FINK | 520 | ifndef NO_FINK |
481 | ifeq ($(shell test -d /sw/lib && echo y),y) | 521 | ifeq ($(shell test -d /sw/lib && echo y),y) |
@@ -492,6 +532,10 @@ ifeq ($(uname_S),Darwin) | |||
492 | PTHREAD_LIBS = | 532 | PTHREAD_LIBS = |
493 | endif | 533 | endif |
494 | 534 | ||
535 | ifneq ($(OUTPUT),) | ||
536 | BASIC_CFLAGS += -I$(OUTPUT) | ||
537 | endif | ||
538 | |||
495 | ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 539 | ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) |
496 | ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 540 | ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) |
497 | msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static); | 541 | msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static); |
@@ -504,14 +548,29 @@ else | |||
504 | msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]); | 548 | msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]); |
505 | endif | 549 | endif |
506 | 550 | ||
507 | ifneq ($(shell sh -c "(echo '\#include <dwarf.h>'; echo '\#include <libdw.h>'; echo 'int main(void) { Dwarf *dbg; dbg = dwarf_begin(0, DWARF_C_READ); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -I/usr/include/elfutils -ldw -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 551 | ifndef NO_DWARF |
508 | msg := $(warning No libdw.h found or old libdw.h found, disables dwarf support. Please install elfutils-devel/elfutils-dev); | 552 | ifeq ($(origin PERF_HAVE_DWARF_REGS), undefined) |
509 | BASIC_CFLAGS += -DNO_DWARF_SUPPORT | 553 | msg := $(warning DWARF register mappings have not been defined for architecture $(ARCH), DWARF support disabled); |
510 | else | 554 | else |
511 | BASIC_CFLAGS += -I/usr/include/elfutils | 555 | BASIC_CFLAGS += -I/usr/include/elfutils -DDWARF_SUPPORT |
512 | EXTLIBS += -lelf -ldw | 556 | EXTLIBS += -lelf -ldw |
513 | LIB_OBJS += util/probe-finder.o | 557 | LIB_OBJS += $(OUTPUT)util/probe-finder.o |
558 | endif # PERF_HAVE_DWARF_REGS | ||
559 | endif # NO_DWARF | ||
560 | |||
561 | ifdef NO_NEWT | ||
562 | BASIC_CFLAGS += -DNO_NEWT_SUPPORT | ||
563 | else | ||
564 | ifneq ($(shell sh -c "(echo '\#include <newt.h>'; echo 'int main(void) { newtInit(); newtCls(); return newtFinished(); }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -lnewt -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | ||
565 | msg := $(warning newt not found, disables TUI support. Please install newt-devel or libnewt-dev); | ||
566 | BASIC_CFLAGS += -DNO_NEWT_SUPPORT | ||
567 | else | ||
568 | # Fedora has /usr/include/slang/slang.h, but ubuntu /usr/include/slang.h | ||
569 | BASIC_CFLAGS += -I/usr/include/slang | ||
570 | EXTLIBS += -lnewt -lslang | ||
571 | LIB_OBJS += $(OUTPUT)util/newt.o | ||
514 | endif | 572 | endif |
573 | endif # NO_NEWT | ||
515 | 574 | ||
516 | ifndef NO_LIBPERL | 575 | ifndef NO_LIBPERL |
517 | PERL_EMBED_LDOPTS = `perl -MExtUtils::Embed -e ldopts 2>/dev/null` | 576 | PERL_EMBED_LDOPTS = `perl -MExtUtils::Embed -e ldopts 2>/dev/null` |
@@ -522,8 +581,8 @@ ifneq ($(shell sh -c "(echo '\#include <EXTERN.h>'; echo '\#include <perl.h>'; e | |||
522 | BASIC_CFLAGS += -DNO_LIBPERL | 581 | BASIC_CFLAGS += -DNO_LIBPERL |
523 | else | 582 | else |
524 | ALL_LDFLAGS += $(PERL_EMBED_LDOPTS) | 583 | ALL_LDFLAGS += $(PERL_EMBED_LDOPTS) |
525 | LIB_OBJS += util/scripting-engines/trace-event-perl.o | 584 | LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-perl.o |
526 | LIB_OBJS += scripts/perl/Perf-Trace-Util/Context.o | 585 | LIB_OBJS += $(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o |
527 | endif | 586 | endif |
528 | 587 | ||
529 | ifndef NO_LIBPYTHON | 588 | ifndef NO_LIBPYTHON |
@@ -531,16 +590,19 @@ PYTHON_EMBED_LDOPTS = `python-config --ldflags 2>/dev/null` | |||
531 | PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null` | 590 | PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null` |
532 | endif | 591 | endif |
533 | 592 | ||
534 | ifneq ($(shell sh -c "(echo '\#include <Python.h>'; echo 'int main(void) { Py_Initialize(); return 0; }') | $(CC) -x c - $(PYTHON_EMBED_CCOPTS) -o /dev/null $(PYTHON_EMBED_LDOPTS) > /dev/null 2>&1 && echo y"), y) | 593 | ifneq ($(shell sh -c "(echo '\#include <Python.h>'; echo 'int main(void) { Py_Initialize(); return 0; }') | $(CC) -x c - $(PYTHON_EMBED_CCOPTS) -o $(BITBUCKET) $(PYTHON_EMBED_LDOPTS) > /dev/null 2>&1 && echo y"), y) |
535 | BASIC_CFLAGS += -DNO_LIBPYTHON | 594 | BASIC_CFLAGS += -DNO_LIBPYTHON |
536 | else | 595 | else |
537 | ALL_LDFLAGS += $(PYTHON_EMBED_LDOPTS) | 596 | ALL_LDFLAGS += $(PYTHON_EMBED_LDOPTS) |
538 | LIB_OBJS += util/scripting-engines/trace-event-python.o | 597 | LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-python.o |
539 | LIB_OBJS += scripts/python/Perf-Trace-Util/Context.o | 598 | LIB_OBJS += $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o |
540 | endif | 599 | endif |
541 | 600 | ||
542 | ifdef NO_DEMANGLE | 601 | ifdef NO_DEMANGLE |
543 | BASIC_CFLAGS += -DNO_DEMANGLE | 602 | BASIC_CFLAGS += -DNO_DEMANGLE |
603 | else ifdef HAVE_CPLUS_DEMANGLE | ||
604 | EXTLIBS += -liberty | ||
605 | BASIC_CFLAGS += -DHAVE_CPLUS_DEMANGLE | ||
544 | else | 606 | else |
545 | has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y") | 607 | has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y") |
546 | 608 | ||
@@ -607,53 +669,53 @@ ifdef NO_C99_FORMAT | |||
607 | endif | 669 | endif |
608 | ifdef SNPRINTF_RETURNS_BOGUS | 670 | ifdef SNPRINTF_RETURNS_BOGUS |
609 | COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS | 671 | COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS |
610 | COMPAT_OBJS += compat/snprintf.o | 672 | COMPAT_OBJS += $(OUTPUT)compat/snprintf.o |
611 | endif | 673 | endif |
612 | ifdef FREAD_READS_DIRECTORIES | 674 | ifdef FREAD_READS_DIRECTORIES |
613 | COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES | 675 | COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES |
614 | COMPAT_OBJS += compat/fopen.o | 676 | COMPAT_OBJS += $(OUTPUT)compat/fopen.o |
615 | endif | 677 | endif |
616 | ifdef NO_SYMLINK_HEAD | 678 | ifdef NO_SYMLINK_HEAD |
617 | BASIC_CFLAGS += -DNO_SYMLINK_HEAD | 679 | BASIC_CFLAGS += -DNO_SYMLINK_HEAD |
618 | endif | 680 | endif |
619 | ifdef NO_STRCASESTR | 681 | ifdef NO_STRCASESTR |
620 | COMPAT_CFLAGS += -DNO_STRCASESTR | 682 | COMPAT_CFLAGS += -DNO_STRCASESTR |
621 | COMPAT_OBJS += compat/strcasestr.o | 683 | COMPAT_OBJS += $(OUTPUT)compat/strcasestr.o |
622 | endif | 684 | endif |
623 | ifdef NO_STRTOUMAX | 685 | ifdef NO_STRTOUMAX |
624 | COMPAT_CFLAGS += -DNO_STRTOUMAX | 686 | COMPAT_CFLAGS += -DNO_STRTOUMAX |
625 | COMPAT_OBJS += compat/strtoumax.o | 687 | COMPAT_OBJS += $(OUTPUT)compat/strtoumax.o |
626 | endif | 688 | endif |
627 | ifdef NO_STRTOULL | 689 | ifdef NO_STRTOULL |
628 | COMPAT_CFLAGS += -DNO_STRTOULL | 690 | COMPAT_CFLAGS += -DNO_STRTOULL |
629 | endif | 691 | endif |
630 | ifdef NO_SETENV | 692 | ifdef NO_SETENV |
631 | COMPAT_CFLAGS += -DNO_SETENV | 693 | COMPAT_CFLAGS += -DNO_SETENV |
632 | COMPAT_OBJS += compat/setenv.o | 694 | COMPAT_OBJS += $(OUTPUT)compat/setenv.o |
633 | endif | 695 | endif |
634 | ifdef NO_MKDTEMP | 696 | ifdef NO_MKDTEMP |
635 | COMPAT_CFLAGS += -DNO_MKDTEMP | 697 | COMPAT_CFLAGS += -DNO_MKDTEMP |
636 | COMPAT_OBJS += compat/mkdtemp.o | 698 | COMPAT_OBJS += $(OUTPUT)compat/mkdtemp.o |
637 | endif | 699 | endif |
638 | ifdef NO_UNSETENV | 700 | ifdef NO_UNSETENV |
639 | COMPAT_CFLAGS += -DNO_UNSETENV | 701 | COMPAT_CFLAGS += -DNO_UNSETENV |
640 | COMPAT_OBJS += compat/unsetenv.o | 702 | COMPAT_OBJS += $(OUTPUT)compat/unsetenv.o |
641 | endif | 703 | endif |
642 | ifdef NO_SYS_SELECT_H | 704 | ifdef NO_SYS_SELECT_H |
643 | BASIC_CFLAGS += -DNO_SYS_SELECT_H | 705 | BASIC_CFLAGS += -DNO_SYS_SELECT_H |
644 | endif | 706 | endif |
645 | ifdef NO_MMAP | 707 | ifdef NO_MMAP |
646 | COMPAT_CFLAGS += -DNO_MMAP | 708 | COMPAT_CFLAGS += -DNO_MMAP |
647 | COMPAT_OBJS += compat/mmap.o | 709 | COMPAT_OBJS += $(OUTPUT)compat/mmap.o |
648 | else | 710 | else |
649 | ifdef USE_WIN32_MMAP | 711 | ifdef USE_WIN32_MMAP |
650 | COMPAT_CFLAGS += -DUSE_WIN32_MMAP | 712 | COMPAT_CFLAGS += -DUSE_WIN32_MMAP |
651 | COMPAT_OBJS += compat/win32mmap.o | 713 | COMPAT_OBJS += $(OUTPUT)compat/win32mmap.o |
652 | endif | 714 | endif |
653 | endif | 715 | endif |
654 | ifdef NO_PREAD | 716 | ifdef NO_PREAD |
655 | COMPAT_CFLAGS += -DNO_PREAD | 717 | COMPAT_CFLAGS += -DNO_PREAD |
656 | COMPAT_OBJS += compat/pread.o | 718 | COMPAT_OBJS += $(OUTPUT)compat/pread.o |
657 | endif | 719 | endif |
658 | ifdef NO_FAST_WORKING_DIRECTORY | 720 | ifdef NO_FAST_WORKING_DIRECTORY |
659 | BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY | 721 | BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY |
@@ -675,10 +737,10 @@ else | |||
675 | endif | 737 | endif |
676 | endif | 738 | endif |
677 | ifdef NO_INET_NTOP | 739 | ifdef NO_INET_NTOP |
678 | LIB_OBJS += compat/inet_ntop.o | 740 | LIB_OBJS += $(OUTPUT)compat/inet_ntop.o |
679 | endif | 741 | endif |
680 | ifdef NO_INET_PTON | 742 | ifdef NO_INET_PTON |
681 | LIB_OBJS += compat/inet_pton.o | 743 | LIB_OBJS += $(OUTPUT)compat/inet_pton.o |
682 | endif | 744 | endif |
683 | 745 | ||
684 | ifdef NO_ICONV | 746 | ifdef NO_ICONV |
@@ -695,15 +757,15 @@ endif | |||
695 | 757 | ||
696 | ifdef PPC_SHA1 | 758 | ifdef PPC_SHA1 |
697 | SHA1_HEADER = "ppc/sha1.h" | 759 | SHA1_HEADER = "ppc/sha1.h" |
698 | LIB_OBJS += ppc/sha1.o ppc/sha1ppc.o | 760 | LIB_OBJS += $(OUTPUT)ppc/sha1.o ppc/sha1ppc.o |
699 | else | 761 | else |
700 | ifdef ARM_SHA1 | 762 | ifdef ARM_SHA1 |
701 | SHA1_HEADER = "arm/sha1.h" | 763 | SHA1_HEADER = "arm/sha1.h" |
702 | LIB_OBJS += arm/sha1.o arm/sha1_arm.o | 764 | LIB_OBJS += $(OUTPUT)arm/sha1.o $(OUTPUT)arm/sha1_arm.o |
703 | else | 765 | else |
704 | ifdef MOZILLA_SHA1 | 766 | ifdef MOZILLA_SHA1 |
705 | SHA1_HEADER = "mozilla-sha1/sha1.h" | 767 | SHA1_HEADER = "mozilla-sha1/sha1.h" |
706 | LIB_OBJS += mozilla-sha1/sha1.o | 768 | LIB_OBJS += $(OUTPUT)mozilla-sha1/sha1.o |
707 | else | 769 | else |
708 | SHA1_HEADER = <openssl/sha.h> | 770 | SHA1_HEADER = <openssl/sha.h> |
709 | EXTLIBS += $(LIB_4_CRYPTO) | 771 | EXTLIBS += $(LIB_4_CRYPTO) |
@@ -715,15 +777,15 @@ ifdef NO_PERL_MAKEMAKER | |||
715 | endif | 777 | endif |
716 | ifdef NO_HSTRERROR | 778 | ifdef NO_HSTRERROR |
717 | COMPAT_CFLAGS += -DNO_HSTRERROR | 779 | COMPAT_CFLAGS += -DNO_HSTRERROR |
718 | COMPAT_OBJS += compat/hstrerror.o | 780 | COMPAT_OBJS += $(OUTPUT)compat/hstrerror.o |
719 | endif | 781 | endif |
720 | ifdef NO_MEMMEM | 782 | ifdef NO_MEMMEM |
721 | COMPAT_CFLAGS += -DNO_MEMMEM | 783 | COMPAT_CFLAGS += -DNO_MEMMEM |
722 | COMPAT_OBJS += compat/memmem.o | 784 | COMPAT_OBJS += $(OUTPUT)compat/memmem.o |
723 | endif | 785 | endif |
724 | ifdef INTERNAL_QSORT | 786 | ifdef INTERNAL_QSORT |
725 | COMPAT_CFLAGS += -DINTERNAL_QSORT | 787 | COMPAT_CFLAGS += -DINTERNAL_QSORT |
726 | COMPAT_OBJS += compat/qsort.o | 788 | COMPAT_OBJS += $(OUTPUT)compat/qsort.o |
727 | endif | 789 | endif |
728 | ifdef RUNTIME_PREFIX | 790 | ifdef RUNTIME_PREFIX |
729 | COMPAT_CFLAGS += -DRUNTIME_PREFIX | 791 | COMPAT_CFLAGS += -DRUNTIME_PREFIX |
@@ -803,7 +865,7 @@ export TAR INSTALL DESTDIR SHELL_PATH | |||
803 | 865 | ||
804 | SHELL = $(SHELL_PATH) | 866 | SHELL = $(SHELL_PATH) |
805 | 867 | ||
806 | all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) PERF-BUILD-OPTIONS | 868 | all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) $(OUTPUT)PERF-BUILD-OPTIONS |
807 | ifneq (,$X) | 869 | ifneq (,$X) |
808 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';) | 870 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';) |
809 | endif | 871 | endif |
@@ -815,39 +877,39 @@ please_set_SHELL_PATH_to_a_more_modern_shell: | |||
815 | 877 | ||
816 | shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell | 878 | shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell |
817 | 879 | ||
818 | strip: $(PROGRAMS) perf$X | 880 | strip: $(PROGRAMS) $(OUTPUT)perf$X |
819 | $(STRIP) $(STRIP_OPTS) $(PROGRAMS) perf$X | 881 | $(STRIP) $(STRIP_OPTS) $(PROGRAMS) $(OUTPUT)perf$X |
820 | 882 | ||
821 | perf.o: perf.c common-cmds.h PERF-CFLAGS | 883 | $(OUTPUT)perf.o: perf.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
822 | $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \ | 884 | $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \ |
823 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 885 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
824 | $(ALL_CFLAGS) -c $(filter %.c,$^) | 886 | $(ALL_CFLAGS) -c $(filter %.c,$^) -o $@ |
825 | 887 | ||
826 | perf$X: perf.o $(BUILTIN_OBJS) $(PERFLIBS) | 888 | $(OUTPUT)perf$X: $(OUTPUT)perf.o $(BUILTIN_OBJS) $(PERFLIBS) |
827 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ perf.o \ | 889 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(OUTPUT)perf.o \ |
828 | $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS) | 890 | $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS) |
829 | 891 | ||
830 | builtin-help.o: builtin-help.c common-cmds.h PERF-CFLAGS | 892 | $(OUTPUT)builtin-help.o: builtin-help.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
831 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 893 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
832 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 894 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
833 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ | 895 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ |
834 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< | 896 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< |
835 | 897 | ||
836 | builtin-timechart.o: builtin-timechart.c common-cmds.h PERF-CFLAGS | 898 | $(OUTPUT)builtin-timechart.o: builtin-timechart.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
837 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 899 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
838 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 900 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
839 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ | 901 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ |
840 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< | 902 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< |
841 | 903 | ||
842 | $(BUILT_INS): perf$X | 904 | $(BUILT_INS): $(OUTPUT)perf$X |
843 | $(QUIET_BUILT_IN)$(RM) $@ && \ | 905 | $(QUIET_BUILT_IN)$(RM) $@ && \ |
844 | ln perf$X $@ 2>/dev/null || \ | 906 | ln perf$X $@ 2>/dev/null || \ |
845 | ln -s perf$X $@ 2>/dev/null || \ | 907 | ln -s perf$X $@ 2>/dev/null || \ |
846 | cp perf$X $@ | 908 | cp perf$X $@ |
847 | 909 | ||
848 | common-cmds.h: util/generate-cmdlist.sh command-list.txt | 910 | $(OUTPUT)common-cmds.h: util/generate-cmdlist.sh command-list.txt |
849 | 911 | ||
850 | common-cmds.h: $(wildcard Documentation/perf-*.txt) | 912 | $(OUTPUT)common-cmds.h: $(wildcard Documentation/perf-*.txt) |
851 | $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@ | 913 | $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@ |
852 | 914 | ||
853 | $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh | 915 | $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh |
@@ -859,7 +921,7 @@ $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh | |||
859 | -e 's/@@NO_CURL@@/$(NO_CURL)/g' \ | 921 | -e 's/@@NO_CURL@@/$(NO_CURL)/g' \ |
860 | $@.sh >$@+ && \ | 922 | $@.sh >$@+ && \ |
861 | chmod +x $@+ && \ | 923 | chmod +x $@+ && \ |
862 | mv $@+ $@ | 924 | mv $@+ $(OUTPUT)$@ |
863 | 925 | ||
864 | configure: configure.ac | 926 | configure: configure.ac |
865 | $(QUIET_GEN)$(RM) $@ $<+ && \ | 927 | $(QUIET_GEN)$(RM) $@ $<+ && \ |
@@ -869,60 +931,50 @@ configure: configure.ac | |||
869 | $(RM) $<+ | 931 | $(RM) $<+ |
870 | 932 | ||
871 | # These can record PERF_VERSION | 933 | # These can record PERF_VERSION |
872 | perf.o perf.spec \ | 934 | $(OUTPUT)perf.o perf.spec \ |
873 | $(patsubst %.sh,%,$(SCRIPT_SH)) \ | 935 | $(patsubst %.sh,%,$(SCRIPT_SH)) \ |
874 | $(patsubst %.perl,%,$(SCRIPT_PERL)) \ | 936 | $(patsubst %.perl,%,$(SCRIPT_PERL)) \ |
875 | : PERF-VERSION-FILE | 937 | : $(OUTPUT)PERF-VERSION-FILE |
876 | 938 | ||
877 | %.o: %.c PERF-CFLAGS | 939 | $(OUTPUT)%.o: %.c $(OUTPUT)PERF-CFLAGS |
878 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< | 940 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $< |
879 | %.s: %.c PERF-CFLAGS | 941 | $(OUTPUT)%.s: %.c $(OUTPUT)PERF-CFLAGS |
880 | $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $< | 942 | $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $< |
881 | %.o: %.S | 943 | $(OUTPUT)%.o: %.S |
882 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< | 944 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $< |
883 | 945 | ||
884 | util/exec_cmd.o: util/exec_cmd.c PERF-CFLAGS | 946 | $(OUTPUT)util/exec_cmd.o: util/exec_cmd.c $(OUTPUT)PERF-CFLAGS |
885 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 947 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
886 | '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \ | 948 | '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \ |
887 | '-DBINDIR="$(bindir_relative_SQ)"' \ | 949 | '-DBINDIR="$(bindir_relative_SQ)"' \ |
888 | '-DPREFIX="$(prefix_SQ)"' \ | 950 | '-DPREFIX="$(prefix_SQ)"' \ |
889 | $< | 951 | $< |
890 | 952 | ||
891 | builtin-init-db.o: builtin-init-db.c PERF-CFLAGS | 953 | $(OUTPUT)builtin-init-db.o: builtin-init-db.c $(OUTPUT)PERF-CFLAGS |
892 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $< | 954 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $< |
893 | |||
894 | util/config.o: util/config.c PERF-CFLAGS | ||
895 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | ||
896 | |||
897 | util/rbtree.o: ../../lib/rbtree.c PERF-CFLAGS | ||
898 | $(QUIET_CC)$(CC) -o util/rbtree.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | ||
899 | |||
900 | # some perf warning policies can't fit to lib/bitmap.c, eg: it warns about variable shadowing | ||
901 | # from <string.h> that comes from kernel headers wrapping. | ||
902 | KBITMAP_FLAGS=`echo $(ALL_CFLAGS) | sed s/-Wshadow// | sed s/-Wswitch-default// | sed s/-Wextra//` | ||
903 | 955 | ||
904 | util/bitmap.o: ../../lib/bitmap.c PERF-CFLAGS | 956 | $(OUTPUT)util/config.o: util/config.c $(OUTPUT)PERF-CFLAGS |
905 | $(QUIET_CC)$(CC) -o util/bitmap.o -c $(KBITMAP_FLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 957 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< |
906 | 958 | ||
907 | util/hweight.o: ../../lib/hweight.c PERF-CFLAGS | 959 | $(OUTPUT)util/newt.o: util/newt.c $(OUTPUT)PERF-CFLAGS |
908 | $(QUIET_CC)$(CC) -o util/hweight.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 960 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $< |
909 | 961 | ||
910 | util/find_next_bit.o: ../../lib/find_next_bit.c PERF-CFLAGS | 962 | $(OUTPUT)util/rbtree.o: ../../lib/rbtree.c $(OUTPUT)PERF-CFLAGS |
911 | $(QUIET_CC)$(CC) -o util/find_next_bit.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 963 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< |
912 | 964 | ||
913 | util/scripting-engines/trace-event-perl.o: util/scripting-engines/trace-event-perl.c PERF-CFLAGS | 965 | $(OUTPUT)util/scripting-engines/trace-event-perl.o: util/scripting-engines/trace-event-perl.c $(OUTPUT)PERF-CFLAGS |
914 | $(QUIET_CC)$(CC) -o util/scripting-engines/trace-event-perl.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< | 966 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< |
915 | 967 | ||
916 | scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c PERF-CFLAGS | 968 | $(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS |
917 | $(QUIET_CC)$(CC) -o scripts/perl/Perf-Trace-Util/Context.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< | 969 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< |
918 | 970 | ||
919 | util/scripting-engines/trace-event-python.o: util/scripting-engines/trace-event-python.c PERF-CFLAGS | 971 | $(OUTPUT)util/scripting-engines/trace-event-python.o: util/scripting-engines/trace-event-python.c $(OUTPUT)PERF-CFLAGS |
920 | $(QUIET_CC)$(CC) -o util/scripting-engines/trace-event-python.o -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< | 972 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< |
921 | 973 | ||
922 | scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c PERF-CFLAGS | 974 | $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS |
923 | $(QUIET_CC)$(CC) -o scripts/python/Perf-Trace-Util/Context.o -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< | 975 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< |
924 | 976 | ||
925 | perf-%$X: %.o $(PERFLIBS) | 977 | $(OUTPUT)perf-%$X: %.o $(PERFLIBS) |
926 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS) | 978 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS) |
927 | 979 | ||
928 | $(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H) | 980 | $(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H) |
@@ -963,17 +1015,17 @@ cscope: | |||
963 | TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\ | 1015 | TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\ |
964 | $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ) | 1016 | $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ) |
965 | 1017 | ||
966 | PERF-CFLAGS: .FORCE-PERF-CFLAGS | 1018 | $(OUTPUT)PERF-CFLAGS: .FORCE-PERF-CFLAGS |
967 | @FLAGS='$(TRACK_CFLAGS)'; \ | 1019 | @FLAGS='$(TRACK_CFLAGS)'; \ |
968 | if test x"$$FLAGS" != x"`cat PERF-CFLAGS 2>/dev/null`" ; then \ | 1020 | if test x"$$FLAGS" != x"`cat $(OUTPUT)PERF-CFLAGS 2>/dev/null`" ; then \ |
969 | echo 1>&2 " * new build flags or prefix"; \ | 1021 | echo 1>&2 " * new build flags or prefix"; \ |
970 | echo "$$FLAGS" >PERF-CFLAGS; \ | 1022 | echo "$$FLAGS" >$(OUTPUT)PERF-CFLAGS; \ |
971 | fi | 1023 | fi |
972 | 1024 | ||
973 | # We need to apply sq twice, once to protect from the shell | 1025 | # We need to apply sq twice, once to protect from the shell |
974 | # that runs PERF-BUILD-OPTIONS, and then again to protect it | 1026 | # that runs $(OUTPUT)PERF-BUILD-OPTIONS, and then again to protect it |
975 | # and the first level quoting from the shell that runs "echo". | 1027 | # and the first level quoting from the shell that runs "echo". |
976 | PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS | 1028 | $(OUTPUT)PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS |
977 | @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@ | 1029 | @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@ |
978 | @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@ | 1030 | @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@ |
979 | @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@ | 1031 | @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@ |
@@ -994,7 +1046,7 @@ all:: $(TEST_PROGRAMS) | |||
994 | 1046 | ||
995 | export NO_SVN_TESTS | 1047 | export NO_SVN_TESTS |
996 | 1048 | ||
997 | check: common-cmds.h | 1049 | check: $(OUTPUT)common-cmds.h |
998 | if sparse; \ | 1050 | if sparse; \ |
999 | then \ | 1051 | then \ |
1000 | for i in *.c */*.c; \ | 1052 | for i in *.c */*.c; \ |
@@ -1028,10 +1080,10 @@ export perfexec_instdir | |||
1028 | 1080 | ||
1029 | install: all | 1081 | install: all |
1030 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)' | 1082 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)' |
1031 | $(INSTALL) perf$X '$(DESTDIR_SQ)$(bindir_SQ)' | 1083 | $(INSTALL) $(OUTPUT)perf$X '$(DESTDIR_SQ)$(bindir_SQ)' |
1032 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' | 1084 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' |
1033 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' | 1085 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' |
1034 | $(INSTALL) perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1086 | $(INSTALL) $(OUTPUT)perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1035 | $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' | 1087 | $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' |
1036 | $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl' | 1088 | $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl' |
1037 | $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' | 1089 | $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' |
@@ -1045,7 +1097,7 @@ ifdef BUILT_INS | |||
1045 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1097 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1046 | $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1098 | $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1047 | ifneq (,$X) | 1099 | ifneq (,$X) |
1048 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';) | 1100 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) $(OUTPUT)perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';) |
1049 | endif | 1101 | endif |
1050 | endif | 1102 | endif |
1051 | 1103 | ||
@@ -1129,14 +1181,14 @@ clean: | |||
1129 | $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE) | 1181 | $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE) |
1130 | $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X | 1182 | $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X |
1131 | $(RM) $(TEST_PROGRAMS) | 1183 | $(RM) $(TEST_PROGRAMS) |
1132 | $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo common-cmds.h TAGS tags cscope* | 1184 | $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo $(OUTPUT)common-cmds.h TAGS tags cscope* |
1133 | $(RM) -r autom4te.cache | 1185 | $(RM) -r autom4te.cache |
1134 | $(RM) config.log config.mak.autogen config.mak.append config.status config.cache | 1186 | $(RM) config.log config.mak.autogen config.mak.append config.status config.cache |
1135 | $(RM) -r $(PERF_TARNAME) .doc-tmp-dir | 1187 | $(RM) -r $(PERF_TARNAME) .doc-tmp-dir |
1136 | $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz | 1188 | $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz |
1137 | $(RM) $(htmldocs).tar.gz $(manpages).tar.gz | 1189 | $(RM) $(htmldocs).tar.gz $(manpages).tar.gz |
1138 | $(MAKE) -C Documentation/ clean | 1190 | $(MAKE) -C Documentation/ clean |
1139 | $(RM) PERF-VERSION-FILE PERF-CFLAGS PERF-BUILD-OPTIONS | 1191 | $(RM) $(OUTPUT)PERF-VERSION-FILE $(OUTPUT)PERF-CFLAGS $(OUTPUT)PERF-BUILD-OPTIONS |
1140 | 1192 | ||
1141 | .PHONY: all install clean strip | 1193 | .PHONY: all install clean strip |
1142 | .PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell | 1194 | .PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell |
diff --git a/tools/perf/arch/powerpc/Makefile b/tools/perf/arch/powerpc/Makefile new file mode 100644 index 000000000000..15130b50dfe3 --- /dev/null +++ b/tools/perf/arch/powerpc/Makefile | |||
@@ -0,0 +1,4 @@ | |||
1 | ifndef NO_DWARF | ||
2 | PERF_HAVE_DWARF_REGS := 1 | ||
3 | LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o | ||
4 | endif | ||
diff --git a/tools/perf/arch/powerpc/util/dwarf-regs.c b/tools/perf/arch/powerpc/util/dwarf-regs.c new file mode 100644 index 000000000000..48ae0c5e3f73 --- /dev/null +++ b/tools/perf/arch/powerpc/util/dwarf-regs.c | |||
@@ -0,0 +1,88 @@ | |||
1 | /* | ||
2 | * Mapping of DWARF debug register numbers into register names. | ||
3 | * | ||
4 | * Copyright (C) 2010 Ian Munsie, IBM Corporation. | ||
5 | * | ||
6 | * This program is free software; you can redistribute it and/or | ||
7 | * modify it under the terms of the GNU General Public License | ||
8 | * as published by the Free Software Foundation; either version | ||
9 | * 2 of the License, or (at your option) any later version. | ||
10 | */ | ||
11 | |||
12 | #include <libio.h> | ||
13 | #include <dwarf-regs.h> | ||
14 | |||
15 | |||
16 | struct pt_regs_dwarfnum { | ||
17 | const char *name; | ||
18 | unsigned int dwarfnum; | ||
19 | }; | ||
20 | |||
21 | #define STR(s) #s | ||
22 | #define REG_DWARFNUM_NAME(r, num) {.name = r, .dwarfnum = num} | ||
23 | #define GPR_DWARFNUM_NAME(num) \ | ||
24 | {.name = STR(%gpr##num), .dwarfnum = num} | ||
25 | #define REG_DWARFNUM_END {.name = NULL, .dwarfnum = 0} | ||
26 | |||
27 | /* | ||
28 | * Reference: | ||
29 | * http://refspecs.linuxfoundation.org/ELF/ppc64/PPC-elf64abi-1.9.html | ||
30 | */ | ||
31 | static const struct pt_regs_dwarfnum regdwarfnum_table[] = { | ||
32 | GPR_DWARFNUM_NAME(0), | ||
33 | GPR_DWARFNUM_NAME(1), | ||
34 | GPR_DWARFNUM_NAME(2), | ||
35 | GPR_DWARFNUM_NAME(3), | ||
36 | GPR_DWARFNUM_NAME(4), | ||
37 | GPR_DWARFNUM_NAME(5), | ||
38 | GPR_DWARFNUM_NAME(6), | ||
39 | GPR_DWARFNUM_NAME(7), | ||
40 | GPR_DWARFNUM_NAME(8), | ||
41 | GPR_DWARFNUM_NAME(9), | ||
42 | GPR_DWARFNUM_NAME(10), | ||
43 | GPR_DWARFNUM_NAME(11), | ||
44 | GPR_DWARFNUM_NAME(12), | ||
45 | GPR_DWARFNUM_NAME(13), | ||
46 | GPR_DWARFNUM_NAME(14), | ||
47 | GPR_DWARFNUM_NAME(15), | ||
48 | GPR_DWARFNUM_NAME(16), | ||
49 | GPR_DWARFNUM_NAME(17), | ||
50 | GPR_DWARFNUM_NAME(18), | ||
51 | GPR_DWARFNUM_NAME(19), | ||
52 | GPR_DWARFNUM_NAME(20), | ||
53 | GPR_DWARFNUM_NAME(21), | ||
54 | GPR_DWARFNUM_NAME(22), | ||
55 | GPR_DWARFNUM_NAME(23), | ||
56 | GPR_DWARFNUM_NAME(24), | ||
57 | GPR_DWARFNUM_NAME(25), | ||
58 | GPR_DWARFNUM_NAME(26), | ||
59 | GPR_DWARFNUM_NAME(27), | ||
60 | GPR_DWARFNUM_NAME(28), | ||
61 | GPR_DWARFNUM_NAME(29), | ||
62 | GPR_DWARFNUM_NAME(30), | ||
63 | GPR_DWARFNUM_NAME(31), | ||
64 | REG_DWARFNUM_NAME("%msr", 66), | ||
65 | REG_DWARFNUM_NAME("%ctr", 109), | ||
66 | REG_DWARFNUM_NAME("%link", 108), | ||
67 | REG_DWARFNUM_NAME("%xer", 101), | ||
68 | REG_DWARFNUM_NAME("%dar", 119), | ||
69 | REG_DWARFNUM_NAME("%dsisr", 118), | ||
70 | REG_DWARFNUM_END, | ||
71 | }; | ||
72 | |||
73 | /** | ||
74 | * get_arch_regstr() - lookup register name from it's DWARF register number | ||
75 | * @n: the DWARF register number | ||
76 | * | ||
77 | * get_arch_regstr() returns the name of the register in struct | ||
78 | * regdwarfnum_table from it's DWARF register number. If the register is not | ||
79 | * found in the table, this returns NULL; | ||
80 | */ | ||
81 | const char *get_arch_regstr(unsigned int n) | ||
82 | { | ||
83 | const struct pt_regs_dwarfnum *roff; | ||
84 | for (roff = regdwarfnum_table; roff->name != NULL; roff++) | ||
85 | if (roff->dwarfnum == n) | ||
86 | return roff->name; | ||
87 | return NULL; | ||
88 | } | ||
diff --git a/tools/perf/arch/x86/Makefile b/tools/perf/arch/x86/Makefile new file mode 100644 index 000000000000..15130b50dfe3 --- /dev/null +++ b/tools/perf/arch/x86/Makefile | |||
@@ -0,0 +1,4 @@ | |||
1 | ifndef NO_DWARF | ||
2 | PERF_HAVE_DWARF_REGS := 1 | ||
3 | LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o | ||
4 | endif | ||
diff --git a/tools/perf/arch/x86/util/dwarf-regs.c b/tools/perf/arch/x86/util/dwarf-regs.c new file mode 100644 index 000000000000..a794d3081928 --- /dev/null +++ b/tools/perf/arch/x86/util/dwarf-regs.c | |||
@@ -0,0 +1,75 @@ | |||
1 | /* | ||
2 | * dwarf-regs.c : Mapping of DWARF debug register numbers into register names. | ||
3 | * Extracted from probe-finder.c | ||
4 | * | ||
5 | * Written by Masami Hiramatsu <mhiramat@redhat.com> | ||
6 | * | ||
7 | * This program is free software; you can redistribute it and/or modify | ||
8 | * it under the terms of the GNU General Public License as published by | ||
9 | * the Free Software Foundation; either version 2 of the License, or | ||
10 | * (at your option) any later version. | ||
11 | * | ||
12 | * This program is distributed in the hope that it will be useful, | ||
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
15 | * GNU General Public License for more details. | ||
16 | * | ||
17 | * You should have received a copy of the GNU General Public License | ||
18 | * along with this program; if not, write to the Free Software | ||
19 | * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. | ||
20 | * | ||
21 | */ | ||
22 | |||
23 | #include <libio.h> | ||
24 | #include <dwarf-regs.h> | ||
25 | |||
26 | /* | ||
27 | * Generic dwarf analysis helpers | ||
28 | */ | ||
29 | |||
30 | #define X86_32_MAX_REGS 8 | ||
31 | const char *x86_32_regs_table[X86_32_MAX_REGS] = { | ||
32 | "%ax", | ||
33 | "%cx", | ||
34 | "%dx", | ||
35 | "%bx", | ||
36 | "$stack", /* Stack address instead of %sp */ | ||
37 | "%bp", | ||
38 | "%si", | ||
39 | "%di", | ||
40 | }; | ||
41 | |||
42 | #define X86_64_MAX_REGS 16 | ||
43 | const char *x86_64_regs_table[X86_64_MAX_REGS] = { | ||
44 | "%ax", | ||
45 | "%dx", | ||
46 | "%cx", | ||
47 | "%bx", | ||
48 | "%si", | ||
49 | "%di", | ||
50 | "%bp", | ||
51 | "%sp", | ||
52 | "%r8", | ||
53 | "%r9", | ||
54 | "%r10", | ||
55 | "%r11", | ||
56 | "%r12", | ||
57 | "%r13", | ||
58 | "%r14", | ||
59 | "%r15", | ||
60 | }; | ||
61 | |||
62 | /* TODO: switching by dwarf address size */ | ||
63 | #ifdef __x86_64__ | ||
64 | #define ARCH_MAX_REGS X86_64_MAX_REGS | ||
65 | #define arch_regs_table x86_64_regs_table | ||
66 | #else | ||
67 | #define ARCH_MAX_REGS X86_32_MAX_REGS | ||
68 | #define arch_regs_table x86_32_regs_table | ||
69 | #endif | ||
70 | |||
71 | /* Return architecture dependent register string (for kprobe-tracer) */ | ||
72 | const char *get_arch_regstr(unsigned int n) | ||
73 | { | ||
74 | return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL; | ||
75 | } | ||
diff --git a/tools/perf/bench/mem-memcpy.c b/tools/perf/bench/mem-memcpy.c index 89773178e894..38dae7465142 100644 --- a/tools/perf/bench/mem-memcpy.c +++ b/tools/perf/bench/mem-memcpy.c | |||
@@ -10,7 +10,6 @@ | |||
10 | #include "../perf.h" | 10 | #include "../perf.h" |
11 | #include "../util/util.h" | 11 | #include "../util/util.h" |
12 | #include "../util/parse-options.h" | 12 | #include "../util/parse-options.h" |
13 | #include "../util/string.h" | ||
14 | #include "../util/header.h" | 13 | #include "../util/header.h" |
15 | #include "bench.h" | 14 | #include "bench.h" |
16 | 15 | ||
@@ -24,7 +23,7 @@ | |||
24 | 23 | ||
25 | static const char *length_str = "1MB"; | 24 | static const char *length_str = "1MB"; |
26 | static const char *routine = "default"; | 25 | static const char *routine = "default"; |
27 | static int use_clock = 0; | 26 | static bool use_clock = false; |
28 | static int clock_fd; | 27 | static int clock_fd; |
29 | 28 | ||
30 | static const struct option options[] = { | 29 | static const struct option options[] = { |
diff --git a/tools/perf/bench/sched-messaging.c b/tools/perf/bench/sched-messaging.c index 81cee78181fa..d1d1b30f99c1 100644 --- a/tools/perf/bench/sched-messaging.c +++ b/tools/perf/bench/sched-messaging.c | |||
@@ -31,9 +31,9 @@ | |||
31 | 31 | ||
32 | #define DATASIZE 100 | 32 | #define DATASIZE 100 |
33 | 33 | ||
34 | static int use_pipes = 0; | 34 | static bool use_pipes = false; |
35 | static unsigned int loops = 100; | 35 | static unsigned int loops = 100; |
36 | static unsigned int thread_mode = 0; | 36 | static bool thread_mode = false; |
37 | static unsigned int num_groups = 10; | 37 | static unsigned int num_groups = 10; |
38 | 38 | ||
39 | struct sender_context { | 39 | struct sender_context { |
@@ -256,10 +256,8 @@ static const struct option options[] = { | |||
256 | "Use pipe() instead of socketpair()"), | 256 | "Use pipe() instead of socketpair()"), |
257 | OPT_BOOLEAN('t', "thread", &thread_mode, | 257 | OPT_BOOLEAN('t', "thread", &thread_mode, |
258 | "Be multi thread instead of multi process"), | 258 | "Be multi thread instead of multi process"), |
259 | OPT_INTEGER('g', "group", &num_groups, | 259 | OPT_UINTEGER('g', "group", &num_groups, "Specify number of groups"), |
260 | "Specify number of groups"), | 260 | OPT_UINTEGER('l', "loop", &loops, "Specify number of loops"), |
261 | OPT_INTEGER('l', "loop", &loops, | ||
262 | "Specify number of loops"), | ||
263 | OPT_END() | 261 | OPT_END() |
264 | }; | 262 | }; |
265 | 263 | ||
diff --git a/tools/perf/bench/sched-pipe.c b/tools/perf/bench/sched-pipe.c index 4f77c7c27640..d9ab3ce446ac 100644 --- a/tools/perf/bench/sched-pipe.c +++ b/tools/perf/bench/sched-pipe.c | |||
@@ -93,7 +93,7 @@ int bench_sched_pipe(int argc, const char **argv, | |||
93 | 93 | ||
94 | switch (bench_format) { | 94 | switch (bench_format) { |
95 | case BENCH_FORMAT_DEFAULT: | 95 | case BENCH_FORMAT_DEFAULT: |
96 | printf("# Extecuted %d pipe operations between two tasks\n\n", | 96 | printf("# Executed %d pipe operations between two tasks\n\n", |
97 | loops); | 97 | loops); |
98 | 98 | ||
99 | result_usec = diff.tv_sec * 1000000; | 99 | result_usec = diff.tv_sec * 1000000; |
diff --git a/tools/perf/builtin-annotate.c b/tools/perf/builtin-annotate.c index 6ad7148451c5..77bcc9b130f5 100644 --- a/tools/perf/builtin-annotate.c +++ b/tools/perf/builtin-annotate.c | |||
@@ -14,7 +14,6 @@ | |||
14 | #include "util/cache.h" | 14 | #include "util/cache.h" |
15 | #include <linux/rbtree.h> | 15 | #include <linux/rbtree.h> |
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | #include "util/string.h" | ||
18 | 17 | ||
19 | #include "perf.h" | 18 | #include "perf.h" |
20 | #include "util/debug.h" | 19 | #include "util/debug.h" |
@@ -29,80 +28,16 @@ | |||
29 | 28 | ||
30 | static char const *input_name = "perf.data"; | 29 | static char const *input_name = "perf.data"; |
31 | 30 | ||
32 | static int force; | 31 | static bool force; |
33 | 32 | ||
34 | static int full_paths; | 33 | static bool full_paths; |
35 | 34 | ||
36 | static int print_line; | 35 | static bool print_line; |
37 | |||
38 | struct sym_hist { | ||
39 | u64 sum; | ||
40 | u64 ip[0]; | ||
41 | }; | ||
42 | |||
43 | struct sym_ext { | ||
44 | struct rb_node node; | ||
45 | double percent; | ||
46 | char *path; | ||
47 | }; | ||
48 | |||
49 | struct sym_priv { | ||
50 | struct sym_hist *hist; | ||
51 | struct sym_ext *ext; | ||
52 | }; | ||
53 | 36 | ||
54 | static const char *sym_hist_filter; | 37 | static const char *sym_hist_filter; |
55 | 38 | ||
56 | static int sym__alloc_hist(struct symbol *self) | 39 | static int hists__add_entry(struct hists *self, struct addr_location *al) |
57 | { | ||
58 | struct sym_priv *priv = symbol__priv(self); | ||
59 | const int size = (sizeof(*priv->hist) + | ||
60 | (self->end - self->start) * sizeof(u64)); | ||
61 | |||
62 | priv->hist = zalloc(size); | ||
63 | return priv->hist == NULL ? -1 : 0; | ||
64 | } | ||
65 | |||
66 | /* | ||
67 | * collect histogram counts | ||
68 | */ | ||
69 | static int annotate__hist_hit(struct hist_entry *he, u64 ip) | ||
70 | { | ||
71 | unsigned int sym_size, offset; | ||
72 | struct symbol *sym = he->sym; | ||
73 | struct sym_priv *priv; | ||
74 | struct sym_hist *h; | ||
75 | |||
76 | he->count++; | ||
77 | |||
78 | if (!sym || !he->map) | ||
79 | return 0; | ||
80 | |||
81 | priv = symbol__priv(sym); | ||
82 | if (priv->hist == NULL && sym__alloc_hist(sym) < 0) | ||
83 | return -ENOMEM; | ||
84 | |||
85 | sym_size = sym->end - sym->start; | ||
86 | offset = ip - sym->start; | ||
87 | |||
88 | pr_debug3("%s: ip=%#Lx\n", __func__, he->map->unmap_ip(he->map, ip)); | ||
89 | |||
90 | if (offset >= sym_size) | ||
91 | return 0; | ||
92 | |||
93 | h = priv->hist; | ||
94 | h->sum++; | ||
95 | h->ip[offset]++; | ||
96 | |||
97 | pr_debug3("%#Lx %s: count++ [ip: %#Lx, %#Lx] => %Ld\n", he->sym->start, | ||
98 | he->sym->name, ip, ip - he->sym->start, h->ip[offset]); | ||
99 | return 0; | ||
100 | } | ||
101 | |||
102 | static int perf_session__add_hist_entry(struct perf_session *self, | ||
103 | struct addr_location *al, u64 count) | ||
104 | { | 40 | { |
105 | bool hit; | ||
106 | struct hist_entry *he; | 41 | struct hist_entry *he; |
107 | 42 | ||
108 | if (sym_hist_filter != NULL && | 43 | if (sym_hist_filter != NULL && |
@@ -116,11 +51,11 @@ static int perf_session__add_hist_entry(struct perf_session *self, | |||
116 | return 0; | 51 | return 0; |
117 | } | 52 | } |
118 | 53 | ||
119 | he = __perf_session__add_hist_entry(&self->hists, al, NULL, count, &hit); | 54 | he = __hists__add_entry(self, al, NULL, 1); |
120 | if (he == NULL) | 55 | if (he == NULL) |
121 | return -ENOMEM; | 56 | return -ENOMEM; |
122 | 57 | ||
123 | return annotate__hist_hit(he, al->addr); | 58 | return hist_entry__inc_addr_samples(he, al->addr); |
124 | } | 59 | } |
125 | 60 | ||
126 | static int process_sample_event(event_t *event, struct perf_session *session) | 61 | static int process_sample_event(event_t *event, struct perf_session *session) |
@@ -136,7 +71,7 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
136 | return -1; | 71 | return -1; |
137 | } | 72 | } |
138 | 73 | ||
139 | if (!al.filtered && perf_session__add_hist_entry(session, &al, 1)) { | 74 | if (!al.filtered && hists__add_entry(&session->hists, &al)) { |
140 | pr_warning("problem incrementing symbol count, " | 75 | pr_warning("problem incrementing symbol count, " |
141 | "skipping event\n"); | 76 | "skipping event\n"); |
142 | return -1; | 77 | return -1; |
@@ -145,106 +80,11 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
145 | return 0; | 80 | return 0; |
146 | } | 81 | } |
147 | 82 | ||
148 | struct objdump_line { | ||
149 | struct list_head node; | ||
150 | s64 offset; | ||
151 | char *line; | ||
152 | }; | ||
153 | |||
154 | static struct objdump_line *objdump_line__new(s64 offset, char *line) | ||
155 | { | ||
156 | struct objdump_line *self = malloc(sizeof(*self)); | ||
157 | |||
158 | if (self != NULL) { | ||
159 | self->offset = offset; | ||
160 | self->line = line; | ||
161 | } | ||
162 | |||
163 | return self; | ||
164 | } | ||
165 | |||
166 | static void objdump_line__free(struct objdump_line *self) | ||
167 | { | ||
168 | free(self->line); | ||
169 | free(self); | ||
170 | } | ||
171 | |||
172 | static void objdump__add_line(struct list_head *head, struct objdump_line *line) | ||
173 | { | ||
174 | list_add_tail(&line->node, head); | ||
175 | } | ||
176 | |||
177 | static struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
178 | struct objdump_line *pos) | ||
179 | { | ||
180 | list_for_each_entry_continue(pos, head, node) | ||
181 | if (pos->offset >= 0) | ||
182 | return pos; | ||
183 | |||
184 | return NULL; | ||
185 | } | ||
186 | |||
187 | static int parse_line(FILE *file, struct hist_entry *he, | ||
188 | struct list_head *head) | ||
189 | { | ||
190 | struct symbol *sym = he->sym; | ||
191 | struct objdump_line *objdump_line; | ||
192 | char *line = NULL, *tmp, *tmp2; | ||
193 | size_t line_len; | ||
194 | s64 line_ip, offset = -1; | ||
195 | char *c; | ||
196 | |||
197 | if (getline(&line, &line_len, file) < 0) | ||
198 | return -1; | ||
199 | |||
200 | if (!line) | ||
201 | return -1; | ||
202 | |||
203 | c = strchr(line, '\n'); | ||
204 | if (c) | ||
205 | *c = 0; | ||
206 | |||
207 | line_ip = -1; | ||
208 | |||
209 | /* | ||
210 | * Strip leading spaces: | ||
211 | */ | ||
212 | tmp = line; | ||
213 | while (*tmp) { | ||
214 | if (*tmp != ' ') | ||
215 | break; | ||
216 | tmp++; | ||
217 | } | ||
218 | |||
219 | if (*tmp) { | ||
220 | /* | ||
221 | * Parse hexa addresses followed by ':' | ||
222 | */ | ||
223 | line_ip = strtoull(tmp, &tmp2, 16); | ||
224 | if (*tmp2 != ':') | ||
225 | line_ip = -1; | ||
226 | } | ||
227 | |||
228 | if (line_ip != -1) { | ||
229 | u64 start = map__rip_2objdump(he->map, sym->start); | ||
230 | offset = line_ip - start; | ||
231 | } | ||
232 | |||
233 | objdump_line = objdump_line__new(offset, line); | ||
234 | if (objdump_line == NULL) { | ||
235 | free(line); | ||
236 | return -1; | ||
237 | } | ||
238 | objdump__add_line(head, objdump_line); | ||
239 | |||
240 | return 0; | ||
241 | } | ||
242 | |||
243 | static int objdump_line__print(struct objdump_line *self, | 83 | static int objdump_line__print(struct objdump_line *self, |
244 | struct list_head *head, | 84 | struct list_head *head, |
245 | struct hist_entry *he, u64 len) | 85 | struct hist_entry *he, u64 len) |
246 | { | 86 | { |
247 | struct symbol *sym = he->sym; | 87 | struct symbol *sym = he->ms.sym; |
248 | static const char *prev_line; | 88 | static const char *prev_line; |
249 | static const char *prev_color; | 89 | static const char *prev_color; |
250 | 90 | ||
@@ -327,7 +167,7 @@ static void insert_source_line(struct sym_ext *sym_ext) | |||
327 | 167 | ||
328 | static void free_source_line(struct hist_entry *he, int len) | 168 | static void free_source_line(struct hist_entry *he, int len) |
329 | { | 169 | { |
330 | struct sym_priv *priv = symbol__priv(he->sym); | 170 | struct sym_priv *priv = symbol__priv(he->ms.sym); |
331 | struct sym_ext *sym_ext = priv->ext; | 171 | struct sym_ext *sym_ext = priv->ext; |
332 | int i; | 172 | int i; |
333 | 173 | ||
@@ -346,7 +186,7 @@ static void free_source_line(struct hist_entry *he, int len) | |||
346 | static void | 186 | static void |
347 | get_source_line(struct hist_entry *he, int len, const char *filename) | 187 | get_source_line(struct hist_entry *he, int len, const char *filename) |
348 | { | 188 | { |
349 | struct symbol *sym = he->sym; | 189 | struct symbol *sym = he->ms.sym; |
350 | u64 start; | 190 | u64 start; |
351 | int i; | 191 | int i; |
352 | char cmd[PATH_MAX * 2]; | 192 | char cmd[PATH_MAX * 2]; |
@@ -361,7 +201,7 @@ get_source_line(struct hist_entry *he, int len, const char *filename) | |||
361 | if (!priv->ext) | 201 | if (!priv->ext) |
362 | return; | 202 | return; |
363 | 203 | ||
364 | start = he->map->unmap_ip(he->map, sym->start); | 204 | start = he->ms.map->unmap_ip(he->ms.map, sym->start); |
365 | 205 | ||
366 | for (i = 0; i < len; i++) { | 206 | for (i = 0; i < len; i++) { |
367 | char *path = NULL; | 207 | char *path = NULL; |
@@ -425,7 +265,7 @@ static void print_summary(const char *filename) | |||
425 | 265 | ||
426 | static void hist_entry__print_hits(struct hist_entry *self) | 266 | static void hist_entry__print_hits(struct hist_entry *self) |
427 | { | 267 | { |
428 | struct symbol *sym = self->sym; | 268 | struct symbol *sym = self->ms.sym; |
429 | struct sym_priv *priv = symbol__priv(sym); | 269 | struct sym_priv *priv = symbol__priv(sym); |
430 | struct sym_hist *h = priv->hist; | 270 | struct sym_hist *h = priv->hist; |
431 | u64 len = sym->end - sym->start, offset; | 271 | u64 len = sym->end - sym->start, offset; |
@@ -439,23 +279,17 @@ static void hist_entry__print_hits(struct hist_entry *self) | |||
439 | 279 | ||
440 | static void annotate_sym(struct hist_entry *he) | 280 | static void annotate_sym(struct hist_entry *he) |
441 | { | 281 | { |
442 | struct map *map = he->map; | 282 | struct map *map = he->ms.map; |
443 | struct dso *dso = map->dso; | 283 | struct dso *dso = map->dso; |
444 | struct symbol *sym = he->sym; | 284 | struct symbol *sym = he->ms.sym; |
445 | const char *filename = dso->long_name, *d_filename; | 285 | const char *filename = dso->long_name, *d_filename; |
446 | u64 len; | 286 | u64 len; |
447 | char command[PATH_MAX*2]; | ||
448 | FILE *file; | ||
449 | LIST_HEAD(head); | 287 | LIST_HEAD(head); |
450 | struct objdump_line *pos, *n; | 288 | struct objdump_line *pos, *n; |
451 | 289 | ||
452 | if (!filename) | 290 | if (hist_entry__annotate(he, &head) < 0) |
453 | return; | 291 | return; |
454 | 292 | ||
455 | pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__, | ||
456 | filename, sym->name, map->unmap_ip(map, sym->start), | ||
457 | map->unmap_ip(map, sym->end)); | ||
458 | |||
459 | if (full_paths) | 293 | if (full_paths) |
460 | d_filename = filename; | 294 | d_filename = filename; |
461 | else | 295 | else |
@@ -472,29 +306,6 @@ static void annotate_sym(struct hist_entry *he) | |||
472 | printf(" Percent | Source code & Disassembly of %s\n", d_filename); | 306 | printf(" Percent | Source code & Disassembly of %s\n", d_filename); |
473 | printf("------------------------------------------------\n"); | 307 | printf("------------------------------------------------\n"); |
474 | 308 | ||
475 | if (verbose >= 2) | ||
476 | printf("annotating [%p] %30s : [%p] %30s\n", | ||
477 | dso, dso->long_name, sym, sym->name); | ||
478 | |||
479 | sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s", | ||
480 | map__rip_2objdump(map, sym->start), | ||
481 | map__rip_2objdump(map, sym->end), | ||
482 | filename, filename); | ||
483 | |||
484 | if (verbose >= 3) | ||
485 | printf("doing: %s\n", command); | ||
486 | |||
487 | file = popen(command, "r"); | ||
488 | if (!file) | ||
489 | return; | ||
490 | |||
491 | while (!feof(file)) { | ||
492 | if (parse_line(file, he, &head) < 0) | ||
493 | break; | ||
494 | } | ||
495 | |||
496 | pclose(file); | ||
497 | |||
498 | if (verbose) | 309 | if (verbose) |
499 | hist_entry__print_hits(he); | 310 | hist_entry__print_hits(he); |
500 | 311 | ||
@@ -508,25 +319,25 @@ static void annotate_sym(struct hist_entry *he) | |||
508 | free_source_line(he, len); | 319 | free_source_line(he, len); |
509 | } | 320 | } |
510 | 321 | ||
511 | static void perf_session__find_annotations(struct perf_session *self) | 322 | static void hists__find_annotations(struct hists *self) |
512 | { | 323 | { |
513 | struct rb_node *nd; | 324 | struct rb_node *nd; |
514 | 325 | ||
515 | for (nd = rb_first(&self->hists); nd; nd = rb_next(nd)) { | 326 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { |
516 | struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node); | 327 | struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node); |
517 | struct sym_priv *priv; | 328 | struct sym_priv *priv; |
518 | 329 | ||
519 | if (he->sym == NULL) | 330 | if (he->ms.sym == NULL) |
520 | continue; | 331 | continue; |
521 | 332 | ||
522 | priv = symbol__priv(he->sym); | 333 | priv = symbol__priv(he->ms.sym); |
523 | if (priv->hist == NULL) | 334 | if (priv->hist == NULL) |
524 | continue; | 335 | continue; |
525 | 336 | ||
526 | annotate_sym(he); | 337 | annotate_sym(he); |
527 | /* | 338 | /* |
528 | * Since we have a hist_entry per IP for the same symbol, free | 339 | * Since we have a hist_entry per IP for the same symbol, free |
529 | * he->sym->hist to signal we already processed this symbol. | 340 | * he->ms.sym->hist to signal we already processed this symbol. |
530 | */ | 341 | */ |
531 | free(priv->hist); | 342 | free(priv->hist); |
532 | priv->hist = NULL; | 343 | priv->hist = NULL; |
@@ -545,7 +356,7 @@ static int __cmd_annotate(void) | |||
545 | int ret; | 356 | int ret; |
546 | struct perf_session *session; | 357 | struct perf_session *session; |
547 | 358 | ||
548 | session = perf_session__new(input_name, O_RDONLY, force); | 359 | session = perf_session__new(input_name, O_RDONLY, force, false); |
549 | if (session == NULL) | 360 | if (session == NULL) |
550 | return -ENOMEM; | 361 | return -ENOMEM; |
551 | 362 | ||
@@ -554,7 +365,7 @@ static int __cmd_annotate(void) | |||
554 | goto out_delete; | 365 | goto out_delete; |
555 | 366 | ||
556 | if (dump_trace) { | 367 | if (dump_trace) { |
557 | event__print_totals(); | 368 | perf_session__fprintf_nr_events(session, stdout); |
558 | goto out_delete; | 369 | goto out_delete; |
559 | } | 370 | } |
560 | 371 | ||
@@ -562,11 +373,11 @@ static int __cmd_annotate(void) | |||
562 | perf_session__fprintf(session, stdout); | 373 | perf_session__fprintf(session, stdout); |
563 | 374 | ||
564 | if (verbose > 2) | 375 | if (verbose > 2) |
565 | dsos__fprintf(stdout); | 376 | perf_session__fprintf_dsos(session, stdout); |
566 | 377 | ||
567 | perf_session__collapse_resort(&session->hists); | 378 | hists__collapse_resort(&session->hists); |
568 | perf_session__output_resort(&session->hists, session->event_total[0]); | 379 | hists__output_resort(&session->hists); |
569 | perf_session__find_annotations(session); | 380 | hists__find_annotations(&session->hists); |
570 | out_delete: | 381 | out_delete: |
571 | perf_session__delete(session); | 382 | perf_session__delete(session); |
572 | 383 | ||
@@ -581,10 +392,12 @@ static const char * const annotate_usage[] = { | |||
581 | static const struct option options[] = { | 392 | static const struct option options[] = { |
582 | OPT_STRING('i', "input", &input_name, "file", | 393 | OPT_STRING('i', "input", &input_name, "file", |
583 | "input file name"), | 394 | "input file name"), |
395 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", | ||
396 | "only consider symbols in these dsos"), | ||
584 | OPT_STRING('s', "symbol", &sym_hist_filter, "symbol", | 397 | OPT_STRING('s', "symbol", &sym_hist_filter, "symbol", |
585 | "symbol to annotate"), | 398 | "symbol to annotate"), |
586 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), | 399 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), |
587 | OPT_BOOLEAN('v', "verbose", &verbose, | 400 | OPT_INCR('v', "verbose", &verbose, |
588 | "be more verbose (show symbol address, etc)"), | 401 | "be more verbose (show symbol address, etc)"), |
589 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 402 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
590 | "dump raw trace in ASCII"), | 403 | "dump raw trace in ASCII"), |
diff --git a/tools/perf/builtin-bench.c b/tools/perf/builtin-bench.c index 46996774e559..fcb96269852a 100644 --- a/tools/perf/builtin-bench.c +++ b/tools/perf/builtin-bench.c | |||
@@ -95,7 +95,7 @@ static void dump_suites(int subsys_index) | |||
95 | return; | 95 | return; |
96 | } | 96 | } |
97 | 97 | ||
98 | static char *bench_format_str; | 98 | static const char *bench_format_str; |
99 | int bench_format = BENCH_FORMAT_DEFAULT; | 99 | int bench_format = BENCH_FORMAT_DEFAULT; |
100 | 100 | ||
101 | static const struct option bench_options[] = { | 101 | static const struct option bench_options[] = { |
@@ -126,7 +126,7 @@ static void print_usage(void) | |||
126 | printf("\n"); | 126 | printf("\n"); |
127 | } | 127 | } |
128 | 128 | ||
129 | static int bench_str2int(char *str) | 129 | static int bench_str2int(const char *str) |
130 | { | 130 | { |
131 | if (!str) | 131 | if (!str) |
132 | return BENCH_FORMAT_DEFAULT; | 132 | return BENCH_FORMAT_DEFAULT; |
diff --git a/tools/perf/builtin-buildid-cache.c b/tools/perf/builtin-buildid-cache.c index 30a05f552c96..f8e3d1852029 100644 --- a/tools/perf/builtin-buildid-cache.c +++ b/tools/perf/builtin-buildid-cache.c | |||
@@ -27,7 +27,7 @@ static const struct option buildid_cache_options[] = { | |||
27 | "file list", "file(s) to add"), | 27 | "file list", "file(s) to add"), |
28 | OPT_STRING('r', "remove", &remove_name_list_str, "file list", | 28 | OPT_STRING('r', "remove", &remove_name_list_str, "file list", |
29 | "file(s) to remove"), | 29 | "file(s) to remove"), |
30 | OPT_BOOLEAN('v', "verbose", &verbose, "be more verbose"), | 30 | OPT_INCR('v', "verbose", &verbose, "be more verbose"), |
31 | OPT_END() | 31 | OPT_END() |
32 | }; | 32 | }; |
33 | 33 | ||
diff --git a/tools/perf/builtin-buildid-list.c b/tools/perf/builtin-buildid-list.c index d0675c02f81e..44a47e13bd67 100644 --- a/tools/perf/builtin-buildid-list.c +++ b/tools/perf/builtin-buildid-list.c | |||
@@ -16,7 +16,7 @@ | |||
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | 17 | ||
18 | static char const *input_name = "perf.data"; | 18 | static char const *input_name = "perf.data"; |
19 | static int force; | 19 | static bool force; |
20 | static bool with_hits; | 20 | static bool with_hits; |
21 | 21 | ||
22 | static const char * const buildid_list_usage[] = { | 22 | static const char * const buildid_list_usage[] = { |
@@ -29,7 +29,7 @@ static const struct option options[] = { | |||
29 | OPT_STRING('i', "input", &input_name, "file", | 29 | OPT_STRING('i', "input", &input_name, "file", |
30 | "input file name"), | 30 | "input file name"), |
31 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), | 31 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), |
32 | OPT_BOOLEAN('v', "verbose", &verbose, | 32 | OPT_INCR('v', "verbose", &verbose, |
33 | "be more verbose"), | 33 | "be more verbose"), |
34 | OPT_END() | 34 | OPT_END() |
35 | }; | 35 | }; |
@@ -39,14 +39,14 @@ static int __cmd_buildid_list(void) | |||
39 | int err = -1; | 39 | int err = -1; |
40 | struct perf_session *session; | 40 | struct perf_session *session; |
41 | 41 | ||
42 | session = perf_session__new(input_name, O_RDONLY, force); | 42 | session = perf_session__new(input_name, O_RDONLY, force, false); |
43 | if (session == NULL) | 43 | if (session == NULL) |
44 | return -1; | 44 | return -1; |
45 | 45 | ||
46 | if (with_hits) | 46 | if (with_hits) |
47 | perf_session__process_events(session, &build_id__mark_dso_hit_ops); | 47 | perf_session__process_events(session, &build_id__mark_dso_hit_ops); |
48 | 48 | ||
49 | dsos__fprintf_buildid(stdout, with_hits); | 49 | perf_session__fprintf_dsos_buildid(session, stdout, with_hits); |
50 | 50 | ||
51 | perf_session__delete(session); | 51 | perf_session__delete(session); |
52 | return err; | 52 | return err; |
diff --git a/tools/perf/builtin-diff.c b/tools/perf/builtin-diff.c index 1ea15d8aeed1..a6e2fdc7a04e 100644 --- a/tools/perf/builtin-diff.c +++ b/tools/perf/builtin-diff.c | |||
@@ -19,23 +19,15 @@ | |||
19 | static char const *input_old = "perf.data.old", | 19 | static char const *input_old = "perf.data.old", |
20 | *input_new = "perf.data"; | 20 | *input_new = "perf.data"; |
21 | static char diff__default_sort_order[] = "dso,symbol"; | 21 | static char diff__default_sort_order[] = "dso,symbol"; |
22 | static int force; | 22 | static bool force; |
23 | static bool show_displacement; | 23 | static bool show_displacement; |
24 | 24 | ||
25 | static int perf_session__add_hist_entry(struct perf_session *self, | 25 | static int hists__add_entry(struct hists *self, |
26 | struct addr_location *al, u64 count) | 26 | struct addr_location *al, u64 period) |
27 | { | 27 | { |
28 | bool hit; | 28 | if (__hists__add_entry(self, al, NULL, period) != NULL) |
29 | struct hist_entry *he = __perf_session__add_hist_entry(&self->hists, | 29 | return 0; |
30 | al, NULL, | 30 | return -ENOMEM; |
31 | count, &hit); | ||
32 | if (he == NULL) | ||
33 | return -ENOMEM; | ||
34 | |||
35 | if (hit) | ||
36 | he->count += count; | ||
37 | |||
38 | return 0; | ||
39 | } | 31 | } |
40 | 32 | ||
41 | static int diff__process_sample_event(event_t *event, struct perf_session *session) | 33 | static int diff__process_sample_event(event_t *event, struct perf_session *session) |
@@ -57,12 +49,12 @@ static int diff__process_sample_event(event_t *event, struct perf_session *sessi | |||
57 | 49 | ||
58 | event__parse_sample(event, session->sample_type, &data); | 50 | event__parse_sample(event, session->sample_type, &data); |
59 | 51 | ||
60 | if (perf_session__add_hist_entry(session, &al, data.period)) { | 52 | if (hists__add_entry(&session->hists, &al, data.period)) { |
61 | pr_warning("problem incrementing symbol count, skipping event\n"); | 53 | pr_warning("problem incrementing symbol period, skipping event\n"); |
62 | return -1; | 54 | return -1; |
63 | } | 55 | } |
64 | 56 | ||
65 | session->events_stats.total += data.period; | 57 | session->hists.stats.total_period += data.period; |
66 | return 0; | 58 | return 0; |
67 | } | 59 | } |
68 | 60 | ||
@@ -95,35 +87,34 @@ static void perf_session__insert_hist_entry_by_name(struct rb_root *root, | |||
95 | rb_insert_color(&he->rb_node, root); | 87 | rb_insert_color(&he->rb_node, root); |
96 | } | 88 | } |
97 | 89 | ||
98 | static void perf_session__resort_hist_entries(struct perf_session *self) | 90 | static void hists__resort_entries(struct hists *self) |
99 | { | 91 | { |
100 | unsigned long position = 1; | 92 | unsigned long position = 1; |
101 | struct rb_root tmp = RB_ROOT; | 93 | struct rb_root tmp = RB_ROOT; |
102 | struct rb_node *next = rb_first(&self->hists); | 94 | struct rb_node *next = rb_first(&self->entries); |
103 | 95 | ||
104 | while (next != NULL) { | 96 | while (next != NULL) { |
105 | struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node); | 97 | struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node); |
106 | 98 | ||
107 | next = rb_next(&n->rb_node); | 99 | next = rb_next(&n->rb_node); |
108 | rb_erase(&n->rb_node, &self->hists); | 100 | rb_erase(&n->rb_node, &self->entries); |
109 | n->position = position++; | 101 | n->position = position++; |
110 | perf_session__insert_hist_entry_by_name(&tmp, n); | 102 | perf_session__insert_hist_entry_by_name(&tmp, n); |
111 | } | 103 | } |
112 | 104 | ||
113 | self->hists = tmp; | 105 | self->entries = tmp; |
114 | } | 106 | } |
115 | 107 | ||
116 | static void perf_session__set_hist_entries_positions(struct perf_session *self) | 108 | static void hists__set_positions(struct hists *self) |
117 | { | 109 | { |
118 | perf_session__output_resort(&self->hists, self->events_stats.total); | 110 | hists__output_resort(self); |
119 | perf_session__resort_hist_entries(self); | 111 | hists__resort_entries(self); |
120 | } | 112 | } |
121 | 113 | ||
122 | static struct hist_entry * | 114 | static struct hist_entry *hists__find_entry(struct hists *self, |
123 | perf_session__find_hist_entry(struct perf_session *self, | 115 | struct hist_entry *he) |
124 | struct hist_entry *he) | ||
125 | { | 116 | { |
126 | struct rb_node *n = self->hists.rb_node; | 117 | struct rb_node *n = self->entries.rb_node; |
127 | 118 | ||
128 | while (n) { | 119 | while (n) { |
129 | struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node); | 120 | struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node); |
@@ -140,14 +131,13 @@ perf_session__find_hist_entry(struct perf_session *self, | |||
140 | return NULL; | 131 | return NULL; |
141 | } | 132 | } |
142 | 133 | ||
143 | static void perf_session__match_hists(struct perf_session *old_session, | 134 | static void hists__match(struct hists *older, struct hists *newer) |
144 | struct perf_session *new_session) | ||
145 | { | 135 | { |
146 | struct rb_node *nd; | 136 | struct rb_node *nd; |
147 | 137 | ||
148 | for (nd = rb_first(&new_session->hists); nd; nd = rb_next(nd)) { | 138 | for (nd = rb_first(&newer->entries); nd; nd = rb_next(nd)) { |
149 | struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node); | 139 | struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node); |
150 | pos->pair = perf_session__find_hist_entry(old_session, pos); | 140 | pos->pair = hists__find_entry(older, pos); |
151 | } | 141 | } |
152 | } | 142 | } |
153 | 143 | ||
@@ -156,8 +146,8 @@ static int __cmd_diff(void) | |||
156 | int ret, i; | 146 | int ret, i; |
157 | struct perf_session *session[2]; | 147 | struct perf_session *session[2]; |
158 | 148 | ||
159 | session[0] = perf_session__new(input_old, O_RDONLY, force); | 149 | session[0] = perf_session__new(input_old, O_RDONLY, force, false); |
160 | session[1] = perf_session__new(input_new, O_RDONLY, force); | 150 | session[1] = perf_session__new(input_new, O_RDONLY, force, false); |
161 | if (session[0] == NULL || session[1] == NULL) | 151 | if (session[0] == NULL || session[1] == NULL) |
162 | return -ENOMEM; | 152 | return -ENOMEM; |
163 | 153 | ||
@@ -167,15 +157,13 @@ static int __cmd_diff(void) | |||
167 | goto out_delete; | 157 | goto out_delete; |
168 | } | 158 | } |
169 | 159 | ||
170 | perf_session__output_resort(&session[1]->hists, | 160 | hists__output_resort(&session[1]->hists); |
171 | session[1]->events_stats.total); | ||
172 | if (show_displacement) | 161 | if (show_displacement) |
173 | perf_session__set_hist_entries_positions(session[0]); | 162 | hists__set_positions(&session[0]->hists); |
174 | 163 | ||
175 | perf_session__match_hists(session[0], session[1]); | 164 | hists__match(&session[0]->hists, &session[1]->hists); |
176 | perf_session__fprintf_hists(&session[1]->hists, session[0], | 165 | hists__fprintf(&session[1]->hists, &session[0]->hists, |
177 | show_displacement, stdout, | 166 | show_displacement, stdout); |
178 | session[1]->events_stats.total); | ||
179 | out_delete: | 167 | out_delete: |
180 | for (i = 0; i < 2; ++i) | 168 | for (i = 0; i < 2; ++i) |
181 | perf_session__delete(session[i]); | 169 | perf_session__delete(session[i]); |
@@ -188,7 +176,7 @@ static const char * const diff_usage[] = { | |||
188 | }; | 176 | }; |
189 | 177 | ||
190 | static const struct option options[] = { | 178 | static const struct option options[] = { |
191 | OPT_BOOLEAN('v', "verbose", &verbose, | 179 | OPT_INCR('v', "verbose", &verbose, |
192 | "be more verbose (show symbol address, etc)"), | 180 | "be more verbose (show symbol address, etc)"), |
193 | OPT_BOOLEAN('m', "displacement", &show_displacement, | 181 | OPT_BOOLEAN('m', "displacement", &show_displacement, |
194 | "Show position displacement relative to baseline"), | 182 | "Show position displacement relative to baseline"), |
@@ -225,6 +213,10 @@ int cmd_diff(int argc, const char **argv, const char *prefix __used) | |||
225 | input_new = argv[1]; | 213 | input_new = argv[1]; |
226 | } else | 214 | } else |
227 | input_new = argv[0]; | 215 | input_new = argv[0]; |
216 | } else if (symbol_conf.default_guest_vmlinux_name || | ||
217 | symbol_conf.default_guest_kallsyms) { | ||
218 | input_old = "perf.data.host"; | ||
219 | input_new = "perf.data.guest"; | ||
228 | } | 220 | } |
229 | 221 | ||
230 | symbol_conf.exclude_other = false; | 222 | symbol_conf.exclude_other = false; |
diff --git a/tools/perf/builtin-help.c b/tools/perf/builtin-help.c index 215b584007b1..6d5a8a7faf48 100644 --- a/tools/perf/builtin-help.c +++ b/tools/perf/builtin-help.c | |||
@@ -29,14 +29,14 @@ enum help_format { | |||
29 | HELP_FORMAT_WEB, | 29 | HELP_FORMAT_WEB, |
30 | }; | 30 | }; |
31 | 31 | ||
32 | static int show_all = 0; | 32 | static bool show_all = false; |
33 | static enum help_format help_format = HELP_FORMAT_MAN; | 33 | static enum help_format help_format = HELP_FORMAT_MAN; |
34 | static struct option builtin_help_options[] = { | 34 | static struct option builtin_help_options[] = { |
35 | OPT_BOOLEAN('a', "all", &show_all, "print all available commands"), | 35 | OPT_BOOLEAN('a', "all", &show_all, "print all available commands"), |
36 | OPT_SET_INT('m', "man", &help_format, "show man page", HELP_FORMAT_MAN), | 36 | OPT_SET_UINT('m', "man", &help_format, "show man page", HELP_FORMAT_MAN), |
37 | OPT_SET_INT('w', "web", &help_format, "show manual in web browser", | 37 | OPT_SET_UINT('w', "web", &help_format, "show manual in web browser", |
38 | HELP_FORMAT_WEB), | 38 | HELP_FORMAT_WEB), |
39 | OPT_SET_INT('i', "info", &help_format, "show info page", | 39 | OPT_SET_UINT('i', "info", &help_format, "show info page", |
40 | HELP_FORMAT_INFO), | 40 | HELP_FORMAT_INFO), |
41 | OPT_END(), | 41 | OPT_END(), |
42 | }; | 42 | }; |
diff --git a/tools/perf/builtin-inject.c b/tools/perf/builtin-inject.c new file mode 100644 index 000000000000..8e3e47b064ce --- /dev/null +++ b/tools/perf/builtin-inject.c | |||
@@ -0,0 +1,228 @@ | |||
1 | /* | ||
2 | * builtin-inject.c | ||
3 | * | ||
4 | * Builtin inject command: Examine the live mode (stdin) event stream | ||
5 | * and repipe it to stdout while optionally injecting additional | ||
6 | * events into it. | ||
7 | */ | ||
8 | #include "builtin.h" | ||
9 | |||
10 | #include "perf.h" | ||
11 | #include "util/session.h" | ||
12 | #include "util/debug.h" | ||
13 | |||
14 | #include "util/parse-options.h" | ||
15 | |||
16 | static char const *input_name = "-"; | ||
17 | static bool inject_build_ids; | ||
18 | |||
19 | static int event__repipe(event_t *event __used, | ||
20 | struct perf_session *session __used) | ||
21 | { | ||
22 | uint32_t size; | ||
23 | void *buf = event; | ||
24 | |||
25 | size = event->header.size; | ||
26 | |||
27 | while (size) { | ||
28 | int ret = write(STDOUT_FILENO, buf, size); | ||
29 | if (ret < 0) | ||
30 | return -errno; | ||
31 | |||
32 | size -= ret; | ||
33 | buf += ret; | ||
34 | } | ||
35 | |||
36 | return 0; | ||
37 | } | ||
38 | |||
39 | static int event__repipe_mmap(event_t *self, struct perf_session *session) | ||
40 | { | ||
41 | int err; | ||
42 | |||
43 | err = event__process_mmap(self, session); | ||
44 | event__repipe(self, session); | ||
45 | |||
46 | return err; | ||
47 | } | ||
48 | |||
49 | static int event__repipe_task(event_t *self, struct perf_session *session) | ||
50 | { | ||
51 | int err; | ||
52 | |||
53 | err = event__process_task(self, session); | ||
54 | event__repipe(self, session); | ||
55 | |||
56 | return err; | ||
57 | } | ||
58 | |||
59 | static int event__repipe_tracing_data(event_t *self, | ||
60 | struct perf_session *session) | ||
61 | { | ||
62 | int err; | ||
63 | |||
64 | event__repipe(self, session); | ||
65 | err = event__process_tracing_data(self, session); | ||
66 | |||
67 | return err; | ||
68 | } | ||
69 | |||
70 | static int dso__read_build_id(struct dso *self) | ||
71 | { | ||
72 | if (self->has_build_id) | ||
73 | return 0; | ||
74 | |||
75 | if (filename__read_build_id(self->long_name, self->build_id, | ||
76 | sizeof(self->build_id)) > 0) { | ||
77 | self->has_build_id = true; | ||
78 | return 0; | ||
79 | } | ||
80 | |||
81 | return -1; | ||
82 | } | ||
83 | |||
84 | static int dso__inject_build_id(struct dso *self, struct perf_session *session) | ||
85 | { | ||
86 | u16 misc = PERF_RECORD_MISC_USER; | ||
87 | struct machine *machine; | ||
88 | int err; | ||
89 | |||
90 | if (dso__read_build_id(self) < 0) { | ||
91 | pr_debug("no build_id found for %s\n", self->long_name); | ||
92 | return -1; | ||
93 | } | ||
94 | |||
95 | machine = perf_session__find_host_machine(session); | ||
96 | if (machine == NULL) { | ||
97 | pr_err("Can't find machine for session\n"); | ||
98 | return -1; | ||
99 | } | ||
100 | |||
101 | if (self->kernel) | ||
102 | misc = PERF_RECORD_MISC_KERNEL; | ||
103 | |||
104 | err = event__synthesize_build_id(self, misc, event__repipe, | ||
105 | machine, session); | ||
106 | if (err) { | ||
107 | pr_err("Can't synthesize build_id event for %s\n", self->long_name); | ||
108 | return -1; | ||
109 | } | ||
110 | |||
111 | return 0; | ||
112 | } | ||
113 | |||
114 | static int event__inject_buildid(event_t *event, struct perf_session *session) | ||
115 | { | ||
116 | struct addr_location al; | ||
117 | struct thread *thread; | ||
118 | u8 cpumode; | ||
119 | |||
120 | cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | ||
121 | |||
122 | thread = perf_session__findnew(session, event->ip.pid); | ||
123 | if (thread == NULL) { | ||
124 | pr_err("problem processing %d event, skipping it.\n", | ||
125 | event->header.type); | ||
126 | goto repipe; | ||
127 | } | ||
128 | |||
129 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, | ||
130 | event->ip.pid, event->ip.ip, &al); | ||
131 | |||
132 | if (al.map != NULL) { | ||
133 | if (!al.map->dso->hit) { | ||
134 | al.map->dso->hit = 1; | ||
135 | if (map__load(al.map, NULL) >= 0) { | ||
136 | dso__inject_build_id(al.map->dso, session); | ||
137 | /* | ||
138 | * If this fails, too bad, let the other side | ||
139 | * account this as unresolved. | ||
140 | */ | ||
141 | } else | ||
142 | pr_warning("no symbols found in %s, maybe " | ||
143 | "install a debug package?\n", | ||
144 | al.map->dso->long_name); | ||
145 | } | ||
146 | } | ||
147 | |||
148 | repipe: | ||
149 | event__repipe(event, session); | ||
150 | return 0; | ||
151 | } | ||
152 | |||
153 | struct perf_event_ops inject_ops = { | ||
154 | .sample = event__repipe, | ||
155 | .mmap = event__repipe, | ||
156 | .comm = event__repipe, | ||
157 | .fork = event__repipe, | ||
158 | .exit = event__repipe, | ||
159 | .lost = event__repipe, | ||
160 | .read = event__repipe, | ||
161 | .throttle = event__repipe, | ||
162 | .unthrottle = event__repipe, | ||
163 | .attr = event__repipe, | ||
164 | .event_type = event__repipe, | ||
165 | .tracing_data = event__repipe, | ||
166 | .build_id = event__repipe, | ||
167 | }; | ||
168 | |||
169 | extern volatile int session_done; | ||
170 | |||
171 | static void sig_handler(int sig __attribute__((__unused__))) | ||
172 | { | ||
173 | session_done = 1; | ||
174 | } | ||
175 | |||
176 | static int __cmd_inject(void) | ||
177 | { | ||
178 | struct perf_session *session; | ||
179 | int ret = -EINVAL; | ||
180 | |||
181 | signal(SIGINT, sig_handler); | ||
182 | |||
183 | if (inject_build_ids) { | ||
184 | inject_ops.sample = event__inject_buildid; | ||
185 | inject_ops.mmap = event__repipe_mmap; | ||
186 | inject_ops.fork = event__repipe_task; | ||
187 | inject_ops.tracing_data = event__repipe_tracing_data; | ||
188 | } | ||
189 | |||
190 | session = perf_session__new(input_name, O_RDONLY, false, true); | ||
191 | if (session == NULL) | ||
192 | return -ENOMEM; | ||
193 | |||
194 | ret = perf_session__process_events(session, &inject_ops); | ||
195 | |||
196 | perf_session__delete(session); | ||
197 | |||
198 | return ret; | ||
199 | } | ||
200 | |||
201 | static const char * const report_usage[] = { | ||
202 | "perf inject [<options>]", | ||
203 | NULL | ||
204 | }; | ||
205 | |||
206 | static const struct option options[] = { | ||
207 | OPT_BOOLEAN('b', "build-ids", &inject_build_ids, | ||
208 | "Inject build-ids into the output stream"), | ||
209 | OPT_INCR('v', "verbose", &verbose, | ||
210 | "be more verbose (show build ids, etc)"), | ||
211 | OPT_END() | ||
212 | }; | ||
213 | |||
214 | int cmd_inject(int argc, const char **argv, const char *prefix __used) | ||
215 | { | ||
216 | argc = parse_options(argc, argv, options, report_usage, 0); | ||
217 | |||
218 | /* | ||
219 | * Any (unrecognized) arguments left? | ||
220 | */ | ||
221 | if (argc) | ||
222 | usage_with_options(report_usage, options); | ||
223 | |||
224 | if (symbol__init() < 0) | ||
225 | return -1; | ||
226 | |||
227 | return __cmd_inject(); | ||
228 | } | ||
diff --git a/tools/perf/builtin-kmem.c b/tools/perf/builtin-kmem.c index 924a9518931a..31f60a2535e0 100644 --- a/tools/perf/builtin-kmem.c +++ b/tools/perf/builtin-kmem.c | |||
@@ -335,8 +335,9 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
335 | } | 335 | } |
336 | 336 | ||
337 | static struct perf_event_ops event_ops = { | 337 | static struct perf_event_ops event_ops = { |
338 | .sample = process_sample_event, | 338 | .sample = process_sample_event, |
339 | .comm = event__process_comm, | 339 | .comm = event__process_comm, |
340 | .ordered_samples = true, | ||
340 | }; | 341 | }; |
341 | 342 | ||
342 | static double fragmentation(unsigned long n_req, unsigned long n_alloc) | 343 | static double fragmentation(unsigned long n_req, unsigned long n_alloc) |
@@ -351,6 +352,7 @@ static void __print_result(struct rb_root *root, struct perf_session *session, | |||
351 | int n_lines, int is_caller) | 352 | int n_lines, int is_caller) |
352 | { | 353 | { |
353 | struct rb_node *next; | 354 | struct rb_node *next; |
355 | struct machine *machine; | ||
354 | 356 | ||
355 | printf("%.102s\n", graph_dotted_line); | 357 | printf("%.102s\n", graph_dotted_line); |
356 | printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr"); | 358 | printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr"); |
@@ -359,23 +361,29 @@ static void __print_result(struct rb_root *root, struct perf_session *session, | |||
359 | 361 | ||
360 | next = rb_first(root); | 362 | next = rb_first(root); |
361 | 363 | ||
364 | machine = perf_session__find_host_machine(session); | ||
365 | if (!machine) { | ||
366 | pr_err("__print_result: couldn't find kernel information\n"); | ||
367 | return; | ||
368 | } | ||
362 | while (next && n_lines--) { | 369 | while (next && n_lines--) { |
363 | struct alloc_stat *data = rb_entry(next, struct alloc_stat, | 370 | struct alloc_stat *data = rb_entry(next, struct alloc_stat, |
364 | node); | 371 | node); |
365 | struct symbol *sym = NULL; | 372 | struct symbol *sym = NULL; |
373 | struct map *map; | ||
366 | char buf[BUFSIZ]; | 374 | char buf[BUFSIZ]; |
367 | u64 addr; | 375 | u64 addr; |
368 | 376 | ||
369 | if (is_caller) { | 377 | if (is_caller) { |
370 | addr = data->call_site; | 378 | addr = data->call_site; |
371 | if (!raw_ip) | 379 | if (!raw_ip) |
372 | sym = map_groups__find_function(&session->kmaps, addr, NULL); | 380 | sym = machine__find_kernel_function(machine, addr, &map, NULL); |
373 | } else | 381 | } else |
374 | addr = data->ptr; | 382 | addr = data->ptr; |
375 | 383 | ||
376 | if (sym != NULL) | 384 | if (sym != NULL) |
377 | snprintf(buf, sizeof(buf), "%s+%Lx", sym->name, | 385 | snprintf(buf, sizeof(buf), "%s+%Lx", sym->name, |
378 | addr - sym->start); | 386 | addr - map->unmap_ip(map, sym->start)); |
379 | else | 387 | else |
380 | snprintf(buf, sizeof(buf), "%#Lx", addr); | 388 | snprintf(buf, sizeof(buf), "%#Lx", addr); |
381 | printf(" %-34s |", buf); | 389 | printf(" %-34s |", buf); |
@@ -484,10 +492,13 @@ static void sort_result(void) | |||
484 | static int __cmd_kmem(void) | 492 | static int __cmd_kmem(void) |
485 | { | 493 | { |
486 | int err = -EINVAL; | 494 | int err = -EINVAL; |
487 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 495 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
488 | if (session == NULL) | 496 | if (session == NULL) |
489 | return -ENOMEM; | 497 | return -ENOMEM; |
490 | 498 | ||
499 | if (perf_session__create_kernel_maps(session) < 0) | ||
500 | goto out_delete; | ||
501 | |||
491 | if (!perf_session__has_traces(session, "kmem record")) | 502 | if (!perf_session__has_traces(session, "kmem record")) |
492 | goto out_delete; | 503 | goto out_delete; |
493 | 504 | ||
@@ -718,7 +729,6 @@ static const char *record_args[] = { | |||
718 | "record", | 729 | "record", |
719 | "-a", | 730 | "-a", |
720 | "-R", | 731 | "-R", |
721 | "-M", | ||
722 | "-f", | 732 | "-f", |
723 | "-c", "1", | 733 | "-c", "1", |
724 | "-e", "kmem:kmalloc", | 734 | "-e", "kmem:kmalloc", |
diff --git a/tools/perf/builtin-kvm.c b/tools/perf/builtin-kvm.c new file mode 100644 index 000000000000..34d1e853829d --- /dev/null +++ b/tools/perf/builtin-kvm.c | |||
@@ -0,0 +1,144 @@ | |||
1 | #include "builtin.h" | ||
2 | #include "perf.h" | ||
3 | |||
4 | #include "util/util.h" | ||
5 | #include "util/cache.h" | ||
6 | #include "util/symbol.h" | ||
7 | #include "util/thread.h" | ||
8 | #include "util/header.h" | ||
9 | #include "util/session.h" | ||
10 | |||
11 | #include "util/parse-options.h" | ||
12 | #include "util/trace-event.h" | ||
13 | |||
14 | #include "util/debug.h" | ||
15 | |||
16 | #include <sys/prctl.h> | ||
17 | |||
18 | #include <semaphore.h> | ||
19 | #include <pthread.h> | ||
20 | #include <math.h> | ||
21 | |||
22 | static const char *file_name; | ||
23 | static char name_buffer[256]; | ||
24 | |||
25 | bool perf_host = 1; | ||
26 | bool perf_guest; | ||
27 | |||
28 | static const char * const kvm_usage[] = { | ||
29 | "perf kvm [<options>] {top|record|report|diff|buildid-list}", | ||
30 | NULL | ||
31 | }; | ||
32 | |||
33 | static const struct option kvm_options[] = { | ||
34 | OPT_STRING('i', "input", &file_name, "file", | ||
35 | "Input file name"), | ||
36 | OPT_STRING('o', "output", &file_name, "file", | ||
37 | "Output file name"), | ||
38 | OPT_BOOLEAN(0, "guest", &perf_guest, | ||
39 | "Collect guest os data"), | ||
40 | OPT_BOOLEAN(0, "host", &perf_host, | ||
41 | "Collect guest os data"), | ||
42 | OPT_STRING(0, "guestmount", &symbol_conf.guestmount, "directory", | ||
43 | "guest mount directory under which every guest os" | ||
44 | " instance has a subdir"), | ||
45 | OPT_STRING(0, "guestvmlinux", &symbol_conf.default_guest_vmlinux_name, | ||
46 | "file", "file saving guest os vmlinux"), | ||
47 | OPT_STRING(0, "guestkallsyms", &symbol_conf.default_guest_kallsyms, | ||
48 | "file", "file saving guest os /proc/kallsyms"), | ||
49 | OPT_STRING(0, "guestmodules", &symbol_conf.default_guest_modules, | ||
50 | "file", "file saving guest os /proc/modules"), | ||
51 | OPT_END() | ||
52 | }; | ||
53 | |||
54 | static int __cmd_record(int argc, const char **argv) | ||
55 | { | ||
56 | int rec_argc, i = 0, j; | ||
57 | const char **rec_argv; | ||
58 | |||
59 | rec_argc = argc + 2; | ||
60 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
61 | rec_argv[i++] = strdup("record"); | ||
62 | rec_argv[i++] = strdup("-o"); | ||
63 | rec_argv[i++] = strdup(file_name); | ||
64 | for (j = 1; j < argc; j++, i++) | ||
65 | rec_argv[i] = argv[j]; | ||
66 | |||
67 | BUG_ON(i != rec_argc); | ||
68 | |||
69 | return cmd_record(i, rec_argv, NULL); | ||
70 | } | ||
71 | |||
72 | static int __cmd_report(int argc, const char **argv) | ||
73 | { | ||
74 | int rec_argc, i = 0, j; | ||
75 | const char **rec_argv; | ||
76 | |||
77 | rec_argc = argc + 2; | ||
78 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
79 | rec_argv[i++] = strdup("report"); | ||
80 | rec_argv[i++] = strdup("-i"); | ||
81 | rec_argv[i++] = strdup(file_name); | ||
82 | for (j = 1; j < argc; j++, i++) | ||
83 | rec_argv[i] = argv[j]; | ||
84 | |||
85 | BUG_ON(i != rec_argc); | ||
86 | |||
87 | return cmd_report(i, rec_argv, NULL); | ||
88 | } | ||
89 | |||
90 | static int __cmd_buildid_list(int argc, const char **argv) | ||
91 | { | ||
92 | int rec_argc, i = 0, j; | ||
93 | const char **rec_argv; | ||
94 | |||
95 | rec_argc = argc + 2; | ||
96 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
97 | rec_argv[i++] = strdup("buildid-list"); | ||
98 | rec_argv[i++] = strdup("-i"); | ||
99 | rec_argv[i++] = strdup(file_name); | ||
100 | for (j = 1; j < argc; j++, i++) | ||
101 | rec_argv[i] = argv[j]; | ||
102 | |||
103 | BUG_ON(i != rec_argc); | ||
104 | |||
105 | return cmd_buildid_list(i, rec_argv, NULL); | ||
106 | } | ||
107 | |||
108 | int cmd_kvm(int argc, const char **argv, const char *prefix __used) | ||
109 | { | ||
110 | perf_host = perf_guest = 0; | ||
111 | |||
112 | argc = parse_options(argc, argv, kvm_options, kvm_usage, | ||
113 | PARSE_OPT_STOP_AT_NON_OPTION); | ||
114 | if (!argc) | ||
115 | usage_with_options(kvm_usage, kvm_options); | ||
116 | |||
117 | if (!perf_host) | ||
118 | perf_guest = 1; | ||
119 | |||
120 | if (!file_name) { | ||
121 | if (perf_host && !perf_guest) | ||
122 | sprintf(name_buffer, "perf.data.host"); | ||
123 | else if (!perf_host && perf_guest) | ||
124 | sprintf(name_buffer, "perf.data.guest"); | ||
125 | else | ||
126 | sprintf(name_buffer, "perf.data.kvm"); | ||
127 | file_name = name_buffer; | ||
128 | } | ||
129 | |||
130 | if (!strncmp(argv[0], "rec", 3)) | ||
131 | return __cmd_record(argc, argv); | ||
132 | else if (!strncmp(argv[0], "rep", 3)) | ||
133 | return __cmd_report(argc, argv); | ||
134 | else if (!strncmp(argv[0], "diff", 4)) | ||
135 | return cmd_diff(argc, argv, NULL); | ||
136 | else if (!strncmp(argv[0], "top", 3)) | ||
137 | return cmd_top(argc, argv, NULL); | ||
138 | else if (!strncmp(argv[0], "buildid-list", 12)) | ||
139 | return __cmd_buildid_list(argc, argv); | ||
140 | else | ||
141 | usage_with_options(kvm_usage, kvm_options); | ||
142 | |||
143 | return 0; | ||
144 | } | ||
diff --git a/tools/perf/builtin-lock.c b/tools/perf/builtin-lock.c index e12c844df1e2..821c1586a22b 100644 --- a/tools/perf/builtin-lock.c +++ b/tools/perf/builtin-lock.c | |||
@@ -23,6 +23,8 @@ | |||
23 | #include <linux/list.h> | 23 | #include <linux/list.h> |
24 | #include <linux/hash.h> | 24 | #include <linux/hash.h> |
25 | 25 | ||
26 | static struct perf_session *session; | ||
27 | |||
26 | /* based on kernel/lockdep.c */ | 28 | /* based on kernel/lockdep.c */ |
27 | #define LOCKHASH_BITS 12 | 29 | #define LOCKHASH_BITS 12 |
28 | #define LOCKHASH_SIZE (1UL << LOCKHASH_BITS) | 30 | #define LOCKHASH_SIZE (1UL << LOCKHASH_BITS) |
@@ -32,9 +34,6 @@ static struct list_head lockhash_table[LOCKHASH_SIZE]; | |||
32 | #define __lockhashfn(key) hash_long((unsigned long)key, LOCKHASH_BITS) | 34 | #define __lockhashfn(key) hash_long((unsigned long)key, LOCKHASH_BITS) |
33 | #define lockhashentry(key) (lockhash_table + __lockhashfn((key))) | 35 | #define lockhashentry(key) (lockhash_table + __lockhashfn((key))) |
34 | 36 | ||
35 | #define LOCK_STATE_UNLOCKED 0 /* initial state */ | ||
36 | #define LOCK_STATE_LOCKED 1 | ||
37 | |||
38 | struct lock_stat { | 37 | struct lock_stat { |
39 | struct list_head hash_entry; | 38 | struct list_head hash_entry; |
40 | struct rb_node rb; /* used for sorting */ | 39 | struct rb_node rb; /* used for sorting */ |
@@ -47,20 +46,151 @@ struct lock_stat { | |||
47 | void *addr; /* address of lockdep_map, used as ID */ | 46 | void *addr; /* address of lockdep_map, used as ID */ |
48 | char *name; /* for strcpy(), we cannot use const */ | 47 | char *name; /* for strcpy(), we cannot use const */ |
49 | 48 | ||
50 | int state; | ||
51 | u64 prev_event_time; /* timestamp of previous event */ | ||
52 | |||
53 | unsigned int nr_acquired; | ||
54 | unsigned int nr_acquire; | 49 | unsigned int nr_acquire; |
50 | unsigned int nr_acquired; | ||
55 | unsigned int nr_contended; | 51 | unsigned int nr_contended; |
56 | unsigned int nr_release; | 52 | unsigned int nr_release; |
57 | 53 | ||
54 | unsigned int nr_readlock; | ||
55 | unsigned int nr_trylock; | ||
58 | /* these times are in nano sec. */ | 56 | /* these times are in nano sec. */ |
59 | u64 wait_time_total; | 57 | u64 wait_time_total; |
60 | u64 wait_time_min; | 58 | u64 wait_time_min; |
61 | u64 wait_time_max; | 59 | u64 wait_time_max; |
60 | |||
61 | int discard; /* flag of blacklist */ | ||
62 | }; | 62 | }; |
63 | 63 | ||
64 | /* | ||
65 | * States of lock_seq_stat | ||
66 | * | ||
67 | * UNINITIALIZED is required for detecting first event of acquire. | ||
68 | * As the nature of lock events, there is no guarantee | ||
69 | * that the first event for the locks are acquire, | ||
70 | * it can be acquired, contended or release. | ||
71 | */ | ||
72 | #define SEQ_STATE_UNINITIALIZED 0 /* initial state */ | ||
73 | #define SEQ_STATE_RELEASED 1 | ||
74 | #define SEQ_STATE_ACQUIRING 2 | ||
75 | #define SEQ_STATE_ACQUIRED 3 | ||
76 | #define SEQ_STATE_READ_ACQUIRED 4 | ||
77 | #define SEQ_STATE_CONTENDED 5 | ||
78 | |||
79 | /* | ||
80 | * MAX_LOCK_DEPTH | ||
81 | * Imported from include/linux/sched.h. | ||
82 | * Should this be synchronized? | ||
83 | */ | ||
84 | #define MAX_LOCK_DEPTH 48 | ||
85 | |||
86 | /* | ||
87 | * struct lock_seq_stat: | ||
88 | * Place to put on state of one lock sequence | ||
89 | * 1) acquire -> acquired -> release | ||
90 | * 2) acquire -> contended -> acquired -> release | ||
91 | * 3) acquire (with read or try) -> release | ||
92 | * 4) Are there other patterns? | ||
93 | */ | ||
94 | struct lock_seq_stat { | ||
95 | struct list_head list; | ||
96 | int state; | ||
97 | u64 prev_event_time; | ||
98 | void *addr; | ||
99 | |||
100 | int read_count; | ||
101 | }; | ||
102 | |||
103 | struct thread_stat { | ||
104 | struct rb_node rb; | ||
105 | |||
106 | u32 tid; | ||
107 | struct list_head seq_list; | ||
108 | }; | ||
109 | |||
110 | static struct rb_root thread_stats; | ||
111 | |||
112 | static struct thread_stat *thread_stat_find(u32 tid) | ||
113 | { | ||
114 | struct rb_node *node; | ||
115 | struct thread_stat *st; | ||
116 | |||
117 | node = thread_stats.rb_node; | ||
118 | while (node) { | ||
119 | st = container_of(node, struct thread_stat, rb); | ||
120 | if (st->tid == tid) | ||
121 | return st; | ||
122 | else if (tid < st->tid) | ||
123 | node = node->rb_left; | ||
124 | else | ||
125 | node = node->rb_right; | ||
126 | } | ||
127 | |||
128 | return NULL; | ||
129 | } | ||
130 | |||
131 | static void thread_stat_insert(struct thread_stat *new) | ||
132 | { | ||
133 | struct rb_node **rb = &thread_stats.rb_node; | ||
134 | struct rb_node *parent = NULL; | ||
135 | struct thread_stat *p; | ||
136 | |||
137 | while (*rb) { | ||
138 | p = container_of(*rb, struct thread_stat, rb); | ||
139 | parent = *rb; | ||
140 | |||
141 | if (new->tid < p->tid) | ||
142 | rb = &(*rb)->rb_left; | ||
143 | else if (new->tid > p->tid) | ||
144 | rb = &(*rb)->rb_right; | ||
145 | else | ||
146 | BUG_ON("inserting invalid thread_stat\n"); | ||
147 | } | ||
148 | |||
149 | rb_link_node(&new->rb, parent, rb); | ||
150 | rb_insert_color(&new->rb, &thread_stats); | ||
151 | } | ||
152 | |||
153 | static struct thread_stat *thread_stat_findnew_after_first(u32 tid) | ||
154 | { | ||
155 | struct thread_stat *st; | ||
156 | |||
157 | st = thread_stat_find(tid); | ||
158 | if (st) | ||
159 | return st; | ||
160 | |||
161 | st = zalloc(sizeof(struct thread_stat)); | ||
162 | if (!st) | ||
163 | die("memory allocation failed\n"); | ||
164 | |||
165 | st->tid = tid; | ||
166 | INIT_LIST_HEAD(&st->seq_list); | ||
167 | |||
168 | thread_stat_insert(st); | ||
169 | |||
170 | return st; | ||
171 | } | ||
172 | |||
173 | static struct thread_stat *thread_stat_findnew_first(u32 tid); | ||
174 | static struct thread_stat *(*thread_stat_findnew)(u32 tid) = | ||
175 | thread_stat_findnew_first; | ||
176 | |||
177 | static struct thread_stat *thread_stat_findnew_first(u32 tid) | ||
178 | { | ||
179 | struct thread_stat *st; | ||
180 | |||
181 | st = zalloc(sizeof(struct thread_stat)); | ||
182 | if (!st) | ||
183 | die("memory allocation failed\n"); | ||
184 | st->tid = tid; | ||
185 | INIT_LIST_HEAD(&st->seq_list); | ||
186 | |||
187 | rb_link_node(&st->rb, NULL, &thread_stats.rb_node); | ||
188 | rb_insert_color(&st->rb, &thread_stats); | ||
189 | |||
190 | thread_stat_findnew = thread_stat_findnew_after_first; | ||
191 | return st; | ||
192 | } | ||
193 | |||
64 | /* build simple key function one is bigger than two */ | 194 | /* build simple key function one is bigger than two */ |
65 | #define SINGLE_KEY(member) \ | 195 | #define SINGLE_KEY(member) \ |
66 | static int lock_stat_key_ ## member(struct lock_stat *one, \ | 196 | static int lock_stat_key_ ## member(struct lock_stat *one, \ |
@@ -175,8 +305,6 @@ static struct lock_stat *lock_stat_findnew(void *addr, const char *name) | |||
175 | goto alloc_failed; | 305 | goto alloc_failed; |
176 | strcpy(new->name, name); | 306 | strcpy(new->name, name); |
177 | 307 | ||
178 | /* LOCK_STATE_UNLOCKED == 0 isn't guaranteed forever */ | ||
179 | new->state = LOCK_STATE_UNLOCKED; | ||
180 | new->wait_time_min = ULLONG_MAX; | 308 | new->wait_time_min = ULLONG_MAX; |
181 | 309 | ||
182 | list_add(&new->hash_entry, entry); | 310 | list_add(&new->hash_entry, entry); |
@@ -188,8 +316,6 @@ alloc_failed: | |||
188 | 316 | ||
189 | static char const *input_name = "perf.data"; | 317 | static char const *input_name = "perf.data"; |
190 | 318 | ||
191 | static int profile_cpu = -1; | ||
192 | |||
193 | struct raw_event_sample { | 319 | struct raw_event_sample { |
194 | u32 size; | 320 | u32 size; |
195 | char data[0]; | 321 | char data[0]; |
@@ -198,6 +324,7 @@ struct raw_event_sample { | |||
198 | struct trace_acquire_event { | 324 | struct trace_acquire_event { |
199 | void *addr; | 325 | void *addr; |
200 | const char *name; | 326 | const char *name; |
327 | int flag; | ||
201 | }; | 328 | }; |
202 | 329 | ||
203 | struct trace_acquired_event { | 330 | struct trace_acquired_event { |
@@ -241,120 +368,258 @@ struct trace_lock_handler { | |||
241 | struct thread *thread); | 368 | struct thread *thread); |
242 | }; | 369 | }; |
243 | 370 | ||
371 | static struct lock_seq_stat *get_seq(struct thread_stat *ts, void *addr) | ||
372 | { | ||
373 | struct lock_seq_stat *seq; | ||
374 | |||
375 | list_for_each_entry(seq, &ts->seq_list, list) { | ||
376 | if (seq->addr == addr) | ||
377 | return seq; | ||
378 | } | ||
379 | |||
380 | seq = zalloc(sizeof(struct lock_seq_stat)); | ||
381 | if (!seq) | ||
382 | die("Not enough memory\n"); | ||
383 | seq->state = SEQ_STATE_UNINITIALIZED; | ||
384 | seq->addr = addr; | ||
385 | |||
386 | list_add(&seq->list, &ts->seq_list); | ||
387 | return seq; | ||
388 | } | ||
389 | |||
390 | enum broken_state { | ||
391 | BROKEN_ACQUIRE, | ||
392 | BROKEN_ACQUIRED, | ||
393 | BROKEN_CONTENDED, | ||
394 | BROKEN_RELEASE, | ||
395 | BROKEN_MAX, | ||
396 | }; | ||
397 | |||
398 | static int bad_hist[BROKEN_MAX]; | ||
399 | |||
400 | enum acquire_flags { | ||
401 | TRY_LOCK = 1, | ||
402 | READ_LOCK = 2, | ||
403 | }; | ||
404 | |||
244 | static void | 405 | static void |
245 | report_lock_acquire_event(struct trace_acquire_event *acquire_event, | 406 | report_lock_acquire_event(struct trace_acquire_event *acquire_event, |
246 | struct event *__event __used, | 407 | struct event *__event __used, |
247 | int cpu __used, | 408 | int cpu __used, |
248 | u64 timestamp, | 409 | u64 timestamp __used, |
249 | struct thread *thread __used) | 410 | struct thread *thread __used) |
250 | { | 411 | { |
251 | struct lock_stat *st; | 412 | struct lock_stat *ls; |
413 | struct thread_stat *ts; | ||
414 | struct lock_seq_stat *seq; | ||
415 | |||
416 | ls = lock_stat_findnew(acquire_event->addr, acquire_event->name); | ||
417 | if (ls->discard) | ||
418 | return; | ||
252 | 419 | ||
253 | st = lock_stat_findnew(acquire_event->addr, acquire_event->name); | 420 | ts = thread_stat_findnew(thread->pid); |
421 | seq = get_seq(ts, acquire_event->addr); | ||
254 | 422 | ||
255 | switch (st->state) { | 423 | switch (seq->state) { |
256 | case LOCK_STATE_UNLOCKED: | 424 | case SEQ_STATE_UNINITIALIZED: |
425 | case SEQ_STATE_RELEASED: | ||
426 | if (!acquire_event->flag) { | ||
427 | seq->state = SEQ_STATE_ACQUIRING; | ||
428 | } else { | ||
429 | if (acquire_event->flag & TRY_LOCK) | ||
430 | ls->nr_trylock++; | ||
431 | if (acquire_event->flag & READ_LOCK) | ||
432 | ls->nr_readlock++; | ||
433 | seq->state = SEQ_STATE_READ_ACQUIRED; | ||
434 | seq->read_count = 1; | ||
435 | ls->nr_acquired++; | ||
436 | } | ||
437 | break; | ||
438 | case SEQ_STATE_READ_ACQUIRED: | ||
439 | if (acquire_event->flag & READ_LOCK) { | ||
440 | seq->read_count++; | ||
441 | ls->nr_acquired++; | ||
442 | goto end; | ||
443 | } else { | ||
444 | goto broken; | ||
445 | } | ||
257 | break; | 446 | break; |
258 | case LOCK_STATE_LOCKED: | 447 | case SEQ_STATE_ACQUIRED: |
448 | case SEQ_STATE_ACQUIRING: | ||
449 | case SEQ_STATE_CONTENDED: | ||
450 | broken: | ||
451 | /* broken lock sequence, discard it */ | ||
452 | ls->discard = 1; | ||
453 | bad_hist[BROKEN_ACQUIRE]++; | ||
454 | list_del(&seq->list); | ||
455 | free(seq); | ||
456 | goto end; | ||
259 | break; | 457 | break; |
260 | default: | 458 | default: |
261 | BUG_ON(1); | 459 | BUG_ON("Unknown state of lock sequence found!\n"); |
262 | break; | 460 | break; |
263 | } | 461 | } |
264 | 462 | ||
265 | st->prev_event_time = timestamp; | 463 | ls->nr_acquire++; |
464 | seq->prev_event_time = timestamp; | ||
465 | end: | ||
466 | return; | ||
266 | } | 467 | } |
267 | 468 | ||
268 | static void | 469 | static void |
269 | report_lock_acquired_event(struct trace_acquired_event *acquired_event, | 470 | report_lock_acquired_event(struct trace_acquired_event *acquired_event, |
270 | struct event *__event __used, | 471 | struct event *__event __used, |
271 | int cpu __used, | 472 | int cpu __used, |
272 | u64 timestamp, | 473 | u64 timestamp __used, |
273 | struct thread *thread __used) | 474 | struct thread *thread __used) |
274 | { | 475 | { |
275 | struct lock_stat *st; | 476 | struct lock_stat *ls; |
477 | struct thread_stat *ts; | ||
478 | struct lock_seq_stat *seq; | ||
479 | u64 contended_term; | ||
480 | |||
481 | ls = lock_stat_findnew(acquired_event->addr, acquired_event->name); | ||
482 | if (ls->discard) | ||
483 | return; | ||
276 | 484 | ||
277 | st = lock_stat_findnew(acquired_event->addr, acquired_event->name); | 485 | ts = thread_stat_findnew(thread->pid); |
486 | seq = get_seq(ts, acquired_event->addr); | ||
278 | 487 | ||
279 | switch (st->state) { | 488 | switch (seq->state) { |
280 | case LOCK_STATE_UNLOCKED: | 489 | case SEQ_STATE_UNINITIALIZED: |
281 | st->state = LOCK_STATE_LOCKED; | 490 | /* orphan event, do nothing */ |
282 | st->nr_acquired++; | 491 | return; |
492 | case SEQ_STATE_ACQUIRING: | ||
493 | break; | ||
494 | case SEQ_STATE_CONTENDED: | ||
495 | contended_term = timestamp - seq->prev_event_time; | ||
496 | ls->wait_time_total += contended_term; | ||
497 | if (contended_term < ls->wait_time_min) | ||
498 | ls->wait_time_min = contended_term; | ||
499 | if (ls->wait_time_max < contended_term) | ||
500 | ls->wait_time_max = contended_term; | ||
283 | break; | 501 | break; |
284 | case LOCK_STATE_LOCKED: | 502 | case SEQ_STATE_RELEASED: |
503 | case SEQ_STATE_ACQUIRED: | ||
504 | case SEQ_STATE_READ_ACQUIRED: | ||
505 | /* broken lock sequence, discard it */ | ||
506 | ls->discard = 1; | ||
507 | bad_hist[BROKEN_ACQUIRED]++; | ||
508 | list_del(&seq->list); | ||
509 | free(seq); | ||
510 | goto end; | ||
285 | break; | 511 | break; |
512 | |||
286 | default: | 513 | default: |
287 | BUG_ON(1); | 514 | BUG_ON("Unknown state of lock sequence found!\n"); |
288 | break; | 515 | break; |
289 | } | 516 | } |
290 | 517 | ||
291 | st->prev_event_time = timestamp; | 518 | seq->state = SEQ_STATE_ACQUIRED; |
519 | ls->nr_acquired++; | ||
520 | seq->prev_event_time = timestamp; | ||
521 | end: | ||
522 | return; | ||
292 | } | 523 | } |
293 | 524 | ||
294 | static void | 525 | static void |
295 | report_lock_contended_event(struct trace_contended_event *contended_event, | 526 | report_lock_contended_event(struct trace_contended_event *contended_event, |
296 | struct event *__event __used, | 527 | struct event *__event __used, |
297 | int cpu __used, | 528 | int cpu __used, |
298 | u64 timestamp, | 529 | u64 timestamp __used, |
299 | struct thread *thread __used) | 530 | struct thread *thread __used) |
300 | { | 531 | { |
301 | struct lock_stat *st; | 532 | struct lock_stat *ls; |
533 | struct thread_stat *ts; | ||
534 | struct lock_seq_stat *seq; | ||
302 | 535 | ||
303 | st = lock_stat_findnew(contended_event->addr, contended_event->name); | 536 | ls = lock_stat_findnew(contended_event->addr, contended_event->name); |
537 | if (ls->discard) | ||
538 | return; | ||
304 | 539 | ||
305 | switch (st->state) { | 540 | ts = thread_stat_findnew(thread->pid); |
306 | case LOCK_STATE_UNLOCKED: | 541 | seq = get_seq(ts, contended_event->addr); |
542 | |||
543 | switch (seq->state) { | ||
544 | case SEQ_STATE_UNINITIALIZED: | ||
545 | /* orphan event, do nothing */ | ||
546 | return; | ||
547 | case SEQ_STATE_ACQUIRING: | ||
307 | break; | 548 | break; |
308 | case LOCK_STATE_LOCKED: | 549 | case SEQ_STATE_RELEASED: |
309 | st->nr_contended++; | 550 | case SEQ_STATE_ACQUIRED: |
551 | case SEQ_STATE_READ_ACQUIRED: | ||
552 | case SEQ_STATE_CONTENDED: | ||
553 | /* broken lock sequence, discard it */ | ||
554 | ls->discard = 1; | ||
555 | bad_hist[BROKEN_CONTENDED]++; | ||
556 | list_del(&seq->list); | ||
557 | free(seq); | ||
558 | goto end; | ||
310 | break; | 559 | break; |
311 | default: | 560 | default: |
312 | BUG_ON(1); | 561 | BUG_ON("Unknown state of lock sequence found!\n"); |
313 | break; | 562 | break; |
314 | } | 563 | } |
315 | 564 | ||
316 | st->prev_event_time = timestamp; | 565 | seq->state = SEQ_STATE_CONTENDED; |
566 | ls->nr_contended++; | ||
567 | seq->prev_event_time = timestamp; | ||
568 | end: | ||
569 | return; | ||
317 | } | 570 | } |
318 | 571 | ||
319 | static void | 572 | static void |
320 | report_lock_release_event(struct trace_release_event *release_event, | 573 | report_lock_release_event(struct trace_release_event *release_event, |
321 | struct event *__event __used, | 574 | struct event *__event __used, |
322 | int cpu __used, | 575 | int cpu __used, |
323 | u64 timestamp, | 576 | u64 timestamp __used, |
324 | struct thread *thread __used) | 577 | struct thread *thread __used) |
325 | { | 578 | { |
326 | struct lock_stat *st; | 579 | struct lock_stat *ls; |
327 | u64 hold_time; | 580 | struct thread_stat *ts; |
581 | struct lock_seq_stat *seq; | ||
328 | 582 | ||
329 | st = lock_stat_findnew(release_event->addr, release_event->name); | 583 | ls = lock_stat_findnew(release_event->addr, release_event->name); |
584 | if (ls->discard) | ||
585 | return; | ||
330 | 586 | ||
331 | switch (st->state) { | 587 | ts = thread_stat_findnew(thread->pid); |
332 | case LOCK_STATE_UNLOCKED: | 588 | seq = get_seq(ts, release_event->addr); |
333 | break; | ||
334 | case LOCK_STATE_LOCKED: | ||
335 | st->state = LOCK_STATE_UNLOCKED; | ||
336 | hold_time = timestamp - st->prev_event_time; | ||
337 | 589 | ||
338 | if (timestamp < st->prev_event_time) { | 590 | switch (seq->state) { |
339 | /* terribly, this can happen... */ | 591 | case SEQ_STATE_UNINITIALIZED: |
592 | goto end; | ||
593 | break; | ||
594 | case SEQ_STATE_ACQUIRED: | ||
595 | break; | ||
596 | case SEQ_STATE_READ_ACQUIRED: | ||
597 | seq->read_count--; | ||
598 | BUG_ON(seq->read_count < 0); | ||
599 | if (!seq->read_count) { | ||
600 | ls->nr_release++; | ||
340 | goto end; | 601 | goto end; |
341 | } | 602 | } |
342 | 603 | break; | |
343 | if (st->wait_time_min > hold_time) | 604 | case SEQ_STATE_ACQUIRING: |
344 | st->wait_time_min = hold_time; | 605 | case SEQ_STATE_CONTENDED: |
345 | if (st->wait_time_max < hold_time) | 606 | case SEQ_STATE_RELEASED: |
346 | st->wait_time_max = hold_time; | 607 | /* broken lock sequence, discard it */ |
347 | st->wait_time_total += hold_time; | 608 | ls->discard = 1; |
348 | 609 | bad_hist[BROKEN_RELEASE]++; | |
349 | st->nr_release++; | 610 | goto free_seq; |
350 | break; | 611 | break; |
351 | default: | 612 | default: |
352 | BUG_ON(1); | 613 | BUG_ON("Unknown state of lock sequence found!\n"); |
353 | break; | 614 | break; |
354 | } | 615 | } |
355 | 616 | ||
617 | ls->nr_release++; | ||
618 | free_seq: | ||
619 | list_del(&seq->list); | ||
620 | free(seq); | ||
356 | end: | 621 | end: |
357 | st->prev_event_time = timestamp; | 622 | return; |
358 | } | 623 | } |
359 | 624 | ||
360 | /* lock oriented handlers */ | 625 | /* lock oriented handlers */ |
@@ -381,6 +646,7 @@ process_lock_acquire_event(void *data, | |||
381 | tmp = raw_field_value(event, "lockdep_addr", data); | 646 | tmp = raw_field_value(event, "lockdep_addr", data); |
382 | memcpy(&acquire_event.addr, &tmp, sizeof(void *)); | 647 | memcpy(&acquire_event.addr, &tmp, sizeof(void *)); |
383 | acquire_event.name = (char *)raw_field_ptr(event, "name", data); | 648 | acquire_event.name = (char *)raw_field_ptr(event, "name", data); |
649 | acquire_event.flag = (int)raw_field_value(event, "flag", data); | ||
384 | 650 | ||
385 | if (trace_handler->acquire_event) | 651 | if (trace_handler->acquire_event) |
386 | trace_handler->acquire_event(&acquire_event, event, cpu, timestamp, thread); | 652 | trace_handler->acquire_event(&acquire_event, event, cpu, timestamp, thread); |
@@ -441,8 +707,7 @@ process_lock_release_event(void *data, | |||
441 | } | 707 | } |
442 | 708 | ||
443 | static void | 709 | static void |
444 | process_raw_event(void *data, int cpu, | 710 | process_raw_event(void *data, int cpu, u64 timestamp, struct thread *thread) |
445 | u64 timestamp, struct thread *thread) | ||
446 | { | 711 | { |
447 | struct event *event; | 712 | struct event *event; |
448 | int type; | 713 | int type; |
@@ -460,173 +725,19 @@ process_raw_event(void *data, int cpu, | |||
460 | process_lock_release_event(data, event, cpu, timestamp, thread); | 725 | process_lock_release_event(data, event, cpu, timestamp, thread); |
461 | } | 726 | } |
462 | 727 | ||
463 | struct raw_event_queue { | 728 | static void print_bad_events(int bad, int total) |
464 | u64 timestamp; | ||
465 | int cpu; | ||
466 | void *data; | ||
467 | struct thread *thread; | ||
468 | struct list_head list; | ||
469 | }; | ||
470 | |||
471 | static LIST_HEAD(raw_event_head); | ||
472 | |||
473 | #define FLUSH_PERIOD (5 * NSEC_PER_SEC) | ||
474 | |||
475 | static u64 flush_limit = ULLONG_MAX; | ||
476 | static u64 last_flush = 0; | ||
477 | struct raw_event_queue *last_inserted; | ||
478 | |||
479 | static void flush_raw_event_queue(u64 limit) | ||
480 | { | ||
481 | struct raw_event_queue *tmp, *iter; | ||
482 | |||
483 | list_for_each_entry_safe(iter, tmp, &raw_event_head, list) { | ||
484 | if (iter->timestamp > limit) | ||
485 | return; | ||
486 | |||
487 | if (iter == last_inserted) | ||
488 | last_inserted = NULL; | ||
489 | |||
490 | process_raw_event(iter->data, iter->cpu, iter->timestamp, | ||
491 | iter->thread); | ||
492 | |||
493 | last_flush = iter->timestamp; | ||
494 | list_del(&iter->list); | ||
495 | free(iter->data); | ||
496 | free(iter); | ||
497 | } | ||
498 | } | ||
499 | |||
500 | static void __queue_raw_event_end(struct raw_event_queue *new) | ||
501 | { | ||
502 | struct raw_event_queue *iter; | ||
503 | |||
504 | list_for_each_entry_reverse(iter, &raw_event_head, list) { | ||
505 | if (iter->timestamp < new->timestamp) { | ||
506 | list_add(&new->list, &iter->list); | ||
507 | return; | ||
508 | } | ||
509 | } | ||
510 | |||
511 | list_add(&new->list, &raw_event_head); | ||
512 | } | ||
513 | |||
514 | static void __queue_raw_event_before(struct raw_event_queue *new, | ||
515 | struct raw_event_queue *iter) | ||
516 | { | 729 | { |
517 | list_for_each_entry_continue_reverse(iter, &raw_event_head, list) { | 730 | /* Output for debug, this have to be removed */ |
518 | if (iter->timestamp < new->timestamp) { | 731 | int i; |
519 | list_add(&new->list, &iter->list); | 732 | const char *name[4] = |
520 | return; | 733 | { "acquire", "acquired", "contended", "release" }; |
521 | } | 734 | |
522 | } | 735 | pr_info("\n=== output for debug===\n\n"); |
523 | 736 | pr_info("bad: %d, total: %d\n", bad, total); | |
524 | list_add(&new->list, &raw_event_head); | 737 | pr_info("bad rate: %f %%\n", (double)bad / (double)total * 100); |
525 | } | 738 | pr_info("histogram of events caused bad sequence\n"); |
526 | 739 | for (i = 0; i < BROKEN_MAX; i++) | |
527 | static void __queue_raw_event_after(struct raw_event_queue *new, | 740 | pr_info(" %10s: %d\n", name[i], bad_hist[i]); |
528 | struct raw_event_queue *iter) | ||
529 | { | ||
530 | list_for_each_entry_continue(iter, &raw_event_head, list) { | ||
531 | if (iter->timestamp > new->timestamp) { | ||
532 | list_add_tail(&new->list, &iter->list); | ||
533 | return; | ||
534 | } | ||
535 | } | ||
536 | list_add_tail(&new->list, &raw_event_head); | ||
537 | } | ||
538 | |||
539 | /* The queue is ordered by time */ | ||
540 | static void __queue_raw_event(struct raw_event_queue *new) | ||
541 | { | ||
542 | if (!last_inserted) { | ||
543 | __queue_raw_event_end(new); | ||
544 | return; | ||
545 | } | ||
546 | |||
547 | /* | ||
548 | * Most of the time the current event has a timestamp | ||
549 | * very close to the last event inserted, unless we just switched | ||
550 | * to another event buffer. Having a sorting based on a list and | ||
551 | * on the last inserted event that is close to the current one is | ||
552 | * probably more efficient than an rbtree based sorting. | ||
553 | */ | ||
554 | if (last_inserted->timestamp >= new->timestamp) | ||
555 | __queue_raw_event_before(new, last_inserted); | ||
556 | else | ||
557 | __queue_raw_event_after(new, last_inserted); | ||
558 | } | ||
559 | |||
560 | static void queue_raw_event(void *data, int raw_size, int cpu, | ||
561 | u64 timestamp, struct thread *thread) | ||
562 | { | ||
563 | struct raw_event_queue *new; | ||
564 | |||
565 | if (flush_limit == ULLONG_MAX) | ||
566 | flush_limit = timestamp + FLUSH_PERIOD; | ||
567 | |||
568 | if (timestamp < last_flush) { | ||
569 | printf("Warning: Timestamp below last timeslice flush\n"); | ||
570 | return; | ||
571 | } | ||
572 | |||
573 | new = malloc(sizeof(*new)); | ||
574 | if (!new) | ||
575 | die("Not enough memory\n"); | ||
576 | |||
577 | new->timestamp = timestamp; | ||
578 | new->cpu = cpu; | ||
579 | new->thread = thread; | ||
580 | |||
581 | new->data = malloc(raw_size); | ||
582 | if (!new->data) | ||
583 | die("Not enough memory\n"); | ||
584 | |||
585 | memcpy(new->data, data, raw_size); | ||
586 | |||
587 | __queue_raw_event(new); | ||
588 | last_inserted = new; | ||
589 | |||
590 | /* | ||
591 | * We want to have a slice of events covering 2 * FLUSH_PERIOD | ||
592 | * If FLUSH_PERIOD is big enough, it ensures every events that occured | ||
593 | * in the first half of the timeslice have all been buffered and there | ||
594 | * are none remaining (we need that because of the weakly ordered | ||
595 | * event recording we have). Then once we reach the 2 * FLUSH_PERIOD | ||
596 | * timeslice, we flush the first half to be gentle with the memory | ||
597 | * (the second half can still get new events in the middle, so wait | ||
598 | * another period to flush it) | ||
599 | */ | ||
600 | if (new->timestamp > flush_limit && | ||
601 | new->timestamp - flush_limit > FLUSH_PERIOD) { | ||
602 | flush_limit += FLUSH_PERIOD; | ||
603 | flush_raw_event_queue(flush_limit); | ||
604 | } | ||
605 | } | ||
606 | |||
607 | static int process_sample_event(event_t *event, struct perf_session *session) | ||
608 | { | ||
609 | struct thread *thread; | ||
610 | struct sample_data data; | ||
611 | |||
612 | bzero(&data, sizeof(struct sample_data)); | ||
613 | event__parse_sample(event, session->sample_type, &data); | ||
614 | thread = perf_session__findnew(session, data.pid); | ||
615 | |||
616 | if (thread == NULL) { | ||
617 | pr_debug("problem processing %d event, skipping it.\n", | ||
618 | event->header.type); | ||
619 | return -1; | ||
620 | } | ||
621 | |||
622 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); | ||
623 | |||
624 | if (profile_cpu != -1 && profile_cpu != (int) data.cpu) | ||
625 | return 0; | ||
626 | |||
627 | queue_raw_event(data.raw_data, data.raw_size, data.cpu, data.time, thread); | ||
628 | |||
629 | return 0; | ||
630 | } | 741 | } |
631 | 742 | ||
632 | /* TODO: various way to print, coloring, nano or milli sec */ | 743 | /* TODO: various way to print, coloring, nano or milli sec */ |
@@ -634,26 +745,30 @@ static void print_result(void) | |||
634 | { | 745 | { |
635 | struct lock_stat *st; | 746 | struct lock_stat *st; |
636 | char cut_name[20]; | 747 | char cut_name[20]; |
748 | int bad, total; | ||
637 | 749 | ||
638 | printf("%18s ", "ID"); | 750 | pr_info("%20s ", "Name"); |
639 | printf("%20s ", "Name"); | 751 | pr_info("%10s ", "acquired"); |
640 | printf("%10s ", "acquired"); | 752 | pr_info("%10s ", "contended"); |
641 | printf("%10s ", "contended"); | ||
642 | 753 | ||
643 | printf("%15s ", "total wait (ns)"); | 754 | pr_info("%15s ", "total wait (ns)"); |
644 | printf("%15s ", "max wait (ns)"); | 755 | pr_info("%15s ", "max wait (ns)"); |
645 | printf("%15s ", "min wait (ns)"); | 756 | pr_info("%15s ", "min wait (ns)"); |
646 | 757 | ||
647 | printf("\n\n"); | 758 | pr_info("\n\n"); |
648 | 759 | ||
760 | bad = total = 0; | ||
649 | while ((st = pop_from_result())) { | 761 | while ((st = pop_from_result())) { |
762 | total++; | ||
763 | if (st->discard) { | ||
764 | bad++; | ||
765 | continue; | ||
766 | } | ||
650 | bzero(cut_name, 20); | 767 | bzero(cut_name, 20); |
651 | 768 | ||
652 | printf("%p ", st->addr); | ||
653 | |||
654 | if (strlen(st->name) < 16) { | 769 | if (strlen(st->name) < 16) { |
655 | /* output raw name */ | 770 | /* output raw name */ |
656 | printf("%20s ", st->name); | 771 | pr_info("%20s ", st->name); |
657 | } else { | 772 | } else { |
658 | strncpy(cut_name, st->name, 16); | 773 | strncpy(cut_name, st->name, 16); |
659 | cut_name[16] = '.'; | 774 | cut_name[16] = '.'; |
@@ -661,18 +776,39 @@ static void print_result(void) | |||
661 | cut_name[18] = '.'; | 776 | cut_name[18] = '.'; |
662 | cut_name[19] = '\0'; | 777 | cut_name[19] = '\0'; |
663 | /* cut off name for saving output style */ | 778 | /* cut off name for saving output style */ |
664 | printf("%20s ", cut_name); | 779 | pr_info("%20s ", cut_name); |
665 | } | 780 | } |
666 | 781 | ||
667 | printf("%10u ", st->nr_acquired); | 782 | pr_info("%10u ", st->nr_acquired); |
668 | printf("%10u ", st->nr_contended); | 783 | pr_info("%10u ", st->nr_contended); |
669 | 784 | ||
670 | printf("%15llu ", st->wait_time_total); | 785 | pr_info("%15llu ", st->wait_time_total); |
671 | printf("%15llu ", st->wait_time_max); | 786 | pr_info("%15llu ", st->wait_time_max); |
672 | printf("%15llu ", st->wait_time_min == ULLONG_MAX ? | 787 | pr_info("%15llu ", st->wait_time_min == ULLONG_MAX ? |
673 | 0 : st->wait_time_min); | 788 | 0 : st->wait_time_min); |
674 | printf("\n"); | 789 | pr_info("\n"); |
675 | } | 790 | } |
791 | |||
792 | print_bad_events(bad, total); | ||
793 | } | ||
794 | |||
795 | static bool info_threads, info_map; | ||
796 | |||
797 | static void dump_threads(void) | ||
798 | { | ||
799 | struct thread_stat *st; | ||
800 | struct rb_node *node; | ||
801 | struct thread *t; | ||
802 | |||
803 | pr_info("%10s: comm\n", "Thread ID"); | ||
804 | |||
805 | node = rb_first(&thread_stats); | ||
806 | while (node) { | ||
807 | st = container_of(node, struct thread_stat, rb); | ||
808 | t = perf_session__findnew(session, st->tid); | ||
809 | pr_info("%10d: %s\n", st->tid, t->comm); | ||
810 | node = rb_next(node); | ||
811 | }; | ||
676 | } | 812 | } |
677 | 813 | ||
678 | static void dump_map(void) | 814 | static void dump_map(void) |
@@ -680,23 +816,53 @@ static void dump_map(void) | |||
680 | unsigned int i; | 816 | unsigned int i; |
681 | struct lock_stat *st; | 817 | struct lock_stat *st; |
682 | 818 | ||
819 | pr_info("Address of instance: name of class\n"); | ||
683 | for (i = 0; i < LOCKHASH_SIZE; i++) { | 820 | for (i = 0; i < LOCKHASH_SIZE; i++) { |
684 | list_for_each_entry(st, &lockhash_table[i], hash_entry) { | 821 | list_for_each_entry(st, &lockhash_table[i], hash_entry) { |
685 | printf("%p: %s\n", st->addr, st->name); | 822 | pr_info(" %p: %s\n", st->addr, st->name); |
686 | } | 823 | } |
687 | } | 824 | } |
688 | } | 825 | } |
689 | 826 | ||
827 | static void dump_info(void) | ||
828 | { | ||
829 | if (info_threads) | ||
830 | dump_threads(); | ||
831 | else if (info_map) | ||
832 | dump_map(); | ||
833 | else | ||
834 | die("Unknown type of information\n"); | ||
835 | } | ||
836 | |||
837 | static int process_sample_event(event_t *self, struct perf_session *s) | ||
838 | { | ||
839 | struct sample_data data; | ||
840 | struct thread *thread; | ||
841 | |||
842 | bzero(&data, sizeof(data)); | ||
843 | event__parse_sample(self, s->sample_type, &data); | ||
844 | |||
845 | thread = perf_session__findnew(s, data.tid); | ||
846 | if (thread == NULL) { | ||
847 | pr_debug("problem processing %d event, skipping it.\n", | ||
848 | self->header.type); | ||
849 | return -1; | ||
850 | } | ||
851 | |||
852 | process_raw_event(data.raw_data, data.cpu, data.time, thread); | ||
853 | |||
854 | return 0; | ||
855 | } | ||
856 | |||
690 | static struct perf_event_ops eops = { | 857 | static struct perf_event_ops eops = { |
691 | .sample = process_sample_event, | 858 | .sample = process_sample_event, |
692 | .comm = event__process_comm, | 859 | .comm = event__process_comm, |
860 | .ordered_samples = true, | ||
693 | }; | 861 | }; |
694 | 862 | ||
695 | static struct perf_session *session; | ||
696 | |||
697 | static int read_events(void) | 863 | static int read_events(void) |
698 | { | 864 | { |
699 | session = perf_session__new(input_name, O_RDONLY, 0); | 865 | session = perf_session__new(input_name, O_RDONLY, 0, false); |
700 | if (!session) | 866 | if (!session) |
701 | die("Initializing perf session failed\n"); | 867 | die("Initializing perf session failed\n"); |
702 | 868 | ||
@@ -720,7 +886,6 @@ static void __cmd_report(void) | |||
720 | setup_pager(); | 886 | setup_pager(); |
721 | select_key(); | 887 | select_key(); |
722 | read_events(); | 888 | read_events(); |
723 | flush_raw_event_queue(ULLONG_MAX); | ||
724 | sort_result(); | 889 | sort_result(); |
725 | print_result(); | 890 | print_result(); |
726 | } | 891 | } |
@@ -737,6 +902,19 @@ static const struct option report_options[] = { | |||
737 | OPT_END() | 902 | OPT_END() |
738 | }; | 903 | }; |
739 | 904 | ||
905 | static const char * const info_usage[] = { | ||
906 | "perf lock info [<options>]", | ||
907 | NULL | ||
908 | }; | ||
909 | |||
910 | static const struct option info_options[] = { | ||
911 | OPT_BOOLEAN('t', "threads", &info_threads, | ||
912 | "dump thread list in perf.data"), | ||
913 | OPT_BOOLEAN('m', "map", &info_map, | ||
914 | "map of lock instances (name:address table)"), | ||
915 | OPT_END() | ||
916 | }; | ||
917 | |||
740 | static const char * const lock_usage[] = { | 918 | static const char * const lock_usage[] = { |
741 | "perf lock [<options>] {record|trace|report}", | 919 | "perf lock [<options>] {record|trace|report}", |
742 | NULL | 920 | NULL |
@@ -744,14 +922,13 @@ static const char * const lock_usage[] = { | |||
744 | 922 | ||
745 | static const struct option lock_options[] = { | 923 | static const struct option lock_options[] = { |
746 | OPT_STRING('i', "input", &input_name, "file", "input file name"), | 924 | OPT_STRING('i', "input", &input_name, "file", "input file name"), |
747 | OPT_BOOLEAN('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"), | 925 | OPT_INCR('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"), |
748 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"), | 926 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"), |
749 | OPT_END() | 927 | OPT_END() |
750 | }; | 928 | }; |
751 | 929 | ||
752 | static const char *record_args[] = { | 930 | static const char *record_args[] = { |
753 | "record", | 931 | "record", |
754 | "-a", | ||
755 | "-R", | 932 | "-R", |
756 | "-f", | 933 | "-f", |
757 | "-m", "1024", | 934 | "-m", "1024", |
@@ -808,12 +985,18 @@ int cmd_lock(int argc, const char **argv, const char *prefix __used) | |||
808 | } else if (!strcmp(argv[0], "trace")) { | 985 | } else if (!strcmp(argv[0], "trace")) { |
809 | /* Aliased to 'perf trace' */ | 986 | /* Aliased to 'perf trace' */ |
810 | return cmd_trace(argc, argv, prefix); | 987 | return cmd_trace(argc, argv, prefix); |
811 | } else if (!strcmp(argv[0], "map")) { | 988 | } else if (!strcmp(argv[0], "info")) { |
989 | if (argc) { | ||
990 | argc = parse_options(argc, argv, | ||
991 | info_options, info_usage, 0); | ||
992 | if (argc) | ||
993 | usage_with_options(info_usage, info_options); | ||
994 | } | ||
812 | /* recycling report_lock_ops */ | 995 | /* recycling report_lock_ops */ |
813 | trace_handler = &report_lock_ops; | 996 | trace_handler = &report_lock_ops; |
814 | setup_pager(); | 997 | setup_pager(); |
815 | read_events(); | 998 | read_events(); |
816 | dump_map(); | 999 | dump_info(); |
817 | } else { | 1000 | } else { |
818 | usage_with_options(lock_usage, lock_options); | 1001 | usage_with_options(lock_usage, lock_options); |
819 | } | 1002 | } |
diff --git a/tools/perf/builtin-probe.c b/tools/perf/builtin-probe.c index 152d6c9b1fa4..61c6d70732c9 100644 --- a/tools/perf/builtin-probe.c +++ b/tools/perf/builtin-probe.c | |||
@@ -36,13 +36,10 @@ | |||
36 | #include "builtin.h" | 36 | #include "builtin.h" |
37 | #include "util/util.h" | 37 | #include "util/util.h" |
38 | #include "util/strlist.h" | 38 | #include "util/strlist.h" |
39 | #include "util/event.h" | 39 | #include "util/symbol.h" |
40 | #include "util/debug.h" | 40 | #include "util/debug.h" |
41 | #include "util/debugfs.h" | 41 | #include "util/debugfs.h" |
42 | #include "util/symbol.h" | ||
43 | #include "util/thread.h" | ||
44 | #include "util/parse-options.h" | 42 | #include "util/parse-options.h" |
45 | #include "util/parse-events.h" /* For debugfs_path */ | ||
46 | #include "util/probe-finder.h" | 43 | #include "util/probe-finder.h" |
47 | #include "util/probe-event.h" | 44 | #include "util/probe-event.h" |
48 | 45 | ||
@@ -50,103 +47,84 @@ | |||
50 | 47 | ||
51 | /* Session management structure */ | 48 | /* Session management structure */ |
52 | static struct { | 49 | static struct { |
53 | bool need_dwarf; | ||
54 | bool list_events; | 50 | bool list_events; |
55 | bool force_add; | 51 | bool force_add; |
56 | bool show_lines; | 52 | bool show_lines; |
57 | int nr_probe; | 53 | int nevents; |
58 | struct probe_point probes[MAX_PROBES]; | 54 | struct perf_probe_event events[MAX_PROBES]; |
59 | struct strlist *dellist; | 55 | struct strlist *dellist; |
60 | struct map_groups kmap_groups; | ||
61 | struct map *kmaps[MAP__NR_TYPES]; | ||
62 | struct line_range line_range; | 56 | struct line_range line_range; |
63 | } session; | 57 | int max_probe_points; |
58 | } params; | ||
64 | 59 | ||
65 | 60 | ||
66 | /* Parse an event definition. Note that any error must die. */ | 61 | /* Parse an event definition. Note that any error must die. */ |
67 | static void parse_probe_event(const char *str) | 62 | static int parse_probe_event(const char *str) |
68 | { | 63 | { |
69 | struct probe_point *pp = &session.probes[session.nr_probe]; | 64 | struct perf_probe_event *pev = ¶ms.events[params.nevents]; |
65 | int ret; | ||
70 | 66 | ||
71 | pr_debug("probe-definition(%d): %s\n", session.nr_probe, str); | 67 | pr_debug("probe-definition(%d): %s\n", params.nevents, str); |
72 | if (++session.nr_probe == MAX_PROBES) | 68 | if (++params.nevents == MAX_PROBES) |
73 | die("Too many probes (> %d) are specified.", MAX_PROBES); | 69 | die("Too many probes (> %d) are specified.", MAX_PROBES); |
74 | 70 | ||
75 | /* Parse perf-probe event into probe_point */ | 71 | /* Parse a perf-probe command into event */ |
76 | parse_perf_probe_event(str, pp, &session.need_dwarf); | 72 | ret = parse_perf_probe_command(str, pev); |
73 | pr_debug("%d arguments\n", pev->nargs); | ||
77 | 74 | ||
78 | pr_debug("%d arguments\n", pp->nr_args); | 75 | return ret; |
79 | } | 76 | } |
80 | 77 | ||
81 | static void parse_probe_event_argv(int argc, const char **argv) | 78 | static int parse_probe_event_argv(int argc, const char **argv) |
82 | { | 79 | { |
83 | int i, len; | 80 | int i, len, ret; |
84 | char *buf; | 81 | char *buf; |
85 | 82 | ||
86 | /* Bind up rest arguments */ | 83 | /* Bind up rest arguments */ |
87 | len = 0; | 84 | len = 0; |
88 | for (i = 0; i < argc; i++) | 85 | for (i = 0; i < argc; i++) |
89 | len += strlen(argv[i]) + 1; | 86 | len += strlen(argv[i]) + 1; |
90 | buf = zalloc(len + 1); | 87 | buf = xzalloc(len + 1); |
91 | if (!buf) | ||
92 | die("Failed to allocate memory for binding arguments."); | ||
93 | len = 0; | 88 | len = 0; |
94 | for (i = 0; i < argc; i++) | 89 | for (i = 0; i < argc; i++) |
95 | len += sprintf(&buf[len], "%s ", argv[i]); | 90 | len += sprintf(&buf[len], "%s ", argv[i]); |
96 | parse_probe_event(buf); | 91 | ret = parse_probe_event(buf); |
97 | free(buf); | 92 | free(buf); |
93 | return ret; | ||
98 | } | 94 | } |
99 | 95 | ||
100 | static int opt_add_probe_event(const struct option *opt __used, | 96 | static int opt_add_probe_event(const struct option *opt __used, |
101 | const char *str, int unset __used) | 97 | const char *str, int unset __used) |
102 | { | 98 | { |
103 | if (str) | 99 | if (str) |
104 | parse_probe_event(str); | 100 | return parse_probe_event(str); |
105 | return 0; | 101 | else |
102 | return 0; | ||
106 | } | 103 | } |
107 | 104 | ||
108 | static int opt_del_probe_event(const struct option *opt __used, | 105 | static int opt_del_probe_event(const struct option *opt __used, |
109 | const char *str, int unset __used) | 106 | const char *str, int unset __used) |
110 | { | 107 | { |
111 | if (str) { | 108 | if (str) { |
112 | if (!session.dellist) | 109 | if (!params.dellist) |
113 | session.dellist = strlist__new(true, NULL); | 110 | params.dellist = strlist__new(true, NULL); |
114 | strlist__add(session.dellist, str); | 111 | strlist__add(params.dellist, str); |
115 | } | 112 | } |
116 | return 0; | 113 | return 0; |
117 | } | 114 | } |
118 | 115 | ||
119 | /* Currently just checking function name from symbol map */ | 116 | #ifdef DWARF_SUPPORT |
120 | static void evaluate_probe_point(struct probe_point *pp) | ||
121 | { | ||
122 | struct symbol *sym; | ||
123 | sym = map__find_symbol_by_name(session.kmaps[MAP__FUNCTION], | ||
124 | pp->function, NULL); | ||
125 | if (!sym) | ||
126 | die("Kernel symbol \'%s\' not found - probe not added.", | ||
127 | pp->function); | ||
128 | } | ||
129 | |||
130 | #ifndef NO_DWARF_SUPPORT | ||
131 | static int open_vmlinux(void) | ||
132 | { | ||
133 | if (map__load(session.kmaps[MAP__FUNCTION], NULL) < 0) { | ||
134 | pr_debug("Failed to load kernel map.\n"); | ||
135 | return -EINVAL; | ||
136 | } | ||
137 | pr_debug("Try to open %s\n", | ||
138 | session.kmaps[MAP__FUNCTION]->dso->long_name); | ||
139 | return open(session.kmaps[MAP__FUNCTION]->dso->long_name, O_RDONLY); | ||
140 | } | ||
141 | |||
142 | static int opt_show_lines(const struct option *opt __used, | 117 | static int opt_show_lines(const struct option *opt __used, |
143 | const char *str, int unset __used) | 118 | const char *str, int unset __used) |
144 | { | 119 | { |
120 | int ret = 0; | ||
121 | |||
145 | if (str) | 122 | if (str) |
146 | parse_line_range_desc(str, &session.line_range); | 123 | ret = parse_line_range_desc(str, ¶ms.line_range); |
147 | INIT_LIST_HEAD(&session.line_range.line_list); | 124 | INIT_LIST_HEAD(¶ms.line_range.line_list); |
148 | session.show_lines = true; | 125 | params.show_lines = true; |
149 | return 0; | 126 | |
127 | return ret; | ||
150 | } | 128 | } |
151 | #endif | 129 | #endif |
152 | 130 | ||
@@ -155,29 +133,25 @@ static const char * const probe_usage[] = { | |||
155 | "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]", | 133 | "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]", |
156 | "perf probe [<options>] --del '[GROUP:]EVENT' ...", | 134 | "perf probe [<options>] --del '[GROUP:]EVENT' ...", |
157 | "perf probe --list", | 135 | "perf probe --list", |
158 | #ifndef NO_DWARF_SUPPORT | 136 | #ifdef DWARF_SUPPORT |
159 | "perf probe --line 'LINEDESC'", | 137 | "perf probe --line 'LINEDESC'", |
160 | #endif | 138 | #endif |
161 | NULL | 139 | NULL |
162 | }; | 140 | }; |
163 | 141 | ||
164 | static const struct option options[] = { | 142 | static const struct option options[] = { |
165 | OPT_BOOLEAN('v', "verbose", &verbose, | 143 | OPT_INCR('v', "verbose", &verbose, |
166 | "be more verbose (show parsed arguments, etc)"), | 144 | "be more verbose (show parsed arguments, etc)"), |
167 | #ifndef NO_DWARF_SUPPORT | 145 | OPT_BOOLEAN('l', "list", ¶ms.list_events, |
168 | OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name, | ||
169 | "file", "vmlinux pathname"), | ||
170 | #endif | ||
171 | OPT_BOOLEAN('l', "list", &session.list_events, | ||
172 | "list up current probe events"), | 146 | "list up current probe events"), |
173 | OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.", | 147 | OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.", |
174 | opt_del_probe_event), | 148 | opt_del_probe_event), |
175 | OPT_CALLBACK('a', "add", NULL, | 149 | OPT_CALLBACK('a', "add", NULL, |
176 | #ifdef NO_DWARF_SUPPORT | 150 | #ifdef DWARF_SUPPORT |
177 | "[EVENT=]FUNC[+OFF|%return] [ARG ...]", | ||
178 | #else | ||
179 | "[EVENT=]FUNC[@SRC][+OFF|%return|:RL|;PT]|SRC:AL|SRC;PT" | 151 | "[EVENT=]FUNC[@SRC][+OFF|%return|:RL|;PT]|SRC:AL|SRC;PT" |
180 | " [ARG ...]", | 152 | " [[NAME=]ARG ...]", |
153 | #else | ||
154 | "[EVENT=]FUNC[+OFF|%return] [[NAME=]ARG ...]", | ||
181 | #endif | 155 | #endif |
182 | "probe point definition, where\n" | 156 | "probe point definition, where\n" |
183 | "\t\tGROUP:\tGroup name (optional)\n" | 157 | "\t\tGROUP:\tGroup name (optional)\n" |
@@ -185,51 +159,35 @@ static const struct option options[] = { | |||
185 | "\t\tFUNC:\tFunction name\n" | 159 | "\t\tFUNC:\tFunction name\n" |
186 | "\t\tOFF:\tOffset from function entry (in byte)\n" | 160 | "\t\tOFF:\tOffset from function entry (in byte)\n" |
187 | "\t\t%return:\tPut the probe at function return\n" | 161 | "\t\t%return:\tPut the probe at function return\n" |
188 | #ifdef NO_DWARF_SUPPORT | 162 | #ifdef DWARF_SUPPORT |
189 | "\t\tARG:\tProbe argument (only \n" | ||
190 | #else | ||
191 | "\t\tSRC:\tSource code path\n" | 163 | "\t\tSRC:\tSource code path\n" |
192 | "\t\tRL:\tRelative line number from function entry.\n" | 164 | "\t\tRL:\tRelative line number from function entry.\n" |
193 | "\t\tAL:\tAbsolute line number in file.\n" | 165 | "\t\tAL:\tAbsolute line number in file.\n" |
194 | "\t\tPT:\tLazy expression of line code.\n" | 166 | "\t\tPT:\tLazy expression of line code.\n" |
195 | "\t\tARG:\tProbe argument (local variable name or\n" | 167 | "\t\tARG:\tProbe argument (local variable name or\n" |
196 | #endif | ||
197 | "\t\t\tkprobe-tracer argument format.)\n", | 168 | "\t\t\tkprobe-tracer argument format.)\n", |
169 | #else | ||
170 | "\t\tARG:\tProbe argument (kprobe-tracer argument format.)\n", | ||
171 | #endif | ||
198 | opt_add_probe_event), | 172 | opt_add_probe_event), |
199 | OPT_BOOLEAN('f', "force", &session.force_add, "forcibly add events" | 173 | OPT_BOOLEAN('f', "force", ¶ms.force_add, "forcibly add events" |
200 | " with existing name"), | 174 | " with existing name"), |
201 | #ifndef NO_DWARF_SUPPORT | 175 | #ifdef DWARF_SUPPORT |
202 | OPT_CALLBACK('L', "line", NULL, | 176 | OPT_CALLBACK('L', "line", NULL, |
203 | "FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]", | 177 | "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]", |
204 | "Show source code lines.", opt_show_lines), | 178 | "Show source code lines.", opt_show_lines), |
179 | OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name, | ||
180 | "file", "vmlinux pathname"), | ||
205 | #endif | 181 | #endif |
182 | OPT__DRY_RUN(&probe_event_dry_run), | ||
183 | OPT_INTEGER('\0', "max-probes", ¶ms.max_probe_points, | ||
184 | "Set how many probe points can be found for a probe."), | ||
206 | OPT_END() | 185 | OPT_END() |
207 | }; | 186 | }; |
208 | 187 | ||
209 | /* Initialize symbol maps for vmlinux */ | ||
210 | static void init_vmlinux(void) | ||
211 | { | ||
212 | symbol_conf.sort_by_name = true; | ||
213 | if (symbol_conf.vmlinux_name == NULL) | ||
214 | symbol_conf.try_vmlinux_path = true; | ||
215 | else | ||
216 | pr_debug("Use vmlinux: %s\n", symbol_conf.vmlinux_name); | ||
217 | if (symbol__init() < 0) | ||
218 | die("Failed to init symbol map."); | ||
219 | |||
220 | map_groups__init(&session.kmap_groups); | ||
221 | if (map_groups__create_kernel_maps(&session.kmap_groups, | ||
222 | session.kmaps) < 0) | ||
223 | die("Failed to create kernel maps."); | ||
224 | } | ||
225 | |||
226 | int cmd_probe(int argc, const char **argv, const char *prefix __used) | 188 | int cmd_probe(int argc, const char **argv, const char *prefix __used) |
227 | { | 189 | { |
228 | int i, ret; | 190 | int ret; |
229 | #ifndef NO_DWARF_SUPPORT | ||
230 | int fd; | ||
231 | #endif | ||
232 | struct probe_point *pp; | ||
233 | 191 | ||
234 | argc = parse_options(argc, argv, options, probe_usage, | 192 | argc = parse_options(argc, argv, options, probe_usage, |
235 | PARSE_OPT_STOP_AT_NON_OPTION); | 193 | PARSE_OPT_STOP_AT_NON_OPTION); |
@@ -238,123 +196,69 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used) | |||
238 | pr_warning(" Error: '-' is not supported.\n"); | 196 | pr_warning(" Error: '-' is not supported.\n"); |
239 | usage_with_options(probe_usage, options); | 197 | usage_with_options(probe_usage, options); |
240 | } | 198 | } |
241 | parse_probe_event_argv(argc, argv); | 199 | ret = parse_probe_event_argv(argc, argv); |
200 | if (ret < 0) { | ||
201 | pr_err(" Error: Parse Error. (%d)\n", ret); | ||
202 | return ret; | ||
203 | } | ||
242 | } | 204 | } |
243 | 205 | ||
244 | if ((!session.nr_probe && !session.dellist && !session.list_events && | 206 | if (params.max_probe_points == 0) |
245 | !session.show_lines)) | 207 | params.max_probe_points = MAX_PROBES; |
246 | usage_with_options(probe_usage, options); | ||
247 | 208 | ||
248 | if (debugfs_valid_mountpoint(debugfs_path) < 0) | 209 | if ((!params.nevents && !params.dellist && !params.list_events && |
249 | die("Failed to find debugfs path."); | 210 | !params.show_lines)) |
211 | usage_with_options(probe_usage, options); | ||
250 | 212 | ||
251 | if (session.list_events) { | 213 | if (params.list_events) { |
252 | if (session.nr_probe != 0 || session.dellist) { | 214 | if (params.nevents != 0 || params.dellist) { |
253 | pr_warning(" Error: Don't use --list with" | 215 | pr_err(" Error: Don't use --list with --add/--del.\n"); |
254 | " --add/--del.\n"); | ||
255 | usage_with_options(probe_usage, options); | 216 | usage_with_options(probe_usage, options); |
256 | } | 217 | } |
257 | if (session.show_lines) { | 218 | if (params.show_lines) { |
258 | pr_warning(" Error: Don't use --list with --line.\n"); | 219 | pr_err(" Error: Don't use --list with --line.\n"); |
259 | usage_with_options(probe_usage, options); | 220 | usage_with_options(probe_usage, options); |
260 | } | 221 | } |
261 | show_perf_probe_events(); | 222 | ret = show_perf_probe_events(); |
262 | return 0; | 223 | if (ret < 0) |
224 | pr_err(" Error: Failed to show event list. (%d)\n", | ||
225 | ret); | ||
226 | return ret; | ||
263 | } | 227 | } |
264 | 228 | ||
265 | #ifndef NO_DWARF_SUPPORT | 229 | #ifdef DWARF_SUPPORT |
266 | if (session.show_lines) { | 230 | if (params.show_lines) { |
267 | if (session.nr_probe != 0 || session.dellist) { | 231 | if (params.nevents != 0 || params.dellist) { |
268 | pr_warning(" Error: Don't use --line with" | 232 | pr_warning(" Error: Don't use --line with" |
269 | " --add/--del.\n"); | 233 | " --add/--del.\n"); |
270 | usage_with_options(probe_usage, options); | 234 | usage_with_options(probe_usage, options); |
271 | } | 235 | } |
272 | init_vmlinux(); | ||
273 | fd = open_vmlinux(); | ||
274 | if (fd < 0) | ||
275 | die("Could not open debuginfo file."); | ||
276 | ret = find_line_range(fd, &session.line_range); | ||
277 | if (ret <= 0) | ||
278 | die("Source line is not found.\n"); | ||
279 | close(fd); | ||
280 | show_line_range(&session.line_range); | ||
281 | return 0; | ||
282 | } | ||
283 | #endif | ||
284 | 236 | ||
285 | if (session.dellist) { | 237 | ret = show_line_range(¶ms.line_range); |
286 | del_trace_kprobe_events(session.dellist); | 238 | if (ret < 0) |
287 | strlist__delete(session.dellist); | 239 | pr_err(" Error: Failed to show lines. (%d)\n", ret); |
288 | if (session.nr_probe == 0) | 240 | return ret; |
289 | return 0; | ||
290 | } | 241 | } |
242 | #endif | ||
291 | 243 | ||
292 | /* Add probes */ | 244 | if (params.dellist) { |
293 | init_vmlinux(); | 245 | ret = del_perf_probe_events(params.dellist); |
294 | 246 | strlist__delete(params.dellist); | |
295 | if (session.need_dwarf) | 247 | if (ret < 0) { |
296 | #ifdef NO_DWARF_SUPPORT | 248 | pr_err(" Error: Failed to delete events. (%d)\n", ret); |
297 | die("Debuginfo-analysis is not supported"); | 249 | return ret; |
298 | #else /* !NO_DWARF_SUPPORT */ | ||
299 | pr_debug("Some probes require debuginfo.\n"); | ||
300 | |||
301 | fd = open_vmlinux(); | ||
302 | if (fd < 0) { | ||
303 | if (session.need_dwarf) | ||
304 | die("Could not open debuginfo file."); | ||
305 | |||
306 | pr_debug("Could not open vmlinux/module file." | ||
307 | " Try to use symbols.\n"); | ||
308 | goto end_dwarf; | ||
309 | } | ||
310 | |||
311 | /* Searching probe points */ | ||
312 | for (i = 0; i < session.nr_probe; i++) { | ||
313 | pp = &session.probes[i]; | ||
314 | if (pp->found) | ||
315 | continue; | ||
316 | |||
317 | lseek(fd, SEEK_SET, 0); | ||
318 | ret = find_probe_point(fd, pp); | ||
319 | if (ret > 0) | ||
320 | continue; | ||
321 | if (ret == 0) { /* No error but failed to find probe point. */ | ||
322 | synthesize_perf_probe_point(pp); | ||
323 | die("Probe point '%s' not found. - probe not added.", | ||
324 | pp->probes[0]); | ||
325 | } | ||
326 | /* Error path */ | ||
327 | if (session.need_dwarf) { | ||
328 | if (ret == -ENOENT) | ||
329 | pr_warning("No dwarf info found in the vmlinux - please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
330 | die("Could not analyze debuginfo."); | ||
331 | } | 250 | } |
332 | pr_debug("An error occurred in debuginfo analysis." | ||
333 | " Try to use symbols.\n"); | ||
334 | break; | ||
335 | } | 251 | } |
336 | close(fd); | ||
337 | |||
338 | end_dwarf: | ||
339 | #endif /* !NO_DWARF_SUPPORT */ | ||
340 | 252 | ||
341 | /* Synthesize probes without dwarf */ | 253 | if (params.nevents) { |
342 | for (i = 0; i < session.nr_probe; i++) { | 254 | ret = add_perf_probe_events(params.events, params.nevents, |
343 | pp = &session.probes[i]; | 255 | params.force_add, |
344 | if (pp->found) /* This probe is already found. */ | 256 | params.max_probe_points); |
345 | continue; | 257 | if (ret < 0) { |
346 | 258 | pr_err(" Error: Failed to add events. (%d)\n", ret); | |
347 | evaluate_probe_point(pp); | 259 | return ret; |
348 | ret = synthesize_trace_kprobe_event(pp); | 260 | } |
349 | if (ret == -E2BIG) | ||
350 | die("probe point definition becomes too long."); | ||
351 | else if (ret < 0) | ||
352 | die("Failed to synthesize a probe point."); | ||
353 | } | 261 | } |
354 | |||
355 | /* Settng up probe points */ | ||
356 | add_trace_kprobe_events(session.probes, session.nr_probe, | ||
357 | session.force_add); | ||
358 | return 0; | 262 | return 0; |
359 | } | 263 | } |
360 | 264 | ||
diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c index f1411e9cdf47..cb46c7d0ea99 100644 --- a/tools/perf/builtin-record.c +++ b/tools/perf/builtin-record.c | |||
@@ -15,7 +15,6 @@ | |||
15 | #include "util/util.h" | 15 | #include "util/util.h" |
16 | #include "util/parse-options.h" | 16 | #include "util/parse-options.h" |
17 | #include "util/parse-events.h" | 17 | #include "util/parse-events.h" |
18 | #include "util/string.h" | ||
19 | 18 | ||
20 | #include "util/header.h" | 19 | #include "util/header.h" |
21 | #include "util/event.h" | 20 | #include "util/event.h" |
@@ -27,31 +26,41 @@ | |||
27 | #include <unistd.h> | 26 | #include <unistd.h> |
28 | #include <sched.h> | 27 | #include <sched.h> |
29 | 28 | ||
30 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 29 | enum write_mode_t { |
30 | WRITE_FORCE, | ||
31 | WRITE_APPEND | ||
32 | }; | ||
33 | |||
34 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; | ||
31 | 35 | ||
32 | static long default_interval = 0; | 36 | static u64 user_interval = ULLONG_MAX; |
37 | static u64 default_interval = 0; | ||
33 | 38 | ||
34 | static int nr_cpus = 0; | 39 | static int nr_cpus = 0; |
35 | static unsigned int page_size; | 40 | static unsigned int page_size; |
36 | static unsigned int mmap_pages = 128; | 41 | static unsigned int mmap_pages = 128; |
42 | static unsigned int user_freq = UINT_MAX; | ||
37 | static int freq = 1000; | 43 | static int freq = 1000; |
38 | static int output; | 44 | static int output; |
45 | static int pipe_output = 0; | ||
39 | static const char *output_name = "perf.data"; | 46 | static const char *output_name = "perf.data"; |
40 | static int group = 0; | 47 | static int group = 0; |
41 | static unsigned int realtime_prio = 0; | 48 | static int realtime_prio = 0; |
42 | static int raw_samples = 0; | 49 | static bool raw_samples = false; |
43 | static int system_wide = 0; | 50 | static bool system_wide = false; |
44 | static int profile_cpu = -1; | 51 | static int profile_cpu = -1; |
45 | static pid_t target_pid = -1; | 52 | static pid_t target_pid = -1; |
53 | static pid_t target_tid = -1; | ||
54 | static pid_t *all_tids = NULL; | ||
55 | static int thread_num = 0; | ||
46 | static pid_t child_pid = -1; | 56 | static pid_t child_pid = -1; |
47 | static int inherit = 1; | 57 | static bool no_inherit = false; |
48 | static int force = 0; | 58 | static enum write_mode_t write_mode = WRITE_FORCE; |
49 | static int append_file = 0; | 59 | static bool call_graph = false; |
50 | static int call_graph = 0; | 60 | static bool inherit_stat = false; |
51 | static int inherit_stat = 0; | 61 | static bool no_samples = false; |
52 | static int no_samples = 0; | 62 | static bool sample_address = false; |
53 | static int sample_address = 0; | 63 | static bool multiplex = false; |
54 | static int multiplex = 0; | ||
55 | static int multiplex_fd = -1; | 64 | static int multiplex_fd = -1; |
56 | 65 | ||
57 | static long samples = 0; | 66 | static long samples = 0; |
@@ -60,7 +69,7 @@ static struct timeval this_read; | |||
60 | 69 | ||
61 | static u64 bytes_written = 0; | 70 | static u64 bytes_written = 0; |
62 | 71 | ||
63 | static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; | 72 | static struct pollfd *event_array; |
64 | 73 | ||
65 | static int nr_poll = 0; | 74 | static int nr_poll = 0; |
66 | static int nr_cpu = 0; | 75 | static int nr_cpu = 0; |
@@ -77,7 +86,7 @@ struct mmap_data { | |||
77 | unsigned int prev; | 86 | unsigned int prev; |
78 | }; | 87 | }; |
79 | 88 | ||
80 | static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; | 89 | static struct mmap_data *mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; |
81 | 90 | ||
82 | static unsigned long mmap_read_head(struct mmap_data *md) | 91 | static unsigned long mmap_read_head(struct mmap_data *md) |
83 | { | 92 | { |
@@ -101,6 +110,11 @@ static void mmap_write_tail(struct mmap_data *md, unsigned long tail) | |||
101 | pc->data_tail = tail; | 110 | pc->data_tail = tail; |
102 | } | 111 | } |
103 | 112 | ||
113 | static void advance_output(size_t size) | ||
114 | { | ||
115 | bytes_written += size; | ||
116 | } | ||
117 | |||
104 | static void write_output(void *buf, size_t size) | 118 | static void write_output(void *buf, size_t size) |
105 | { | 119 | { |
106 | while (size) { | 120 | while (size) { |
@@ -225,12 +239,13 @@ static struct perf_header_attr *get_header_attr(struct perf_event_attr *a, int n | |||
225 | return h_attr; | 239 | return h_attr; |
226 | } | 240 | } |
227 | 241 | ||
228 | static void create_counter(int counter, int cpu, pid_t pid) | 242 | static void create_counter(int counter, int cpu) |
229 | { | 243 | { |
230 | char *filter = filters[counter]; | 244 | char *filter = filters[counter]; |
231 | struct perf_event_attr *attr = attrs + counter; | 245 | struct perf_event_attr *attr = attrs + counter; |
232 | struct perf_header_attr *h_attr; | 246 | struct perf_header_attr *h_attr; |
233 | int track = !counter; /* only the first counter needs these */ | 247 | int track = !counter; /* only the first counter needs these */ |
248 | int thread_index; | ||
234 | int ret; | 249 | int ret; |
235 | struct { | 250 | struct { |
236 | u64 count; | 251 | u64 count; |
@@ -248,10 +263,19 @@ static void create_counter(int counter, int cpu, pid_t pid) | |||
248 | if (nr_counters > 1) | 263 | if (nr_counters > 1) |
249 | attr->sample_type |= PERF_SAMPLE_ID; | 264 | attr->sample_type |= PERF_SAMPLE_ID; |
250 | 265 | ||
251 | if (freq) { | 266 | /* |
252 | attr->sample_type |= PERF_SAMPLE_PERIOD; | 267 | * We default some events to a 1 default interval. But keep |
253 | attr->freq = 1; | 268 | * it a weak assumption overridable by the user. |
254 | attr->sample_freq = freq; | 269 | */ |
270 | if (!attr->sample_period || (user_freq != UINT_MAX && | ||
271 | user_interval != ULLONG_MAX)) { | ||
272 | if (freq) { | ||
273 | attr->sample_type |= PERF_SAMPLE_PERIOD; | ||
274 | attr->freq = 1; | ||
275 | attr->sample_freq = freq; | ||
276 | } else { | ||
277 | attr->sample_period = default_interval; | ||
278 | } | ||
255 | } | 279 | } |
256 | 280 | ||
257 | if (no_samples) | 281 | if (no_samples) |
@@ -274,119 +298,130 @@ static void create_counter(int counter, int cpu, pid_t pid) | |||
274 | 298 | ||
275 | attr->mmap = track; | 299 | attr->mmap = track; |
276 | attr->comm = track; | 300 | attr->comm = track; |
277 | attr->inherit = inherit; | 301 | attr->inherit = !no_inherit; |
278 | attr->disabled = 1; | 302 | if (target_pid == -1 && target_tid == -1 && !system_wide) { |
303 | attr->disabled = 1; | ||
304 | attr->enable_on_exec = 1; | ||
305 | } | ||
279 | 306 | ||
307 | for (thread_index = 0; thread_index < thread_num; thread_index++) { | ||
280 | try_again: | 308 | try_again: |
281 | fd[nr_cpu][counter] = sys_perf_event_open(attr, pid, cpu, group_fd, 0); | 309 | fd[nr_cpu][counter][thread_index] = sys_perf_event_open(attr, |
282 | 310 | all_tids[thread_index], cpu, group_fd, 0); | |
283 | if (fd[nr_cpu][counter] < 0) { | 311 | |
284 | int err = errno; | 312 | if (fd[nr_cpu][counter][thread_index] < 0) { |
285 | 313 | int err = errno; | |
286 | if (err == EPERM || err == EACCES) | 314 | |
287 | die("Permission error - are you root?\n"); | 315 | if (err == EPERM || err == EACCES) |
288 | else if (err == ENODEV && profile_cpu != -1) | 316 | die("Permission error - are you root?\n" |
289 | die("No such device - did you specify an out-of-range profile CPU?\n"); | 317 | "\t Consider tweaking" |
318 | " /proc/sys/kernel/perf_event_paranoid.\n"); | ||
319 | else if (err == ENODEV && profile_cpu != -1) { | ||
320 | die("No such device - did you specify" | ||
321 | " an out-of-range profile CPU?\n"); | ||
322 | } | ||
290 | 323 | ||
291 | /* | 324 | /* |
292 | * If it's cycles then fall back to hrtimer | 325 | * If it's cycles then fall back to hrtimer |
293 | * based cpu-clock-tick sw counter, which | 326 | * based cpu-clock-tick sw counter, which |
294 | * is always available even if no PMU support: | 327 | * is always available even if no PMU support: |
295 | */ | 328 | */ |
296 | if (attr->type == PERF_TYPE_HARDWARE | 329 | if (attr->type == PERF_TYPE_HARDWARE |
297 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | 330 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { |
298 | 331 | ||
299 | if (verbose) | 332 | if (verbose) |
300 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | 333 | warning(" ... trying to fall back to cpu-clock-ticks\n"); |
301 | attr->type = PERF_TYPE_SOFTWARE; | 334 | attr->type = PERF_TYPE_SOFTWARE; |
302 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | 335 | attr->config = PERF_COUNT_SW_CPU_CLOCK; |
303 | goto try_again; | 336 | goto try_again; |
304 | } | 337 | } |
305 | printf("\n"); | 338 | printf("\n"); |
306 | error("perfcounter syscall returned with %d (%s)\n", | 339 | error("perfcounter syscall returned with %d (%s)\n", |
307 | fd[nr_cpu][counter], strerror(err)); | 340 | fd[nr_cpu][counter][thread_index], strerror(err)); |
308 | 341 | ||
309 | #if defined(__i386__) || defined(__x86_64__) | 342 | #if defined(__i386__) || defined(__x86_64__) |
310 | if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP) | 343 | if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP) |
311 | die("No hardware sampling interrupt available. No APIC? If so then you can boot the kernel with the \"lapic\" boot parameter to force-enable it.\n"); | 344 | die("No hardware sampling interrupt available." |
345 | " No APIC? If so then you can boot the kernel" | ||
346 | " with the \"lapic\" boot parameter to" | ||
347 | " force-enable it.\n"); | ||
312 | #endif | 348 | #endif |
313 | 349 | ||
314 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | 350 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); |
315 | exit(-1); | 351 | exit(-1); |
316 | } | 352 | } |
317 | 353 | ||
318 | h_attr = get_header_attr(attr, counter); | 354 | h_attr = get_header_attr(attr, counter); |
319 | if (h_attr == NULL) | 355 | if (h_attr == NULL) |
320 | die("nomem\n"); | 356 | die("nomem\n"); |
321 | 357 | ||
322 | if (!file_new) { | 358 | if (!file_new) { |
323 | if (memcmp(&h_attr->attr, attr, sizeof(*attr))) { | 359 | if (memcmp(&h_attr->attr, attr, sizeof(*attr))) { |
324 | fprintf(stderr, "incompatible append\n"); | 360 | fprintf(stderr, "incompatible append\n"); |
325 | exit(-1); | 361 | exit(-1); |
362 | } | ||
326 | } | 363 | } |
327 | } | ||
328 | 364 | ||
329 | if (read(fd[nr_cpu][counter], &read_data, sizeof(read_data)) == -1) { | 365 | if (read(fd[nr_cpu][counter][thread_index], &read_data, sizeof(read_data)) == -1) { |
330 | perror("Unable to read perf file descriptor\n"); | 366 | perror("Unable to read perf file descriptor\n"); |
331 | exit(-1); | 367 | exit(-1); |
332 | } | 368 | } |
333 | 369 | ||
334 | if (perf_header_attr__add_id(h_attr, read_data.id) < 0) { | 370 | if (perf_header_attr__add_id(h_attr, read_data.id) < 0) { |
335 | pr_warning("Not enough memory to add id\n"); | 371 | pr_warning("Not enough memory to add id\n"); |
336 | exit(-1); | 372 | exit(-1); |
337 | } | 373 | } |
338 | 374 | ||
339 | assert(fd[nr_cpu][counter] >= 0); | 375 | assert(fd[nr_cpu][counter][thread_index] >= 0); |
340 | fcntl(fd[nr_cpu][counter], F_SETFL, O_NONBLOCK); | 376 | fcntl(fd[nr_cpu][counter][thread_index], F_SETFL, O_NONBLOCK); |
341 | 377 | ||
342 | /* | 378 | /* |
343 | * First counter acts as the group leader: | 379 | * First counter acts as the group leader: |
344 | */ | 380 | */ |
345 | if (group && group_fd == -1) | 381 | if (group && group_fd == -1) |
346 | group_fd = fd[nr_cpu][counter]; | 382 | group_fd = fd[nr_cpu][counter][thread_index]; |
347 | if (multiplex && multiplex_fd == -1) | 383 | if (multiplex && multiplex_fd == -1) |
348 | multiplex_fd = fd[nr_cpu][counter]; | 384 | multiplex_fd = fd[nr_cpu][counter][thread_index]; |
349 | 385 | ||
350 | if (multiplex && fd[nr_cpu][counter] != multiplex_fd) { | 386 | if (multiplex && fd[nr_cpu][counter][thread_index] != multiplex_fd) { |
351 | 387 | ||
352 | ret = ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_SET_OUTPUT, multiplex_fd); | 388 | ret = ioctl(fd[nr_cpu][counter][thread_index], PERF_EVENT_IOC_SET_OUTPUT, multiplex_fd); |
353 | assert(ret != -1); | 389 | assert(ret != -1); |
354 | } else { | 390 | } else { |
355 | event_array[nr_poll].fd = fd[nr_cpu][counter]; | 391 | event_array[nr_poll].fd = fd[nr_cpu][counter][thread_index]; |
356 | event_array[nr_poll].events = POLLIN; | 392 | event_array[nr_poll].events = POLLIN; |
357 | nr_poll++; | 393 | nr_poll++; |
358 | 394 | ||
359 | mmap_array[nr_cpu][counter].counter = counter; | 395 | mmap_array[nr_cpu][counter][thread_index].counter = counter; |
360 | mmap_array[nr_cpu][counter].prev = 0; | 396 | mmap_array[nr_cpu][counter][thread_index].prev = 0; |
361 | mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1; | 397 | mmap_array[nr_cpu][counter][thread_index].mask = mmap_pages*page_size - 1; |
362 | mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size, | 398 | mmap_array[nr_cpu][counter][thread_index].base = mmap(NULL, (mmap_pages+1)*page_size, |
363 | PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter], 0); | 399 | PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter][thread_index], 0); |
364 | if (mmap_array[nr_cpu][counter].base == MAP_FAILED) { | 400 | if (mmap_array[nr_cpu][counter][thread_index].base == MAP_FAILED) { |
365 | error("failed to mmap with %d (%s)\n", errno, strerror(errno)); | 401 | error("failed to mmap with %d (%s)\n", errno, strerror(errno)); |
366 | exit(-1); | 402 | exit(-1); |
403 | } | ||
367 | } | 404 | } |
368 | } | ||
369 | 405 | ||
370 | if (filter != NULL) { | 406 | if (filter != NULL) { |
371 | ret = ioctl(fd[nr_cpu][counter], | 407 | ret = ioctl(fd[nr_cpu][counter][thread_index], |
372 | PERF_EVENT_IOC_SET_FILTER, filter); | 408 | PERF_EVENT_IOC_SET_FILTER, filter); |
373 | if (ret) { | 409 | if (ret) { |
374 | error("failed to set filter with %d (%s)\n", errno, | 410 | error("failed to set filter with %d (%s)\n", errno, |
375 | strerror(errno)); | 411 | strerror(errno)); |
376 | exit(-1); | 412 | exit(-1); |
413 | } | ||
377 | } | 414 | } |
378 | } | 415 | } |
379 | |||
380 | ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_ENABLE); | ||
381 | } | 416 | } |
382 | 417 | ||
383 | static void open_counters(int cpu, pid_t pid) | 418 | static void open_counters(int cpu) |
384 | { | 419 | { |
385 | int counter; | 420 | int counter; |
386 | 421 | ||
387 | group_fd = -1; | 422 | group_fd = -1; |
388 | for (counter = 0; counter < nr_counters; counter++) | 423 | for (counter = 0; counter < nr_counters; counter++) |
389 | create_counter(counter, cpu, pid); | 424 | create_counter(counter, cpu); |
390 | 425 | ||
391 | nr_cpu++; | 426 | nr_cpu++; |
392 | } | 427 | } |
@@ -406,10 +441,80 @@ static int process_buildids(void) | |||
406 | 441 | ||
407 | static void atexit_header(void) | 442 | static void atexit_header(void) |
408 | { | 443 | { |
409 | session->header.data_size += bytes_written; | 444 | if (!pipe_output) { |
445 | session->header.data_size += bytes_written; | ||
446 | |||
447 | process_buildids(); | ||
448 | perf_header__write(&session->header, output, true); | ||
449 | } | ||
450 | } | ||
451 | |||
452 | static void event__synthesize_guest_os(struct machine *machine, void *data) | ||
453 | { | ||
454 | int err; | ||
455 | char *guest_kallsyms; | ||
456 | char path[PATH_MAX]; | ||
457 | struct perf_session *psession = data; | ||
458 | |||
459 | if (machine__is_host(machine)) | ||
460 | return; | ||
461 | |||
462 | /* | ||
463 | *As for guest kernel when processing subcommand record&report, | ||
464 | *we arrange module mmap prior to guest kernel mmap and trigger | ||
465 | *a preload dso because default guest module symbols are loaded | ||
466 | *from guest kallsyms instead of /lib/modules/XXX/XXX. This | ||
467 | *method is used to avoid symbol missing when the first addr is | ||
468 | *in module instead of in guest kernel. | ||
469 | */ | ||
470 | err = event__synthesize_modules(process_synthesized_event, | ||
471 | psession, machine); | ||
472 | if (err < 0) | ||
473 | pr_err("Couldn't record guest kernel [%d]'s reference" | ||
474 | " relocation symbol.\n", machine->pid); | ||
475 | |||
476 | if (machine__is_default_guest(machine)) | ||
477 | guest_kallsyms = (char *) symbol_conf.default_guest_kallsyms; | ||
478 | else { | ||
479 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
480 | guest_kallsyms = path; | ||
481 | } | ||
482 | |||
483 | /* | ||
484 | * We use _stext for guest kernel because guest kernel's /proc/kallsyms | ||
485 | * have no _text sometimes. | ||
486 | */ | ||
487 | err = event__synthesize_kernel_mmap(process_synthesized_event, | ||
488 | psession, machine, "_text"); | ||
489 | if (err < 0) | ||
490 | err = event__synthesize_kernel_mmap(process_synthesized_event, | ||
491 | psession, machine, "_stext"); | ||
492 | if (err < 0) | ||
493 | pr_err("Couldn't record guest kernel [%d]'s reference" | ||
494 | " relocation symbol.\n", machine->pid); | ||
495 | } | ||
496 | |||
497 | static struct perf_event_header finished_round_event = { | ||
498 | .size = sizeof(struct perf_event_header), | ||
499 | .type = PERF_RECORD_FINISHED_ROUND, | ||
500 | }; | ||
501 | |||
502 | static void mmap_read_all(void) | ||
503 | { | ||
504 | int i, counter, thread; | ||
505 | |||
506 | for (i = 0; i < nr_cpu; i++) { | ||
507 | for (counter = 0; counter < nr_counters; counter++) { | ||
508 | for (thread = 0; thread < thread_num; thread++) { | ||
509 | if (mmap_array[i][counter][thread].base) | ||
510 | mmap_read(&mmap_array[i][counter][thread]); | ||
511 | } | ||
512 | |||
513 | } | ||
514 | } | ||
410 | 515 | ||
411 | process_buildids(); | 516 | if (perf_header__has_feat(&session->header, HEADER_TRACE_INFO)) |
412 | perf_header__write(&session->header, output, true); | 517 | write_output(&finished_round_event, sizeof(finished_round_event)); |
413 | } | 518 | } |
414 | 519 | ||
415 | static int __cmd_record(int argc, const char **argv) | 520 | static int __cmd_record(int argc, const char **argv) |
@@ -421,8 +526,9 @@ static int __cmd_record(int argc, const char **argv) | |||
421 | int err; | 526 | int err; |
422 | unsigned long waking = 0; | 527 | unsigned long waking = 0; |
423 | int child_ready_pipe[2], go_pipe[2]; | 528 | int child_ready_pipe[2], go_pipe[2]; |
424 | const bool forks = target_pid == -1 && argc > 0; | 529 | const bool forks = argc > 0; |
425 | char buf; | 530 | char buf; |
531 | struct machine *machine; | ||
426 | 532 | ||
427 | page_size = sysconf(_SC_PAGE_SIZE); | 533 | page_size = sysconf(_SC_PAGE_SIZE); |
428 | 534 | ||
@@ -435,70 +541,63 @@ static int __cmd_record(int argc, const char **argv) | |||
435 | exit(-1); | 541 | exit(-1); |
436 | } | 542 | } |
437 | 543 | ||
438 | if (!stat(output_name, &st) && st.st_size) { | 544 | if (!strcmp(output_name, "-")) |
439 | if (!force) { | 545 | pipe_output = 1; |
440 | if (!append_file) { | 546 | else if (!stat(output_name, &st) && st.st_size) { |
441 | pr_err("Error, output file %s exists, use -A " | 547 | if (write_mode == WRITE_FORCE) { |
442 | "to append or -f to overwrite.\n", | ||
443 | output_name); | ||
444 | exit(-1); | ||
445 | } | ||
446 | } else { | ||
447 | char oldname[PATH_MAX]; | 548 | char oldname[PATH_MAX]; |
448 | snprintf(oldname, sizeof(oldname), "%s.old", | 549 | snprintf(oldname, sizeof(oldname), "%s.old", |
449 | output_name); | 550 | output_name); |
450 | unlink(oldname); | 551 | unlink(oldname); |
451 | rename(output_name, oldname); | 552 | rename(output_name, oldname); |
452 | } | 553 | } |
453 | } else { | 554 | } else if (write_mode == WRITE_APPEND) { |
454 | append_file = 0; | 555 | write_mode = WRITE_FORCE; |
455 | } | 556 | } |
456 | 557 | ||
457 | flags = O_CREAT|O_RDWR; | 558 | flags = O_CREAT|O_RDWR; |
458 | if (append_file) | 559 | if (write_mode == WRITE_APPEND) |
459 | file_new = 0; | 560 | file_new = 0; |
460 | else | 561 | else |
461 | flags |= O_TRUNC; | 562 | flags |= O_TRUNC; |
462 | 563 | ||
463 | output = open(output_name, flags, S_IRUSR|S_IWUSR); | 564 | if (pipe_output) |
565 | output = STDOUT_FILENO; | ||
566 | else | ||
567 | output = open(output_name, flags, S_IRUSR | S_IWUSR); | ||
464 | if (output < 0) { | 568 | if (output < 0) { |
465 | perror("failed to create output file"); | 569 | perror("failed to create output file"); |
466 | exit(-1); | 570 | exit(-1); |
467 | } | 571 | } |
468 | 572 | ||
469 | session = perf_session__new(output_name, O_WRONLY, force); | 573 | session = perf_session__new(output_name, O_WRONLY, |
574 | write_mode == WRITE_FORCE, false); | ||
470 | if (session == NULL) { | 575 | if (session == NULL) { |
471 | pr_err("Not enough memory for reading perf file header\n"); | 576 | pr_err("Not enough memory for reading perf file header\n"); |
472 | return -1; | 577 | return -1; |
473 | } | 578 | } |
474 | 579 | ||
475 | if (!file_new) { | 580 | if (!file_new) { |
476 | err = perf_header__read(&session->header, output); | 581 | err = perf_header__read(session, output); |
477 | if (err < 0) | 582 | if (err < 0) |
478 | return err; | 583 | return err; |
479 | } | 584 | } |
480 | 585 | ||
481 | if (raw_samples) { | 586 | if (have_tracepoints(attrs, nr_counters)) |
482 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); | 587 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); |
483 | } else { | ||
484 | for (i = 0; i < nr_counters; i++) { | ||
485 | if (attrs[i].sample_type & PERF_SAMPLE_RAW) { | ||
486 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); | ||
487 | break; | ||
488 | } | ||
489 | } | ||
490 | } | ||
491 | 588 | ||
492 | atexit(atexit_header); | 589 | atexit(atexit_header); |
493 | 590 | ||
494 | if (forks) { | 591 | if (forks) { |
495 | pid = fork(); | 592 | child_pid = fork(); |
496 | if (pid < 0) { | 593 | if (pid < 0) { |
497 | perror("failed to fork"); | 594 | perror("failed to fork"); |
498 | exit(-1); | 595 | exit(-1); |
499 | } | 596 | } |
500 | 597 | ||
501 | if (!pid) { | 598 | if (!child_pid) { |
599 | if (pipe_output) | ||
600 | dup2(2, 1); | ||
502 | close(child_ready_pipe[0]); | 601 | close(child_ready_pipe[0]); |
503 | close(go_pipe[1]); | 602 | close(go_pipe[1]); |
504 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); | 603 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); |
@@ -527,10 +626,8 @@ static int __cmd_record(int argc, const char **argv) | |||
527 | exit(-1); | 626 | exit(-1); |
528 | } | 627 | } |
529 | 628 | ||
530 | child_pid = pid; | 629 | if (!system_wide && target_tid == -1 && target_pid == -1) |
531 | 630 | all_tids[0] = child_pid; | |
532 | if (!system_wide) | ||
533 | target_pid = pid; | ||
534 | 631 | ||
535 | close(child_ready_pipe[1]); | 632 | close(child_ready_pipe[1]); |
536 | close(go_pipe[0]); | 633 | close(go_pipe[0]); |
@@ -544,16 +641,19 @@ static int __cmd_record(int argc, const char **argv) | |||
544 | close(child_ready_pipe[0]); | 641 | close(child_ready_pipe[0]); |
545 | } | 642 | } |
546 | 643 | ||
547 | 644 | if ((!system_wide && no_inherit) || profile_cpu != -1) { | |
548 | if ((!system_wide && !inherit) || profile_cpu != -1) { | 645 | open_counters(profile_cpu); |
549 | open_counters(profile_cpu, target_pid); | ||
550 | } else { | 646 | } else { |
551 | nr_cpus = read_cpu_map(); | 647 | nr_cpus = read_cpu_map(); |
552 | for (i = 0; i < nr_cpus; i++) | 648 | for (i = 0; i < nr_cpus; i++) |
553 | open_counters(cpumap[i], target_pid); | 649 | open_counters(cpumap[i]); |
554 | } | 650 | } |
555 | 651 | ||
556 | if (file_new) { | 652 | if (pipe_output) { |
653 | err = perf_header__write_pipe(output); | ||
654 | if (err < 0) | ||
655 | return err; | ||
656 | } else if (file_new) { | ||
557 | err = perf_header__write(&session->header, output, false); | 657 | err = perf_header__write(&session->header, output, false); |
558 | if (err < 0) | 658 | if (err < 0) |
559 | return err; | 659 | return err; |
@@ -561,24 +661,70 @@ static int __cmd_record(int argc, const char **argv) | |||
561 | 661 | ||
562 | post_processing_offset = lseek(output, 0, SEEK_CUR); | 662 | post_processing_offset = lseek(output, 0, SEEK_CUR); |
563 | 663 | ||
664 | if (pipe_output) { | ||
665 | err = event__synthesize_attrs(&session->header, | ||
666 | process_synthesized_event, | ||
667 | session); | ||
668 | if (err < 0) { | ||
669 | pr_err("Couldn't synthesize attrs.\n"); | ||
670 | return err; | ||
671 | } | ||
672 | |||
673 | err = event__synthesize_event_types(process_synthesized_event, | ||
674 | session); | ||
675 | if (err < 0) { | ||
676 | pr_err("Couldn't synthesize event_types.\n"); | ||
677 | return err; | ||
678 | } | ||
679 | |||
680 | if (have_tracepoints(attrs, nr_counters)) { | ||
681 | /* | ||
682 | * FIXME err <= 0 here actually means that | ||
683 | * there were no tracepoints so its not really | ||
684 | * an error, just that we don't need to | ||
685 | * synthesize anything. We really have to | ||
686 | * return this more properly and also | ||
687 | * propagate errors that now are calling die() | ||
688 | */ | ||
689 | err = event__synthesize_tracing_data(output, attrs, | ||
690 | nr_counters, | ||
691 | process_synthesized_event, | ||
692 | session); | ||
693 | if (err <= 0) { | ||
694 | pr_err("Couldn't record tracing data.\n"); | ||
695 | return err; | ||
696 | } | ||
697 | advance_output(err); | ||
698 | } | ||
699 | } | ||
700 | |||
701 | machine = perf_session__find_host_machine(session); | ||
702 | if (!machine) { | ||
703 | pr_err("Couldn't find native kernel information.\n"); | ||
704 | return -1; | ||
705 | } | ||
706 | |||
564 | err = event__synthesize_kernel_mmap(process_synthesized_event, | 707 | err = event__synthesize_kernel_mmap(process_synthesized_event, |
565 | session, "_text"); | 708 | session, machine, "_text"); |
566 | if (err < 0) | 709 | if (err < 0) |
567 | err = event__synthesize_kernel_mmap(process_synthesized_event, | 710 | err = event__synthesize_kernel_mmap(process_synthesized_event, |
568 | session, "_stext"); | 711 | session, machine, "_stext"); |
569 | if (err < 0) { | 712 | if (err < 0) { |
570 | pr_err("Couldn't record kernel reference relocation symbol.\n"); | 713 | pr_err("Couldn't record kernel reference relocation symbol.\n"); |
571 | return err; | 714 | return err; |
572 | } | 715 | } |
573 | 716 | ||
574 | err = event__synthesize_modules(process_synthesized_event, session); | 717 | err = event__synthesize_modules(process_synthesized_event, |
718 | session, machine); | ||
575 | if (err < 0) { | 719 | if (err < 0) { |
576 | pr_err("Couldn't record kernel reference relocation symbol.\n"); | 720 | pr_err("Couldn't record kernel reference relocation symbol.\n"); |
577 | return err; | 721 | return err; |
578 | } | 722 | } |
723 | if (perf_guest) | ||
724 | perf_session__process_machines(session, event__synthesize_guest_os); | ||
579 | 725 | ||
580 | if (!system_wide && profile_cpu == -1) | 726 | if (!system_wide && profile_cpu == -1) |
581 | event__synthesize_thread(target_pid, process_synthesized_event, | 727 | event__synthesize_thread(target_tid, process_synthesized_event, |
582 | session); | 728 | session); |
583 | else | 729 | else |
584 | event__synthesize_threads(process_synthesized_event, session); | 730 | event__synthesize_threads(process_synthesized_event, session); |
@@ -601,13 +747,9 @@ static int __cmd_record(int argc, const char **argv) | |||
601 | 747 | ||
602 | for (;;) { | 748 | for (;;) { |
603 | int hits = samples; | 749 | int hits = samples; |
750 | int thread; | ||
604 | 751 | ||
605 | for (i = 0; i < nr_cpu; i++) { | 752 | mmap_read_all(); |
606 | for (counter = 0; counter < nr_counters; counter++) { | ||
607 | if (mmap_array[i][counter].base) | ||
608 | mmap_read(&mmap_array[i][counter]); | ||
609 | } | ||
610 | } | ||
611 | 753 | ||
612 | if (hits == samples) { | 754 | if (hits == samples) { |
613 | if (done) | 755 | if (done) |
@@ -618,8 +760,15 @@ static int __cmd_record(int argc, const char **argv) | |||
618 | 760 | ||
619 | if (done) { | 761 | if (done) { |
620 | for (i = 0; i < nr_cpu; i++) { | 762 | for (i = 0; i < nr_cpu; i++) { |
621 | for (counter = 0; counter < nr_counters; counter++) | 763 | for (counter = 0; |
622 | ioctl(fd[i][counter], PERF_EVENT_IOC_DISABLE); | 764 | counter < nr_counters; |
765 | counter++) { | ||
766 | for (thread = 0; | ||
767 | thread < thread_num; | ||
768 | thread++) | ||
769 | ioctl(fd[i][counter][thread], | ||
770 | PERF_EVENT_IOC_DISABLE); | ||
771 | } | ||
623 | } | 772 | } |
624 | } | 773 | } |
625 | } | 774 | } |
@@ -644,6 +793,8 @@ static const char * const record_usage[] = { | |||
644 | NULL | 793 | NULL |
645 | }; | 794 | }; |
646 | 795 | ||
796 | static bool force, append_file; | ||
797 | |||
647 | static const struct option options[] = { | 798 | static const struct option options[] = { |
648 | OPT_CALLBACK('e', "event", NULL, "event", | 799 | OPT_CALLBACK('e', "event", NULL, "event", |
649 | "event selector. use 'perf list' to list available events", | 800 | "event selector. use 'perf list' to list available events", |
@@ -651,7 +802,9 @@ static const struct option options[] = { | |||
651 | OPT_CALLBACK(0, "filter", NULL, "filter", | 802 | OPT_CALLBACK(0, "filter", NULL, "filter", |
652 | "event filter", parse_filter), | 803 | "event filter", parse_filter), |
653 | OPT_INTEGER('p', "pid", &target_pid, | 804 | OPT_INTEGER('p', "pid", &target_pid, |
654 | "record events on existing pid"), | 805 | "record events on existing process id"), |
806 | OPT_INTEGER('t', "tid", &target_tid, | ||
807 | "record events on existing thread id"), | ||
655 | OPT_INTEGER('r', "realtime", &realtime_prio, | 808 | OPT_INTEGER('r', "realtime", &realtime_prio, |
656 | "collect data with this RT SCHED_FIFO priority"), | 809 | "collect data with this RT SCHED_FIFO priority"), |
657 | OPT_BOOLEAN('R', "raw-samples", &raw_samples, | 810 | OPT_BOOLEAN('R', "raw-samples", &raw_samples, |
@@ -663,20 +816,17 @@ static const struct option options[] = { | |||
663 | OPT_INTEGER('C', "profile_cpu", &profile_cpu, | 816 | OPT_INTEGER('C', "profile_cpu", &profile_cpu, |
664 | "CPU to profile on"), | 817 | "CPU to profile on"), |
665 | OPT_BOOLEAN('f', "force", &force, | 818 | OPT_BOOLEAN('f', "force", &force, |
666 | "overwrite existing data file"), | 819 | "overwrite existing data file (deprecated)"), |
667 | OPT_LONG('c', "count", &default_interval, | 820 | OPT_U64('c', "count", &user_interval, "event period to sample"), |
668 | "event period to sample"), | ||
669 | OPT_STRING('o', "output", &output_name, "file", | 821 | OPT_STRING('o', "output", &output_name, "file", |
670 | "output file name"), | 822 | "output file name"), |
671 | OPT_BOOLEAN('i', "inherit", &inherit, | 823 | OPT_BOOLEAN('i', "no-inherit", &no_inherit, |
672 | "child tasks inherit counters"), | 824 | "child tasks do not inherit counters"), |
673 | OPT_INTEGER('F', "freq", &freq, | 825 | OPT_UINTEGER('F', "freq", &user_freq, "profile at this frequency"), |
674 | "profile at this frequency"), | 826 | OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"), |
675 | OPT_INTEGER('m', "mmap-pages", &mmap_pages, | ||
676 | "number of mmap data pages"), | ||
677 | OPT_BOOLEAN('g', "call-graph", &call_graph, | 827 | OPT_BOOLEAN('g', "call-graph", &call_graph, |
678 | "do call-graph (stack chain/backtrace) recording"), | 828 | "do call-graph (stack chain/backtrace) recording"), |
679 | OPT_BOOLEAN('v', "verbose", &verbose, | 829 | OPT_INCR('v', "verbose", &verbose, |
680 | "be more verbose (show counter open errors, etc)"), | 830 | "be more verbose (show counter open errors, etc)"), |
681 | OPT_BOOLEAN('s', "stat", &inherit_stat, | 831 | OPT_BOOLEAN('s', "stat", &inherit_stat, |
682 | "per thread counts"), | 832 | "per thread counts"), |
@@ -691,13 +841,24 @@ static const struct option options[] = { | |||
691 | 841 | ||
692 | int cmd_record(int argc, const char **argv, const char *prefix __used) | 842 | int cmd_record(int argc, const char **argv, const char *prefix __used) |
693 | { | 843 | { |
694 | int counter; | 844 | int i,j; |
695 | 845 | ||
696 | argc = parse_options(argc, argv, options, record_usage, | 846 | argc = parse_options(argc, argv, options, record_usage, |
697 | PARSE_OPT_STOP_AT_NON_OPTION); | 847 | PARSE_OPT_STOP_AT_NON_OPTION); |
698 | if (!argc && target_pid == -1 && !system_wide && profile_cpu == -1) | 848 | if (!argc && target_pid == -1 && target_tid == -1 && |
849 | !system_wide && profile_cpu == -1) | ||
699 | usage_with_options(record_usage, options); | 850 | usage_with_options(record_usage, options); |
700 | 851 | ||
852 | if (force && append_file) { | ||
853 | fprintf(stderr, "Can't overwrite and append at the same time." | ||
854 | " You need to choose between -f and -A"); | ||
855 | usage_with_options(record_usage, options); | ||
856 | } else if (append_file) { | ||
857 | write_mode = WRITE_APPEND; | ||
858 | } else { | ||
859 | write_mode = WRITE_FORCE; | ||
860 | } | ||
861 | |||
701 | symbol__init(); | 862 | symbol__init(); |
702 | 863 | ||
703 | if (!nr_counters) { | 864 | if (!nr_counters) { |
@@ -706,6 +867,42 @@ int cmd_record(int argc, const char **argv, const char *prefix __used) | |||
706 | attrs[0].config = PERF_COUNT_HW_CPU_CYCLES; | 867 | attrs[0].config = PERF_COUNT_HW_CPU_CYCLES; |
707 | } | 868 | } |
708 | 869 | ||
870 | if (target_pid != -1) { | ||
871 | target_tid = target_pid; | ||
872 | thread_num = find_all_tid(target_pid, &all_tids); | ||
873 | if (thread_num <= 0) { | ||
874 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
875 | target_pid); | ||
876 | usage_with_options(record_usage, options); | ||
877 | } | ||
878 | } else { | ||
879 | all_tids=malloc(sizeof(pid_t)); | ||
880 | if (!all_tids) | ||
881 | return -ENOMEM; | ||
882 | |||
883 | all_tids[0] = target_tid; | ||
884 | thread_num = 1; | ||
885 | } | ||
886 | |||
887 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
888 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
889 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
890 | mmap_array[i][j] = zalloc( | ||
891 | sizeof(struct mmap_data)*thread_num); | ||
892 | if (!fd[i][j] || !mmap_array[i][j]) | ||
893 | return -ENOMEM; | ||
894 | } | ||
895 | } | ||
896 | event_array = malloc( | ||
897 | sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num); | ||
898 | if (!event_array) | ||
899 | return -ENOMEM; | ||
900 | |||
901 | if (user_interval != ULLONG_MAX) | ||
902 | default_interval = user_interval; | ||
903 | if (user_freq != UINT_MAX) | ||
904 | freq = user_freq; | ||
905 | |||
709 | /* | 906 | /* |
710 | * User specified count overrides default frequency. | 907 | * User specified count overrides default frequency. |
711 | */ | 908 | */ |
@@ -718,12 +915,5 @@ int cmd_record(int argc, const char **argv, const char *prefix __used) | |||
718 | exit(EXIT_FAILURE); | 915 | exit(EXIT_FAILURE); |
719 | } | 916 | } |
720 | 917 | ||
721 | for (counter = 0; counter < nr_counters; counter++) { | ||
722 | if (attrs[counter].sample_period) | ||
723 | continue; | ||
724 | |||
725 | attrs[counter].sample_period = default_interval; | ||
726 | } | ||
727 | |||
728 | return __cmd_record(argc, argv); | 918 | return __cmd_record(argc, argv); |
729 | } | 919 | } |
diff --git a/tools/perf/builtin-report.c b/tools/perf/builtin-report.c index f815de25d0fc..1d3c1003b43a 100644 --- a/tools/perf/builtin-report.c +++ b/tools/perf/builtin-report.c | |||
@@ -14,7 +14,6 @@ | |||
14 | #include "util/cache.h" | 14 | #include "util/cache.h" |
15 | #include <linux/rbtree.h> | 15 | #include <linux/rbtree.h> |
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | #include "util/string.h" | ||
18 | #include "util/callchain.h" | 17 | #include "util/callchain.h" |
19 | #include "util/strlist.h" | 18 | #include "util/strlist.h" |
20 | #include "util/values.h" | 19 | #include "util/values.h" |
@@ -33,28 +32,29 @@ | |||
33 | 32 | ||
34 | static char const *input_name = "perf.data"; | 33 | static char const *input_name = "perf.data"; |
35 | 34 | ||
36 | static int force; | 35 | static bool force; |
37 | static bool hide_unresolved; | 36 | static bool hide_unresolved; |
38 | static bool dont_use_callchains; | 37 | static bool dont_use_callchains; |
39 | 38 | ||
40 | static int show_threads; | 39 | static bool show_threads; |
41 | static struct perf_read_values show_threads_values; | 40 | static struct perf_read_values show_threads_values; |
42 | 41 | ||
43 | static char default_pretty_printing_style[] = "normal"; | 42 | static const char default_pretty_printing_style[] = "normal"; |
44 | static char *pretty_printing_style = default_pretty_printing_style; | 43 | static const char *pretty_printing_style = default_pretty_printing_style; |
45 | 44 | ||
46 | static char callchain_default_opt[] = "fractal,0.5"; | 45 | static char callchain_default_opt[] = "fractal,0.5"; |
47 | 46 | ||
48 | static struct event_stat_id *get_stats(struct perf_session *self, | 47 | static struct hists *perf_session__hists_findnew(struct perf_session *self, |
49 | u64 event_stream, u32 type, u64 config) | 48 | u64 event_stream, u32 type, |
49 | u64 config) | ||
50 | { | 50 | { |
51 | struct rb_node **p = &self->stats_by_id.rb_node; | 51 | struct rb_node **p = &self->hists_tree.rb_node; |
52 | struct rb_node *parent = NULL; | 52 | struct rb_node *parent = NULL; |
53 | struct event_stat_id *iter, *new; | 53 | struct hists *iter, *new; |
54 | 54 | ||
55 | while (*p != NULL) { | 55 | while (*p != NULL) { |
56 | parent = *p; | 56 | parent = *p; |
57 | iter = rb_entry(parent, struct event_stat_id, rb_node); | 57 | iter = rb_entry(parent, struct hists, rb_node); |
58 | if (iter->config == config) | 58 | if (iter->config == config) |
59 | return iter; | 59 | return iter; |
60 | 60 | ||
@@ -65,15 +65,15 @@ static struct event_stat_id *get_stats(struct perf_session *self, | |||
65 | p = &(*p)->rb_left; | 65 | p = &(*p)->rb_left; |
66 | } | 66 | } |
67 | 67 | ||
68 | new = malloc(sizeof(struct event_stat_id)); | 68 | new = malloc(sizeof(struct hists)); |
69 | if (new == NULL) | 69 | if (new == NULL) |
70 | return NULL; | 70 | return NULL; |
71 | memset(new, 0, sizeof(struct event_stat_id)); | 71 | memset(new, 0, sizeof(struct hists)); |
72 | new->event_stream = event_stream; | 72 | new->event_stream = event_stream; |
73 | new->config = config; | 73 | new->config = config; |
74 | new->type = type; | 74 | new->type = type; |
75 | rb_link_node(&new->rb_node, parent, p); | 75 | rb_link_node(&new->rb_node, parent, p); |
76 | rb_insert_color(&new->rb_node, &self->stats_by_id); | 76 | rb_insert_color(&new->rb_node, &self->hists_tree); |
77 | return new; | 77 | return new; |
78 | } | 78 | } |
79 | 79 | ||
@@ -81,70 +81,71 @@ static int perf_session__add_hist_entry(struct perf_session *self, | |||
81 | struct addr_location *al, | 81 | struct addr_location *al, |
82 | struct sample_data *data) | 82 | struct sample_data *data) |
83 | { | 83 | { |
84 | struct symbol **syms = NULL, *parent = NULL; | 84 | struct map_symbol *syms = NULL; |
85 | bool hit; | 85 | struct symbol *parent = NULL; |
86 | int err = -ENOMEM; | ||
86 | struct hist_entry *he; | 87 | struct hist_entry *he; |
87 | struct event_stat_id *stats; | 88 | struct hists *hists; |
88 | struct perf_event_attr *attr; | 89 | struct perf_event_attr *attr; |
89 | 90 | ||
90 | if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) | 91 | if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) { |
91 | syms = perf_session__resolve_callchain(self, al->thread, | 92 | syms = perf_session__resolve_callchain(self, al->thread, |
92 | data->callchain, &parent); | 93 | data->callchain, &parent); |
94 | if (syms == NULL) | ||
95 | return -ENOMEM; | ||
96 | } | ||
93 | 97 | ||
94 | attr = perf_header__find_attr(data->id, &self->header); | 98 | attr = perf_header__find_attr(data->id, &self->header); |
95 | if (attr) | 99 | if (attr) |
96 | stats = get_stats(self, data->id, attr->type, attr->config); | 100 | hists = perf_session__hists_findnew(self, data->id, attr->type, attr->config); |
97 | else | 101 | else |
98 | stats = get_stats(self, data->id, 0, 0); | 102 | hists = perf_session__hists_findnew(self, data->id, 0, 0); |
99 | if (stats == NULL) | 103 | if (hists == NULL) |
100 | return -ENOMEM; | 104 | goto out_free_syms; |
101 | he = __perf_session__add_hist_entry(&stats->hists, al, parent, | 105 | he = __hists__add_entry(hists, al, parent, data->period); |
102 | data->period, &hit); | ||
103 | if (he == NULL) | 106 | if (he == NULL) |
104 | return -ENOMEM; | 107 | goto out_free_syms; |
105 | 108 | err = 0; | |
106 | if (hit) | ||
107 | he->count += data->period; | ||
108 | |||
109 | if (symbol_conf.use_callchain) { | 109 | if (symbol_conf.use_callchain) { |
110 | if (!hit) | 110 | err = append_chain(he->callchain, data->callchain, syms); |
111 | callchain_init(&he->callchain); | 111 | if (err) |
112 | append_chain(&he->callchain, data->callchain, syms); | 112 | goto out_free_syms; |
113 | free(syms); | ||
114 | } | 113 | } |
115 | 114 | /* | |
116 | return 0; | 115 | * Only in the newt browser we are doing integrated annotation, |
117 | } | 116 | * so we don't allocated the extra space needed because the stdio |
118 | 117 | * code will not use it. | |
119 | static int validate_chain(struct ip_callchain *chain, event_t *event) | 118 | */ |
120 | { | 119 | if (use_browser) |
121 | unsigned int chain_size; | 120 | err = hist_entry__inc_addr_samples(he, al->addr); |
122 | 121 | out_free_syms: | |
123 | chain_size = event->header.size; | 122 | free(syms); |
124 | chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event; | 123 | return err; |
125 | |||
126 | if (chain->nr*sizeof(u64) > chain_size) | ||
127 | return -1; | ||
128 | |||
129 | return 0; | ||
130 | } | 124 | } |
131 | 125 | ||
132 | static int add_event_total(struct perf_session *session, | 126 | static int add_event_total(struct perf_session *session, |
133 | struct sample_data *data, | 127 | struct sample_data *data, |
134 | struct perf_event_attr *attr) | 128 | struct perf_event_attr *attr) |
135 | { | 129 | { |
136 | struct event_stat_id *stats; | 130 | struct hists *hists; |
137 | 131 | ||
138 | if (attr) | 132 | if (attr) |
139 | stats = get_stats(session, data->id, attr->type, attr->config); | 133 | hists = perf_session__hists_findnew(session, data->id, |
134 | attr->type, attr->config); | ||
140 | else | 135 | else |
141 | stats = get_stats(session, data->id, 0, 0); | 136 | hists = perf_session__hists_findnew(session, data->id, 0, 0); |
142 | 137 | ||
143 | if (!stats) | 138 | if (!hists) |
144 | return -ENOMEM; | 139 | return -ENOMEM; |
145 | 140 | ||
146 | stats->stats.total += data->period; | 141 | hists->stats.total_period += data->period; |
147 | session->events_stats.total += data->period; | 142 | /* |
143 | * FIXME: add_event_total should be moved from here to | ||
144 | * perf_session__process_event so that the proper hist is passed to | ||
145 | * the event_op methods. | ||
146 | */ | ||
147 | hists__inc_nr_events(hists, PERF_RECORD_SAMPLE); | ||
148 | session->hists.stats.total_period += data->period; | ||
148 | return 0; | 149 | return 0; |
149 | } | 150 | } |
150 | 151 | ||
@@ -164,7 +165,7 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
164 | 165 | ||
165 | dump_printf("... chain: nr:%Lu\n", data.callchain->nr); | 166 | dump_printf("... chain: nr:%Lu\n", data.callchain->nr); |
166 | 167 | ||
167 | if (validate_chain(data.callchain, event) < 0) { | 168 | if (!ip_callchain__valid(data.callchain, event)) { |
168 | pr_debug("call-chain problem with event, " | 169 | pr_debug("call-chain problem with event, " |
169 | "skipping it.\n"); | 170 | "skipping it.\n"); |
170 | return 0; | 171 | return 0; |
@@ -187,14 +188,14 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
187 | return 0; | 188 | return 0; |
188 | 189 | ||
189 | if (perf_session__add_hist_entry(session, &al, &data)) { | 190 | if (perf_session__add_hist_entry(session, &al, &data)) { |
190 | pr_debug("problem incrementing symbol count, skipping event\n"); | 191 | pr_debug("problem incrementing symbol period, skipping event\n"); |
191 | return -1; | 192 | return -1; |
192 | } | 193 | } |
193 | 194 | ||
194 | attr = perf_header__find_attr(data.id, &session->header); | 195 | attr = perf_header__find_attr(data.id, &session->header); |
195 | 196 | ||
196 | if (add_event_total(session, &data, attr)) { | 197 | if (add_event_total(session, &data, attr)) { |
197 | pr_debug("problem adding event count\n"); | 198 | pr_debug("problem adding event period\n"); |
198 | return -1; | 199 | return -1; |
199 | } | 200 | } |
200 | 201 | ||
@@ -260,15 +261,43 @@ static struct perf_event_ops event_ops = { | |||
260 | .fork = event__process_task, | 261 | .fork = event__process_task, |
261 | .lost = event__process_lost, | 262 | .lost = event__process_lost, |
262 | .read = process_read_event, | 263 | .read = process_read_event, |
264 | .attr = event__process_attr, | ||
265 | .event_type = event__process_event_type, | ||
266 | .tracing_data = event__process_tracing_data, | ||
267 | .build_id = event__process_build_id, | ||
263 | }; | 268 | }; |
264 | 269 | ||
270 | extern volatile int session_done; | ||
271 | |||
272 | static void sig_handler(int sig __used) | ||
273 | { | ||
274 | session_done = 1; | ||
275 | } | ||
276 | |||
277 | static size_t hists__fprintf_nr_sample_events(struct hists *self, | ||
278 | const char *evname, FILE *fp) | ||
279 | { | ||
280 | size_t ret; | ||
281 | char unit; | ||
282 | unsigned long nr_events = self->stats.nr_events[PERF_RECORD_SAMPLE]; | ||
283 | |||
284 | nr_events = convert_unit(nr_events, &unit); | ||
285 | ret = fprintf(fp, "# Events: %lu%c", nr_events, unit); | ||
286 | if (evname != NULL) | ||
287 | ret += fprintf(fp, " %s", evname); | ||
288 | return ret + fprintf(fp, "\n#\n"); | ||
289 | } | ||
290 | |||
265 | static int __cmd_report(void) | 291 | static int __cmd_report(void) |
266 | { | 292 | { |
267 | int ret = -EINVAL; | 293 | int ret = -EINVAL; |
268 | struct perf_session *session; | 294 | struct perf_session *session; |
269 | struct rb_node *next; | 295 | struct rb_node *next; |
296 | const char *help = "For a higher level overview, try: perf report --sort comm,dso"; | ||
297 | |||
298 | signal(SIGINT, sig_handler); | ||
270 | 299 | ||
271 | session = perf_session__new(input_name, O_RDONLY, force); | 300 | session = perf_session__new(input_name, O_RDONLY, force, false); |
272 | if (session == NULL) | 301 | if (session == NULL) |
273 | return -ENOMEM; | 302 | return -ENOMEM; |
274 | 303 | ||
@@ -284,7 +313,7 @@ static int __cmd_report(void) | |||
284 | goto out_delete; | 313 | goto out_delete; |
285 | 314 | ||
286 | if (dump_trace) { | 315 | if (dump_trace) { |
287 | event__print_totals(); | 316 | perf_session__fprintf_nr_events(session, stdout); |
288 | goto out_delete; | 317 | goto out_delete; |
289 | } | 318 | } |
290 | 319 | ||
@@ -292,39 +321,42 @@ static int __cmd_report(void) | |||
292 | perf_session__fprintf(session, stdout); | 321 | perf_session__fprintf(session, stdout); |
293 | 322 | ||
294 | if (verbose > 2) | 323 | if (verbose > 2) |
295 | dsos__fprintf(stdout); | 324 | perf_session__fprintf_dsos(session, stdout); |
296 | 325 | ||
297 | next = rb_first(&session->stats_by_id); | 326 | next = rb_first(&session->hists_tree); |
298 | while (next) { | 327 | while (next) { |
299 | struct event_stat_id *stats; | 328 | struct hists *hists; |
300 | 329 | ||
301 | stats = rb_entry(next, struct event_stat_id, rb_node); | 330 | hists = rb_entry(next, struct hists, rb_node); |
302 | perf_session__collapse_resort(&stats->hists); | 331 | hists__collapse_resort(hists); |
303 | perf_session__output_resort(&stats->hists, stats->stats.total); | 332 | hists__output_resort(hists); |
304 | if (rb_first(&session->stats_by_id) == | 333 | if (use_browser) |
305 | rb_last(&session->stats_by_id)) | 334 | hists__browse(hists, help, input_name); |
306 | fprintf(stdout, "# Samples: %Ld\n#\n", | 335 | else { |
307 | stats->stats.total); | 336 | const char *evname = NULL; |
308 | else | 337 | if (rb_first(&session->hists.entries) != |
309 | fprintf(stdout, "# Samples: %Ld %s\n#\n", | 338 | rb_last(&session->hists.entries)) |
310 | stats->stats.total, | 339 | evname = __event_name(hists->type, hists->config); |
311 | __event_name(stats->type, stats->config)); | 340 | |
312 | 341 | hists__fprintf_nr_sample_events(hists, evname, stdout); | |
313 | perf_session__fprintf_hists(&stats->hists, NULL, false, stdout, | 342 | |
314 | stats->stats.total); | 343 | hists__fprintf(hists, NULL, false, stdout); |
315 | fprintf(stdout, "\n\n"); | 344 | fprintf(stdout, "\n\n"); |
316 | next = rb_next(&stats->rb_node); | 345 | } |
346 | |||
347 | next = rb_next(&hists->rb_node); | ||
317 | } | 348 | } |
318 | 349 | ||
319 | if (sort_order == default_sort_order && | 350 | if (!use_browser && sort_order == default_sort_order && |
320 | parent_pattern == default_parent_pattern) | 351 | parent_pattern == default_parent_pattern) { |
321 | fprintf(stdout, "#\n# (For a higher level overview, try: perf report --sort comm,dso)\n#\n"); | 352 | fprintf(stdout, "#\n# (%s)\n#\n", help); |
322 | 353 | ||
323 | if (show_threads) { | 354 | if (show_threads) { |
324 | bool raw_printing_style = !strcmp(pretty_printing_style, "raw"); | 355 | bool style = !strcmp(pretty_printing_style, "raw"); |
325 | perf_read_values_display(stdout, &show_threads_values, | 356 | perf_read_values_display(stdout, &show_threads_values, |
326 | raw_printing_style); | 357 | style); |
327 | perf_read_values_destroy(&show_threads_values); | 358 | perf_read_values_destroy(&show_threads_values); |
359 | } | ||
328 | } | 360 | } |
329 | out_delete: | 361 | out_delete: |
330 | perf_session__delete(session); | 362 | perf_session__delete(session); |
@@ -335,7 +367,7 @@ static int | |||
335 | parse_callchain_opt(const struct option *opt __used, const char *arg, | 367 | parse_callchain_opt(const struct option *opt __used, const char *arg, |
336 | int unset) | 368 | int unset) |
337 | { | 369 | { |
338 | char *tok; | 370 | char *tok, *tok2; |
339 | char *endptr; | 371 | char *endptr; |
340 | 372 | ||
341 | /* | 373 | /* |
@@ -380,10 +412,13 @@ parse_callchain_opt(const struct option *opt __used, const char *arg, | |||
380 | if (!tok) | 412 | if (!tok) |
381 | goto setup; | 413 | goto setup; |
382 | 414 | ||
415 | tok2 = strtok(NULL, ","); | ||
383 | callchain_param.min_percent = strtod(tok, &endptr); | 416 | callchain_param.min_percent = strtod(tok, &endptr); |
384 | if (tok == endptr) | 417 | if (tok == endptr) |
385 | return -1; | 418 | return -1; |
386 | 419 | ||
420 | if (tok2) | ||
421 | callchain_param.print_limit = strtod(tok2, &endptr); | ||
387 | setup: | 422 | setup: |
388 | if (register_callchain_param(&callchain_param) < 0) { | 423 | if (register_callchain_param(&callchain_param) < 0) { |
389 | fprintf(stderr, "Can't register callchain params\n"); | 424 | fprintf(stderr, "Can't register callchain params\n"); |
@@ -400,7 +435,7 @@ static const char * const report_usage[] = { | |||
400 | static const struct option options[] = { | 435 | static const struct option options[] = { |
401 | OPT_STRING('i', "input", &input_name, "file", | 436 | OPT_STRING('i', "input", &input_name, "file", |
402 | "input file name"), | 437 | "input file name"), |
403 | OPT_BOOLEAN('v', "verbose", &verbose, | 438 | OPT_INCR('v', "verbose", &verbose, |
404 | "be more verbose (show symbol address, etc)"), | 439 | "be more verbose (show symbol address, etc)"), |
405 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 440 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
406 | "dump raw trace in ASCII"), | 441 | "dump raw trace in ASCII"), |
@@ -419,12 +454,14 @@ static const struct option options[] = { | |||
419 | "sort by key(s): pid, comm, dso, symbol, parent"), | 454 | "sort by key(s): pid, comm, dso, symbol, parent"), |
420 | OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths, | 455 | OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths, |
421 | "Don't shorten the pathnames taking into account the cwd"), | 456 | "Don't shorten the pathnames taking into account the cwd"), |
457 | OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization, | ||
458 | "Show sample percentage for different cpu modes"), | ||
422 | OPT_STRING('p', "parent", &parent_pattern, "regex", | 459 | OPT_STRING('p', "parent", &parent_pattern, "regex", |
423 | "regex filter to identify parent, see: '--sort parent'"), | 460 | "regex filter to identify parent, see: '--sort parent'"), |
424 | OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other, | 461 | OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other, |
425 | "Only display entries with parent-match"), | 462 | "Only display entries with parent-match"), |
426 | OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent", | 463 | OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent", |
427 | "Display callchains using output_type and min percent threshold. " | 464 | "Display callchains using output_type (graph, flat, fractal, or none) and min percent threshold. " |
428 | "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt), | 465 | "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt), |
429 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", | 466 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", |
430 | "only consider symbols in these dsos"), | 467 | "only consider symbols in these dsos"), |
@@ -447,7 +484,15 @@ int cmd_report(int argc, const char **argv, const char *prefix __used) | |||
447 | { | 484 | { |
448 | argc = parse_options(argc, argv, options, report_usage, 0); | 485 | argc = parse_options(argc, argv, options, report_usage, 0); |
449 | 486 | ||
450 | setup_pager(); | 487 | if (strcmp(input_name, "-") != 0) |
488 | setup_browser(); | ||
489 | /* | ||
490 | * Only in the newt browser we are doing integrated annotation, | ||
491 | * so don't allocate extra space that won't be used in the stdio | ||
492 | * implementation. | ||
493 | */ | ||
494 | if (use_browser) | ||
495 | symbol_conf.priv_size = sizeof(struct sym_priv); | ||
451 | 496 | ||
452 | if (symbol__init() < 0) | 497 | if (symbol__init() < 0) |
453 | return -1; | 498 | return -1; |
@@ -455,7 +500,8 @@ int cmd_report(int argc, const char **argv, const char *prefix __used) | |||
455 | setup_sorting(report_usage, options); | 500 | setup_sorting(report_usage, options); |
456 | 501 | ||
457 | if (parent_pattern != default_parent_pattern) { | 502 | if (parent_pattern != default_parent_pattern) { |
458 | sort_dimension__add("parent"); | 503 | if (sort_dimension__add("parent") < 0) |
504 | return -1; | ||
459 | sort_parent.elide = 1; | 505 | sort_parent.elide = 1; |
460 | } else | 506 | } else |
461 | symbol_conf.exclude_other = false; | 507 | symbol_conf.exclude_other = false; |
diff --git a/tools/perf/builtin-sched.c b/tools/perf/builtin-sched.c index 4f5a03e43444..f67bce2a83b4 100644 --- a/tools/perf/builtin-sched.c +++ b/tools/perf/builtin-sched.c | |||
@@ -22,7 +22,7 @@ | |||
22 | static char const *input_name = "perf.data"; | 22 | static char const *input_name = "perf.data"; |
23 | 23 | ||
24 | static char default_sort_order[] = "avg, max, switch, runtime"; | 24 | static char default_sort_order[] = "avg, max, switch, runtime"; |
25 | static char *sort_order = default_sort_order; | 25 | static const char *sort_order = default_sort_order; |
26 | 26 | ||
27 | static int profile_cpu = -1; | 27 | static int profile_cpu = -1; |
28 | 28 | ||
@@ -68,10 +68,10 @@ enum sched_event_type { | |||
68 | 68 | ||
69 | struct sched_atom { | 69 | struct sched_atom { |
70 | enum sched_event_type type; | 70 | enum sched_event_type type; |
71 | int specific_wait; | ||
71 | u64 timestamp; | 72 | u64 timestamp; |
72 | u64 duration; | 73 | u64 duration; |
73 | unsigned long nr; | 74 | unsigned long nr; |
74 | int specific_wait; | ||
75 | sem_t *wait_sem; | 75 | sem_t *wait_sem; |
76 | struct task_desc *wakee; | 76 | struct task_desc *wakee; |
77 | }; | 77 | }; |
@@ -105,7 +105,7 @@ static u64 sum_runtime; | |||
105 | static u64 sum_fluct; | 105 | static u64 sum_fluct; |
106 | static u64 run_avg; | 106 | static u64 run_avg; |
107 | 107 | ||
108 | static unsigned long replay_repeat = 10; | 108 | static unsigned int replay_repeat = 10; |
109 | static unsigned long nr_timestamps; | 109 | static unsigned long nr_timestamps; |
110 | static unsigned long nr_unordered_timestamps; | 110 | static unsigned long nr_unordered_timestamps; |
111 | static unsigned long nr_state_machine_bugs; | 111 | static unsigned long nr_state_machine_bugs; |
@@ -1641,30 +1641,26 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
1641 | return 0; | 1641 | return 0; |
1642 | } | 1642 | } |
1643 | 1643 | ||
1644 | static int process_lost_event(event_t *event __used, | ||
1645 | struct perf_session *session __used) | ||
1646 | { | ||
1647 | nr_lost_chunks++; | ||
1648 | nr_lost_events += event->lost.lost; | ||
1649 | |||
1650 | return 0; | ||
1651 | } | ||
1652 | |||
1653 | static struct perf_event_ops event_ops = { | 1644 | static struct perf_event_ops event_ops = { |
1654 | .sample = process_sample_event, | 1645 | .sample = process_sample_event, |
1655 | .comm = event__process_comm, | 1646 | .comm = event__process_comm, |
1656 | .lost = process_lost_event, | 1647 | .lost = event__process_lost, |
1648 | .ordered_samples = true, | ||
1657 | }; | 1649 | }; |
1658 | 1650 | ||
1659 | static int read_events(void) | 1651 | static int read_events(void) |
1660 | { | 1652 | { |
1661 | int err = -EINVAL; | 1653 | int err = -EINVAL; |
1662 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 1654 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
1663 | if (session == NULL) | 1655 | if (session == NULL) |
1664 | return -ENOMEM; | 1656 | return -ENOMEM; |
1665 | 1657 | ||
1666 | if (perf_session__has_traces(session, "record -R")) | 1658 | if (perf_session__has_traces(session, "record -R")) { |
1667 | err = perf_session__process_events(session, &event_ops); | 1659 | err = perf_session__process_events(session, &event_ops); |
1660 | nr_events = session->hists.stats.nr_events[0]; | ||
1661 | nr_lost_events = session->hists.stats.total_lost; | ||
1662 | nr_lost_chunks = session->hists.stats.nr_events[PERF_RECORD_LOST]; | ||
1663 | } | ||
1668 | 1664 | ||
1669 | perf_session__delete(session); | 1665 | perf_session__delete(session); |
1670 | return err; | 1666 | return err; |
@@ -1790,7 +1786,7 @@ static const char * const sched_usage[] = { | |||
1790 | static const struct option sched_options[] = { | 1786 | static const struct option sched_options[] = { |
1791 | OPT_STRING('i', "input", &input_name, "file", | 1787 | OPT_STRING('i', "input", &input_name, "file", |
1792 | "input file name"), | 1788 | "input file name"), |
1793 | OPT_BOOLEAN('v', "verbose", &verbose, | 1789 | OPT_INCR('v', "verbose", &verbose, |
1794 | "be more verbose (show symbol address, etc)"), | 1790 | "be more verbose (show symbol address, etc)"), |
1795 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 1791 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
1796 | "dump raw trace in ASCII"), | 1792 | "dump raw trace in ASCII"), |
@@ -1805,7 +1801,7 @@ static const char * const latency_usage[] = { | |||
1805 | static const struct option latency_options[] = { | 1801 | static const struct option latency_options[] = { |
1806 | OPT_STRING('s', "sort", &sort_order, "key[,key2...]", | 1802 | OPT_STRING('s', "sort", &sort_order, "key[,key2...]", |
1807 | "sort by key(s): runtime, switch, avg, max"), | 1803 | "sort by key(s): runtime, switch, avg, max"), |
1808 | OPT_BOOLEAN('v', "verbose", &verbose, | 1804 | OPT_INCR('v', "verbose", &verbose, |
1809 | "be more verbose (show symbol address, etc)"), | 1805 | "be more verbose (show symbol address, etc)"), |
1810 | OPT_INTEGER('C', "CPU", &profile_cpu, | 1806 | OPT_INTEGER('C', "CPU", &profile_cpu, |
1811 | "CPU to profile on"), | 1807 | "CPU to profile on"), |
@@ -1820,9 +1816,9 @@ static const char * const replay_usage[] = { | |||
1820 | }; | 1816 | }; |
1821 | 1817 | ||
1822 | static const struct option replay_options[] = { | 1818 | static const struct option replay_options[] = { |
1823 | OPT_INTEGER('r', "repeat", &replay_repeat, | 1819 | OPT_UINTEGER('r', "repeat", &replay_repeat, |
1824 | "repeat the workload replay N times (-1: infinite)"), | 1820 | "repeat the workload replay N times (-1: infinite)"), |
1825 | OPT_BOOLEAN('v', "verbose", &verbose, | 1821 | OPT_INCR('v', "verbose", &verbose, |
1826 | "be more verbose (show symbol address, etc)"), | 1822 | "be more verbose (show symbol address, etc)"), |
1827 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 1823 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
1828 | "dump raw trace in ASCII"), | 1824 | "dump raw trace in ASCII"), |
@@ -1850,7 +1846,6 @@ static const char *record_args[] = { | |||
1850 | "record", | 1846 | "record", |
1851 | "-a", | 1847 | "-a", |
1852 | "-R", | 1848 | "-R", |
1853 | "-M", | ||
1854 | "-f", | 1849 | "-f", |
1855 | "-m", "1024", | 1850 | "-m", "1024", |
1856 | "-c", "1", | 1851 | "-c", "1", |
diff --git a/tools/perf/builtin-stat.c b/tools/perf/builtin-stat.c index 95db31cff6fd..ff8c413b7e73 100644 --- a/tools/perf/builtin-stat.c +++ b/tools/perf/builtin-stat.c | |||
@@ -46,6 +46,7 @@ | |||
46 | #include "util/debug.h" | 46 | #include "util/debug.h" |
47 | #include "util/header.h" | 47 | #include "util/header.h" |
48 | #include "util/cpumap.h" | 48 | #include "util/cpumap.h" |
49 | #include "util/thread.h" | ||
49 | 50 | ||
50 | #include <sys/prctl.h> | 51 | #include <sys/prctl.h> |
51 | #include <math.h> | 52 | #include <math.h> |
@@ -66,18 +67,21 @@ static struct perf_event_attr default_attrs[] = { | |||
66 | 67 | ||
67 | }; | 68 | }; |
68 | 69 | ||
69 | static int system_wide = 0; | 70 | static bool system_wide = false; |
70 | static unsigned int nr_cpus = 0; | 71 | static unsigned int nr_cpus = 0; |
71 | static int run_idx = 0; | 72 | static int run_idx = 0; |
72 | 73 | ||
73 | static int run_count = 1; | 74 | static int run_count = 1; |
74 | static int inherit = 1; | 75 | static bool no_inherit = false; |
75 | static int scale = 1; | 76 | static bool scale = true; |
76 | static pid_t target_pid = -1; | 77 | static pid_t target_pid = -1; |
78 | static pid_t target_tid = -1; | ||
79 | static pid_t *all_tids = NULL; | ||
80 | static int thread_num = 0; | ||
77 | static pid_t child_pid = -1; | 81 | static pid_t child_pid = -1; |
78 | static int null_run = 0; | 82 | static bool null_run = false; |
79 | 83 | ||
80 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 84 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; |
81 | 85 | ||
82 | static int event_scaled[MAX_COUNTERS]; | 86 | static int event_scaled[MAX_COUNTERS]; |
83 | 87 | ||
@@ -140,9 +144,11 @@ struct stats runtime_branches_stats; | |||
140 | #define ERR_PERF_OPEN \ | 144 | #define ERR_PERF_OPEN \ |
141 | "Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n" | 145 | "Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n" |
142 | 146 | ||
143 | static void create_perf_stat_counter(int counter, int pid) | 147 | static int create_perf_stat_counter(int counter) |
144 | { | 148 | { |
145 | struct perf_event_attr *attr = attrs + counter; | 149 | struct perf_event_attr *attr = attrs + counter; |
150 | int thread; | ||
151 | int ncreated = 0; | ||
146 | 152 | ||
147 | if (scale) | 153 | if (scale) |
148 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | | 154 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | |
@@ -152,21 +158,33 @@ static void create_perf_stat_counter(int counter, int pid) | |||
152 | unsigned int cpu; | 158 | unsigned int cpu; |
153 | 159 | ||
154 | for (cpu = 0; cpu < nr_cpus; cpu++) { | 160 | for (cpu = 0; cpu < nr_cpus; cpu++) { |
155 | fd[cpu][counter] = sys_perf_event_open(attr, -1, cpumap[cpu], -1, 0); | 161 | fd[cpu][counter][0] = sys_perf_event_open(attr, |
156 | if (fd[cpu][counter] < 0 && verbose) | 162 | -1, cpumap[cpu], -1, 0); |
157 | fprintf(stderr, ERR_PERF_OPEN, counter, | 163 | if (fd[cpu][counter][0] < 0) |
158 | fd[cpu][counter], strerror(errno)); | 164 | pr_debug(ERR_PERF_OPEN, counter, |
165 | fd[cpu][counter][0], strerror(errno)); | ||
166 | else | ||
167 | ++ncreated; | ||
159 | } | 168 | } |
160 | } else { | 169 | } else { |
161 | attr->inherit = inherit; | 170 | attr->inherit = !no_inherit; |
162 | attr->disabled = 1; | 171 | if (target_pid == -1 && target_tid == -1) { |
163 | attr->enable_on_exec = 1; | 172 | attr->disabled = 1; |
164 | 173 | attr->enable_on_exec = 1; | |
165 | fd[0][counter] = sys_perf_event_open(attr, pid, -1, -1, 0); | 174 | } |
166 | if (fd[0][counter] < 0 && verbose) | 175 | for (thread = 0; thread < thread_num; thread++) { |
167 | fprintf(stderr, ERR_PERF_OPEN, counter, | 176 | fd[0][counter][thread] = sys_perf_event_open(attr, |
168 | fd[0][counter], strerror(errno)); | 177 | all_tids[thread], -1, -1, 0); |
178 | if (fd[0][counter][thread] < 0) | ||
179 | pr_debug(ERR_PERF_OPEN, counter, | ||
180 | fd[0][counter][thread], | ||
181 | strerror(errno)); | ||
182 | else | ||
183 | ++ncreated; | ||
184 | } | ||
169 | } | 185 | } |
186 | |||
187 | return ncreated; | ||
170 | } | 188 | } |
171 | 189 | ||
172 | /* | 190 | /* |
@@ -190,25 +208,28 @@ static void read_counter(int counter) | |||
190 | unsigned int cpu; | 208 | unsigned int cpu; |
191 | size_t res, nv; | 209 | size_t res, nv; |
192 | int scaled; | 210 | int scaled; |
193 | int i; | 211 | int i, thread; |
194 | 212 | ||
195 | count[0] = count[1] = count[2] = 0; | 213 | count[0] = count[1] = count[2] = 0; |
196 | 214 | ||
197 | nv = scale ? 3 : 1; | 215 | nv = scale ? 3 : 1; |
198 | for (cpu = 0; cpu < nr_cpus; cpu++) { | 216 | for (cpu = 0; cpu < nr_cpus; cpu++) { |
199 | if (fd[cpu][counter] < 0) | 217 | for (thread = 0; thread < thread_num; thread++) { |
200 | continue; | 218 | if (fd[cpu][counter][thread] < 0) |
201 | 219 | continue; | |
202 | res = read(fd[cpu][counter], single_count, nv * sizeof(u64)); | 220 | |
203 | assert(res == nv * sizeof(u64)); | 221 | res = read(fd[cpu][counter][thread], |
204 | 222 | single_count, nv * sizeof(u64)); | |
205 | close(fd[cpu][counter]); | 223 | assert(res == nv * sizeof(u64)); |
206 | fd[cpu][counter] = -1; | 224 | |
207 | 225 | close(fd[cpu][counter][thread]); | |
208 | count[0] += single_count[0]; | 226 | fd[cpu][counter][thread] = -1; |
209 | if (scale) { | 227 | |
210 | count[1] += single_count[1]; | 228 | count[0] += single_count[0]; |
211 | count[2] += single_count[2]; | 229 | if (scale) { |
230 | count[1] += single_count[1]; | ||
231 | count[2] += single_count[2]; | ||
232 | } | ||
212 | } | 233 | } |
213 | } | 234 | } |
214 | 235 | ||
@@ -250,10 +271,9 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
250 | { | 271 | { |
251 | unsigned long long t0, t1; | 272 | unsigned long long t0, t1; |
252 | int status = 0; | 273 | int status = 0; |
253 | int counter; | 274 | int counter, ncreated = 0; |
254 | int pid = target_pid; | ||
255 | int child_ready_pipe[2], go_pipe[2]; | 275 | int child_ready_pipe[2], go_pipe[2]; |
256 | const bool forks = (target_pid == -1 && argc > 0); | 276 | const bool forks = (argc > 0); |
257 | char buf; | 277 | char buf; |
258 | 278 | ||
259 | if (!system_wide) | 279 | if (!system_wide) |
@@ -265,10 +285,10 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
265 | } | 285 | } |
266 | 286 | ||
267 | if (forks) { | 287 | if (forks) { |
268 | if ((pid = fork()) < 0) | 288 | if ((child_pid = fork()) < 0) |
269 | perror("failed to fork"); | 289 | perror("failed to fork"); |
270 | 290 | ||
271 | if (!pid) { | 291 | if (!child_pid) { |
272 | close(child_ready_pipe[0]); | 292 | close(child_ready_pipe[0]); |
273 | close(go_pipe[1]); | 293 | close(go_pipe[1]); |
274 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); | 294 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); |
@@ -297,7 +317,8 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
297 | exit(-1); | 317 | exit(-1); |
298 | } | 318 | } |
299 | 319 | ||
300 | child_pid = pid; | 320 | if (target_tid == -1 && target_pid == -1 && !system_wide) |
321 | all_tids[0] = child_pid; | ||
301 | 322 | ||
302 | /* | 323 | /* |
303 | * Wait for the child to be ready to exec. | 324 | * Wait for the child to be ready to exec. |
@@ -310,7 +331,16 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
310 | } | 331 | } |
311 | 332 | ||
312 | for (counter = 0; counter < nr_counters; counter++) | 333 | for (counter = 0; counter < nr_counters; counter++) |
313 | create_perf_stat_counter(counter, pid); | 334 | ncreated += create_perf_stat_counter(counter); |
335 | |||
336 | if (ncreated == 0) { | ||
337 | pr_err("No permission to collect %sstats.\n" | ||
338 | "Consider tweaking /proc/sys/kernel/perf_event_paranoid.\n", | ||
339 | system_wide ? "system-wide " : ""); | ||
340 | if (child_pid != -1) | ||
341 | kill(child_pid, SIGTERM); | ||
342 | return -1; | ||
343 | } | ||
314 | 344 | ||
315 | /* | 345 | /* |
316 | * Enable counters and exec the command: | 346 | * Enable counters and exec the command: |
@@ -321,7 +351,7 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
321 | close(go_pipe[1]); | 351 | close(go_pipe[1]); |
322 | wait(&status); | 352 | wait(&status); |
323 | } else { | 353 | } else { |
324 | while(!done); | 354 | while(!done) sleep(1); |
325 | } | 355 | } |
326 | 356 | ||
327 | t1 = rdclock(); | 357 | t1 = rdclock(); |
@@ -429,12 +459,14 @@ static void print_stat(int argc, const char **argv) | |||
429 | 459 | ||
430 | fprintf(stderr, "\n"); | 460 | fprintf(stderr, "\n"); |
431 | fprintf(stderr, " Performance counter stats for "); | 461 | fprintf(stderr, " Performance counter stats for "); |
432 | if(target_pid == -1) { | 462 | if(target_pid == -1 && target_tid == -1) { |
433 | fprintf(stderr, "\'%s", argv[0]); | 463 | fprintf(stderr, "\'%s", argv[0]); |
434 | for (i = 1; i < argc; i++) | 464 | for (i = 1; i < argc; i++) |
435 | fprintf(stderr, " %s", argv[i]); | 465 | fprintf(stderr, " %s", argv[i]); |
436 | }else | 466 | } else if (target_pid != -1) |
437 | fprintf(stderr, "task pid \'%d", target_pid); | 467 | fprintf(stderr, "process id \'%d", target_pid); |
468 | else | ||
469 | fprintf(stderr, "thread id \'%d", target_tid); | ||
438 | 470 | ||
439 | fprintf(stderr, "\'"); | 471 | fprintf(stderr, "\'"); |
440 | if (run_count > 1) | 472 | if (run_count > 1) |
@@ -459,7 +491,7 @@ static volatile int signr = -1; | |||
459 | 491 | ||
460 | static void skip_signal(int signo) | 492 | static void skip_signal(int signo) |
461 | { | 493 | { |
462 | if(target_pid != -1) | 494 | if(child_pid == -1) |
463 | done = 1; | 495 | done = 1; |
464 | 496 | ||
465 | signr = signo; | 497 | signr = signo; |
@@ -486,15 +518,17 @@ static const struct option options[] = { | |||
486 | OPT_CALLBACK('e', "event", NULL, "event", | 518 | OPT_CALLBACK('e', "event", NULL, "event", |
487 | "event selector. use 'perf list' to list available events", | 519 | "event selector. use 'perf list' to list available events", |
488 | parse_events), | 520 | parse_events), |
489 | OPT_BOOLEAN('i', "inherit", &inherit, | 521 | OPT_BOOLEAN('i', "no-inherit", &no_inherit, |
490 | "child tasks inherit counters"), | 522 | "child tasks do not inherit counters"), |
491 | OPT_INTEGER('p', "pid", &target_pid, | 523 | OPT_INTEGER('p', "pid", &target_pid, |
492 | "stat events on existing pid"), | 524 | "stat events on existing process id"), |
525 | OPT_INTEGER('t', "tid", &target_tid, | ||
526 | "stat events on existing thread id"), | ||
493 | OPT_BOOLEAN('a', "all-cpus", &system_wide, | 527 | OPT_BOOLEAN('a', "all-cpus", &system_wide, |
494 | "system-wide collection from all CPUs"), | 528 | "system-wide collection from all CPUs"), |
495 | OPT_BOOLEAN('c', "scale", &scale, | 529 | OPT_BOOLEAN('c', "scale", &scale, |
496 | "scale/normalize counters"), | 530 | "scale/normalize counters"), |
497 | OPT_BOOLEAN('v', "verbose", &verbose, | 531 | OPT_INCR('v', "verbose", &verbose, |
498 | "be more verbose (show counter open errors, etc)"), | 532 | "be more verbose (show counter open errors, etc)"), |
499 | OPT_INTEGER('r', "repeat", &run_count, | 533 | OPT_INTEGER('r', "repeat", &run_count, |
500 | "repeat command and print average + stddev (max: 100)"), | 534 | "repeat command and print average + stddev (max: 100)"), |
@@ -506,10 +540,11 @@ static const struct option options[] = { | |||
506 | int cmd_stat(int argc, const char **argv, const char *prefix __used) | 540 | int cmd_stat(int argc, const char **argv, const char *prefix __used) |
507 | { | 541 | { |
508 | int status; | 542 | int status; |
543 | int i,j; | ||
509 | 544 | ||
510 | argc = parse_options(argc, argv, options, stat_usage, | 545 | argc = parse_options(argc, argv, options, stat_usage, |
511 | PARSE_OPT_STOP_AT_NON_OPTION); | 546 | PARSE_OPT_STOP_AT_NON_OPTION); |
512 | if (!argc && target_pid == -1) | 547 | if (!argc && target_pid == -1 && target_tid == -1) |
513 | usage_with_options(stat_usage, options); | 548 | usage_with_options(stat_usage, options); |
514 | if (run_count <= 0) | 549 | if (run_count <= 0) |
515 | usage_with_options(stat_usage, options); | 550 | usage_with_options(stat_usage, options); |
@@ -525,6 +560,31 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used) | |||
525 | else | 560 | else |
526 | nr_cpus = 1; | 561 | nr_cpus = 1; |
527 | 562 | ||
563 | if (target_pid != -1) { | ||
564 | target_tid = target_pid; | ||
565 | thread_num = find_all_tid(target_pid, &all_tids); | ||
566 | if (thread_num <= 0) { | ||
567 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
568 | target_pid); | ||
569 | usage_with_options(stat_usage, options); | ||
570 | } | ||
571 | } else { | ||
572 | all_tids=malloc(sizeof(pid_t)); | ||
573 | if (!all_tids) | ||
574 | return -ENOMEM; | ||
575 | |||
576 | all_tids[0] = target_tid; | ||
577 | thread_num = 1; | ||
578 | } | ||
579 | |||
580 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
581 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
582 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
583 | if (!fd[i][j]) | ||
584 | return -ENOMEM; | ||
585 | } | ||
586 | } | ||
587 | |||
528 | /* | 588 | /* |
529 | * We dont want to block the signals - that would cause | 589 | * We dont want to block the signals - that would cause |
530 | * child tasks to inherit that and Ctrl-C would not work. | 590 | * child tasks to inherit that and Ctrl-C would not work. |
@@ -543,7 +603,8 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used) | |||
543 | status = run_perf_stat(argc, argv); | 603 | status = run_perf_stat(argc, argv); |
544 | } | 604 | } |
545 | 605 | ||
546 | print_stat(argc, argv); | 606 | if (status != -1) |
607 | print_stat(argc, argv); | ||
547 | 608 | ||
548 | return status; | 609 | return status; |
549 | } | 610 | } |
diff --git a/tools/perf/builtin-test.c b/tools/perf/builtin-test.c new file mode 100644 index 000000000000..035b9fa063a9 --- /dev/null +++ b/tools/perf/builtin-test.c | |||
@@ -0,0 +1,281 @@ | |||
1 | /* | ||
2 | * builtin-test.c | ||
3 | * | ||
4 | * Builtin regression testing command: ever growing number of sanity tests | ||
5 | */ | ||
6 | #include "builtin.h" | ||
7 | |||
8 | #include "util/cache.h" | ||
9 | #include "util/debug.h" | ||
10 | #include "util/parse-options.h" | ||
11 | #include "util/session.h" | ||
12 | #include "util/symbol.h" | ||
13 | #include "util/thread.h" | ||
14 | |||
15 | static long page_size; | ||
16 | |||
17 | static int vmlinux_matches_kallsyms_filter(struct map *map __used, struct symbol *sym) | ||
18 | { | ||
19 | bool *visited = symbol__priv(sym); | ||
20 | *visited = true; | ||
21 | return 0; | ||
22 | } | ||
23 | |||
24 | static int test__vmlinux_matches_kallsyms(void) | ||
25 | { | ||
26 | int err = -1; | ||
27 | struct rb_node *nd; | ||
28 | struct symbol *sym; | ||
29 | struct map *kallsyms_map, *vmlinux_map; | ||
30 | struct machine kallsyms, vmlinux; | ||
31 | enum map_type type = MAP__FUNCTION; | ||
32 | struct ref_reloc_sym ref_reloc_sym = { .name = "_stext", }; | ||
33 | |||
34 | /* | ||
35 | * Step 1: | ||
36 | * | ||
37 | * Init the machines that will hold kernel, modules obtained from | ||
38 | * both vmlinux + .ko files and from /proc/kallsyms split by modules. | ||
39 | */ | ||
40 | machine__init(&kallsyms, "", HOST_KERNEL_ID); | ||
41 | machine__init(&vmlinux, "", HOST_KERNEL_ID); | ||
42 | |||
43 | /* | ||
44 | * Step 2: | ||
45 | * | ||
46 | * Create the kernel maps for kallsyms and the DSO where we will then | ||
47 | * load /proc/kallsyms. Also create the modules maps from /proc/modules | ||
48 | * and find the .ko files that match them in /lib/modules/`uname -r`/. | ||
49 | */ | ||
50 | if (machine__create_kernel_maps(&kallsyms) < 0) { | ||
51 | pr_debug("machine__create_kernel_maps "); | ||
52 | return -1; | ||
53 | } | ||
54 | |||
55 | /* | ||
56 | * Step 3: | ||
57 | * | ||
58 | * Load and split /proc/kallsyms into multiple maps, one per module. | ||
59 | */ | ||
60 | if (machine__load_kallsyms(&kallsyms, "/proc/kallsyms", type, NULL) <= 0) { | ||
61 | pr_debug("dso__load_kallsyms "); | ||
62 | goto out; | ||
63 | } | ||
64 | |||
65 | /* | ||
66 | * Step 4: | ||
67 | * | ||
68 | * kallsyms will be internally on demand sorted by name so that we can | ||
69 | * find the reference relocation * symbol, i.e. the symbol we will use | ||
70 | * to see if the running kernel was relocated by checking if it has the | ||
71 | * same value in the vmlinux file we load. | ||
72 | */ | ||
73 | kallsyms_map = machine__kernel_map(&kallsyms, type); | ||
74 | |||
75 | sym = map__find_symbol_by_name(kallsyms_map, ref_reloc_sym.name, NULL); | ||
76 | if (sym == NULL) { | ||
77 | pr_debug("dso__find_symbol_by_name "); | ||
78 | goto out; | ||
79 | } | ||
80 | |||
81 | ref_reloc_sym.addr = sym->start; | ||
82 | |||
83 | /* | ||
84 | * Step 5: | ||
85 | * | ||
86 | * Now repeat step 2, this time for the vmlinux file we'll auto-locate. | ||
87 | */ | ||
88 | if (machine__create_kernel_maps(&vmlinux) < 0) { | ||
89 | pr_debug("machine__create_kernel_maps "); | ||
90 | goto out; | ||
91 | } | ||
92 | |||
93 | vmlinux_map = machine__kernel_map(&vmlinux, type); | ||
94 | map__kmap(vmlinux_map)->ref_reloc_sym = &ref_reloc_sym; | ||
95 | |||
96 | /* | ||
97 | * Step 6: | ||
98 | * | ||
99 | * Locate a vmlinux file in the vmlinux path that has a buildid that | ||
100 | * matches the one of the running kernel. | ||
101 | * | ||
102 | * While doing that look if we find the ref reloc symbol, if we find it | ||
103 | * we'll have its ref_reloc_symbol.unrelocated_addr and then | ||
104 | * maps__reloc_vmlinux will notice and set proper ->[un]map_ip routines | ||
105 | * to fixup the symbols. | ||
106 | */ | ||
107 | if (machine__load_vmlinux_path(&vmlinux, type, | ||
108 | vmlinux_matches_kallsyms_filter) <= 0) { | ||
109 | pr_debug("machine__load_vmlinux_path "); | ||
110 | goto out; | ||
111 | } | ||
112 | |||
113 | err = 0; | ||
114 | /* | ||
115 | * Step 7: | ||
116 | * | ||
117 | * Now look at the symbols in the vmlinux DSO and check if we find all of them | ||
118 | * in the kallsyms dso. For the ones that are in both, check its names and | ||
119 | * end addresses too. | ||
120 | */ | ||
121 | for (nd = rb_first(&vmlinux_map->dso->symbols[type]); nd; nd = rb_next(nd)) { | ||
122 | struct symbol *pair; | ||
123 | |||
124 | sym = rb_entry(nd, struct symbol, rb_node); | ||
125 | pair = machine__find_kernel_symbol(&kallsyms, type, sym->start, NULL, NULL); | ||
126 | |||
127 | if (pair && pair->start == sym->start) { | ||
128 | next_pair: | ||
129 | if (strcmp(sym->name, pair->name) == 0) { | ||
130 | /* | ||
131 | * kallsyms don't have the symbol end, so we | ||
132 | * set that by using the next symbol start - 1, | ||
133 | * in some cases we get this up to a page | ||
134 | * wrong, trace_kmalloc when I was developing | ||
135 | * this code was one such example, 2106 bytes | ||
136 | * off the real size. More than that and we | ||
137 | * _really_ have a problem. | ||
138 | */ | ||
139 | s64 skew = sym->end - pair->end; | ||
140 | if (llabs(skew) < page_size) | ||
141 | continue; | ||
142 | |||
143 | pr_debug("%#Lx: diff end addr for %s v: %#Lx k: %#Lx\n", | ||
144 | sym->start, sym->name, sym->end, pair->end); | ||
145 | } else { | ||
146 | struct rb_node *nnd = rb_prev(&pair->rb_node); | ||
147 | |||
148 | if (nnd) { | ||
149 | struct symbol *next = rb_entry(nnd, struct symbol, rb_node); | ||
150 | |||
151 | if (next->start == sym->start) { | ||
152 | pair = next; | ||
153 | goto next_pair; | ||
154 | } | ||
155 | } | ||
156 | pr_debug("%#Lx: diff name v: %s k: %s\n", | ||
157 | sym->start, sym->name, pair->name); | ||
158 | } | ||
159 | } else | ||
160 | pr_debug("%#Lx: %s not on kallsyms\n", sym->start, sym->name); | ||
161 | |||
162 | err = -1; | ||
163 | } | ||
164 | |||
165 | if (!verbose) | ||
166 | goto out; | ||
167 | |||
168 | pr_info("Maps only in vmlinux:\n"); | ||
169 | |||
170 | for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) { | ||
171 | struct map *pos = rb_entry(nd, struct map, rb_node), *pair; | ||
172 | /* | ||
173 | * If it is the kernel, kallsyms is always "[kernel.kallsyms]", while | ||
174 | * the kernel will have the path for the vmlinux file being used, | ||
175 | * so use the short name, less descriptive but the same ("[kernel]" in | ||
176 | * both cases. | ||
177 | */ | ||
178 | pair = map_groups__find_by_name(&kallsyms.kmaps, type, | ||
179 | (pos->dso->kernel ? | ||
180 | pos->dso->short_name : | ||
181 | pos->dso->name)); | ||
182 | if (pair) | ||
183 | pair->priv = 1; | ||
184 | else | ||
185 | map__fprintf(pos, stderr); | ||
186 | } | ||
187 | |||
188 | pr_info("Maps in vmlinux with a different name in kallsyms:\n"); | ||
189 | |||
190 | for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) { | ||
191 | struct map *pos = rb_entry(nd, struct map, rb_node), *pair; | ||
192 | |||
193 | pair = map_groups__find(&kallsyms.kmaps, type, pos->start); | ||
194 | if (pair == NULL || pair->priv) | ||
195 | continue; | ||
196 | |||
197 | if (pair->start == pos->start) { | ||
198 | pair->priv = 1; | ||
199 | pr_info(" %Lx-%Lx %Lx %s in kallsyms as", | ||
200 | pos->start, pos->end, pos->pgoff, pos->dso->name); | ||
201 | if (pos->pgoff != pair->pgoff || pos->end != pair->end) | ||
202 | pr_info(": \n*%Lx-%Lx %Lx", | ||
203 | pair->start, pair->end, pair->pgoff); | ||
204 | pr_info(" %s\n", pair->dso->name); | ||
205 | pair->priv = 1; | ||
206 | } | ||
207 | } | ||
208 | |||
209 | pr_info("Maps only in kallsyms:\n"); | ||
210 | |||
211 | for (nd = rb_first(&kallsyms.kmaps.maps[type]); | ||
212 | nd; nd = rb_next(nd)) { | ||
213 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
214 | |||
215 | if (!pos->priv) | ||
216 | map__fprintf(pos, stderr); | ||
217 | } | ||
218 | out: | ||
219 | return err; | ||
220 | } | ||
221 | |||
222 | static struct test { | ||
223 | const char *desc; | ||
224 | int (*func)(void); | ||
225 | } tests[] = { | ||
226 | { | ||
227 | .desc = "vmlinux symtab matches kallsyms", | ||
228 | .func = test__vmlinux_matches_kallsyms, | ||
229 | }, | ||
230 | { | ||
231 | .func = NULL, | ||
232 | }, | ||
233 | }; | ||
234 | |||
235 | static int __cmd_test(void) | ||
236 | { | ||
237 | int i = 0; | ||
238 | |||
239 | page_size = sysconf(_SC_PAGE_SIZE); | ||
240 | |||
241 | while (tests[i].func) { | ||
242 | int err; | ||
243 | pr_info("%2d: %s:", i + 1, tests[i].desc); | ||
244 | pr_debug("\n--- start ---\n"); | ||
245 | err = tests[i].func(); | ||
246 | pr_debug("---- end ----\n%s:", tests[i].desc); | ||
247 | pr_info(" %s\n", err ? "FAILED!\n" : "Ok"); | ||
248 | ++i; | ||
249 | } | ||
250 | |||
251 | return 0; | ||
252 | } | ||
253 | |||
254 | static const char * const test_usage[] = { | ||
255 | "perf test [<options>]", | ||
256 | NULL, | ||
257 | }; | ||
258 | |||
259 | static const struct option test_options[] = { | ||
260 | OPT_INTEGER('v', "verbose", &verbose, | ||
261 | "be more verbose (show symbol address, etc)"), | ||
262 | OPT_END() | ||
263 | }; | ||
264 | |||
265 | int cmd_test(int argc, const char **argv, const char *prefix __used) | ||
266 | { | ||
267 | argc = parse_options(argc, argv, test_options, test_usage, 0); | ||
268 | if (argc) | ||
269 | usage_with_options(test_usage, test_options); | ||
270 | |||
271 | symbol_conf.priv_size = sizeof(int); | ||
272 | symbol_conf.sort_by_name = true; | ||
273 | symbol_conf.try_vmlinux_path = true; | ||
274 | |||
275 | if (symbol__init() < 0) | ||
276 | return -1; | ||
277 | |||
278 | setup_pager(); | ||
279 | |||
280 | return __cmd_test(); | ||
281 | } | ||
diff --git a/tools/perf/builtin-timechart.c b/tools/perf/builtin-timechart.c index 0d4d8ff7914b..5a52ed9fc10b 100644 --- a/tools/perf/builtin-timechart.c +++ b/tools/perf/builtin-timechart.c | |||
@@ -21,7 +21,6 @@ | |||
21 | #include "util/cache.h" | 21 | #include "util/cache.h" |
22 | #include <linux/rbtree.h> | 22 | #include <linux/rbtree.h> |
23 | #include "util/symbol.h" | 23 | #include "util/symbol.h" |
24 | #include "util/string.h" | ||
25 | #include "util/callchain.h" | 24 | #include "util/callchain.h" |
26 | #include "util/strlist.h" | 25 | #include "util/strlist.h" |
27 | 26 | ||
@@ -43,7 +42,7 @@ static u64 turbo_frequency; | |||
43 | 42 | ||
44 | static u64 first_time, last_time; | 43 | static u64 first_time, last_time; |
45 | 44 | ||
46 | static int power_only; | 45 | static bool power_only; |
47 | 46 | ||
48 | 47 | ||
49 | struct per_pid; | 48 | struct per_pid; |
@@ -78,8 +77,6 @@ struct per_pid { | |||
78 | 77 | ||
79 | struct per_pidcomm *all; | 78 | struct per_pidcomm *all; |
80 | struct per_pidcomm *current; | 79 | struct per_pidcomm *current; |
81 | |||
82 | int painted; | ||
83 | }; | 80 | }; |
84 | 81 | ||
85 | 82 | ||
@@ -146,9 +143,6 @@ struct wake_event { | |||
146 | static struct power_event *power_events; | 143 | static struct power_event *power_events; |
147 | static struct wake_event *wake_events; | 144 | static struct wake_event *wake_events; |
148 | 145 | ||
149 | struct sample_wrapper *all_samples; | ||
150 | |||
151 | |||
152 | struct process_filter; | 146 | struct process_filter; |
153 | struct process_filter { | 147 | struct process_filter { |
154 | char *name; | 148 | char *name; |
@@ -569,88 +563,6 @@ static void end_sample_processing(void) | |||
569 | } | 563 | } |
570 | } | 564 | } |
571 | 565 | ||
572 | static u64 sample_time(event_t *event, const struct perf_session *session) | ||
573 | { | ||
574 | int cursor; | ||
575 | |||
576 | cursor = 0; | ||
577 | if (session->sample_type & PERF_SAMPLE_IP) | ||
578 | cursor++; | ||
579 | if (session->sample_type & PERF_SAMPLE_TID) | ||
580 | cursor++; | ||
581 | if (session->sample_type & PERF_SAMPLE_TIME) | ||
582 | return event->sample.array[cursor]; | ||
583 | return 0; | ||
584 | } | ||
585 | |||
586 | |||
587 | /* | ||
588 | * We first queue all events, sorted backwards by insertion. | ||
589 | * The order will get flipped later. | ||
590 | */ | ||
591 | static int queue_sample_event(event_t *event, struct perf_session *session) | ||
592 | { | ||
593 | struct sample_wrapper *copy, *prev; | ||
594 | int size; | ||
595 | |||
596 | size = event->sample.header.size + sizeof(struct sample_wrapper) + 8; | ||
597 | |||
598 | copy = malloc(size); | ||
599 | if (!copy) | ||
600 | return 1; | ||
601 | |||
602 | memset(copy, 0, size); | ||
603 | |||
604 | copy->next = NULL; | ||
605 | copy->timestamp = sample_time(event, session); | ||
606 | |||
607 | memcpy(©->data, event, event->sample.header.size); | ||
608 | |||
609 | /* insert in the right place in the list */ | ||
610 | |||
611 | if (!all_samples) { | ||
612 | /* first sample ever */ | ||
613 | all_samples = copy; | ||
614 | return 0; | ||
615 | } | ||
616 | |||
617 | if (all_samples->timestamp < copy->timestamp) { | ||
618 | /* insert at the head of the list */ | ||
619 | copy->next = all_samples; | ||
620 | all_samples = copy; | ||
621 | return 0; | ||
622 | } | ||
623 | |||
624 | prev = all_samples; | ||
625 | while (prev->next) { | ||
626 | if (prev->next->timestamp < copy->timestamp) { | ||
627 | copy->next = prev->next; | ||
628 | prev->next = copy; | ||
629 | return 0; | ||
630 | } | ||
631 | prev = prev->next; | ||
632 | } | ||
633 | /* insert at the end of the list */ | ||
634 | prev->next = copy; | ||
635 | |||
636 | return 0; | ||
637 | } | ||
638 | |||
639 | static void sort_queued_samples(void) | ||
640 | { | ||
641 | struct sample_wrapper *cursor, *next; | ||
642 | |||
643 | cursor = all_samples; | ||
644 | all_samples = NULL; | ||
645 | |||
646 | while (cursor) { | ||
647 | next = cursor->next; | ||
648 | cursor->next = all_samples; | ||
649 | all_samples = cursor; | ||
650 | cursor = next; | ||
651 | } | ||
652 | } | ||
653 | |||
654 | /* | 566 | /* |
655 | * Sort the pid datastructure | 567 | * Sort the pid datastructure |
656 | */ | 568 | */ |
@@ -1014,31 +926,17 @@ static void write_svg_file(const char *filename) | |||
1014 | svg_close(); | 926 | svg_close(); |
1015 | } | 927 | } |
1016 | 928 | ||
1017 | static void process_samples(struct perf_session *session) | ||
1018 | { | ||
1019 | struct sample_wrapper *cursor; | ||
1020 | event_t *event; | ||
1021 | |||
1022 | sort_queued_samples(); | ||
1023 | |||
1024 | cursor = all_samples; | ||
1025 | while (cursor) { | ||
1026 | event = (void *)&cursor->data; | ||
1027 | cursor = cursor->next; | ||
1028 | process_sample_event(event, session); | ||
1029 | } | ||
1030 | } | ||
1031 | |||
1032 | static struct perf_event_ops event_ops = { | 929 | static struct perf_event_ops event_ops = { |
1033 | .comm = process_comm_event, | 930 | .comm = process_comm_event, |
1034 | .fork = process_fork_event, | 931 | .fork = process_fork_event, |
1035 | .exit = process_exit_event, | 932 | .exit = process_exit_event, |
1036 | .sample = queue_sample_event, | 933 | .sample = process_sample_event, |
934 | .ordered_samples = true, | ||
1037 | }; | 935 | }; |
1038 | 936 | ||
1039 | static int __cmd_timechart(void) | 937 | static int __cmd_timechart(void) |
1040 | { | 938 | { |
1041 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 939 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
1042 | int ret = -EINVAL; | 940 | int ret = -EINVAL; |
1043 | 941 | ||
1044 | if (session == NULL) | 942 | if (session == NULL) |
@@ -1051,8 +949,6 @@ static int __cmd_timechart(void) | |||
1051 | if (ret) | 949 | if (ret) |
1052 | goto out_delete; | 950 | goto out_delete; |
1053 | 951 | ||
1054 | process_samples(session); | ||
1055 | |||
1056 | end_sample_processing(); | 952 | end_sample_processing(); |
1057 | 953 | ||
1058 | sort_pids(); | 954 | sort_pids(); |
@@ -1075,7 +971,6 @@ static const char *record_args[] = { | |||
1075 | "record", | 971 | "record", |
1076 | "-a", | 972 | "-a", |
1077 | "-R", | 973 | "-R", |
1078 | "-M", | ||
1079 | "-f", | 974 | "-f", |
1080 | "-c", "1", | 975 | "-c", "1", |
1081 | "-e", "power:power_start", | 976 | "-e", "power:power_start", |
diff --git a/tools/perf/builtin-top.c b/tools/perf/builtin-top.c index 1f529321607e..397290a0a76e 100644 --- a/tools/perf/builtin-top.c +++ b/tools/perf/builtin-top.c | |||
@@ -55,9 +55,9 @@ | |||
55 | #include <linux/unistd.h> | 55 | #include <linux/unistd.h> |
56 | #include <linux/types.h> | 56 | #include <linux/types.h> |
57 | 57 | ||
58 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 58 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; |
59 | 59 | ||
60 | static int system_wide = 0; | 60 | static bool system_wide = false; |
61 | 61 | ||
62 | static int default_interval = 0; | 62 | static int default_interval = 0; |
63 | 63 | ||
@@ -65,18 +65,21 @@ static int count_filter = 5; | |||
65 | static int print_entries; | 65 | static int print_entries; |
66 | 66 | ||
67 | static int target_pid = -1; | 67 | static int target_pid = -1; |
68 | static int inherit = 0; | 68 | static int target_tid = -1; |
69 | static pid_t *all_tids = NULL; | ||
70 | static int thread_num = 0; | ||
71 | static bool inherit = false; | ||
69 | static int profile_cpu = -1; | 72 | static int profile_cpu = -1; |
70 | static int nr_cpus = 0; | 73 | static int nr_cpus = 0; |
71 | static unsigned int realtime_prio = 0; | 74 | static int realtime_prio = 0; |
72 | static int group = 0; | 75 | static bool group = false; |
73 | static unsigned int page_size; | 76 | static unsigned int page_size; |
74 | static unsigned int mmap_pages = 16; | 77 | static unsigned int mmap_pages = 16; |
75 | static int freq = 1000; /* 1 KHz */ | 78 | static int freq = 1000; /* 1 KHz */ |
76 | 79 | ||
77 | static int delay_secs = 2; | 80 | static int delay_secs = 2; |
78 | static int zero = 0; | 81 | static bool zero = false; |
79 | static int dump_symtab = 0; | 82 | static bool dump_symtab = false; |
80 | 83 | ||
81 | static bool hide_kernel_symbols = false; | 84 | static bool hide_kernel_symbols = false; |
82 | static bool hide_user_symbols = false; | 85 | static bool hide_user_symbols = false; |
@@ -93,7 +96,7 @@ struct source_line { | |||
93 | struct source_line *next; | 96 | struct source_line *next; |
94 | }; | 97 | }; |
95 | 98 | ||
96 | static char *sym_filter = NULL; | 99 | static const char *sym_filter = NULL; |
97 | struct sym_entry *sym_filter_entry = NULL; | 100 | struct sym_entry *sym_filter_entry = NULL; |
98 | struct sym_entry *sym_filter_entry_sched = NULL; | 101 | struct sym_entry *sym_filter_entry_sched = NULL; |
99 | static int sym_pcnt_filter = 5; | 102 | static int sym_pcnt_filter = 5; |
@@ -133,7 +136,7 @@ static inline struct symbol *sym_entry__symbol(struct sym_entry *self) | |||
133 | return ((void *)self) + symbol_conf.priv_size; | 136 | return ((void *)self) + symbol_conf.priv_size; |
134 | } | 137 | } |
135 | 138 | ||
136 | static void get_term_dimensions(struct winsize *ws) | 139 | void get_term_dimensions(struct winsize *ws) |
137 | { | 140 | { |
138 | char *s = getenv("LINES"); | 141 | char *s = getenv("LINES"); |
139 | 142 | ||
@@ -169,7 +172,7 @@ static void sig_winch_handler(int sig __used) | |||
169 | update_print_entries(&winsize); | 172 | update_print_entries(&winsize); |
170 | } | 173 | } |
171 | 174 | ||
172 | static void parse_source(struct sym_entry *syme) | 175 | static int parse_source(struct sym_entry *syme) |
173 | { | 176 | { |
174 | struct symbol *sym; | 177 | struct symbol *sym; |
175 | struct sym_entry_source *source; | 178 | struct sym_entry_source *source; |
@@ -180,12 +183,21 @@ static void parse_source(struct sym_entry *syme) | |||
180 | u64 len; | 183 | u64 len; |
181 | 184 | ||
182 | if (!syme) | 185 | if (!syme) |
183 | return; | 186 | return -1; |
187 | |||
188 | sym = sym_entry__symbol(syme); | ||
189 | map = syme->map; | ||
190 | |||
191 | /* | ||
192 | * We can't annotate with just /proc/kallsyms | ||
193 | */ | ||
194 | if (map->dso->origin == DSO__ORIG_KERNEL) | ||
195 | return -1; | ||
184 | 196 | ||
185 | if (syme->src == NULL) { | 197 | if (syme->src == NULL) { |
186 | syme->src = zalloc(sizeof(*source)); | 198 | syme->src = zalloc(sizeof(*source)); |
187 | if (syme->src == NULL) | 199 | if (syme->src == NULL) |
188 | return; | 200 | return -1; |
189 | pthread_mutex_init(&syme->src->lock, NULL); | 201 | pthread_mutex_init(&syme->src->lock, NULL); |
190 | } | 202 | } |
191 | 203 | ||
@@ -195,9 +207,6 @@ static void parse_source(struct sym_entry *syme) | |||
195 | pthread_mutex_lock(&source->lock); | 207 | pthread_mutex_lock(&source->lock); |
196 | goto out_assign; | 208 | goto out_assign; |
197 | } | 209 | } |
198 | |||
199 | sym = sym_entry__symbol(syme); | ||
200 | map = syme->map; | ||
201 | path = map->dso->long_name; | 210 | path = map->dso->long_name; |
202 | 211 | ||
203 | len = sym->end - sym->start; | 212 | len = sym->end - sym->start; |
@@ -209,7 +218,7 @@ static void parse_source(struct sym_entry *syme) | |||
209 | 218 | ||
210 | file = popen(command, "r"); | 219 | file = popen(command, "r"); |
211 | if (!file) | 220 | if (!file) |
212 | return; | 221 | return -1; |
213 | 222 | ||
214 | pthread_mutex_lock(&source->lock); | 223 | pthread_mutex_lock(&source->lock); |
215 | source->lines_tail = &source->lines; | 224 | source->lines_tail = &source->lines; |
@@ -245,6 +254,7 @@ static void parse_source(struct sym_entry *syme) | |||
245 | out_assign: | 254 | out_assign: |
246 | sym_filter_entry = syme; | 255 | sym_filter_entry = syme; |
247 | pthread_mutex_unlock(&source->lock); | 256 | pthread_mutex_unlock(&source->lock); |
257 | return 0; | ||
248 | } | 258 | } |
249 | 259 | ||
250 | static void __zero_source_counters(struct sym_entry *syme) | 260 | static void __zero_source_counters(struct sym_entry *syme) |
@@ -410,7 +420,9 @@ static double sym_weight(const struct sym_entry *sym) | |||
410 | } | 420 | } |
411 | 421 | ||
412 | static long samples; | 422 | static long samples; |
413 | static long userspace_samples; | 423 | static long kernel_samples, us_samples; |
424 | static long exact_samples; | ||
425 | static long guest_us_samples, guest_kernel_samples; | ||
414 | static const char CONSOLE_CLEAR[] = "[H[2J"; | 426 | static const char CONSOLE_CLEAR[] = "[H[2J"; |
415 | 427 | ||
416 | static void __list_insert_active_sym(struct sym_entry *syme) | 428 | static void __list_insert_active_sym(struct sym_entry *syme) |
@@ -450,7 +462,11 @@ static void print_sym_table(void) | |||
450 | int printed = 0, j; | 462 | int printed = 0, j; |
451 | int counter, snap = !display_weighted ? sym_counter : 0; | 463 | int counter, snap = !display_weighted ? sym_counter : 0; |
452 | float samples_per_sec = samples/delay_secs; | 464 | float samples_per_sec = samples/delay_secs; |
453 | float ksamples_per_sec = (samples-userspace_samples)/delay_secs; | 465 | float ksamples_per_sec = kernel_samples/delay_secs; |
466 | float us_samples_per_sec = (us_samples)/delay_secs; | ||
467 | float guest_kernel_samples_per_sec = (guest_kernel_samples)/delay_secs; | ||
468 | float guest_us_samples_per_sec = (guest_us_samples)/delay_secs; | ||
469 | float esamples_percent = (100.0*exact_samples)/samples; | ||
454 | float sum_ksamples = 0.0; | 470 | float sum_ksamples = 0.0; |
455 | struct sym_entry *syme, *n; | 471 | struct sym_entry *syme, *n; |
456 | struct rb_root tmp = RB_ROOT; | 472 | struct rb_root tmp = RB_ROOT; |
@@ -458,7 +474,8 @@ static void print_sym_table(void) | |||
458 | int sym_width = 0, dso_width = 0, dso_short_width = 0; | 474 | int sym_width = 0, dso_width = 0, dso_short_width = 0; |
459 | const int win_width = winsize.ws_col - 1; | 475 | const int win_width = winsize.ws_col - 1; |
460 | 476 | ||
461 | samples = userspace_samples = 0; | 477 | samples = us_samples = kernel_samples = exact_samples = 0; |
478 | guest_kernel_samples = guest_us_samples = 0; | ||
462 | 479 | ||
463 | /* Sort the active symbols */ | 480 | /* Sort the active symbols */ |
464 | pthread_mutex_lock(&active_symbols_lock); | 481 | pthread_mutex_lock(&active_symbols_lock); |
@@ -489,9 +506,30 @@ static void print_sym_table(void) | |||
489 | puts(CONSOLE_CLEAR); | 506 | puts(CONSOLE_CLEAR); |
490 | 507 | ||
491 | printf("%-*.*s\n", win_width, win_width, graph_dotted_line); | 508 | printf("%-*.*s\n", win_width, win_width, graph_dotted_line); |
492 | printf( " PerfTop:%8.0f irqs/sec kernel:%4.1f%% [", | 509 | if (!perf_guest) { |
493 | samples_per_sec, | 510 | printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%%" |
494 | 100.0 - (100.0*((samples_per_sec-ksamples_per_sec)/samples_per_sec))); | 511 | " exact: %4.1f%% [", |
512 | samples_per_sec, | ||
513 | 100.0 - (100.0 * ((samples_per_sec - ksamples_per_sec) / | ||
514 | samples_per_sec)), | ||
515 | esamples_percent); | ||
516 | } else { | ||
517 | printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%% us:%4.1f%%" | ||
518 | " guest kernel:%4.1f%% guest us:%4.1f%%" | ||
519 | " exact: %4.1f%% [", | ||
520 | samples_per_sec, | ||
521 | 100.0 - (100.0 * ((samples_per_sec-ksamples_per_sec) / | ||
522 | samples_per_sec)), | ||
523 | 100.0 - (100.0 * ((samples_per_sec-us_samples_per_sec) / | ||
524 | samples_per_sec)), | ||
525 | 100.0 - (100.0 * ((samples_per_sec - | ||
526 | guest_kernel_samples_per_sec) / | ||
527 | samples_per_sec)), | ||
528 | 100.0 - (100.0 * ((samples_per_sec - | ||
529 | guest_us_samples_per_sec) / | ||
530 | samples_per_sec)), | ||
531 | esamples_percent); | ||
532 | } | ||
495 | 533 | ||
496 | if (nr_counters == 1 || !display_weighted) { | 534 | if (nr_counters == 1 || !display_weighted) { |
497 | printf("%Ld", (u64)attrs[0].sample_period); | 535 | printf("%Ld", (u64)attrs[0].sample_period); |
@@ -514,13 +552,15 @@ static void print_sym_table(void) | |||
514 | 552 | ||
515 | if (target_pid != -1) | 553 | if (target_pid != -1) |
516 | printf(" (target_pid: %d", target_pid); | 554 | printf(" (target_pid: %d", target_pid); |
555 | else if (target_tid != -1) | ||
556 | printf(" (target_tid: %d", target_tid); | ||
517 | else | 557 | else |
518 | printf(" (all"); | 558 | printf(" (all"); |
519 | 559 | ||
520 | if (profile_cpu != -1) | 560 | if (profile_cpu != -1) |
521 | printf(", cpu: %d)\n", profile_cpu); | 561 | printf(", cpu: %d)\n", profile_cpu); |
522 | else { | 562 | else { |
523 | if (target_pid != -1) | 563 | if (target_tid != -1) |
524 | printf(")\n"); | 564 | printf(")\n"); |
525 | else | 565 | else |
526 | printf(", %d CPUs)\n", nr_cpus); | 566 | printf(", %d CPUs)\n", nr_cpus); |
@@ -582,7 +622,6 @@ static void print_sym_table(void) | |||
582 | 622 | ||
583 | syme = rb_entry(nd, struct sym_entry, rb_node); | 623 | syme = rb_entry(nd, struct sym_entry, rb_node); |
584 | sym = sym_entry__symbol(syme); | 624 | sym = sym_entry__symbol(syme); |
585 | |||
586 | if (++printed > print_entries || (int)syme->snap_count < count_filter) | 625 | if (++printed > print_entries || (int)syme->snap_count < count_filter) |
587 | continue; | 626 | continue; |
588 | 627 | ||
@@ -746,7 +785,7 @@ static int key_mapped(int c) | |||
746 | return 0; | 785 | return 0; |
747 | } | 786 | } |
748 | 787 | ||
749 | static void handle_keypress(int c) | 788 | static void handle_keypress(struct perf_session *session, int c) |
750 | { | 789 | { |
751 | if (!key_mapped(c)) { | 790 | if (!key_mapped(c)) { |
752 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; | 791 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; |
@@ -815,7 +854,7 @@ static void handle_keypress(int c) | |||
815 | case 'Q': | 854 | case 'Q': |
816 | printf("exiting.\n"); | 855 | printf("exiting.\n"); |
817 | if (dump_symtab) | 856 | if (dump_symtab) |
818 | dsos__fprintf(stderr); | 857 | perf_session__fprintf_dsos(session, stderr); |
819 | exit(0); | 858 | exit(0); |
820 | case 's': | 859 | case 's': |
821 | prompt_symbol(&sym_filter_entry, "Enter details symbol"); | 860 | prompt_symbol(&sym_filter_entry, "Enter details symbol"); |
@@ -839,7 +878,7 @@ static void handle_keypress(int c) | |||
839 | display_weighted = ~display_weighted; | 878 | display_weighted = ~display_weighted; |
840 | break; | 879 | break; |
841 | case 'z': | 880 | case 'z': |
842 | zero = ~zero; | 881 | zero = !zero; |
843 | break; | 882 | break; |
844 | default: | 883 | default: |
845 | break; | 884 | break; |
@@ -851,6 +890,7 @@ static void *display_thread(void *arg __used) | |||
851 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; | 890 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; |
852 | struct termios tc, save; | 891 | struct termios tc, save; |
853 | int delay_msecs, c; | 892 | int delay_msecs, c; |
893 | struct perf_session *session = (struct perf_session *) arg; | ||
854 | 894 | ||
855 | tcgetattr(0, &save); | 895 | tcgetattr(0, &save); |
856 | tc = save; | 896 | tc = save; |
@@ -871,7 +911,7 @@ repeat: | |||
871 | c = getc(stdin); | 911 | c = getc(stdin); |
872 | tcsetattr(0, TCSAFLUSH, &save); | 912 | tcsetattr(0, TCSAFLUSH, &save); |
873 | 913 | ||
874 | handle_keypress(c); | 914 | handle_keypress(session, c); |
875 | goto repeat; | 915 | goto repeat; |
876 | 916 | ||
877 | return NULL; | 917 | return NULL; |
@@ -942,24 +982,48 @@ static void event__process_sample(const event_t *self, | |||
942 | u64 ip = self->ip.ip; | 982 | u64 ip = self->ip.ip; |
943 | struct sym_entry *syme; | 983 | struct sym_entry *syme; |
944 | struct addr_location al; | 984 | struct addr_location al; |
985 | struct machine *machine; | ||
945 | u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | 986 | u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; |
946 | 987 | ||
947 | ++samples; | 988 | ++samples; |
948 | 989 | ||
949 | switch (origin) { | 990 | switch (origin) { |
950 | case PERF_RECORD_MISC_USER: | 991 | case PERF_RECORD_MISC_USER: |
951 | ++userspace_samples; | 992 | ++us_samples; |
952 | if (hide_user_symbols) | 993 | if (hide_user_symbols) |
953 | return; | 994 | return; |
995 | machine = perf_session__find_host_machine(session); | ||
954 | break; | 996 | break; |
955 | case PERF_RECORD_MISC_KERNEL: | 997 | case PERF_RECORD_MISC_KERNEL: |
998 | ++kernel_samples; | ||
956 | if (hide_kernel_symbols) | 999 | if (hide_kernel_symbols) |
957 | return; | 1000 | return; |
1001 | machine = perf_session__find_host_machine(session); | ||
1002 | break; | ||
1003 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
1004 | ++guest_kernel_samples; | ||
1005 | machine = perf_session__find_machine(session, self->ip.pid); | ||
958 | break; | 1006 | break; |
1007 | case PERF_RECORD_MISC_GUEST_USER: | ||
1008 | ++guest_us_samples; | ||
1009 | /* | ||
1010 | * TODO: we don't process guest user from host side | ||
1011 | * except simple counting. | ||
1012 | */ | ||
1013 | return; | ||
959 | default: | 1014 | default: |
960 | return; | 1015 | return; |
961 | } | 1016 | } |
962 | 1017 | ||
1018 | if (!machine && perf_guest) { | ||
1019 | pr_err("Can't find guest [%d]'s kernel information\n", | ||
1020 | self->ip.pid); | ||
1021 | return; | ||
1022 | } | ||
1023 | |||
1024 | if (self->header.misc & PERF_RECORD_MISC_EXACT_IP) | ||
1025 | exact_samples++; | ||
1026 | |||
963 | if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 || | 1027 | if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 || |
964 | al.filtered) | 1028 | al.filtered) |
965 | return; | 1029 | return; |
@@ -976,7 +1040,7 @@ static void event__process_sample(const event_t *self, | |||
976 | * --hide-kernel-symbols, even if the user specifies an | 1040 | * --hide-kernel-symbols, even if the user specifies an |
977 | * invalid --vmlinux ;-) | 1041 | * invalid --vmlinux ;-) |
978 | */ | 1042 | */ |
979 | if (al.map == session->vmlinux_maps[MAP__FUNCTION] && | 1043 | if (al.map == machine->vmlinux_maps[MAP__FUNCTION] && |
980 | RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) { | 1044 | RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) { |
981 | pr_err("The %s file can't be used\n", | 1045 | pr_err("The %s file can't be used\n", |
982 | symbol_conf.vmlinux_name); | 1046 | symbol_conf.vmlinux_name); |
@@ -990,7 +1054,17 @@ static void event__process_sample(const event_t *self, | |||
990 | if (sym_filter_entry_sched) { | 1054 | if (sym_filter_entry_sched) { |
991 | sym_filter_entry = sym_filter_entry_sched; | 1055 | sym_filter_entry = sym_filter_entry_sched; |
992 | sym_filter_entry_sched = NULL; | 1056 | sym_filter_entry_sched = NULL; |
993 | parse_source(sym_filter_entry); | 1057 | if (parse_source(sym_filter_entry) < 0) { |
1058 | struct symbol *sym = sym_entry__symbol(sym_filter_entry); | ||
1059 | |||
1060 | pr_err("Can't annotate %s", sym->name); | ||
1061 | if (sym_filter_entry->map->dso->origin == DSO__ORIG_KERNEL) { | ||
1062 | pr_err(": No vmlinux file was found in the path:\n"); | ||
1063 | vmlinux_path__fprintf(stderr); | ||
1064 | } else | ||
1065 | pr_err(".\n"); | ||
1066 | exit(1); | ||
1067 | } | ||
994 | } | 1068 | } |
995 | 1069 | ||
996 | syme = symbol__priv(al.sym); | 1070 | syme = symbol__priv(al.sym); |
@@ -1106,16 +1180,21 @@ static void perf_session__mmap_read_counter(struct perf_session *self, | |||
1106 | md->prev = old; | 1180 | md->prev = old; |
1107 | } | 1181 | } |
1108 | 1182 | ||
1109 | static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; | 1183 | static struct pollfd *event_array; |
1110 | static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; | 1184 | static struct mmap_data *mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; |
1111 | 1185 | ||
1112 | static void perf_session__mmap_read(struct perf_session *self) | 1186 | static void perf_session__mmap_read(struct perf_session *self) |
1113 | { | 1187 | { |
1114 | int i, counter; | 1188 | int i, counter, thread_index; |
1115 | 1189 | ||
1116 | for (i = 0; i < nr_cpus; i++) { | 1190 | for (i = 0; i < nr_cpus; i++) { |
1117 | for (counter = 0; counter < nr_counters; counter++) | 1191 | for (counter = 0; counter < nr_counters; counter++) |
1118 | perf_session__mmap_read_counter(self, &mmap_array[i][counter]); | 1192 | for (thread_index = 0; |
1193 | thread_index < thread_num; | ||
1194 | thread_index++) { | ||
1195 | perf_session__mmap_read_counter(self, | ||
1196 | &mmap_array[i][counter][thread_index]); | ||
1197 | } | ||
1119 | } | 1198 | } |
1120 | } | 1199 | } |
1121 | 1200 | ||
@@ -1126,9 +1205,10 @@ static void start_counter(int i, int counter) | |||
1126 | { | 1205 | { |
1127 | struct perf_event_attr *attr; | 1206 | struct perf_event_attr *attr; |
1128 | int cpu; | 1207 | int cpu; |
1208 | int thread_index; | ||
1129 | 1209 | ||
1130 | cpu = profile_cpu; | 1210 | cpu = profile_cpu; |
1131 | if (target_pid == -1 && profile_cpu == -1) | 1211 | if (target_tid == -1 && profile_cpu == -1) |
1132 | cpu = cpumap[i]; | 1212 | cpu = cpumap[i]; |
1133 | 1213 | ||
1134 | attr = attrs + counter; | 1214 | attr = attrs + counter; |
@@ -1144,55 +1224,58 @@ static void start_counter(int i, int counter) | |||
1144 | attr->inherit = (cpu < 0) && inherit; | 1224 | attr->inherit = (cpu < 0) && inherit; |
1145 | attr->mmap = 1; | 1225 | attr->mmap = 1; |
1146 | 1226 | ||
1227 | for (thread_index = 0; thread_index < thread_num; thread_index++) { | ||
1147 | try_again: | 1228 | try_again: |
1148 | fd[i][counter] = sys_perf_event_open(attr, target_pid, cpu, group_fd, 0); | 1229 | fd[i][counter][thread_index] = sys_perf_event_open(attr, |
1149 | 1230 | all_tids[thread_index], cpu, group_fd, 0); | |
1150 | if (fd[i][counter] < 0) { | 1231 | |
1151 | int err = errno; | 1232 | if (fd[i][counter][thread_index] < 0) { |
1233 | int err = errno; | ||
1234 | |||
1235 | if (err == EPERM || err == EACCES) | ||
1236 | die("No permission - are you root?\n"); | ||
1237 | /* | ||
1238 | * If it's cycles then fall back to hrtimer | ||
1239 | * based cpu-clock-tick sw counter, which | ||
1240 | * is always available even if no PMU support: | ||
1241 | */ | ||
1242 | if (attr->type == PERF_TYPE_HARDWARE | ||
1243 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | ||
1244 | |||
1245 | if (verbose) | ||
1246 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | ||
1247 | |||
1248 | attr->type = PERF_TYPE_SOFTWARE; | ||
1249 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | ||
1250 | goto try_again; | ||
1251 | } | ||
1252 | printf("\n"); | ||
1253 | error("perfcounter syscall returned with %d (%s)\n", | ||
1254 | fd[i][counter][thread_index], strerror(err)); | ||
1255 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | ||
1256 | exit(-1); | ||
1257 | } | ||
1258 | assert(fd[i][counter][thread_index] >= 0); | ||
1259 | fcntl(fd[i][counter][thread_index], F_SETFL, O_NONBLOCK); | ||
1152 | 1260 | ||
1153 | if (err == EPERM || err == EACCES) | ||
1154 | die("No permission - are you root?\n"); | ||
1155 | /* | 1261 | /* |
1156 | * If it's cycles then fall back to hrtimer | 1262 | * First counter acts as the group leader: |
1157 | * based cpu-clock-tick sw counter, which | ||
1158 | * is always available even if no PMU support: | ||
1159 | */ | 1263 | */ |
1160 | if (attr->type == PERF_TYPE_HARDWARE | 1264 | if (group && group_fd == -1) |
1161 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | 1265 | group_fd = fd[i][counter][thread_index]; |
1162 | 1266 | ||
1163 | if (verbose) | 1267 | event_array[nr_poll].fd = fd[i][counter][thread_index]; |
1164 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | 1268 | event_array[nr_poll].events = POLLIN; |
1165 | 1269 | nr_poll++; | |
1166 | attr->type = PERF_TYPE_SOFTWARE; | 1270 | |
1167 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | 1271 | mmap_array[i][counter][thread_index].counter = counter; |
1168 | goto try_again; | 1272 | mmap_array[i][counter][thread_index].prev = 0; |
1169 | } | 1273 | mmap_array[i][counter][thread_index].mask = mmap_pages*page_size - 1; |
1170 | printf("\n"); | 1274 | mmap_array[i][counter][thread_index].base = mmap(NULL, (mmap_pages+1)*page_size, |
1171 | error("perfcounter syscall returned with %d (%s)\n", | 1275 | PROT_READ, MAP_SHARED, fd[i][counter][thread_index], 0); |
1172 | fd[i][counter], strerror(err)); | 1276 | if (mmap_array[i][counter][thread_index].base == MAP_FAILED) |
1173 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | 1277 | die("failed to mmap with %d (%s)\n", errno, strerror(errno)); |
1174 | exit(-1); | ||
1175 | } | 1278 | } |
1176 | assert(fd[i][counter] >= 0); | ||
1177 | fcntl(fd[i][counter], F_SETFL, O_NONBLOCK); | ||
1178 | |||
1179 | /* | ||
1180 | * First counter acts as the group leader: | ||
1181 | */ | ||
1182 | if (group && group_fd == -1) | ||
1183 | group_fd = fd[i][counter]; | ||
1184 | |||
1185 | event_array[nr_poll].fd = fd[i][counter]; | ||
1186 | event_array[nr_poll].events = POLLIN; | ||
1187 | nr_poll++; | ||
1188 | |||
1189 | mmap_array[i][counter].counter = counter; | ||
1190 | mmap_array[i][counter].prev = 0; | ||
1191 | mmap_array[i][counter].mask = mmap_pages*page_size - 1; | ||
1192 | mmap_array[i][counter].base = mmap(NULL, (mmap_pages+1)*page_size, | ||
1193 | PROT_READ, MAP_SHARED, fd[i][counter], 0); | ||
1194 | if (mmap_array[i][counter].base == MAP_FAILED) | ||
1195 | die("failed to mmap with %d (%s)\n", errno, strerror(errno)); | ||
1196 | } | 1279 | } |
1197 | 1280 | ||
1198 | static int __cmd_top(void) | 1281 | static int __cmd_top(void) |
@@ -1204,12 +1287,12 @@ static int __cmd_top(void) | |||
1204 | * FIXME: perf_session__new should allow passing a O_MMAP, so that all this | 1287 | * FIXME: perf_session__new should allow passing a O_MMAP, so that all this |
1205 | * mmap reading, etc is encapsulated in it. Use O_WRONLY for now. | 1288 | * mmap reading, etc is encapsulated in it. Use O_WRONLY for now. |
1206 | */ | 1289 | */ |
1207 | struct perf_session *session = perf_session__new(NULL, O_WRONLY, false); | 1290 | struct perf_session *session = perf_session__new(NULL, O_WRONLY, false, false); |
1208 | if (session == NULL) | 1291 | if (session == NULL) |
1209 | return -ENOMEM; | 1292 | return -ENOMEM; |
1210 | 1293 | ||
1211 | if (target_pid != -1) | 1294 | if (target_tid != -1) |
1212 | event__synthesize_thread(target_pid, event__process, session); | 1295 | event__synthesize_thread(target_tid, event__process, session); |
1213 | else | 1296 | else |
1214 | event__synthesize_threads(event__process, session); | 1297 | event__synthesize_threads(event__process, session); |
1215 | 1298 | ||
@@ -1220,11 +1303,11 @@ static int __cmd_top(void) | |||
1220 | } | 1303 | } |
1221 | 1304 | ||
1222 | /* Wait for a minimal set of events before starting the snapshot */ | 1305 | /* Wait for a minimal set of events before starting the snapshot */ |
1223 | poll(event_array, nr_poll, 100); | 1306 | poll(&event_array[0], nr_poll, 100); |
1224 | 1307 | ||
1225 | perf_session__mmap_read(session); | 1308 | perf_session__mmap_read(session); |
1226 | 1309 | ||
1227 | if (pthread_create(&thread, NULL, display_thread, NULL)) { | 1310 | if (pthread_create(&thread, NULL, display_thread, session)) { |
1228 | printf("Could not create display thread.\n"); | 1311 | printf("Could not create display thread.\n"); |
1229 | exit(-1); | 1312 | exit(-1); |
1230 | } | 1313 | } |
@@ -1263,7 +1346,9 @@ static const struct option options[] = { | |||
1263 | OPT_INTEGER('c', "count", &default_interval, | 1346 | OPT_INTEGER('c', "count", &default_interval, |
1264 | "event period to sample"), | 1347 | "event period to sample"), |
1265 | OPT_INTEGER('p', "pid", &target_pid, | 1348 | OPT_INTEGER('p', "pid", &target_pid, |
1266 | "profile events on existing pid"), | 1349 | "profile events on existing process id"), |
1350 | OPT_INTEGER('t', "tid", &target_tid, | ||
1351 | "profile events on existing thread id"), | ||
1267 | OPT_BOOLEAN('a', "all-cpus", &system_wide, | 1352 | OPT_BOOLEAN('a', "all-cpus", &system_wide, |
1268 | "system-wide collection from all CPUs"), | 1353 | "system-wide collection from all CPUs"), |
1269 | OPT_INTEGER('C', "CPU", &profile_cpu, | 1354 | OPT_INTEGER('C', "CPU", &profile_cpu, |
@@ -1272,8 +1357,7 @@ static const struct option options[] = { | |||
1272 | "file", "vmlinux pathname"), | 1357 | "file", "vmlinux pathname"), |
1273 | OPT_BOOLEAN('K', "hide_kernel_symbols", &hide_kernel_symbols, | 1358 | OPT_BOOLEAN('K', "hide_kernel_symbols", &hide_kernel_symbols, |
1274 | "hide kernel symbols"), | 1359 | "hide kernel symbols"), |
1275 | OPT_INTEGER('m', "mmap-pages", &mmap_pages, | 1360 | OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"), |
1276 | "number of mmap data pages"), | ||
1277 | OPT_INTEGER('r', "realtime", &realtime_prio, | 1361 | OPT_INTEGER('r', "realtime", &realtime_prio, |
1278 | "collect data with this RT SCHED_FIFO priority"), | 1362 | "collect data with this RT SCHED_FIFO priority"), |
1279 | OPT_INTEGER('d', "delay", &delay_secs, | 1363 | OPT_INTEGER('d', "delay", &delay_secs, |
@@ -1296,7 +1380,7 @@ static const struct option options[] = { | |||
1296 | "display this many functions"), | 1380 | "display this many functions"), |
1297 | OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols, | 1381 | OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols, |
1298 | "hide user symbols"), | 1382 | "hide user symbols"), |
1299 | OPT_BOOLEAN('v', "verbose", &verbose, | 1383 | OPT_INCR('v', "verbose", &verbose, |
1300 | "be more verbose (show counter open errors, etc)"), | 1384 | "be more verbose (show counter open errors, etc)"), |
1301 | OPT_END() | 1385 | OPT_END() |
1302 | }; | 1386 | }; |
@@ -1304,6 +1388,7 @@ static const struct option options[] = { | |||
1304 | int cmd_top(int argc, const char **argv, const char *prefix __used) | 1388 | int cmd_top(int argc, const char **argv, const char *prefix __used) |
1305 | { | 1389 | { |
1306 | int counter; | 1390 | int counter; |
1391 | int i,j; | ||
1307 | 1392 | ||
1308 | page_size = sysconf(_SC_PAGE_SIZE); | 1393 | page_size = sysconf(_SC_PAGE_SIZE); |
1309 | 1394 | ||
@@ -1311,8 +1396,39 @@ int cmd_top(int argc, const char **argv, const char *prefix __used) | |||
1311 | if (argc) | 1396 | if (argc) |
1312 | usage_with_options(top_usage, options); | 1397 | usage_with_options(top_usage, options); |
1313 | 1398 | ||
1399 | if (target_pid != -1) { | ||
1400 | target_tid = target_pid; | ||
1401 | thread_num = find_all_tid(target_pid, &all_tids); | ||
1402 | if (thread_num <= 0) { | ||
1403 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
1404 | target_pid); | ||
1405 | usage_with_options(top_usage, options); | ||
1406 | } | ||
1407 | } else { | ||
1408 | all_tids=malloc(sizeof(pid_t)); | ||
1409 | if (!all_tids) | ||
1410 | return -ENOMEM; | ||
1411 | |||
1412 | all_tids[0] = target_tid; | ||
1413 | thread_num = 1; | ||
1414 | } | ||
1415 | |||
1416 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
1417 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
1418 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
1419 | mmap_array[i][j] = zalloc( | ||
1420 | sizeof(struct mmap_data)*thread_num); | ||
1421 | if (!fd[i][j] || !mmap_array[i][j]) | ||
1422 | return -ENOMEM; | ||
1423 | } | ||
1424 | } | ||
1425 | event_array = malloc( | ||
1426 | sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num); | ||
1427 | if (!event_array) | ||
1428 | return -ENOMEM; | ||
1429 | |||
1314 | /* CPU and PID are mutually exclusive */ | 1430 | /* CPU and PID are mutually exclusive */ |
1315 | if (target_pid != -1 && profile_cpu != -1) { | 1431 | if (target_tid > 0 && profile_cpu != -1) { |
1316 | printf("WARNING: PID switch overriding CPU\n"); | 1432 | printf("WARNING: PID switch overriding CPU\n"); |
1317 | sleep(1); | 1433 | sleep(1); |
1318 | profile_cpu = -1; | 1434 | profile_cpu = -1; |
@@ -1353,7 +1469,7 @@ int cmd_top(int argc, const char **argv, const char *prefix __used) | |||
1353 | attrs[counter].sample_period = default_interval; | 1469 | attrs[counter].sample_period = default_interval; |
1354 | } | 1470 | } |
1355 | 1471 | ||
1356 | if (target_pid != -1 || profile_cpu != -1) | 1472 | if (target_tid != -1 || profile_cpu != -1) |
1357 | nr_cpus = 1; | 1473 | nr_cpus = 1; |
1358 | else | 1474 | else |
1359 | nr_cpus = read_cpu_map(); | 1475 | nr_cpus = read_cpu_map(); |
diff --git a/tools/perf/builtin-trace.c b/tools/perf/builtin-trace.c index 407041d20de0..dddf3f01b5ab 100644 --- a/tools/perf/builtin-trace.c +++ b/tools/perf/builtin-trace.c | |||
@@ -11,6 +11,8 @@ | |||
11 | 11 | ||
12 | static char const *script_name; | 12 | static char const *script_name; |
13 | static char const *generate_script_lang; | 13 | static char const *generate_script_lang; |
14 | static bool debug_ordering; | ||
15 | static u64 last_timestamp; | ||
14 | 16 | ||
15 | static int default_start_script(const char *script __unused, | 17 | static int default_start_script(const char *script __unused, |
16 | int argc __unused, | 18 | int argc __unused, |
@@ -51,6 +53,8 @@ static void setup_scripting(void) | |||
51 | 53 | ||
52 | static int cleanup_scripting(void) | 54 | static int cleanup_scripting(void) |
53 | { | 55 | { |
56 | pr_debug("\nperf trace script stopped\n"); | ||
57 | |||
54 | return scripting_ops->stop_script(); | 58 | return scripting_ops->stop_script(); |
55 | } | 59 | } |
56 | 60 | ||
@@ -87,6 +91,14 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
87 | } | 91 | } |
88 | 92 | ||
89 | if (session->sample_type & PERF_SAMPLE_RAW) { | 93 | if (session->sample_type & PERF_SAMPLE_RAW) { |
94 | if (debug_ordering) { | ||
95 | if (data.time < last_timestamp) { | ||
96 | pr_err("Samples misordered, previous: %llu " | ||
97 | "this: %llu\n", last_timestamp, | ||
98 | data.time); | ||
99 | } | ||
100 | last_timestamp = data.time; | ||
101 | } | ||
90 | /* | 102 | /* |
91 | * FIXME: better resolve from pid from the struct trace_entry | 103 | * FIXME: better resolve from pid from the struct trace_entry |
92 | * field, although it should be the same than this perf | 104 | * field, although it should be the same than this perf |
@@ -97,17 +109,31 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
97 | data.time, thread->comm); | 109 | data.time, thread->comm); |
98 | } | 110 | } |
99 | 111 | ||
100 | session->events_stats.total += data.period; | 112 | session->hists.stats.total_period += data.period; |
101 | return 0; | 113 | return 0; |
102 | } | 114 | } |
103 | 115 | ||
104 | static struct perf_event_ops event_ops = { | 116 | static struct perf_event_ops event_ops = { |
105 | .sample = process_sample_event, | 117 | .sample = process_sample_event, |
106 | .comm = event__process_comm, | 118 | .comm = event__process_comm, |
119 | .attr = event__process_attr, | ||
120 | .event_type = event__process_event_type, | ||
121 | .tracing_data = event__process_tracing_data, | ||
122 | .build_id = event__process_build_id, | ||
123 | .ordered_samples = true, | ||
107 | }; | 124 | }; |
108 | 125 | ||
126 | extern volatile int session_done; | ||
127 | |||
128 | static void sig_handler(int sig __unused) | ||
129 | { | ||
130 | session_done = 1; | ||
131 | } | ||
132 | |||
109 | static int __cmd_trace(struct perf_session *session) | 133 | static int __cmd_trace(struct perf_session *session) |
110 | { | 134 | { |
135 | signal(SIGINT, sig_handler); | ||
136 | |||
111 | return perf_session__process_events(session, &event_ops); | 137 | return perf_session__process_events(session, &event_ops); |
112 | } | 138 | } |
113 | 139 | ||
@@ -505,7 +531,7 @@ static const char * const trace_usage[] = { | |||
505 | static const struct option options[] = { | 531 | static const struct option options[] = { |
506 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 532 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
507 | "dump raw trace in ASCII"), | 533 | "dump raw trace in ASCII"), |
508 | OPT_BOOLEAN('v', "verbose", &verbose, | 534 | OPT_INCR('v', "verbose", &verbose, |
509 | "be more verbose (show symbol address, etc)"), | 535 | "be more verbose (show symbol address, etc)"), |
510 | OPT_BOOLEAN('L', "Latency", &latency_format, | 536 | OPT_BOOLEAN('L', "Latency", &latency_format, |
511 | "show latency attributes (irqs/preemption disabled, etc)"), | 537 | "show latency attributes (irqs/preemption disabled, etc)"), |
@@ -518,6 +544,8 @@ static const struct option options[] = { | |||
518 | "generate perf-trace.xx script in specified language"), | 544 | "generate perf-trace.xx script in specified language"), |
519 | OPT_STRING('i', "input", &input_name, "file", | 545 | OPT_STRING('i', "input", &input_name, "file", |
520 | "input file name"), | 546 | "input file name"), |
547 | OPT_BOOLEAN('d', "debug-ordering", &debug_ordering, | ||
548 | "check that samples time ordering is monotonic"), | ||
521 | 549 | ||
522 | OPT_END() | 550 | OPT_END() |
523 | }; | 551 | }; |
@@ -548,6 +576,65 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
548 | suffix = REPORT_SUFFIX; | 576 | suffix = REPORT_SUFFIX; |
549 | } | 577 | } |
550 | 578 | ||
579 | if (!suffix && argc >= 2 && strncmp(argv[1], "-", strlen("-")) != 0) { | ||
580 | char *record_script_path, *report_script_path; | ||
581 | int live_pipe[2]; | ||
582 | pid_t pid; | ||
583 | |||
584 | record_script_path = get_script_path(argv[1], RECORD_SUFFIX); | ||
585 | if (!record_script_path) { | ||
586 | fprintf(stderr, "record script not found\n"); | ||
587 | return -1; | ||
588 | } | ||
589 | |||
590 | report_script_path = get_script_path(argv[1], REPORT_SUFFIX); | ||
591 | if (!report_script_path) { | ||
592 | fprintf(stderr, "report script not found\n"); | ||
593 | return -1; | ||
594 | } | ||
595 | |||
596 | if (pipe(live_pipe) < 0) { | ||
597 | perror("failed to create pipe"); | ||
598 | exit(-1); | ||
599 | } | ||
600 | |||
601 | pid = fork(); | ||
602 | if (pid < 0) { | ||
603 | perror("failed to fork"); | ||
604 | exit(-1); | ||
605 | } | ||
606 | |||
607 | if (!pid) { | ||
608 | dup2(live_pipe[1], 1); | ||
609 | close(live_pipe[0]); | ||
610 | |||
611 | __argv = malloc(5 * sizeof(const char *)); | ||
612 | __argv[0] = "/bin/sh"; | ||
613 | __argv[1] = record_script_path; | ||
614 | __argv[2] = "-o"; | ||
615 | __argv[3] = "-"; | ||
616 | __argv[4] = NULL; | ||
617 | |||
618 | execvp("/bin/sh", (char **)__argv); | ||
619 | exit(-1); | ||
620 | } | ||
621 | |||
622 | dup2(live_pipe[0], 0); | ||
623 | close(live_pipe[1]); | ||
624 | |||
625 | __argv = malloc((argc + 3) * sizeof(const char *)); | ||
626 | __argv[0] = "/bin/sh"; | ||
627 | __argv[1] = report_script_path; | ||
628 | for (i = 2; i < argc; i++) | ||
629 | __argv[i] = argv[i]; | ||
630 | __argv[i++] = "-i"; | ||
631 | __argv[i++] = "-"; | ||
632 | __argv[i++] = NULL; | ||
633 | |||
634 | execvp("/bin/sh", (char **)__argv); | ||
635 | exit(-1); | ||
636 | } | ||
637 | |||
551 | if (suffix) { | 638 | if (suffix) { |
552 | script_path = get_script_path(argv[2], suffix); | 639 | script_path = get_script_path(argv[2], suffix); |
553 | if (!script_path) { | 640 | if (!script_path) { |
@@ -576,11 +663,12 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
576 | if (!script_name) | 663 | if (!script_name) |
577 | setup_pager(); | 664 | setup_pager(); |
578 | 665 | ||
579 | session = perf_session__new(input_name, O_RDONLY, 0); | 666 | session = perf_session__new(input_name, O_RDONLY, 0, false); |
580 | if (session == NULL) | 667 | if (session == NULL) |
581 | return -ENOMEM; | 668 | return -ENOMEM; |
582 | 669 | ||
583 | if (!perf_session__has_traces(session, "record -R")) | 670 | if (strcmp(input_name, "-") && |
671 | !perf_session__has_traces(session, "record -R")) | ||
584 | return -EINVAL; | 672 | return -EINVAL; |
585 | 673 | ||
586 | if (generate_script_lang) { | 674 | if (generate_script_lang) { |
@@ -617,6 +705,7 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
617 | err = scripting_ops->start_script(script_name, argc, argv); | 705 | err = scripting_ops->start_script(script_name, argc, argv); |
618 | if (err) | 706 | if (err) |
619 | goto out; | 707 | goto out; |
708 | pr_debug("perf trace started with script %s\n\n", script_name); | ||
620 | } | 709 | } |
621 | 710 | ||
622 | err = __cmd_trace(session); | 711 | err = __cmd_trace(session); |
diff --git a/tools/perf/builtin.h b/tools/perf/builtin.h index 10fe49e7048a..921245b28583 100644 --- a/tools/perf/builtin.h +++ b/tools/perf/builtin.h | |||
@@ -32,5 +32,8 @@ extern int cmd_version(int argc, const char **argv, const char *prefix); | |||
32 | extern int cmd_probe(int argc, const char **argv, const char *prefix); | 32 | extern int cmd_probe(int argc, const char **argv, const char *prefix); |
33 | extern int cmd_kmem(int argc, const char **argv, const char *prefix); | 33 | extern int cmd_kmem(int argc, const char **argv, const char *prefix); |
34 | extern int cmd_lock(int argc, const char **argv, const char *prefix); | 34 | extern int cmd_lock(int argc, const char **argv, const char *prefix); |
35 | extern int cmd_kvm(int argc, const char **argv, const char *prefix); | ||
36 | extern int cmd_test(int argc, const char **argv, const char *prefix); | ||
37 | extern int cmd_inject(int argc, const char **argv, const char *prefix); | ||
35 | 38 | ||
36 | #endif | 39 | #endif |
diff --git a/tools/perf/command-list.txt b/tools/perf/command-list.txt index db6ee94d4a8e..949d77fc0b97 100644 --- a/tools/perf/command-list.txt +++ b/tools/perf/command-list.txt | |||
@@ -8,6 +8,7 @@ perf-bench mainporcelain common | |||
8 | perf-buildid-cache mainporcelain common | 8 | perf-buildid-cache mainporcelain common |
9 | perf-buildid-list mainporcelain common | 9 | perf-buildid-list mainporcelain common |
10 | perf-diff mainporcelain common | 10 | perf-diff mainporcelain common |
11 | perf-inject mainporcelain common | ||
11 | perf-list mainporcelain common | 12 | perf-list mainporcelain common |
12 | perf-sched mainporcelain common | 13 | perf-sched mainporcelain common |
13 | perf-record mainporcelain common | 14 | perf-record mainporcelain common |
@@ -19,3 +20,5 @@ perf-trace mainporcelain common | |||
19 | perf-probe mainporcelain common | 20 | perf-probe mainporcelain common |
20 | perf-kmem mainporcelain common | 21 | perf-kmem mainporcelain common |
21 | perf-lock mainporcelain common | 22 | perf-lock mainporcelain common |
23 | perf-kvm mainporcelain common | ||
24 | perf-test mainporcelain common | ||
diff --git a/tools/perf/perf-archive.sh b/tools/perf/perf-archive.sh index 910468e6e01c..2e7a4f417e20 100644 --- a/tools/perf/perf-archive.sh +++ b/tools/perf/perf-archive.sh | |||
@@ -30,4 +30,7 @@ done | |||
30 | 30 | ||
31 | tar cfj $PERF_DATA.tar.bz2 -C $DEBUGDIR -T $MANIFEST | 31 | tar cfj $PERF_DATA.tar.bz2 -C $DEBUGDIR -T $MANIFEST |
32 | rm -f $MANIFEST $BUILDIDS | 32 | rm -f $MANIFEST $BUILDIDS |
33 | echo -e "Now please run:\n" | ||
34 | echo -e "$ tar xvf $PERF_DATA.tar.bz2 -C ~/.debug\n" | ||
35 | echo "wherever you need to run 'perf report' on." | ||
33 | exit 0 | 36 | exit 0 |
diff --git a/tools/perf/perf.c b/tools/perf/perf.c index cd32c200cdb3..08e0e5d2b50e 100644 --- a/tools/perf/perf.c +++ b/tools/perf/perf.c | |||
@@ -13,9 +13,10 @@ | |||
13 | #include "util/quote.h" | 13 | #include "util/quote.h" |
14 | #include "util/run-command.h" | 14 | #include "util/run-command.h" |
15 | #include "util/parse-events.h" | 15 | #include "util/parse-events.h" |
16 | #include "util/string.h" | ||
17 | #include "util/debugfs.h" | 16 | #include "util/debugfs.h" |
18 | 17 | ||
18 | bool use_browser; | ||
19 | |||
19 | const char perf_usage_string[] = | 20 | const char perf_usage_string[] = |
20 | "perf [--version] [--help] COMMAND [ARGS]"; | 21 | "perf [--version] [--help] COMMAND [ARGS]"; |
21 | 22 | ||
@@ -262,6 +263,8 @@ static int run_builtin(struct cmd_struct *p, int argc, const char **argv) | |||
262 | set_debugfs_path(); | 263 | set_debugfs_path(); |
263 | 264 | ||
264 | status = p->fn(argc, argv, prefix); | 265 | status = p->fn(argc, argv, prefix); |
266 | exit_browser(status); | ||
267 | |||
265 | if (status) | 268 | if (status) |
266 | return status & 0xff; | 269 | return status & 0xff; |
267 | 270 | ||
@@ -304,6 +307,9 @@ static void handle_internal_command(int argc, const char **argv) | |||
304 | { "probe", cmd_probe, 0 }, | 307 | { "probe", cmd_probe, 0 }, |
305 | { "kmem", cmd_kmem, 0 }, | 308 | { "kmem", cmd_kmem, 0 }, |
306 | { "lock", cmd_lock, 0 }, | 309 | { "lock", cmd_lock, 0 }, |
310 | { "kvm", cmd_kvm, 0 }, | ||
311 | { "test", cmd_test, 0 }, | ||
312 | { "inject", cmd_inject, 0 }, | ||
307 | }; | 313 | }; |
308 | unsigned int i; | 314 | unsigned int i; |
309 | static const char ext[] = STRIP_EXTENSION; | 315 | static const char ext[] = STRIP_EXTENSION; |
diff --git a/tools/perf/perf.h b/tools/perf/perf.h index 6fb379bc1d1f..ef7aa0a0c526 100644 --- a/tools/perf/perf.h +++ b/tools/perf/perf.h | |||
@@ -1,6 +1,10 @@ | |||
1 | #ifndef _PERF_PERF_H | 1 | #ifndef _PERF_PERF_H |
2 | #define _PERF_PERF_H | 2 | #define _PERF_PERF_H |
3 | 3 | ||
4 | struct winsize; | ||
5 | |||
6 | void get_term_dimensions(struct winsize *ws); | ||
7 | |||
4 | #if defined(__i386__) | 8 | #if defined(__i386__) |
5 | #include "../../arch/x86/include/asm/unistd.h" | 9 | #include "../../arch/x86/include/asm/unistd.h" |
6 | #define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory") | 10 | #define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory") |
@@ -76,6 +80,7 @@ | |||
76 | 80 | ||
77 | #include "../../include/linux/perf_event.h" | 81 | #include "../../include/linux/perf_event.h" |
78 | #include "util/types.h" | 82 | #include "util/types.h" |
83 | #include <stdbool.h> | ||
79 | 84 | ||
80 | /* | 85 | /* |
81 | * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all | 86 | * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all |
@@ -102,8 +107,6 @@ static inline unsigned long long rdclock(void) | |||
102 | #define __user | 107 | #define __user |
103 | #define asmlinkage | 108 | #define asmlinkage |
104 | 109 | ||
105 | #define __used __attribute__((__unused__)) | ||
106 | |||
107 | #define unlikely(x) __builtin_expect(!!(x), 0) | 110 | #define unlikely(x) __builtin_expect(!!(x), 0) |
108 | #define min(x, y) ({ \ | 111 | #define min(x, y) ({ \ |
109 | typeof(x) _min1 = (x); \ | 112 | typeof(x) _min1 = (x); \ |
@@ -129,4 +132,6 @@ struct ip_callchain { | |||
129 | u64 ips[0]; | 132 | u64 ips[0]; |
130 | }; | 133 | }; |
131 | 134 | ||
135 | extern bool perf_host, perf_guest; | ||
136 | |||
132 | #endif | 137 | #endif |
diff --git a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm index f869c48dc9b0..d94b40c8ac85 100644 --- a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm +++ b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm | |||
@@ -15,6 +15,7 @@ our @EXPORT_OK = ( @{ $EXPORT_TAGS{'all'} } ); | |||
15 | 15 | ||
16 | our @EXPORT = qw( | 16 | our @EXPORT = qw( |
17 | avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs | 17 | avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs |
18 | clear_term | ||
18 | ); | 19 | ); |
19 | 20 | ||
20 | our $VERSION = '0.01'; | 21 | our $VERSION = '0.01'; |
@@ -55,6 +56,11 @@ sub nsecs_str { | |||
55 | return $str; | 56 | return $str; |
56 | } | 57 | } |
57 | 58 | ||
59 | sub clear_term | ||
60 | { | ||
61 | print "\x1b[H\x1b[2J"; | ||
62 | } | ||
63 | |||
58 | 1; | 64 | 1; |
59 | __END__ | 65 | __END__ |
60 | =head1 NAME | 66 | =head1 NAME |
diff --git a/tools/perf/scripts/perl/bin/check-perf-trace-record b/tools/perf/scripts/perl/bin/check-perf-trace-record index e6cb1474f8e8..423ad6aed056 100644 --- a/tools/perf/scripts/perl/bin/check-perf-trace-record +++ b/tools/perf/scripts/perl/bin/check-perf-trace-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e kmem:kmalloc -e irq:softirq_entry -e kmem:kfree | 2 | perf record -a -e kmem:kmalloc -e irq:softirq_entry -e kmem:kfree |
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-record b/tools/perf/scripts/perl/bin/failed-syscalls-record index f8885d389e6f..eb5846bcb565 100644 --- a/tools/perf/scripts/perl/bin/failed-syscalls-record +++ b/tools/perf/scripts/perl/bin/failed-syscalls-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_exit | 2 | perf record -a -e raw_syscalls:sys_exit $@ |
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-report b/tools/perf/scripts/perl/bin/failed-syscalls-report index 8bfc660e5056..e3a5e55d54ff 100644 --- a/tools/perf/scripts/perl/bin/failed-syscalls-report +++ b/tools/perf/scripts/perl/bin/failed-syscalls-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide failed syscalls | 2 | # description: system-wide failed syscalls |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/perl/failed-syscalls.pl $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/failed-syscalls.pl $comm | ||
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-record b/tools/perf/scripts/perl/bin/rw-by-file-record index b25056ebf963..5bfaae5a6cba 100644 --- a/tools/perf/scripts/perl/bin/rw-by-file-record +++ b/tools/perf/scripts/perl/bin/rw-by-file-record | |||
@@ -1,2 +1,3 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_enter_write | 2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_enter_write $@ |
3 | |||
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-report b/tools/perf/scripts/perl/bin/rw-by-file-report index eddb9ccce6a5..d83070b7eeb5 100644 --- a/tools/perf/scripts/perl/bin/rw-by-file-report +++ b/tools/perf/scripts/perl/bin/rw-by-file-report | |||
@@ -1,7 +1,13 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: r/w activity for a program, by file | 2 | # description: r/w activity for a program, by file |
3 | # args: <comm> | 3 | # args: <comm> |
4 | perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $1 | 4 | if [ $# -lt 1 ] ; then |
5 | echo "usage: rw-by-file <comm>" | ||
6 | exit | ||
7 | fi | ||
8 | comm=$1 | ||
9 | shift | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $comm | ||
5 | 11 | ||
6 | 12 | ||
7 | 13 | ||
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-record b/tools/perf/scripts/perl/bin/rw-by-pid-record index 8903979c5b6c..6e0b2f7755ac 100644 --- a/tools/perf/scripts/perl/bin/rw-by-pid-record +++ b/tools/perf/scripts/perl/bin/rw-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write | 2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@ |
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-report b/tools/perf/scripts/perl/bin/rw-by-pid-report index 7f44c25cc857..7ef46983f62f 100644 --- a/tools/perf/scripts/perl/bin/rw-by-pid-report +++ b/tools/perf/scripts/perl/bin/rw-by-pid-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide r/w activity | 2 | # description: system-wide r/w activity |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/bin/rwtop-record b/tools/perf/scripts/perl/bin/rwtop-record new file mode 100644 index 000000000000..6e0b2f7755ac --- /dev/null +++ b/tools/perf/scripts/perl/bin/rwtop-record | |||
@@ -0,0 +1,2 @@ | |||
1 | #!/bin/bash | ||
2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@ | ||
diff --git a/tools/perf/scripts/perl/bin/rwtop-report b/tools/perf/scripts/perl/bin/rwtop-report new file mode 100644 index 000000000000..93e698cd3f38 --- /dev/null +++ b/tools/perf/scripts/perl/bin/rwtop-report | |||
@@ -0,0 +1,23 @@ | |||
1 | #!/bin/bash | ||
2 | # description: system-wide r/w top | ||
3 | # args: [interval] | ||
4 | n_args=0 | ||
5 | for i in "$@" | ||
6 | do | ||
7 | if expr match "$i" "-" > /dev/null ; then | ||
8 | break | ||
9 | fi | ||
10 | n_args=$(( $n_args + 1 )) | ||
11 | done | ||
12 | if [ "$n_args" -gt 1 ] ; then | ||
13 | echo "usage: rwtop-report [interval]" | ||
14 | exit | ||
15 | fi | ||
16 | if [ "$n_args" -gt 0 ] ; then | ||
17 | interval=$1 | ||
18 | shift | ||
19 | fi | ||
20 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rwtop.pl $interval | ||
21 | |||
22 | |||
23 | |||
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-record b/tools/perf/scripts/perl/bin/wakeup-latency-record index 6abedda911a4..9f2acaaae9f0 100644 --- a/tools/perf/scripts/perl/bin/wakeup-latency-record +++ b/tools/perf/scripts/perl/bin/wakeup-latency-record | |||
@@ -1,5 +1,5 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e sched:sched_switch -e sched:sched_wakeup | 2 | perf record -a -e sched:sched_switch -e sched:sched_wakeup $@ |
3 | 3 | ||
4 | 4 | ||
5 | 5 | ||
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-report b/tools/perf/scripts/perl/bin/wakeup-latency-report index fce3adcb3249..a0d898f9ca1d 100644 --- a/tools/perf/scripts/perl/bin/wakeup-latency-report +++ b/tools/perf/scripts/perl/bin/wakeup-latency-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide min/max/avg wakeup latency | 2 | # description: system-wide min/max/avg wakeup latency |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-record b/tools/perf/scripts/perl/bin/workqueue-stats-record index fce6637b19ba..85301f2471ff 100644 --- a/tools/perf/scripts/perl/bin/workqueue-stats-record +++ b/tools/perf/scripts/perl/bin/workqueue-stats-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion | 2 | perf record -a -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion $@ |
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-report b/tools/perf/scripts/perl/bin/workqueue-stats-report index 71cfbd182fb9..35081132ef97 100644 --- a/tools/perf/scripts/perl/bin/workqueue-stats-report +++ b/tools/perf/scripts/perl/bin/workqueue-stats-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: workqueue stats (ins/exe/create/destroy) | 2 | # description: workqueue stats (ins/exe/create/destroy) |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/failed-syscalls.pl b/tools/perf/scripts/perl/failed-syscalls.pl index c18e7e27a84b..94bc25a347eb 100644 --- a/tools/perf/scripts/perl/failed-syscalls.pl +++ b/tools/perf/scripts/perl/failed-syscalls.pl | |||
@@ -11,6 +11,8 @@ use Perf::Trace::Core; | |||
11 | use Perf::Trace::Context; | 11 | use Perf::Trace::Context; |
12 | use Perf::Trace::Util; | 12 | use Perf::Trace::Util; |
13 | 13 | ||
14 | my $for_comm = shift; | ||
15 | |||
14 | my %failed_syscalls; | 16 | my %failed_syscalls; |
15 | 17 | ||
16 | sub raw_syscalls::sys_exit | 18 | sub raw_syscalls::sys_exit |
@@ -33,6 +35,8 @@ sub trace_end | |||
33 | 35 | ||
34 | foreach my $comm (sort {$failed_syscalls{$b} <=> $failed_syscalls{$a}} | 36 | foreach my $comm (sort {$failed_syscalls{$b} <=> $failed_syscalls{$a}} |
35 | keys %failed_syscalls) { | 37 | keys %failed_syscalls) { |
36 | printf("%-20s %10s\n", $comm, $failed_syscalls{$comm}); | 38 | next if ($for_comm && $comm ne $for_comm); |
39 | |||
40 | printf("%-20s %10s\n", $comm, $failed_syscalls{$comm}); | ||
37 | } | 41 | } |
38 | } | 42 | } |
diff --git a/tools/perf/scripts/perl/rw-by-pid.pl b/tools/perf/scripts/perl/rw-by-pid.pl index da601fae1a00..9db23c9daf55 100644 --- a/tools/perf/scripts/perl/rw-by-pid.pl +++ b/tools/perf/scripts/perl/rw-by-pid.pl | |||
@@ -79,12 +79,12 @@ sub trace_end | |||
79 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", | 79 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", |
80 | "-----------", "----------", "----------"); | 80 | "-----------", "----------", "----------"); |
81 | 81 | ||
82 | foreach my $pid (sort {$reads{$b}{bytes_read} <=> | 82 | foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=> |
83 | $reads{$a}{bytes_read}} keys %reads) { | 83 | ($reads{$a}{bytes_read} || 0) } keys %reads) { |
84 | my $comm = $reads{$pid}{comm}; | 84 | my $comm = $reads{$pid}{comm} || ""; |
85 | my $total_reads = $reads{$pid}{total_reads}; | 85 | my $total_reads = $reads{$pid}{total_reads} || 0; |
86 | my $bytes_requested = $reads{$pid}{bytes_requested}; | 86 | my $bytes_requested = $reads{$pid}{bytes_requested} || 0; |
87 | my $bytes_read = $reads{$pid}{bytes_read}; | 87 | my $bytes_read = $reads{$pid}{bytes_read} || 0; |
88 | 88 | ||
89 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, | 89 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, |
90 | $total_reads, $bytes_requested, $bytes_read); | 90 | $total_reads, $bytes_requested, $bytes_read); |
@@ -96,16 +96,23 @@ sub trace_end | |||
96 | printf("%6s %20s %6s %10s\n", "------", "--------------------", | 96 | printf("%6s %20s %6s %10s\n", "------", "--------------------", |
97 | "------", "----------"); | 97 | "------", "----------"); |
98 | 98 | ||
99 | foreach my $pid (keys %reads) { | 99 | my @errcounts = (); |
100 | my $comm = $reads{$pid}{comm}; | ||
101 | foreach my $err (sort {$reads{$b}{comm} cmp $reads{$a}{comm}} | ||
102 | keys %{$reads{$pid}{errors}}) { | ||
103 | my $errors = $reads{$pid}{errors}{$err}; | ||
104 | 100 | ||
105 | printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); | 101 | foreach my $pid (keys %reads) { |
102 | foreach my $error (keys %{$reads{$pid}{errors}}) { | ||
103 | my $comm = $reads{$pid}{comm} || ""; | ||
104 | my $errcount = $reads{$pid}{errors}{$error} || 0; | ||
105 | push @errcounts, [$pid, $comm, $error, $errcount]; | ||
106 | } | 106 | } |
107 | } | 107 | } |
108 | 108 | ||
109 | @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts; | ||
110 | |||
111 | for my $i (0 .. $#errcounts) { | ||
112 | printf("%6d %-20s %6d %10s\n", $errcounts[$i][0], | ||
113 | $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]); | ||
114 | } | ||
115 | |||
109 | printf("\nwrite counts by pid:\n\n"); | 116 | printf("\nwrite counts by pid:\n\n"); |
110 | 117 | ||
111 | printf("%6s %20s %10s %10s\n", "pid", "comm", | 118 | printf("%6s %20s %10s %10s\n", "pid", "comm", |
@@ -113,11 +120,11 @@ sub trace_end | |||
113 | printf("%6s %-20s %10s %10s\n", "------", "--------------------", | 120 | printf("%6s %-20s %10s %10s\n", "------", "--------------------", |
114 | "-----------", "----------"); | 121 | "-----------", "----------"); |
115 | 122 | ||
116 | foreach my $pid (sort {$writes{$b}{bytes_written} <=> | 123 | foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=> |
117 | $writes{$a}{bytes_written}} keys %writes) { | 124 | ($writes{$a}{bytes_written} || 0)} keys %writes) { |
118 | my $comm = $writes{$pid}{comm}; | 125 | my $comm = $writes{$pid}{comm} || ""; |
119 | my $total_writes = $writes{$pid}{total_writes}; | 126 | my $total_writes = $writes{$pid}{total_writes} || 0; |
120 | my $bytes_written = $writes{$pid}{bytes_written}; | 127 | my $bytes_written = $writes{$pid}{bytes_written} || 0; |
121 | 128 | ||
122 | printf("%6s %-20s %10s %10s\n", $pid, $comm, | 129 | printf("%6s %-20s %10s %10s\n", $pid, $comm, |
123 | $total_writes, $bytes_written); | 130 | $total_writes, $bytes_written); |
@@ -129,16 +136,23 @@ sub trace_end | |||
129 | printf("%6s %20s %6s %10s\n", "------", "--------------------", | 136 | printf("%6s %20s %6s %10s\n", "------", "--------------------", |
130 | "------", "----------"); | 137 | "------", "----------"); |
131 | 138 | ||
132 | foreach my $pid (keys %writes) { | 139 | @errcounts = (); |
133 | my $comm = $writes{$pid}{comm}; | ||
134 | foreach my $err (sort {$writes{$b}{comm} cmp $writes{$a}{comm}} | ||
135 | keys %{$writes{$pid}{errors}}) { | ||
136 | my $errors = $writes{$pid}{errors}{$err}; | ||
137 | 140 | ||
138 | printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); | 141 | foreach my $pid (keys %writes) { |
142 | foreach my $error (keys %{$writes{$pid}{errors}}) { | ||
143 | my $comm = $writes{$pid}{comm} || ""; | ||
144 | my $errcount = $writes{$pid}{errors}{$error} || 0; | ||
145 | push @errcounts, [$pid, $comm, $error, $errcount]; | ||
139 | } | 146 | } |
140 | } | 147 | } |
141 | 148 | ||
149 | @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts; | ||
150 | |||
151 | for my $i (0 .. $#errcounts) { | ||
152 | printf("%6d %-20s %6d %10s\n", $errcounts[$i][0], | ||
153 | $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]); | ||
154 | } | ||
155 | |||
142 | print_unhandled(); | 156 | print_unhandled(); |
143 | } | 157 | } |
144 | 158 | ||
diff --git a/tools/perf/scripts/perl/rwtop.pl b/tools/perf/scripts/perl/rwtop.pl new file mode 100644 index 000000000000..4bb3ecd33472 --- /dev/null +++ b/tools/perf/scripts/perl/rwtop.pl | |||
@@ -0,0 +1,199 @@ | |||
1 | #!/usr/bin/perl -w | ||
2 | # (c) 2010, Tom Zanussi <tzanussi@gmail.com> | ||
3 | # Licensed under the terms of the GNU GPL License version 2 | ||
4 | |||
5 | # read/write top | ||
6 | # | ||
7 | # Periodically displays system-wide r/w call activity, broken down by | ||
8 | # pid. If an [interval] arg is specified, the display will be | ||
9 | # refreshed every [interval] seconds. The default interval is 3 | ||
10 | # seconds. | ||
11 | |||
12 | use 5.010000; | ||
13 | use strict; | ||
14 | use warnings; | ||
15 | |||
16 | use lib "$ENV{'PERF_EXEC_PATH'}/scripts/perl/Perf-Trace-Util/lib"; | ||
17 | use lib "./Perf-Trace-Util/lib"; | ||
18 | use Perf::Trace::Core; | ||
19 | use Perf::Trace::Util; | ||
20 | |||
21 | my $default_interval = 3; | ||
22 | my $nlines = 20; | ||
23 | my $print_thread; | ||
24 | my $print_pending = 0; | ||
25 | |||
26 | my %reads; | ||
27 | my %writes; | ||
28 | |||
29 | my $interval = shift; | ||
30 | if (!$interval) { | ||
31 | $interval = $default_interval; | ||
32 | } | ||
33 | |||
34 | sub syscalls::sys_exit_read | ||
35 | { | ||
36 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
37 | $common_pid, $common_comm, | ||
38 | $nr, $ret) = @_; | ||
39 | |||
40 | print_check(); | ||
41 | |||
42 | if ($ret > 0) { | ||
43 | $reads{$common_pid}{bytes_read} += $ret; | ||
44 | } else { | ||
45 | if (!defined ($reads{$common_pid}{bytes_read})) { | ||
46 | $reads{$common_pid}{bytes_read} = 0; | ||
47 | } | ||
48 | $reads{$common_pid}{errors}{$ret}++; | ||
49 | } | ||
50 | } | ||
51 | |||
52 | sub syscalls::sys_enter_read | ||
53 | { | ||
54 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
55 | $common_pid, $common_comm, | ||
56 | $nr, $fd, $buf, $count) = @_; | ||
57 | |||
58 | print_check(); | ||
59 | |||
60 | $reads{$common_pid}{bytes_requested} += $count; | ||
61 | $reads{$common_pid}{total_reads}++; | ||
62 | $reads{$common_pid}{comm} = $common_comm; | ||
63 | } | ||
64 | |||
65 | sub syscalls::sys_exit_write | ||
66 | { | ||
67 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
68 | $common_pid, $common_comm, | ||
69 | $nr, $ret) = @_; | ||
70 | |||
71 | print_check(); | ||
72 | |||
73 | if ($ret <= 0) { | ||
74 | $writes{$common_pid}{errors}{$ret}++; | ||
75 | } | ||
76 | } | ||
77 | |||
78 | sub syscalls::sys_enter_write | ||
79 | { | ||
80 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
81 | $common_pid, $common_comm, | ||
82 | $nr, $fd, $buf, $count) = @_; | ||
83 | |||
84 | print_check(); | ||
85 | |||
86 | $writes{$common_pid}{bytes_written} += $count; | ||
87 | $writes{$common_pid}{total_writes}++; | ||
88 | $writes{$common_pid}{comm} = $common_comm; | ||
89 | } | ||
90 | |||
91 | sub trace_begin | ||
92 | { | ||
93 | $SIG{ALRM} = \&set_print_pending; | ||
94 | alarm 1; | ||
95 | } | ||
96 | |||
97 | sub trace_end | ||
98 | { | ||
99 | print_unhandled(); | ||
100 | print_totals(); | ||
101 | } | ||
102 | |||
103 | sub print_check() | ||
104 | { | ||
105 | if ($print_pending == 1) { | ||
106 | $print_pending = 0; | ||
107 | print_totals(); | ||
108 | } | ||
109 | } | ||
110 | |||
111 | sub set_print_pending() | ||
112 | { | ||
113 | $print_pending = 1; | ||
114 | alarm $interval; | ||
115 | } | ||
116 | |||
117 | sub print_totals | ||
118 | { | ||
119 | my $count; | ||
120 | |||
121 | $count = 0; | ||
122 | |||
123 | clear_term(); | ||
124 | |||
125 | printf("\nread counts by pid:\n\n"); | ||
126 | |||
127 | printf("%6s %20s %10s %10s %10s\n", "pid", "comm", | ||
128 | "# reads", "bytes_req", "bytes_read"); | ||
129 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", | ||
130 | "----------", "----------", "----------"); | ||
131 | |||
132 | foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=> | ||
133 | ($reads{$a}{bytes_read} || 0) } keys %reads) { | ||
134 | my $comm = $reads{$pid}{comm} || ""; | ||
135 | my $total_reads = $reads{$pid}{total_reads} || 0; | ||
136 | my $bytes_requested = $reads{$pid}{bytes_requested} || 0; | ||
137 | my $bytes_read = $reads{$pid}{bytes_read} || 0; | ||
138 | |||
139 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, | ||
140 | $total_reads, $bytes_requested, $bytes_read); | ||
141 | |||
142 | if (++$count == $nlines) { | ||
143 | last; | ||
144 | } | ||
145 | } | ||
146 | |||
147 | $count = 0; | ||
148 | |||
149 | printf("\nwrite counts by pid:\n\n"); | ||
150 | |||
151 | printf("%6s %20s %10s %13s\n", "pid", "comm", | ||
152 | "# writes", "bytes_written"); | ||
153 | printf("%6s %-20s %10s %13s\n", "------", "--------------------", | ||
154 | "----------", "-------------"); | ||
155 | |||
156 | foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=> | ||
157 | ($writes{$a}{bytes_written} || 0)} keys %writes) { | ||
158 | my $comm = $writes{$pid}{comm} || ""; | ||
159 | my $total_writes = $writes{$pid}{total_writes} || 0; | ||
160 | my $bytes_written = $writes{$pid}{bytes_written} || 0; | ||
161 | |||
162 | printf("%6s %-20s %10s %13s\n", $pid, $comm, | ||
163 | $total_writes, $bytes_written); | ||
164 | |||
165 | if (++$count == $nlines) { | ||
166 | last; | ||
167 | } | ||
168 | } | ||
169 | |||
170 | %reads = (); | ||
171 | %writes = (); | ||
172 | } | ||
173 | |||
174 | my %unhandled; | ||
175 | |||
176 | sub print_unhandled | ||
177 | { | ||
178 | if ((scalar keys %unhandled) == 0) { | ||
179 | return; | ||
180 | } | ||
181 | |||
182 | print "\nunhandled events:\n\n"; | ||
183 | |||
184 | printf("%-40s %10s\n", "event", "count"); | ||
185 | printf("%-40s %10s\n", "----------------------------------------", | ||
186 | "-----------"); | ||
187 | |||
188 | foreach my $event_name (keys %unhandled) { | ||
189 | printf("%-40s %10d\n", $event_name, $unhandled{$event_name}); | ||
190 | } | ||
191 | } | ||
192 | |||
193 | sub trace_unhandled | ||
194 | { | ||
195 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
196 | $common_pid, $common_comm) = @_; | ||
197 | |||
198 | $unhandled{$event_name}++; | ||
199 | } | ||
diff --git a/tools/perf/scripts/perl/wakeup-latency.pl b/tools/perf/scripts/perl/wakeup-latency.pl index ed58ef284e23..d9143dcec6c6 100644 --- a/tools/perf/scripts/perl/wakeup-latency.pl +++ b/tools/perf/scripts/perl/wakeup-latency.pl | |||
@@ -22,8 +22,8 @@ my %last_wakeup; | |||
22 | 22 | ||
23 | my $max_wakeup_latency; | 23 | my $max_wakeup_latency; |
24 | my $min_wakeup_latency; | 24 | my $min_wakeup_latency; |
25 | my $total_wakeup_latency; | 25 | my $total_wakeup_latency = 0; |
26 | my $total_wakeups; | 26 | my $total_wakeups = 0; |
27 | 27 | ||
28 | sub sched::sched_switch | 28 | sub sched::sched_switch |
29 | { | 29 | { |
@@ -67,8 +67,12 @@ sub trace_end | |||
67 | { | 67 | { |
68 | printf("wakeup_latency stats:\n\n"); | 68 | printf("wakeup_latency stats:\n\n"); |
69 | print "total_wakeups: $total_wakeups\n"; | 69 | print "total_wakeups: $total_wakeups\n"; |
70 | printf("avg_wakeup_latency (ns): %u\n", | 70 | if ($total_wakeups) { |
71 | avg($total_wakeup_latency, $total_wakeups)); | 71 | printf("avg_wakeup_latency (ns): %u\n", |
72 | avg($total_wakeup_latency, $total_wakeups)); | ||
73 | } else { | ||
74 | printf("avg_wakeup_latency (ns): N/A\n"); | ||
75 | } | ||
72 | printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency); | 76 | printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency); |
73 | printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency); | 77 | printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency); |
74 | 78 | ||
diff --git a/tools/perf/scripts/perl/workqueue-stats.pl b/tools/perf/scripts/perl/workqueue-stats.pl index 511302c8a494..b84b12699b70 100644 --- a/tools/perf/scripts/perl/workqueue-stats.pl +++ b/tools/perf/scripts/perl/workqueue-stats.pl | |||
@@ -71,9 +71,9 @@ sub trace_end | |||
71 | printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----"); | 71 | printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----"); |
72 | foreach my $pidhash (@cpus) { | 72 | foreach my $pidhash (@cpus) { |
73 | while ((my $pid, my $wqhash) = each %$pidhash) { | 73 | while ((my $pid, my $wqhash) = each %$pidhash) { |
74 | my $ins = $$wqhash{'inserted'}; | 74 | my $ins = $$wqhash{'inserted'} || 0; |
75 | my $exe = $$wqhash{'executed'}; | 75 | my $exe = $$wqhash{'executed'} || 0; |
76 | my $comm = $$wqhash{'comm'}; | 76 | my $comm = $$wqhash{'comm'} || ""; |
77 | if ($ins || $exe) { | 77 | if ($ins || $exe) { |
78 | printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm); | 78 | printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm); |
79 | } | 79 | } |
@@ -87,9 +87,9 @@ sub trace_end | |||
87 | printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----"); | 87 | printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----"); |
88 | foreach my $pidhash (@cpus) { | 88 | foreach my $pidhash (@cpus) { |
89 | while ((my $pid, my $wqhash) = each %$pidhash) { | 89 | while ((my $pid, my $wqhash) = each %$pidhash) { |
90 | my $created = $$wqhash{'created'}; | 90 | my $created = $$wqhash{'created'} || 0; |
91 | my $destroyed = $$wqhash{'destroyed'}; | 91 | my $destroyed = $$wqhash{'destroyed'} || 0; |
92 | my $comm = $$wqhash{'comm'}; | 92 | my $comm = $$wqhash{'comm'} || ""; |
93 | if ($created || $destroyed) { | 93 | if ($created || $destroyed) { |
94 | printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed, | 94 | printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed, |
95 | $comm); | 95 | $comm); |
diff --git a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py index 83e91435ed09..9689bc0acd9f 100644 --- a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py +++ b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py | |||
@@ -23,3 +23,6 @@ def nsecs_nsecs(nsecs): | |||
23 | def nsecs_str(nsecs): | 23 | def nsecs_str(nsecs): |
24 | str = "%5u.%09u" % (nsecs_secs(nsecs), nsecs_nsecs(nsecs)), | 24 | str = "%5u.%09u" % (nsecs_secs(nsecs), nsecs_nsecs(nsecs)), |
25 | return str | 25 | return str |
26 | |||
27 | def clear_term(): | ||
28 | print("\x1b[H\x1b[2J") | ||
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record index f8885d389e6f..eb5846bcb565 100644 --- a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record +++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_exit | 2 | perf record -a -e raw_syscalls:sys_exit $@ |
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report index 1e0c0a860c87..30293545fcc2 100644 --- a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report +++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide failed syscalls, by pid | 2 | # description: system-wide failed syscalls, by pid |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/failed-syscalls-by-pid.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/failed-syscalls-by-pid.py $comm | ||
diff --git a/tools/perf/scripts/python/bin/sctop-record b/tools/perf/scripts/python/bin/sctop-record new file mode 100644 index 000000000000..1fc5998b721d --- /dev/null +++ b/tools/perf/scripts/python/bin/sctop-record | |||
@@ -0,0 +1,2 @@ | |||
1 | #!/bin/bash | ||
2 | perf record -a -e raw_syscalls:sys_enter $@ | ||
diff --git a/tools/perf/scripts/python/bin/sctop-report b/tools/perf/scripts/python/bin/sctop-report new file mode 100644 index 000000000000..b01c842ae7b4 --- /dev/null +++ b/tools/perf/scripts/python/bin/sctop-report | |||
@@ -0,0 +1,24 @@ | |||
1 | #!/bin/bash | ||
2 | # description: syscall top | ||
3 | # args: [comm] [interval] | ||
4 | n_args=0 | ||
5 | for i in "$@" | ||
6 | do | ||
7 | if expr match "$i" "-" > /dev/null ; then | ||
8 | break | ||
9 | fi | ||
10 | n_args=$(( $n_args + 1 )) | ||
11 | done | ||
12 | if [ "$n_args" -gt 2 ] ; then | ||
13 | echo "usage: sctop-report [comm] [interval]" | ||
14 | exit | ||
15 | fi | ||
16 | if [ "$n_args" -gt 1 ] ; then | ||
17 | comm=$1 | ||
18 | interval=$2 | ||
19 | shift 2 | ||
20 | elif [ "$n_args" -gt 0 ] ; then | ||
21 | interval=$1 | ||
22 | shift | ||
23 | fi | ||
24 | perf trace $@ -s ~/libexec/perf-core/scripts/python/sctop.py $comm $interval | ||
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-record b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record index 45a8c50359da..1fc5998b721d 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-by-pid-record +++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 2 | perf record -a -e raw_syscalls:sys_enter $@ |
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-report b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report index f8044d192271..9e9d8ddd72ce 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-by-pid-report +++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide syscall counts, by pid | 2 | # description: system-wide syscall counts, by pid |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/syscall-counts-by-pid.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts-by-pid.py $comm | ||
diff --git a/tools/perf/scripts/python/bin/syscall-counts-record b/tools/perf/scripts/python/bin/syscall-counts-record index 45a8c50359da..1fc5998b721d 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-record +++ b/tools/perf/scripts/python/bin/syscall-counts-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 2 | perf record -a -e raw_syscalls:sys_enter $@ |
diff --git a/tools/perf/scripts/python/bin/syscall-counts-report b/tools/perf/scripts/python/bin/syscall-counts-report index a366aa61612f..dc076b618796 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-report +++ b/tools/perf/scripts/python/bin/syscall-counts-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide syscall counts | 2 | # description: system-wide syscall counts |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/syscall-counts.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts.py $comm | ||
diff --git a/tools/perf/scripts/python/sctop.py b/tools/perf/scripts/python/sctop.py new file mode 100644 index 000000000000..6cafad40c296 --- /dev/null +++ b/tools/perf/scripts/python/sctop.py | |||
@@ -0,0 +1,78 @@ | |||
1 | # system call top | ||
2 | # (c) 2010, Tom Zanussi <tzanussi@gmail.com> | ||
3 | # Licensed under the terms of the GNU GPL License version 2 | ||
4 | # | ||
5 | # Periodically displays system-wide system call totals, broken down by | ||
6 | # syscall. If a [comm] arg is specified, only syscalls called by | ||
7 | # [comm] are displayed. If an [interval] arg is specified, the display | ||
8 | # will be refreshed every [interval] seconds. The default interval is | ||
9 | # 3 seconds. | ||
10 | |||
11 | import thread | ||
12 | import time | ||
13 | import os | ||
14 | import sys | ||
15 | |||
16 | sys.path.append(os.environ['PERF_EXEC_PATH'] + \ | ||
17 | '/scripts/python/Perf-Trace-Util/lib/Perf/Trace') | ||
18 | |||
19 | from perf_trace_context import * | ||
20 | from Core import * | ||
21 | from Util import * | ||
22 | |||
23 | usage = "perf trace -s syscall-counts.py [comm] [interval]\n"; | ||
24 | |||
25 | for_comm = None | ||
26 | default_interval = 3 | ||
27 | interval = default_interval | ||
28 | |||
29 | if len(sys.argv) > 3: | ||
30 | sys.exit(usage) | ||
31 | |||
32 | if len(sys.argv) > 2: | ||
33 | for_comm = sys.argv[1] | ||
34 | interval = int(sys.argv[2]) | ||
35 | elif len(sys.argv) > 1: | ||
36 | try: | ||
37 | interval = int(sys.argv[1]) | ||
38 | except ValueError: | ||
39 | for_comm = sys.argv[1] | ||
40 | interval = default_interval | ||
41 | |||
42 | syscalls = autodict() | ||
43 | |||
44 | def trace_begin(): | ||
45 | thread.start_new_thread(print_syscall_totals, (interval,)) | ||
46 | pass | ||
47 | |||
48 | def raw_syscalls__sys_enter(event_name, context, common_cpu, | ||
49 | common_secs, common_nsecs, common_pid, common_comm, | ||
50 | id, args): | ||
51 | if for_comm is not None: | ||
52 | if common_comm != for_comm: | ||
53 | return | ||
54 | try: | ||
55 | syscalls[id] += 1 | ||
56 | except TypeError: | ||
57 | syscalls[id] = 1 | ||
58 | |||
59 | def print_syscall_totals(interval): | ||
60 | while 1: | ||
61 | clear_term() | ||
62 | if for_comm is not None: | ||
63 | print "\nsyscall events for %s:\n\n" % (for_comm), | ||
64 | else: | ||
65 | print "\nsyscall events:\n\n", | ||
66 | |||
67 | print "%-40s %10s\n" % ("event", "count"), | ||
68 | print "%-40s %10s\n" % ("----------------------------------------", \ | ||
69 | "----------"), | ||
70 | |||
71 | for id, val in sorted(syscalls.iteritems(), key = lambda(k, v): (v, k), \ | ||
72 | reverse = True): | ||
73 | try: | ||
74 | print "%-40d %10d\n" % (id, val), | ||
75 | except TypeError: | ||
76 | pass | ||
77 | syscalls.clear() | ||
78 | time.sleep(interval) | ||
diff --git a/tools/perf/util/PERF-VERSION-GEN b/tools/perf/util/PERF-VERSION-GEN index 54552a00a117..49ece7921914 100755 --- a/tools/perf/util/PERF-VERSION-GEN +++ b/tools/perf/util/PERF-VERSION-GEN | |||
@@ -1,6 +1,10 @@ | |||
1 | #!/bin/sh | 1 | #!/bin/sh |
2 | 2 | ||
3 | GVF=PERF-VERSION-FILE | 3 | if [ $# -eq 1 ] ; then |
4 | OUTPUT=$1 | ||
5 | fi | ||
6 | |||
7 | GVF=${OUTPUT}PERF-VERSION-FILE | ||
4 | DEF_VER=v0.0.2.PERF | 8 | DEF_VER=v0.0.2.PERF |
5 | 9 | ||
6 | LF=' | 10 | LF=' |
diff --git a/tools/perf/util/bitmap.c b/tools/perf/util/bitmap.c new file mode 100644 index 000000000000..5e230acae1e9 --- /dev/null +++ b/tools/perf/util/bitmap.c | |||
@@ -0,0 +1,21 @@ | |||
1 | /* | ||
2 | * From lib/bitmap.c | ||
3 | * Helper functions for bitmap.h. | ||
4 | * | ||
5 | * This source code is licensed under the GNU General Public License, | ||
6 | * Version 2. See the file COPYING for more details. | ||
7 | */ | ||
8 | #include <linux/bitmap.h> | ||
9 | |||
10 | int __bitmap_weight(const unsigned long *bitmap, int bits) | ||
11 | { | ||
12 | int k, w = 0, lim = bits/BITS_PER_LONG; | ||
13 | |||
14 | for (k = 0; k < lim; k++) | ||
15 | w += hweight_long(bitmap[k]); | ||
16 | |||
17 | if (bits % BITS_PER_LONG) | ||
18 | w += hweight_long(bitmap[k] & BITMAP_LAST_WORD_MASK(bits)); | ||
19 | |||
20 | return w; | ||
21 | } | ||
diff --git a/tools/perf/util/build-id.c b/tools/perf/util/build-id.c index 04904b35ba81..0f60a3906808 100644 --- a/tools/perf/util/build-id.c +++ b/tools/perf/util/build-id.c | |||
@@ -24,7 +24,7 @@ static int build_id__mark_dso_hit(event_t *event, struct perf_session *session) | |||
24 | } | 24 | } |
25 | 25 | ||
26 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, | 26 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, |
27 | event->ip.ip, &al); | 27 | event->ip.pid, event->ip.ip, &al); |
28 | 28 | ||
29 | if (al.map != NULL) | 29 | if (al.map != NULL) |
30 | al.map->dso->hit = 1; | 30 | al.map->dso->hit = 1; |
diff --git a/tools/perf/util/cache.h b/tools/perf/util/cache.h index 918eb376abe3..4b9aab7f0405 100644 --- a/tools/perf/util/cache.h +++ b/tools/perf/util/cache.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_CACHE_H | 1 | #ifndef __PERF_CACHE_H |
2 | #define __PERF_CACHE_H | 2 | #define __PERF_CACHE_H |
3 | 3 | ||
4 | #include <stdbool.h> | ||
4 | #include "util.h" | 5 | #include "util.h" |
5 | #include "strbuf.h" | 6 | #include "strbuf.h" |
6 | #include "../perf.h" | 7 | #include "../perf.h" |
@@ -69,6 +70,19 @@ extern const char *pager_program; | |||
69 | extern int pager_in_use(void); | 70 | extern int pager_in_use(void); |
70 | extern int pager_use_color; | 71 | extern int pager_use_color; |
71 | 72 | ||
73 | extern bool use_browser; | ||
74 | |||
75 | #ifdef NO_NEWT_SUPPORT | ||
76 | static inline void setup_browser(void) | ||
77 | { | ||
78 | setup_pager(); | ||
79 | } | ||
80 | static inline void exit_browser(bool wait_for_ok __used) {} | ||
81 | #else | ||
82 | void setup_browser(void); | ||
83 | void exit_browser(bool wait_for_ok); | ||
84 | #endif | ||
85 | |||
72 | extern const char *editor_program; | 86 | extern const char *editor_program; |
73 | extern const char *excludes_file; | 87 | extern const char *excludes_file; |
74 | 88 | ||
diff --git a/tools/perf/util/callchain.c b/tools/perf/util/callchain.c index b3b71258272a..21a52e0a4435 100644 --- a/tools/perf/util/callchain.c +++ b/tools/perf/util/callchain.c | |||
@@ -1,5 +1,5 @@ | |||
1 | /* | 1 | /* |
2 | * Copyright (C) 2009, Frederic Weisbecker <fweisbec@gmail.com> | 2 | * Copyright (C) 2009-2010, Frederic Weisbecker <fweisbec@gmail.com> |
3 | * | 3 | * |
4 | * Handle the callchains from the stream in an ad-hoc radix tree and then | 4 | * Handle the callchains from the stream in an ad-hoc radix tree and then |
5 | * sort them in an rbtree. | 5 | * sort them in an rbtree. |
@@ -17,6 +17,13 @@ | |||
17 | 17 | ||
18 | #include "callchain.h" | 18 | #include "callchain.h" |
19 | 19 | ||
20 | bool ip_callchain__valid(struct ip_callchain *chain, event_t *event) | ||
21 | { | ||
22 | unsigned int chain_size = event->header.size; | ||
23 | chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event; | ||
24 | return chain->nr * sizeof(u64) <= chain_size; | ||
25 | } | ||
26 | |||
20 | #define chain_for_each_child(child, parent) \ | 27 | #define chain_for_each_child(child, parent) \ |
21 | list_for_each_entry(child, &parent->children, brothers) | 28 | list_for_each_entry(child, &parent->children, brothers) |
22 | 29 | ||
@@ -160,7 +167,7 @@ create_child(struct callchain_node *parent, bool inherit_children) | |||
160 | { | 167 | { |
161 | struct callchain_node *new; | 168 | struct callchain_node *new; |
162 | 169 | ||
163 | new = malloc(sizeof(*new)); | 170 | new = zalloc(sizeof(*new)); |
164 | if (!new) { | 171 | if (!new) { |
165 | perror("not enough memory to create child for code path tree"); | 172 | perror("not enough memory to create child for code path tree"); |
166 | return NULL; | 173 | return NULL; |
@@ -183,25 +190,36 @@ create_child(struct callchain_node *parent, bool inherit_children) | |||
183 | return new; | 190 | return new; |
184 | } | 191 | } |
185 | 192 | ||
193 | |||
194 | struct resolved_ip { | ||
195 | u64 ip; | ||
196 | struct map_symbol ms; | ||
197 | }; | ||
198 | |||
199 | struct resolved_chain { | ||
200 | u64 nr; | ||
201 | struct resolved_ip ips[0]; | ||
202 | }; | ||
203 | |||
204 | |||
186 | /* | 205 | /* |
187 | * Fill the node with callchain values | 206 | * Fill the node with callchain values |
188 | */ | 207 | */ |
189 | static void | 208 | static void |
190 | fill_node(struct callchain_node *node, struct ip_callchain *chain, | 209 | fill_node(struct callchain_node *node, struct resolved_chain *chain, int start) |
191 | int start, struct symbol **syms) | ||
192 | { | 210 | { |
193 | unsigned int i; | 211 | unsigned int i; |
194 | 212 | ||
195 | for (i = start; i < chain->nr; i++) { | 213 | for (i = start; i < chain->nr; i++) { |
196 | struct callchain_list *call; | 214 | struct callchain_list *call; |
197 | 215 | ||
198 | call = malloc(sizeof(*call)); | 216 | call = zalloc(sizeof(*call)); |
199 | if (!call) { | 217 | if (!call) { |
200 | perror("not enough memory for the code path tree"); | 218 | perror("not enough memory for the code path tree"); |
201 | return; | 219 | return; |
202 | } | 220 | } |
203 | call->ip = chain->ips[i]; | 221 | call->ip = chain->ips[i].ip; |
204 | call->sym = syms[i]; | 222 | call->ms = chain->ips[i].ms; |
205 | list_add_tail(&call->list, &node->val); | 223 | list_add_tail(&call->list, &node->val); |
206 | } | 224 | } |
207 | node->val_nr = chain->nr - start; | 225 | node->val_nr = chain->nr - start; |
@@ -210,13 +228,13 @@ fill_node(struct callchain_node *node, struct ip_callchain *chain, | |||
210 | } | 228 | } |
211 | 229 | ||
212 | static void | 230 | static void |
213 | add_child(struct callchain_node *parent, struct ip_callchain *chain, | 231 | add_child(struct callchain_node *parent, struct resolved_chain *chain, |
214 | int start, struct symbol **syms) | 232 | int start) |
215 | { | 233 | { |
216 | struct callchain_node *new; | 234 | struct callchain_node *new; |
217 | 235 | ||
218 | new = create_child(parent, false); | 236 | new = create_child(parent, false); |
219 | fill_node(new, chain, start, syms); | 237 | fill_node(new, chain, start); |
220 | 238 | ||
221 | new->children_hit = 0; | 239 | new->children_hit = 0; |
222 | new->hit = 1; | 240 | new->hit = 1; |
@@ -228,9 +246,8 @@ add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
228 | * Then create another child to host the given callchain of new branch | 246 | * Then create another child to host the given callchain of new branch |
229 | */ | 247 | */ |
230 | static void | 248 | static void |
231 | split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | 249 | split_add_child(struct callchain_node *parent, struct resolved_chain *chain, |
232 | struct callchain_list *to_split, int idx_parents, int idx_local, | 250 | struct callchain_list *to_split, int idx_parents, int idx_local) |
233 | struct symbol **syms) | ||
234 | { | 251 | { |
235 | struct callchain_node *new; | 252 | struct callchain_node *new; |
236 | struct list_head *old_tail; | 253 | struct list_head *old_tail; |
@@ -257,7 +274,7 @@ split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
257 | /* create a new child for the new branch if any */ | 274 | /* create a new child for the new branch if any */ |
258 | if (idx_total < chain->nr) { | 275 | if (idx_total < chain->nr) { |
259 | parent->hit = 0; | 276 | parent->hit = 0; |
260 | add_child(parent, chain, idx_total, syms); | 277 | add_child(parent, chain, idx_total); |
261 | parent->children_hit++; | 278 | parent->children_hit++; |
262 | } else { | 279 | } else { |
263 | parent->hit = 1; | 280 | parent->hit = 1; |
@@ -265,32 +282,33 @@ split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
265 | } | 282 | } |
266 | 283 | ||
267 | static int | 284 | static int |
268 | __append_chain(struct callchain_node *root, struct ip_callchain *chain, | 285 | __append_chain(struct callchain_node *root, struct resolved_chain *chain, |
269 | unsigned int start, struct symbol **syms); | 286 | unsigned int start); |
270 | 287 | ||
271 | static void | 288 | static void |
272 | __append_chain_children(struct callchain_node *root, struct ip_callchain *chain, | 289 | __append_chain_children(struct callchain_node *root, |
273 | struct symbol **syms, unsigned int start) | 290 | struct resolved_chain *chain, |
291 | unsigned int start) | ||
274 | { | 292 | { |
275 | struct callchain_node *rnode; | 293 | struct callchain_node *rnode; |
276 | 294 | ||
277 | /* lookup in childrens */ | 295 | /* lookup in childrens */ |
278 | chain_for_each_child(rnode, root) { | 296 | chain_for_each_child(rnode, root) { |
279 | unsigned int ret = __append_chain(rnode, chain, start, syms); | 297 | unsigned int ret = __append_chain(rnode, chain, start); |
280 | 298 | ||
281 | if (!ret) | 299 | if (!ret) |
282 | goto inc_children_hit; | 300 | goto inc_children_hit; |
283 | } | 301 | } |
284 | /* nothing in children, add to the current node */ | 302 | /* nothing in children, add to the current node */ |
285 | add_child(root, chain, start, syms); | 303 | add_child(root, chain, start); |
286 | 304 | ||
287 | inc_children_hit: | 305 | inc_children_hit: |
288 | root->children_hit++; | 306 | root->children_hit++; |
289 | } | 307 | } |
290 | 308 | ||
291 | static int | 309 | static int |
292 | __append_chain(struct callchain_node *root, struct ip_callchain *chain, | 310 | __append_chain(struct callchain_node *root, struct resolved_chain *chain, |
293 | unsigned int start, struct symbol **syms) | 311 | unsigned int start) |
294 | { | 312 | { |
295 | struct callchain_list *cnode; | 313 | struct callchain_list *cnode; |
296 | unsigned int i = start; | 314 | unsigned int i = start; |
@@ -302,13 +320,19 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
302 | * anywhere inside a function. | 320 | * anywhere inside a function. |
303 | */ | 321 | */ |
304 | list_for_each_entry(cnode, &root->val, list) { | 322 | list_for_each_entry(cnode, &root->val, list) { |
323 | struct symbol *sym; | ||
324 | |||
305 | if (i == chain->nr) | 325 | if (i == chain->nr) |
306 | break; | 326 | break; |
307 | if (cnode->sym && syms[i]) { | 327 | |
308 | if (cnode->sym->start != syms[i]->start) | 328 | sym = chain->ips[i].ms.sym; |
329 | |||
330 | if (cnode->ms.sym && sym) { | ||
331 | if (cnode->ms.sym->start != sym->start) | ||
309 | break; | 332 | break; |
310 | } else if (cnode->ip != chain->ips[i]) | 333 | } else if (cnode->ip != chain->ips[i].ip) |
311 | break; | 334 | break; |
335 | |||
312 | if (!found) | 336 | if (!found) |
313 | found = true; | 337 | found = true; |
314 | i++; | 338 | i++; |
@@ -320,7 +344,7 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
320 | 344 | ||
321 | /* we match only a part of the node. Split it and add the new chain */ | 345 | /* we match only a part of the node. Split it and add the new chain */ |
322 | if (i - start < root->val_nr) { | 346 | if (i - start < root->val_nr) { |
323 | split_add_child(root, chain, cnode, start, i - start, syms); | 347 | split_add_child(root, chain, cnode, start, i - start); |
324 | return 0; | 348 | return 0; |
325 | } | 349 | } |
326 | 350 | ||
@@ -331,15 +355,50 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
331 | } | 355 | } |
332 | 356 | ||
333 | /* We match the node and still have a part remaining */ | 357 | /* We match the node and still have a part remaining */ |
334 | __append_chain_children(root, chain, syms, i); | 358 | __append_chain_children(root, chain, i); |
335 | 359 | ||
336 | return 0; | 360 | return 0; |
337 | } | 361 | } |
338 | 362 | ||
339 | void append_chain(struct callchain_node *root, struct ip_callchain *chain, | 363 | static void filter_context(struct ip_callchain *old, struct resolved_chain *new, |
340 | struct symbol **syms) | 364 | struct map_symbol *syms) |
341 | { | 365 | { |
366 | int i, j = 0; | ||
367 | |||
368 | for (i = 0; i < (int)old->nr; i++) { | ||
369 | if (old->ips[i] >= PERF_CONTEXT_MAX) | ||
370 | continue; | ||
371 | |||
372 | new->ips[j].ip = old->ips[i]; | ||
373 | new->ips[j].ms = syms[i]; | ||
374 | j++; | ||
375 | } | ||
376 | |||
377 | new->nr = j; | ||
378 | } | ||
379 | |||
380 | |||
381 | int append_chain(struct callchain_node *root, struct ip_callchain *chain, | ||
382 | struct map_symbol *syms) | ||
383 | { | ||
384 | struct resolved_chain *filtered; | ||
385 | |||
342 | if (!chain->nr) | 386 | if (!chain->nr) |
343 | return; | 387 | return 0; |
344 | __append_chain_children(root, chain, syms, 0); | 388 | |
389 | filtered = zalloc(sizeof(*filtered) + | ||
390 | chain->nr * sizeof(struct resolved_ip)); | ||
391 | if (!filtered) | ||
392 | return -ENOMEM; | ||
393 | |||
394 | filter_context(chain, filtered, syms); | ||
395 | |||
396 | if (!filtered->nr) | ||
397 | goto end; | ||
398 | |||
399 | __append_chain_children(root, filtered, 0); | ||
400 | end: | ||
401 | free(filtered); | ||
402 | |||
403 | return 0; | ||
345 | } | 404 | } |
diff --git a/tools/perf/util/callchain.h b/tools/perf/util/callchain.h index ad4626de4c2b..1cba1f5504e7 100644 --- a/tools/perf/util/callchain.h +++ b/tools/perf/util/callchain.h | |||
@@ -4,6 +4,7 @@ | |||
4 | #include "../perf.h" | 4 | #include "../perf.h" |
5 | #include <linux/list.h> | 5 | #include <linux/list.h> |
6 | #include <linux/rbtree.h> | 6 | #include <linux/rbtree.h> |
7 | #include "event.h" | ||
7 | #include "util.h" | 8 | #include "util.h" |
8 | #include "symbol.h" | 9 | #include "symbol.h" |
9 | 10 | ||
@@ -33,13 +34,14 @@ typedef void (*sort_chain_func_t)(struct rb_root *, struct callchain_node *, | |||
33 | 34 | ||
34 | struct callchain_param { | 35 | struct callchain_param { |
35 | enum chain_mode mode; | 36 | enum chain_mode mode; |
37 | u32 print_limit; | ||
36 | double min_percent; | 38 | double min_percent; |
37 | sort_chain_func_t sort; | 39 | sort_chain_func_t sort; |
38 | }; | 40 | }; |
39 | 41 | ||
40 | struct callchain_list { | 42 | struct callchain_list { |
41 | u64 ip; | 43 | u64 ip; |
42 | struct symbol *sym; | 44 | struct map_symbol ms; |
43 | struct list_head list; | 45 | struct list_head list; |
44 | }; | 46 | }; |
45 | 47 | ||
@@ -56,6 +58,8 @@ static inline u64 cumul_hits(struct callchain_node *node) | |||
56 | } | 58 | } |
57 | 59 | ||
58 | int register_callchain_param(struct callchain_param *param); | 60 | int register_callchain_param(struct callchain_param *param); |
59 | void append_chain(struct callchain_node *root, struct ip_callchain *chain, | 61 | int append_chain(struct callchain_node *root, struct ip_callchain *chain, |
60 | struct symbol **syms); | 62 | struct map_symbol *syms); |
63 | |||
64 | bool ip_callchain__valid(struct ip_callchain *chain, event_t *event); | ||
61 | #endif /* __PERF_CALLCHAIN_H */ | 65 | #endif /* __PERF_CALLCHAIN_H */ |
diff --git a/tools/perf/util/color.c b/tools/perf/util/color.c index e88bca55a599..e191eb9a667f 100644 --- a/tools/perf/util/color.c +++ b/tools/perf/util/color.c | |||
@@ -166,6 +166,31 @@ int perf_color_default_config(const char *var, const char *value, void *cb) | |||
166 | return perf_default_config(var, value, cb); | 166 | return perf_default_config(var, value, cb); |
167 | } | 167 | } |
168 | 168 | ||
169 | static int __color_vsnprintf(char *bf, size_t size, const char *color, | ||
170 | const char *fmt, va_list args, const char *trail) | ||
171 | { | ||
172 | int r = 0; | ||
173 | |||
174 | /* | ||
175 | * Auto-detect: | ||
176 | */ | ||
177 | if (perf_use_color_default < 0) { | ||
178 | if (isatty(1) || pager_in_use()) | ||
179 | perf_use_color_default = 1; | ||
180 | else | ||
181 | perf_use_color_default = 0; | ||
182 | } | ||
183 | |||
184 | if (perf_use_color_default && *color) | ||
185 | r += snprintf(bf, size, "%s", color); | ||
186 | r += vsnprintf(bf + r, size - r, fmt, args); | ||
187 | if (perf_use_color_default && *color) | ||
188 | r += snprintf(bf + r, size - r, "%s", PERF_COLOR_RESET); | ||
189 | if (trail) | ||
190 | r += snprintf(bf + r, size - r, "%s", trail); | ||
191 | return r; | ||
192 | } | ||
193 | |||
169 | static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, | 194 | static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, |
170 | va_list args, const char *trail) | 195 | va_list args, const char *trail) |
171 | { | 196 | { |
@@ -191,11 +216,28 @@ static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, | |||
191 | return r; | 216 | return r; |
192 | } | 217 | } |
193 | 218 | ||
219 | int color_vsnprintf(char *bf, size_t size, const char *color, | ||
220 | const char *fmt, va_list args) | ||
221 | { | ||
222 | return __color_vsnprintf(bf, size, color, fmt, args, NULL); | ||
223 | } | ||
224 | |||
194 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args) | 225 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args) |
195 | { | 226 | { |
196 | return __color_vfprintf(fp, color, fmt, args, NULL); | 227 | return __color_vfprintf(fp, color, fmt, args, NULL); |
197 | } | 228 | } |
198 | 229 | ||
230 | int color_snprintf(char *bf, size_t size, const char *color, | ||
231 | const char *fmt, ...) | ||
232 | { | ||
233 | va_list args; | ||
234 | int r; | ||
235 | |||
236 | va_start(args, fmt); | ||
237 | r = color_vsnprintf(bf, size, color, fmt, args); | ||
238 | va_end(args); | ||
239 | return r; | ||
240 | } | ||
199 | 241 | ||
200 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...) | 242 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...) |
201 | { | 243 | { |
@@ -274,3 +316,9 @@ int percent_color_fprintf(FILE *fp, const char *fmt, double percent) | |||
274 | 316 | ||
275 | return r; | 317 | return r; |
276 | } | 318 | } |
319 | |||
320 | int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent) | ||
321 | { | ||
322 | const char *color = get_percent_color(percent); | ||
323 | return color_snprintf(bf, size, color, fmt, percent); | ||
324 | } | ||
diff --git a/tools/perf/util/color.h b/tools/perf/util/color.h index 24e8809210bb..dea082b79602 100644 --- a/tools/perf/util/color.h +++ b/tools/perf/util/color.h | |||
@@ -32,10 +32,14 @@ int perf_color_default_config(const char *var, const char *value, void *cb); | |||
32 | int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty); | 32 | int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty); |
33 | void color_parse(const char *value, const char *var, char *dst); | 33 | void color_parse(const char *value, const char *var, char *dst); |
34 | void color_parse_mem(const char *value, int len, const char *var, char *dst); | 34 | void color_parse_mem(const char *value, int len, const char *var, char *dst); |
35 | int color_vsnprintf(char *bf, size_t size, const char *color, | ||
36 | const char *fmt, va_list args); | ||
35 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args); | 37 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args); |
36 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...); | 38 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...); |
39 | int color_snprintf(char *bf, size_t size, const char *color, const char *fmt, ...); | ||
37 | int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...); | 40 | int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...); |
38 | int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf); | 41 | int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf); |
42 | int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent); | ||
39 | int percent_color_fprintf(FILE *fp, const char *fmt, double percent); | 43 | int percent_color_fprintf(FILE *fp, const char *fmt, double percent); |
40 | const char *get_percent_color(double percent); | 44 | const char *get_percent_color(double percent); |
41 | 45 | ||
diff --git a/tools/perf/util/debug.c b/tools/perf/util/debug.c index 0905600c3851..dd824cf3b628 100644 --- a/tools/perf/util/debug.c +++ b/tools/perf/util/debug.c | |||
@@ -6,13 +6,14 @@ | |||
6 | #include <stdarg.h> | 6 | #include <stdarg.h> |
7 | #include <stdio.h> | 7 | #include <stdio.h> |
8 | 8 | ||
9 | #include "cache.h" | ||
9 | #include "color.h" | 10 | #include "color.h" |
10 | #include "event.h" | 11 | #include "event.h" |
11 | #include "debug.h" | 12 | #include "debug.h" |
12 | #include "util.h" | 13 | #include "util.h" |
13 | 14 | ||
14 | int verbose = 0; | 15 | int verbose = 0; |
15 | int dump_trace = 0; | 16 | bool dump_trace = false; |
16 | 17 | ||
17 | int eprintf(int level, const char *fmt, ...) | 18 | int eprintf(int level, const char *fmt, ...) |
18 | { | 19 | { |
@@ -21,7 +22,10 @@ int eprintf(int level, const char *fmt, ...) | |||
21 | 22 | ||
22 | if (verbose >= level) { | 23 | if (verbose >= level) { |
23 | va_start(args, fmt); | 24 | va_start(args, fmt); |
24 | ret = vfprintf(stderr, fmt, args); | 25 | if (use_browser) |
26 | ret = browser__show_help(fmt, args); | ||
27 | else | ||
28 | ret = vfprintf(stderr, fmt, args); | ||
25 | va_end(args); | 29 | va_end(args); |
26 | } | 30 | } |
27 | 31 | ||
diff --git a/tools/perf/util/debug.h b/tools/perf/util/debug.h index c6c24c522dea..047ac3324ebe 100644 --- a/tools/perf/util/debug.h +++ b/tools/perf/util/debug.h | |||
@@ -2,14 +2,38 @@ | |||
2 | #ifndef __PERF_DEBUG_H | 2 | #ifndef __PERF_DEBUG_H |
3 | #define __PERF_DEBUG_H | 3 | #define __PERF_DEBUG_H |
4 | 4 | ||
5 | #include <stdbool.h> | ||
5 | #include "event.h" | 6 | #include "event.h" |
6 | 7 | ||
7 | extern int verbose; | 8 | extern int verbose; |
8 | extern int dump_trace; | 9 | extern bool dump_trace; |
9 | 10 | ||
10 | int eprintf(int level, | ||
11 | const char *fmt, ...) __attribute__((format(printf, 2, 3))); | ||
12 | int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2))); | 11 | int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2))); |
13 | void trace_event(event_t *event); | 12 | void trace_event(event_t *event); |
14 | 13 | ||
14 | struct ui_progress; | ||
15 | |||
16 | #ifdef NO_NEWT_SUPPORT | ||
17 | static inline int browser__show_help(const char *format __used, va_list ap __used) | ||
18 | { | ||
19 | return 0; | ||
20 | } | ||
21 | |||
22 | static inline struct ui_progress *ui_progress__new(const char *title __used, | ||
23 | u64 total __used) | ||
24 | { | ||
25 | return (struct ui_progress *)1; | ||
26 | } | ||
27 | |||
28 | static inline void ui_progress__update(struct ui_progress *self __used, | ||
29 | u64 curr __used) {} | ||
30 | |||
31 | static inline void ui_progress__delete(struct ui_progress *self __used) {} | ||
32 | #else | ||
33 | int browser__show_help(const char *format, va_list ap); | ||
34 | struct ui_progress *ui_progress__new(const char *title, u64 total); | ||
35 | void ui_progress__update(struct ui_progress *self, u64 curr); | ||
36 | void ui_progress__delete(struct ui_progress *self); | ||
37 | #endif | ||
38 | |||
15 | #endif /* __PERF_DEBUG_H */ | 39 | #endif /* __PERF_DEBUG_H */ |
diff --git a/tools/perf/util/event.c b/tools/perf/util/event.c index 705ec63548b4..50771b5813ee 100644 --- a/tools/perf/util/event.c +++ b/tools/perf/util/event.c | |||
@@ -7,6 +7,23 @@ | |||
7 | #include "strlist.h" | 7 | #include "strlist.h" |
8 | #include "thread.h" | 8 | #include "thread.h" |
9 | 9 | ||
10 | const char *event__name[] = { | ||
11 | [0] = "TOTAL", | ||
12 | [PERF_RECORD_MMAP] = "MMAP", | ||
13 | [PERF_RECORD_LOST] = "LOST", | ||
14 | [PERF_RECORD_COMM] = "COMM", | ||
15 | [PERF_RECORD_EXIT] = "EXIT", | ||
16 | [PERF_RECORD_THROTTLE] = "THROTTLE", | ||
17 | [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE", | ||
18 | [PERF_RECORD_FORK] = "FORK", | ||
19 | [PERF_RECORD_READ] = "READ", | ||
20 | [PERF_RECORD_SAMPLE] = "SAMPLE", | ||
21 | [PERF_RECORD_HEADER_ATTR] = "ATTR", | ||
22 | [PERF_RECORD_HEADER_EVENT_TYPE] = "EVENT_TYPE", | ||
23 | [PERF_RECORD_HEADER_TRACING_DATA] = "TRACING_DATA", | ||
24 | [PERF_RECORD_HEADER_BUILD_ID] = "BUILD_ID", | ||
25 | }; | ||
26 | |||
10 | static pid_t event__synthesize_comm(pid_t pid, int full, | 27 | static pid_t event__synthesize_comm(pid_t pid, int full, |
11 | event__handler_t process, | 28 | event__handler_t process, |
12 | struct perf_session *session) | 29 | struct perf_session *session) |
@@ -112,7 +129,11 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
112 | event_t ev = { | 129 | event_t ev = { |
113 | .header = { | 130 | .header = { |
114 | .type = PERF_RECORD_MMAP, | 131 | .type = PERF_RECORD_MMAP, |
115 | .misc = 0, /* Just like the kernel, see kernel/perf_event.c __perf_event_mmap */ | 132 | /* |
133 | * Just like the kernel, see __perf_event_mmap | ||
134 | * in kernel/perf_event.c | ||
135 | */ | ||
136 | .misc = PERF_RECORD_MISC_USER, | ||
116 | }, | 137 | }, |
117 | }; | 138 | }; |
118 | int n; | 139 | int n; |
@@ -130,6 +151,7 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
130 | continue; | 151 | continue; |
131 | pbf += n + 3; | 152 | pbf += n + 3; |
132 | if (*pbf == 'x') { /* vm_exec */ | 153 | if (*pbf == 'x') { /* vm_exec */ |
154 | u64 vm_pgoff; | ||
133 | char *execname = strchr(bf, '/'); | 155 | char *execname = strchr(bf, '/'); |
134 | 156 | ||
135 | /* Catch VDSO */ | 157 | /* Catch VDSO */ |
@@ -139,6 +161,14 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
139 | if (execname == NULL) | 161 | if (execname == NULL) |
140 | continue; | 162 | continue; |
141 | 163 | ||
164 | pbf += 3; | ||
165 | n = hex2u64(pbf, &vm_pgoff); | ||
166 | /* pgoff is in bytes, not pages */ | ||
167 | if (n >= 0) | ||
168 | ev.mmap.pgoff = vm_pgoff << getpagesize(); | ||
169 | else | ||
170 | ev.mmap.pgoff = 0; | ||
171 | |||
142 | size = strlen(execname); | 172 | size = strlen(execname); |
143 | execname[size - 1] = '\0'; /* Remove \n */ | 173 | execname[size - 1] = '\0'; /* Remove \n */ |
144 | memcpy(ev.mmap.filename, execname, size); | 174 | memcpy(ev.mmap.filename, execname, size); |
@@ -158,11 +188,23 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
158 | } | 188 | } |
159 | 189 | ||
160 | int event__synthesize_modules(event__handler_t process, | 190 | int event__synthesize_modules(event__handler_t process, |
161 | struct perf_session *session) | 191 | struct perf_session *session, |
192 | struct machine *machine) | ||
162 | { | 193 | { |
163 | struct rb_node *nd; | 194 | struct rb_node *nd; |
195 | struct map_groups *kmaps = &machine->kmaps; | ||
196 | u16 misc; | ||
197 | |||
198 | /* | ||
199 | * kernel uses 0 for user space maps, see kernel/perf_event.c | ||
200 | * __perf_event_mmap | ||
201 | */ | ||
202 | if (machine__is_host(machine)) | ||
203 | misc = PERF_RECORD_MISC_KERNEL; | ||
204 | else | ||
205 | misc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
164 | 206 | ||
165 | for (nd = rb_first(&session->kmaps.maps[MAP__FUNCTION]); | 207 | for (nd = rb_first(&kmaps->maps[MAP__FUNCTION]); |
166 | nd; nd = rb_next(nd)) { | 208 | nd; nd = rb_next(nd)) { |
167 | event_t ev; | 209 | event_t ev; |
168 | size_t size; | 210 | size_t size; |
@@ -173,12 +215,13 @@ int event__synthesize_modules(event__handler_t process, | |||
173 | 215 | ||
174 | size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64)); | 216 | size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64)); |
175 | memset(&ev, 0, sizeof(ev)); | 217 | memset(&ev, 0, sizeof(ev)); |
176 | ev.mmap.header.misc = 1; /* kernel uses 0 for user space maps, see kernel/perf_event.c __perf_event_mmap */ | 218 | ev.mmap.header.misc = misc; |
177 | ev.mmap.header.type = PERF_RECORD_MMAP; | 219 | ev.mmap.header.type = PERF_RECORD_MMAP; |
178 | ev.mmap.header.size = (sizeof(ev.mmap) - | 220 | ev.mmap.header.size = (sizeof(ev.mmap) - |
179 | (sizeof(ev.mmap.filename) - size)); | 221 | (sizeof(ev.mmap.filename) - size)); |
180 | ev.mmap.start = pos->start; | 222 | ev.mmap.start = pos->start; |
181 | ev.mmap.len = pos->end - pos->start; | 223 | ev.mmap.len = pos->end - pos->start; |
224 | ev.mmap.pid = machine->pid; | ||
182 | 225 | ||
183 | memcpy(ev.mmap.filename, pos->dso->long_name, | 226 | memcpy(ev.mmap.filename, pos->dso->long_name, |
184 | pos->dso->long_name_len + 1); | 227 | pos->dso->long_name_len + 1); |
@@ -241,13 +284,18 @@ static int find_symbol_cb(void *arg, const char *name, char type, u64 start) | |||
241 | 284 | ||
242 | int event__synthesize_kernel_mmap(event__handler_t process, | 285 | int event__synthesize_kernel_mmap(event__handler_t process, |
243 | struct perf_session *session, | 286 | struct perf_session *session, |
287 | struct machine *machine, | ||
244 | const char *symbol_name) | 288 | const char *symbol_name) |
245 | { | 289 | { |
246 | size_t size; | 290 | size_t size; |
291 | const char *filename, *mmap_name; | ||
292 | char path[PATH_MAX]; | ||
293 | char name_buff[PATH_MAX]; | ||
294 | struct map *map; | ||
295 | |||
247 | event_t ev = { | 296 | event_t ev = { |
248 | .header = { | 297 | .header = { |
249 | .type = PERF_RECORD_MMAP, | 298 | .type = PERF_RECORD_MMAP, |
250 | .misc = 1, /* kernel uses 0 for user space maps, see kernel/perf_event.c __perf_event_mmap */ | ||
251 | }, | 299 | }, |
252 | }; | 300 | }; |
253 | /* | 301 | /* |
@@ -257,16 +305,37 @@ int event__synthesize_kernel_mmap(event__handler_t process, | |||
257 | */ | 305 | */ |
258 | struct process_symbol_args args = { .name = symbol_name, }; | 306 | struct process_symbol_args args = { .name = symbol_name, }; |
259 | 307 | ||
260 | if (kallsyms__parse("/proc/kallsyms", &args, find_symbol_cb) <= 0) | 308 | mmap_name = machine__mmap_name(machine, name_buff, sizeof(name_buff)); |
309 | if (machine__is_host(machine)) { | ||
310 | /* | ||
311 | * kernel uses PERF_RECORD_MISC_USER for user space maps, | ||
312 | * see kernel/perf_event.c __perf_event_mmap | ||
313 | */ | ||
314 | ev.header.misc = PERF_RECORD_MISC_KERNEL; | ||
315 | filename = "/proc/kallsyms"; | ||
316 | } else { | ||
317 | ev.header.misc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
318 | if (machine__is_default_guest(machine)) | ||
319 | filename = (char *) symbol_conf.default_guest_kallsyms; | ||
320 | else { | ||
321 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
322 | filename = path; | ||
323 | } | ||
324 | } | ||
325 | |||
326 | if (kallsyms__parse(filename, &args, find_symbol_cb) <= 0) | ||
261 | return -ENOENT; | 327 | return -ENOENT; |
262 | 328 | ||
329 | map = machine->vmlinux_maps[MAP__FUNCTION]; | ||
263 | size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename), | 330 | size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename), |
264 | "[kernel.kallsyms.%s]", symbol_name) + 1; | 331 | "%s%s", mmap_name, symbol_name) + 1; |
265 | size = ALIGN(size, sizeof(u64)); | 332 | size = ALIGN(size, sizeof(u64)); |
266 | ev.mmap.header.size = (sizeof(ev.mmap) - (sizeof(ev.mmap.filename) - size)); | 333 | ev.mmap.header.size = (sizeof(ev.mmap) - |
334 | (sizeof(ev.mmap.filename) - size)); | ||
267 | ev.mmap.pgoff = args.start; | 335 | ev.mmap.pgoff = args.start; |
268 | ev.mmap.start = session->vmlinux_maps[MAP__FUNCTION]->start; | 336 | ev.mmap.start = map->start; |
269 | ev.mmap.len = session->vmlinux_maps[MAP__FUNCTION]->end - ev.mmap.start ; | 337 | ev.mmap.len = map->end - ev.mmap.start; |
338 | ev.mmap.pid = machine->pid; | ||
270 | 339 | ||
271 | return process(&ev, session); | 340 | return process(&ev, session); |
272 | } | 341 | } |
@@ -316,26 +385,54 @@ int event__process_comm(event_t *self, struct perf_session *session) | |||
316 | int event__process_lost(event_t *self, struct perf_session *session) | 385 | int event__process_lost(event_t *self, struct perf_session *session) |
317 | { | 386 | { |
318 | dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost); | 387 | dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost); |
319 | session->events_stats.lost += self->lost.lost; | 388 | session->hists.stats.total_lost += self->lost.lost; |
320 | return 0; | 389 | return 0; |
321 | } | 390 | } |
322 | 391 | ||
323 | int event__process_mmap(event_t *self, struct perf_session *session) | 392 | static void event_set_kernel_mmap_len(struct map **maps, event_t *self) |
393 | { | ||
394 | maps[MAP__FUNCTION]->start = self->mmap.start; | ||
395 | maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len; | ||
396 | /* | ||
397 | * Be a bit paranoid here, some perf.data file came with | ||
398 | * a zero sized synthesized MMAP event for the kernel. | ||
399 | */ | ||
400 | if (maps[MAP__FUNCTION]->end == 0) | ||
401 | maps[MAP__FUNCTION]->end = ~0UL; | ||
402 | } | ||
403 | |||
404 | static int event__process_kernel_mmap(event_t *self, | ||
405 | struct perf_session *session) | ||
324 | { | 406 | { |
325 | struct thread *thread; | ||
326 | struct map *map; | 407 | struct map *map; |
408 | char kmmap_prefix[PATH_MAX]; | ||
409 | struct machine *machine; | ||
410 | enum dso_kernel_type kernel_type; | ||
411 | bool is_kernel_mmap; | ||
412 | |||
413 | machine = perf_session__findnew_machine(session, self->mmap.pid); | ||
414 | if (!machine) { | ||
415 | pr_err("Can't find id %d's machine\n", self->mmap.pid); | ||
416 | goto out_problem; | ||
417 | } | ||
327 | 418 | ||
328 | dump_printf(" %d/%d: [%#Lx(%#Lx) @ %#Lx]: %s\n", | 419 | machine__mmap_name(machine, kmmap_prefix, sizeof(kmmap_prefix)); |
329 | self->mmap.pid, self->mmap.tid, self->mmap.start, | 420 | if (machine__is_host(machine)) |
330 | self->mmap.len, self->mmap.pgoff, self->mmap.filename); | 421 | kernel_type = DSO_TYPE_KERNEL; |
422 | else | ||
423 | kernel_type = DSO_TYPE_GUEST_KERNEL; | ||
331 | 424 | ||
332 | if (self->mmap.pid == 0) { | 425 | is_kernel_mmap = memcmp(self->mmap.filename, |
333 | static const char kmmap_prefix[] = "[kernel.kallsyms."; | 426 | kmmap_prefix, |
427 | strlen(kmmap_prefix)) == 0; | ||
428 | if (self->mmap.filename[0] == '/' || | ||
429 | (!is_kernel_mmap && self->mmap.filename[0] == '[')) { | ||
334 | 430 | ||
335 | if (self->mmap.filename[0] == '/') { | 431 | char short_module_name[1024]; |
336 | char short_module_name[1024]; | 432 | char *name, *dot; |
337 | char *name = strrchr(self->mmap.filename, '/'), *dot; | ||
338 | 433 | ||
434 | if (self->mmap.filename[0] == '/') { | ||
435 | name = strrchr(self->mmap.filename, '/'); | ||
339 | if (name == NULL) | 436 | if (name == NULL) |
340 | goto out_problem; | 437 | goto out_problem; |
341 | 438 | ||
@@ -343,58 +440,84 @@ int event__process_mmap(event_t *self, struct perf_session *session) | |||
343 | dot = strrchr(name, '.'); | 440 | dot = strrchr(name, '.'); |
344 | if (dot == NULL) | 441 | if (dot == NULL) |
345 | goto out_problem; | 442 | goto out_problem; |
346 | |||
347 | snprintf(short_module_name, sizeof(short_module_name), | 443 | snprintf(short_module_name, sizeof(short_module_name), |
348 | "[%.*s]", (int)(dot - name), name); | 444 | "[%.*s]", (int)(dot - name), name); |
349 | strxfrchar(short_module_name, '-', '_'); | 445 | strxfrchar(short_module_name, '-', '_'); |
350 | 446 | } else | |
351 | map = perf_session__new_module_map(session, | 447 | strcpy(short_module_name, self->mmap.filename); |
352 | self->mmap.start, | 448 | |
353 | self->mmap.filename); | 449 | map = machine__new_module(machine, self->mmap.start, |
354 | if (map == NULL) | 450 | self->mmap.filename); |
355 | goto out_problem; | 451 | if (map == NULL) |
356 | 452 | goto out_problem; | |
357 | name = strdup(short_module_name); | 453 | |
358 | if (name == NULL) | 454 | name = strdup(short_module_name); |
359 | goto out_problem; | 455 | if (name == NULL) |
360 | 456 | goto out_problem; | |
361 | map->dso->short_name = name; | 457 | |
362 | map->end = map->start + self->mmap.len; | 458 | map->dso->short_name = name; |
363 | } else if (memcmp(self->mmap.filename, kmmap_prefix, | 459 | map->end = map->start + self->mmap.len; |
364 | sizeof(kmmap_prefix) - 1) == 0) { | 460 | } else if (is_kernel_mmap) { |
365 | const char *symbol_name = (self->mmap.filename + | 461 | const char *symbol_name = (self->mmap.filename + |
366 | sizeof(kmmap_prefix) - 1); | 462 | strlen(kmmap_prefix)); |
463 | /* | ||
464 | * Should be there already, from the build-id table in | ||
465 | * the header. | ||
466 | */ | ||
467 | struct dso *kernel = __dsos__findnew(&machine->kernel_dsos, | ||
468 | kmmap_prefix); | ||
469 | if (kernel == NULL) | ||
470 | goto out_problem; | ||
471 | |||
472 | kernel->kernel = kernel_type; | ||
473 | if (__machine__create_kernel_maps(machine, kernel) < 0) | ||
474 | goto out_problem; | ||
475 | |||
476 | event_set_kernel_mmap_len(machine->vmlinux_maps, self); | ||
477 | perf_session__set_kallsyms_ref_reloc_sym(machine->vmlinux_maps, | ||
478 | symbol_name, | ||
479 | self->mmap.pgoff); | ||
480 | if (machine__is_default_guest(machine)) { | ||
367 | /* | 481 | /* |
368 | * Should be there already, from the build-id table in | 482 | * preload dso of guest kernel and modules |
369 | * the header. | ||
370 | */ | 483 | */ |
371 | struct dso *kernel = __dsos__findnew(&dsos__kernel, | 484 | dso__load(kernel, machine->vmlinux_maps[MAP__FUNCTION], |
372 | "[kernel.kallsyms]"); | 485 | NULL); |
373 | if (kernel == NULL) | 486 | } |
374 | goto out_problem; | 487 | } |
375 | 488 | return 0; | |
376 | kernel->kernel = 1; | 489 | out_problem: |
377 | if (__perf_session__create_kernel_maps(session, kernel) < 0) | 490 | return -1; |
378 | goto out_problem; | 491 | } |
379 | 492 | ||
380 | session->vmlinux_maps[MAP__FUNCTION]->start = self->mmap.start; | 493 | int event__process_mmap(event_t *self, struct perf_session *session) |
381 | session->vmlinux_maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len; | 494 | { |
382 | /* | 495 | struct machine *machine; |
383 | * Be a bit paranoid here, some perf.data file came with | 496 | struct thread *thread; |
384 | * a zero sized synthesized MMAP event for the kernel. | 497 | struct map *map; |
385 | */ | 498 | u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; |
386 | if (session->vmlinux_maps[MAP__FUNCTION]->end == 0) | 499 | int ret = 0; |
387 | session->vmlinux_maps[MAP__FUNCTION]->end = ~0UL; | ||
388 | 500 | ||
389 | perf_session__set_kallsyms_ref_reloc_sym(session, symbol_name, | 501 | dump_printf(" %d/%d: [%#Lx(%#Lx) @ %#Lx]: %s\n", |
390 | self->mmap.pgoff); | 502 | self->mmap.pid, self->mmap.tid, self->mmap.start, |
391 | } | 503 | self->mmap.len, self->mmap.pgoff, self->mmap.filename); |
504 | |||
505 | if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL || | ||
506 | cpumode == PERF_RECORD_MISC_KERNEL) { | ||
507 | ret = event__process_kernel_mmap(self, session); | ||
508 | if (ret < 0) | ||
509 | goto out_problem; | ||
392 | return 0; | 510 | return 0; |
393 | } | 511 | } |
394 | 512 | ||
513 | machine = perf_session__find_host_machine(session); | ||
514 | if (machine == NULL) | ||
515 | goto out_problem; | ||
395 | thread = perf_session__findnew(session, self->mmap.pid); | 516 | thread = perf_session__findnew(session, self->mmap.pid); |
396 | map = map__new(&self->mmap, MAP__FUNCTION, | 517 | map = map__new(&machine->user_dsos, self->mmap.start, |
397 | session->cwd, session->cwdlen); | 518 | self->mmap.len, self->mmap.pgoff, |
519 | self->mmap.pid, self->mmap.filename, | ||
520 | MAP__FUNCTION, session->cwd, session->cwdlen); | ||
398 | 521 | ||
399 | if (thread == NULL || map == NULL) | 522 | if (thread == NULL || map == NULL) |
400 | goto out_problem; | 523 | goto out_problem; |
@@ -434,22 +557,56 @@ int event__process_task(event_t *self, struct perf_session *session) | |||
434 | 557 | ||
435 | void thread__find_addr_map(struct thread *self, | 558 | void thread__find_addr_map(struct thread *self, |
436 | struct perf_session *session, u8 cpumode, | 559 | struct perf_session *session, u8 cpumode, |
437 | enum map_type type, u64 addr, | 560 | enum map_type type, pid_t pid, u64 addr, |
438 | struct addr_location *al) | 561 | struct addr_location *al) |
439 | { | 562 | { |
440 | struct map_groups *mg = &self->mg; | 563 | struct map_groups *mg = &self->mg; |
564 | struct machine *machine = NULL; | ||
441 | 565 | ||
442 | al->thread = self; | 566 | al->thread = self; |
443 | al->addr = addr; | 567 | al->addr = addr; |
568 | al->cpumode = cpumode; | ||
569 | al->filtered = false; | ||
444 | 570 | ||
445 | if (cpumode == PERF_RECORD_MISC_KERNEL) { | 571 | if (cpumode == PERF_RECORD_MISC_KERNEL && perf_host) { |
446 | al->level = 'k'; | 572 | al->level = 'k'; |
447 | mg = &session->kmaps; | 573 | machine = perf_session__find_host_machine(session); |
448 | } else if (cpumode == PERF_RECORD_MISC_USER) | 574 | if (machine == NULL) { |
575 | al->map = NULL; | ||
576 | return; | ||
577 | } | ||
578 | mg = &machine->kmaps; | ||
579 | } else if (cpumode == PERF_RECORD_MISC_USER && perf_host) { | ||
449 | al->level = '.'; | 580 | al->level = '.'; |
450 | else { | 581 | machine = perf_session__find_host_machine(session); |
451 | al->level = 'H'; | 582 | } else if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL && perf_guest) { |
583 | al->level = 'g'; | ||
584 | machine = perf_session__find_machine(session, pid); | ||
585 | if (machine == NULL) { | ||
586 | al->map = NULL; | ||
587 | return; | ||
588 | } | ||
589 | mg = &machine->kmaps; | ||
590 | } else { | ||
591 | /* | ||
592 | * 'u' means guest os user space. | ||
593 | * TODO: We don't support guest user space. Might support late. | ||
594 | */ | ||
595 | if (cpumode == PERF_RECORD_MISC_GUEST_USER && perf_guest) | ||
596 | al->level = 'u'; | ||
597 | else | ||
598 | al->level = 'H'; | ||
452 | al->map = NULL; | 599 | al->map = NULL; |
600 | |||
601 | if ((cpumode == PERF_RECORD_MISC_GUEST_USER || | ||
602 | cpumode == PERF_RECORD_MISC_GUEST_KERNEL) && | ||
603 | !perf_guest) | ||
604 | al->filtered = true; | ||
605 | if ((cpumode == PERF_RECORD_MISC_USER || | ||
606 | cpumode == PERF_RECORD_MISC_KERNEL) && | ||
607 | !perf_host) | ||
608 | al->filtered = true; | ||
609 | |||
453 | return; | 610 | return; |
454 | } | 611 | } |
455 | try_again: | 612 | try_again: |
@@ -464,8 +621,10 @@ try_again: | |||
464 | * "[vdso]" dso, but for now lets use the old trick of looking | 621 | * "[vdso]" dso, but for now lets use the old trick of looking |
465 | * in the whole kernel symbol list. | 622 | * in the whole kernel symbol list. |
466 | */ | 623 | */ |
467 | if ((long long)al->addr < 0 && mg != &session->kmaps) { | 624 | if ((long long)al->addr < 0 && |
468 | mg = &session->kmaps; | 625 | cpumode == PERF_RECORD_MISC_KERNEL && |
626 | machine && mg != &machine->kmaps) { | ||
627 | mg = &machine->kmaps; | ||
469 | goto try_again; | 628 | goto try_again; |
470 | } | 629 | } |
471 | } else | 630 | } else |
@@ -474,11 +633,11 @@ try_again: | |||
474 | 633 | ||
475 | void thread__find_addr_location(struct thread *self, | 634 | void thread__find_addr_location(struct thread *self, |
476 | struct perf_session *session, u8 cpumode, | 635 | struct perf_session *session, u8 cpumode, |
477 | enum map_type type, u64 addr, | 636 | enum map_type type, pid_t pid, u64 addr, |
478 | struct addr_location *al, | 637 | struct addr_location *al, |
479 | symbol_filter_t filter) | 638 | symbol_filter_t filter) |
480 | { | 639 | { |
481 | thread__find_addr_map(self, session, cpumode, type, addr, al); | 640 | thread__find_addr_map(self, session, cpumode, type, pid, addr, al); |
482 | if (al->map != NULL) | 641 | if (al->map != NULL) |
483 | al->sym = map__find_symbol(al->map, al->addr, filter); | 642 | al->sym = map__find_symbol(al->map, al->addr, filter); |
484 | else | 643 | else |
@@ -490,8 +649,10 @@ static void dso__calc_col_width(struct dso *self) | |||
490 | if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep && | 649 | if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep && |
491 | (!symbol_conf.dso_list || | 650 | (!symbol_conf.dso_list || |
492 | strlist__has_entry(symbol_conf.dso_list, self->name))) { | 651 | strlist__has_entry(symbol_conf.dso_list, self->name))) { |
493 | unsigned int slen = strlen(self->name); | 652 | u16 slen = self->short_name_len; |
494 | if (slen > dsos__col_width) | 653 | if (verbose) |
654 | slen = self->long_name_len; | ||
655 | if (dsos__col_width < slen) | ||
495 | dsos__col_width = slen; | 656 | dsos__col_width = slen; |
496 | } | 657 | } |
497 | 658 | ||
@@ -512,31 +673,55 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session, | |||
512 | goto out_filtered; | 673 | goto out_filtered; |
513 | 674 | ||
514 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); | 675 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); |
676 | /* | ||
677 | * Have we already created the kernel maps for the host machine? | ||
678 | * | ||
679 | * This should have happened earlier, when we processed the kernel MMAP | ||
680 | * events, but for older perf.data files there was no such thing, so do | ||
681 | * it now. | ||
682 | */ | ||
683 | if (cpumode == PERF_RECORD_MISC_KERNEL && | ||
684 | session->host_machine.vmlinux_maps[MAP__FUNCTION] == NULL) | ||
685 | machine__create_kernel_maps(&session->host_machine); | ||
515 | 686 | ||
516 | thread__find_addr_location(thread, session, cpumode, MAP__FUNCTION, | 687 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, |
517 | self->ip.ip, al, filter); | 688 | self->ip.pid, self->ip.ip, al); |
518 | dump_printf(" ...... dso: %s\n", | 689 | dump_printf(" ...... dso: %s\n", |
519 | al->map ? al->map->dso->long_name : | 690 | al->map ? al->map->dso->long_name : |
520 | al->level == 'H' ? "[hypervisor]" : "<not found>"); | 691 | al->level == 'H' ? "[hypervisor]" : "<not found>"); |
521 | /* | 692 | al->sym = NULL; |
522 | * We have to do this here as we may have a dso with no symbol hit that | 693 | |
523 | * has a name longer than the ones with symbols sampled. | 694 | if (al->map) { |
524 | */ | 695 | if (symbol_conf.dso_list && |
525 | if (al->map && !sort_dso.elide && !al->map->dso->slen_calculated) | 696 | (!al->map || !al->map->dso || |
526 | dso__calc_col_width(al->map->dso); | 697 | !(strlist__has_entry(symbol_conf.dso_list, |
527 | 698 | al->map->dso->short_name) || | |
528 | if (symbol_conf.dso_list && | 699 | (al->map->dso->short_name != al->map->dso->long_name && |
529 | (!al->map || !al->map->dso || | 700 | strlist__has_entry(symbol_conf.dso_list, |
530 | !(strlist__has_entry(symbol_conf.dso_list, al->map->dso->short_name) || | 701 | al->map->dso->long_name))))) |
531 | (al->map->dso->short_name != al->map->dso->long_name && | 702 | goto out_filtered; |
532 | strlist__has_entry(symbol_conf.dso_list, al->map->dso->long_name))))) | 703 | /* |
533 | goto out_filtered; | 704 | * We have to do this here as we may have a dso with no symbol |
705 | * hit that has a name longer than the ones with symbols | ||
706 | * sampled. | ||
707 | */ | ||
708 | if (!sort_dso.elide && !al->map->dso->slen_calculated) | ||
709 | dso__calc_col_width(al->map->dso); | ||
710 | |||
711 | al->sym = map__find_symbol(al->map, al->addr, filter); | ||
712 | } else { | ||
713 | const unsigned int unresolved_col_width = BITS_PER_LONG / 4; | ||
714 | |||
715 | if (dsos__col_width < unresolved_col_width && | ||
716 | !symbol_conf.col_width_list_str && !symbol_conf.field_sep && | ||
717 | !symbol_conf.dso_list) | ||
718 | dsos__col_width = unresolved_col_width; | ||
719 | } | ||
534 | 720 | ||
535 | if (symbol_conf.sym_list && al->sym && | 721 | if (symbol_conf.sym_list && al->sym && |
536 | !strlist__has_entry(symbol_conf.sym_list, al->sym->name)) | 722 | !strlist__has_entry(symbol_conf.sym_list, al->sym->name)) |
537 | goto out_filtered; | 723 | goto out_filtered; |
538 | 724 | ||
539 | al->filtered = false; | ||
540 | return 0; | 725 | return 0; |
541 | 726 | ||
542 | out_filtered: | 727 | out_filtered: |
@@ -570,6 +755,7 @@ int event__parse_sample(event_t *event, u64 type, struct sample_data *data) | |||
570 | array++; | 755 | array++; |
571 | } | 756 | } |
572 | 757 | ||
758 | data->id = -1ULL; | ||
573 | if (type & PERF_SAMPLE_ID) { | 759 | if (type & PERF_SAMPLE_ID) { |
574 | data->id = *array; | 760 | data->id = *array; |
575 | array++; | 761 | array++; |
diff --git a/tools/perf/util/event.h b/tools/perf/util/event.h index a33b94952e34..8577085db067 100644 --- a/tools/perf/util/event.h +++ b/tools/perf/util/event.h | |||
@@ -68,21 +68,54 @@ struct sample_data { | |||
68 | u64 addr; | 68 | u64 addr; |
69 | u64 id; | 69 | u64 id; |
70 | u64 stream_id; | 70 | u64 stream_id; |
71 | u32 cpu; | ||
72 | u64 period; | 71 | u64 period; |
73 | struct ip_callchain *callchain; | 72 | u32 cpu; |
74 | u32 raw_size; | 73 | u32 raw_size; |
75 | void *raw_data; | 74 | void *raw_data; |
75 | struct ip_callchain *callchain; | ||
76 | }; | 76 | }; |
77 | 77 | ||
78 | #define BUILD_ID_SIZE 20 | 78 | #define BUILD_ID_SIZE 20 |
79 | 79 | ||
80 | struct build_id_event { | 80 | struct build_id_event { |
81 | struct perf_event_header header; | 81 | struct perf_event_header header; |
82 | pid_t pid; | ||
82 | u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))]; | 83 | u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))]; |
83 | char filename[]; | 84 | char filename[]; |
84 | }; | 85 | }; |
85 | 86 | ||
87 | enum perf_user_event_type { /* above any possible kernel type */ | ||
88 | PERF_RECORD_HEADER_ATTR = 64, | ||
89 | PERF_RECORD_HEADER_EVENT_TYPE = 65, | ||
90 | PERF_RECORD_HEADER_TRACING_DATA = 66, | ||
91 | PERF_RECORD_HEADER_BUILD_ID = 67, | ||
92 | PERF_RECORD_FINISHED_ROUND = 68, | ||
93 | PERF_RECORD_HEADER_MAX | ||
94 | }; | ||
95 | |||
96 | struct attr_event { | ||
97 | struct perf_event_header header; | ||
98 | struct perf_event_attr attr; | ||
99 | u64 id[]; | ||
100 | }; | ||
101 | |||
102 | #define MAX_EVENT_NAME 64 | ||
103 | |||
104 | struct perf_trace_event_type { | ||
105 | u64 event_id; | ||
106 | char name[MAX_EVENT_NAME]; | ||
107 | }; | ||
108 | |||
109 | struct event_type_event { | ||
110 | struct perf_event_header header; | ||
111 | struct perf_trace_event_type event_type; | ||
112 | }; | ||
113 | |||
114 | struct tracing_data_event { | ||
115 | struct perf_event_header header; | ||
116 | u32 size; | ||
117 | }; | ||
118 | |||
86 | typedef union event_union { | 119 | typedef union event_union { |
87 | struct perf_event_header header; | 120 | struct perf_event_header header; |
88 | struct ip_event ip; | 121 | struct ip_event ip; |
@@ -92,22 +125,12 @@ typedef union event_union { | |||
92 | struct lost_event lost; | 125 | struct lost_event lost; |
93 | struct read_event read; | 126 | struct read_event read; |
94 | struct sample_event sample; | 127 | struct sample_event sample; |
128 | struct attr_event attr; | ||
129 | struct event_type_event event_type; | ||
130 | struct tracing_data_event tracing_data; | ||
131 | struct build_id_event build_id; | ||
95 | } event_t; | 132 | } event_t; |
96 | 133 | ||
97 | struct events_stats { | ||
98 | u64 total; | ||
99 | u64 lost; | ||
100 | }; | ||
101 | |||
102 | struct event_stat_id { | ||
103 | struct rb_node rb_node; | ||
104 | struct rb_root hists; | ||
105 | struct events_stats stats; | ||
106 | u64 config; | ||
107 | u64 event_stream; | ||
108 | u32 type; | ||
109 | }; | ||
110 | |||
111 | void event__print_totals(void); | 134 | void event__print_totals(void); |
112 | 135 | ||
113 | struct perf_session; | 136 | struct perf_session; |
@@ -119,10 +142,13 @@ int event__synthesize_thread(pid_t pid, event__handler_t process, | |||
119 | void event__synthesize_threads(event__handler_t process, | 142 | void event__synthesize_threads(event__handler_t process, |
120 | struct perf_session *session); | 143 | struct perf_session *session); |
121 | int event__synthesize_kernel_mmap(event__handler_t process, | 144 | int event__synthesize_kernel_mmap(event__handler_t process, |
122 | struct perf_session *session, | 145 | struct perf_session *session, |
123 | const char *symbol_name); | 146 | struct machine *machine, |
147 | const char *symbol_name); | ||
148 | |||
124 | int event__synthesize_modules(event__handler_t process, | 149 | int event__synthesize_modules(event__handler_t process, |
125 | struct perf_session *session); | 150 | struct perf_session *session, |
151 | struct machine *machine); | ||
126 | 152 | ||
127 | int event__process_comm(event_t *self, struct perf_session *session); | 153 | int event__process_comm(event_t *self, struct perf_session *session); |
128 | int event__process_lost(event_t *self, struct perf_session *session); | 154 | int event__process_lost(event_t *self, struct perf_session *session); |
@@ -134,4 +160,6 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session, | |||
134 | struct addr_location *al, symbol_filter_t filter); | 160 | struct addr_location *al, symbol_filter_t filter); |
135 | int event__parse_sample(event_t *event, u64 type, struct sample_data *data); | 161 | int event__parse_sample(event_t *event, u64 type, struct sample_data *data); |
136 | 162 | ||
163 | extern const char *event__name[]; | ||
164 | |||
137 | #endif /* __PERF_RECORD_H */ | 165 | #endif /* __PERF_RECORD_H */ |
diff --git a/tools/perf/util/header.c b/tools/perf/util/header.c index 6c9aa16ee51f..8847bec64c54 100644 --- a/tools/perf/util/header.c +++ b/tools/perf/util/header.c | |||
@@ -99,13 +99,6 @@ int perf_header__add_attr(struct perf_header *self, | |||
99 | return 0; | 99 | return 0; |
100 | } | 100 | } |
101 | 101 | ||
102 | #define MAX_EVENT_NAME 64 | ||
103 | |||
104 | struct perf_trace_event_type { | ||
105 | u64 event_id; | ||
106 | char name[MAX_EVENT_NAME]; | ||
107 | }; | ||
108 | |||
109 | static int event_count; | 102 | static int event_count; |
110 | static struct perf_trace_event_type *events; | 103 | static struct perf_trace_event_type *events; |
111 | 104 | ||
@@ -197,7 +190,8 @@ static int write_padded(int fd, const void *bf, size_t count, | |||
197 | continue; \ | 190 | continue; \ |
198 | else | 191 | else |
199 | 192 | ||
200 | static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | 193 | static int __dsos__write_buildid_table(struct list_head *head, pid_t pid, |
194 | u16 misc, int fd) | ||
201 | { | 195 | { |
202 | struct dso *pos; | 196 | struct dso *pos; |
203 | 197 | ||
@@ -212,6 +206,7 @@ static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | |||
212 | len = ALIGN(len, NAME_ALIGN); | 206 | len = ALIGN(len, NAME_ALIGN); |
213 | memset(&b, 0, sizeof(b)); | 207 | memset(&b, 0, sizeof(b)); |
214 | memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id)); | 208 | memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id)); |
209 | b.pid = pid; | ||
215 | b.header.misc = misc; | 210 | b.header.misc = misc; |
216 | b.header.size = sizeof(b) + len; | 211 | b.header.size = sizeof(b) + len; |
217 | err = do_write(fd, &b, sizeof(b)); | 212 | err = do_write(fd, &b, sizeof(b)); |
@@ -226,13 +221,32 @@ static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | |||
226 | return 0; | 221 | return 0; |
227 | } | 222 | } |
228 | 223 | ||
229 | static int dsos__write_buildid_table(int fd) | 224 | static int dsos__write_buildid_table(struct perf_header *header, int fd) |
230 | { | 225 | { |
231 | int err = __dsos__write_buildid_table(&dsos__kernel, | 226 | struct perf_session *session = container_of(header, |
232 | PERF_RECORD_MISC_KERNEL, fd); | 227 | struct perf_session, header); |
233 | if (err == 0) | 228 | struct rb_node *nd; |
234 | err = __dsos__write_buildid_table(&dsos__user, | 229 | int err = 0; |
235 | PERF_RECORD_MISC_USER, fd); | 230 | u16 kmisc, umisc; |
231 | |||
232 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { | ||
233 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
234 | if (machine__is_host(pos)) { | ||
235 | kmisc = PERF_RECORD_MISC_KERNEL; | ||
236 | umisc = PERF_RECORD_MISC_USER; | ||
237 | } else { | ||
238 | kmisc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
239 | umisc = PERF_RECORD_MISC_GUEST_USER; | ||
240 | } | ||
241 | |||
242 | err = __dsos__write_buildid_table(&pos->kernel_dsos, pos->pid, | ||
243 | kmisc, fd); | ||
244 | if (err == 0) | ||
245 | err = __dsos__write_buildid_table(&pos->user_dsos, | ||
246 | pos->pid, umisc, fd); | ||
247 | if (err) | ||
248 | break; | ||
249 | } | ||
236 | return err; | 250 | return err; |
237 | } | 251 | } |
238 | 252 | ||
@@ -349,9 +363,12 @@ static int __dsos__cache_build_ids(struct list_head *head, const char *debugdir) | |||
349 | return err; | 363 | return err; |
350 | } | 364 | } |
351 | 365 | ||
352 | static int dsos__cache_build_ids(void) | 366 | static int dsos__cache_build_ids(struct perf_header *self) |
353 | { | 367 | { |
354 | int err_kernel, err_user; | 368 | struct perf_session *session = container_of(self, |
369 | struct perf_session, header); | ||
370 | struct rb_node *nd; | ||
371 | int ret = 0; | ||
355 | char debugdir[PATH_MAX]; | 372 | char debugdir[PATH_MAX]; |
356 | 373 | ||
357 | snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"), | 374 | snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"), |
@@ -360,9 +377,28 @@ static int dsos__cache_build_ids(void) | |||
360 | if (mkdir(debugdir, 0755) != 0 && errno != EEXIST) | 377 | if (mkdir(debugdir, 0755) != 0 && errno != EEXIST) |
361 | return -1; | 378 | return -1; |
362 | 379 | ||
363 | err_kernel = __dsos__cache_build_ids(&dsos__kernel, debugdir); | 380 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { |
364 | err_user = __dsos__cache_build_ids(&dsos__user, debugdir); | 381 | struct machine *pos = rb_entry(nd, struct machine, rb_node); |
365 | return err_kernel || err_user ? -1 : 0; | 382 | ret |= __dsos__cache_build_ids(&pos->kernel_dsos, debugdir); |
383 | ret |= __dsos__cache_build_ids(&pos->user_dsos, debugdir); | ||
384 | } | ||
385 | return ret ? -1 : 0; | ||
386 | } | ||
387 | |||
388 | static bool dsos__read_build_ids(struct perf_header *self, bool with_hits) | ||
389 | { | ||
390 | bool ret = false; | ||
391 | struct perf_session *session = container_of(self, | ||
392 | struct perf_session, header); | ||
393 | struct rb_node *nd; | ||
394 | |||
395 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { | ||
396 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
397 | ret |= __dsos__read_build_ids(&pos->kernel_dsos, with_hits); | ||
398 | ret |= __dsos__read_build_ids(&pos->user_dsos, with_hits); | ||
399 | } | ||
400 | |||
401 | return ret; | ||
366 | } | 402 | } |
367 | 403 | ||
368 | static int perf_header__adds_write(struct perf_header *self, int fd) | 404 | static int perf_header__adds_write(struct perf_header *self, int fd) |
@@ -373,7 +409,7 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
373 | u64 sec_start; | 409 | u64 sec_start; |
374 | int idx = 0, err; | 410 | int idx = 0, err; |
375 | 411 | ||
376 | if (dsos__read_build_ids(true)) | 412 | if (dsos__read_build_ids(self, true)) |
377 | perf_header__set_feat(self, HEADER_BUILD_ID); | 413 | perf_header__set_feat(self, HEADER_BUILD_ID); |
378 | 414 | ||
379 | nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); | 415 | nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); |
@@ -400,7 +436,6 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
400 | trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset; | 436 | trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset; |
401 | } | 437 | } |
402 | 438 | ||
403 | |||
404 | if (perf_header__has_feat(self, HEADER_BUILD_ID)) { | 439 | if (perf_header__has_feat(self, HEADER_BUILD_ID)) { |
405 | struct perf_file_section *buildid_sec; | 440 | struct perf_file_section *buildid_sec; |
406 | 441 | ||
@@ -408,14 +443,14 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
408 | 443 | ||
409 | /* Write build-ids */ | 444 | /* Write build-ids */ |
410 | buildid_sec->offset = lseek(fd, 0, SEEK_CUR); | 445 | buildid_sec->offset = lseek(fd, 0, SEEK_CUR); |
411 | err = dsos__write_buildid_table(fd); | 446 | err = dsos__write_buildid_table(self, fd); |
412 | if (err < 0) { | 447 | if (err < 0) { |
413 | pr_debug("failed to write buildid table\n"); | 448 | pr_debug("failed to write buildid table\n"); |
414 | goto out_free; | 449 | goto out_free; |
415 | } | 450 | } |
416 | buildid_sec->size = lseek(fd, 0, SEEK_CUR) - | 451 | buildid_sec->size = lseek(fd, 0, SEEK_CUR) - |
417 | buildid_sec->offset; | 452 | buildid_sec->offset; |
418 | dsos__cache_build_ids(); | 453 | dsos__cache_build_ids(self); |
419 | } | 454 | } |
420 | 455 | ||
421 | lseek(fd, sec_start, SEEK_SET); | 456 | lseek(fd, sec_start, SEEK_SET); |
@@ -427,6 +462,25 @@ out_free: | |||
427 | return err; | 462 | return err; |
428 | } | 463 | } |
429 | 464 | ||
465 | int perf_header__write_pipe(int fd) | ||
466 | { | ||
467 | struct perf_pipe_file_header f_header; | ||
468 | int err; | ||
469 | |||
470 | f_header = (struct perf_pipe_file_header){ | ||
471 | .magic = PERF_MAGIC, | ||
472 | .size = sizeof(f_header), | ||
473 | }; | ||
474 | |||
475 | err = do_write(fd, &f_header, sizeof(f_header)); | ||
476 | if (err < 0) { | ||
477 | pr_debug("failed to write perf pipe header\n"); | ||
478 | return err; | ||
479 | } | ||
480 | |||
481 | return 0; | ||
482 | } | ||
483 | |||
430 | int perf_header__write(struct perf_header *self, int fd, bool at_exit) | 484 | int perf_header__write(struct perf_header *self, int fd, bool at_exit) |
431 | { | 485 | { |
432 | struct perf_file_header f_header; | 486 | struct perf_file_header f_header; |
@@ -518,25 +572,10 @@ int perf_header__write(struct perf_header *self, int fd, bool at_exit) | |||
518 | return 0; | 572 | return 0; |
519 | } | 573 | } |
520 | 574 | ||
521 | static int do_read(int fd, void *buf, size_t size) | ||
522 | { | ||
523 | while (size) { | ||
524 | int ret = read(fd, buf, size); | ||
525 | |||
526 | if (ret <= 0) | ||
527 | return -1; | ||
528 | |||
529 | size -= ret; | ||
530 | buf += ret; | ||
531 | } | ||
532 | |||
533 | return 0; | ||
534 | } | ||
535 | |||
536 | static int perf_header__getbuffer64(struct perf_header *self, | 575 | static int perf_header__getbuffer64(struct perf_header *self, |
537 | int fd, void *buf, size_t size) | 576 | int fd, void *buf, size_t size) |
538 | { | 577 | { |
539 | if (do_read(fd, buf, size)) | 578 | if (do_read(fd, buf, size) <= 0) |
540 | return -1; | 579 | return -1; |
541 | 580 | ||
542 | if (self->needs_swap) | 581 | if (self->needs_swap) |
@@ -592,7 +631,7 @@ int perf_file_header__read(struct perf_file_header *self, | |||
592 | { | 631 | { |
593 | lseek(fd, 0, SEEK_SET); | 632 | lseek(fd, 0, SEEK_SET); |
594 | 633 | ||
595 | if (do_read(fd, self, sizeof(*self)) || | 634 | if (do_read(fd, self, sizeof(*self)) <= 0 || |
596 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) | 635 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) |
597 | return -1; | 636 | return -1; |
598 | 637 | ||
@@ -636,6 +675,93 @@ int perf_file_header__read(struct perf_file_header *self, | |||
636 | return 0; | 675 | return 0; |
637 | } | 676 | } |
638 | 677 | ||
678 | static int __event_process_build_id(struct build_id_event *bev, | ||
679 | char *filename, | ||
680 | struct perf_session *session) | ||
681 | { | ||
682 | int err = -1; | ||
683 | struct list_head *head; | ||
684 | struct machine *machine; | ||
685 | u16 misc; | ||
686 | struct dso *dso; | ||
687 | enum dso_kernel_type dso_type; | ||
688 | |||
689 | machine = perf_session__findnew_machine(session, bev->pid); | ||
690 | if (!machine) | ||
691 | goto out; | ||
692 | |||
693 | misc = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | ||
694 | |||
695 | switch (misc) { | ||
696 | case PERF_RECORD_MISC_KERNEL: | ||
697 | dso_type = DSO_TYPE_KERNEL; | ||
698 | head = &machine->kernel_dsos; | ||
699 | break; | ||
700 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
701 | dso_type = DSO_TYPE_GUEST_KERNEL; | ||
702 | head = &machine->kernel_dsos; | ||
703 | break; | ||
704 | case PERF_RECORD_MISC_USER: | ||
705 | case PERF_RECORD_MISC_GUEST_USER: | ||
706 | dso_type = DSO_TYPE_USER; | ||
707 | head = &machine->user_dsos; | ||
708 | break; | ||
709 | default: | ||
710 | goto out; | ||
711 | } | ||
712 | |||
713 | dso = __dsos__findnew(head, filename); | ||
714 | if (dso != NULL) { | ||
715 | char sbuild_id[BUILD_ID_SIZE * 2 + 1]; | ||
716 | |||
717 | dso__set_build_id(dso, &bev->build_id); | ||
718 | |||
719 | if (filename[0] == '[') | ||
720 | dso->kernel = dso_type; | ||
721 | |||
722 | build_id__sprintf(dso->build_id, sizeof(dso->build_id), | ||
723 | sbuild_id); | ||
724 | pr_debug("build id event received for %s: %s\n", | ||
725 | dso->long_name, sbuild_id); | ||
726 | } | ||
727 | |||
728 | err = 0; | ||
729 | out: | ||
730 | return err; | ||
731 | } | ||
732 | |||
733 | static int perf_header__read_build_ids(struct perf_header *self, | ||
734 | int input, u64 offset, u64 size) | ||
735 | { | ||
736 | struct perf_session *session = container_of(self, | ||
737 | struct perf_session, header); | ||
738 | struct build_id_event bev; | ||
739 | char filename[PATH_MAX]; | ||
740 | u64 limit = offset + size; | ||
741 | int err = -1; | ||
742 | |||
743 | while (offset < limit) { | ||
744 | ssize_t len; | ||
745 | |||
746 | if (read(input, &bev, sizeof(bev)) != sizeof(bev)) | ||
747 | goto out; | ||
748 | |||
749 | if (self->needs_swap) | ||
750 | perf_event_header__bswap(&bev.header); | ||
751 | |||
752 | len = bev.header.size - sizeof(bev); | ||
753 | if (read(input, filename, len) != len) | ||
754 | goto out; | ||
755 | |||
756 | __event_process_build_id(&bev, filename, session); | ||
757 | |||
758 | offset += bev.header.size; | ||
759 | } | ||
760 | err = 0; | ||
761 | out: | ||
762 | return err; | ||
763 | } | ||
764 | |||
639 | static int perf_file_section__process(struct perf_file_section *self, | 765 | static int perf_file_section__process(struct perf_file_section *self, |
640 | struct perf_header *ph, | 766 | struct perf_header *ph, |
641 | int feat, int fd) | 767 | int feat, int fd) |
@@ -648,7 +774,7 @@ static int perf_file_section__process(struct perf_file_section *self, | |||
648 | 774 | ||
649 | switch (feat) { | 775 | switch (feat) { |
650 | case HEADER_TRACE_INFO: | 776 | case HEADER_TRACE_INFO: |
651 | trace_report(fd); | 777 | trace_report(fd, false); |
652 | break; | 778 | break; |
653 | 779 | ||
654 | case HEADER_BUILD_ID: | 780 | case HEADER_BUILD_ID: |
@@ -662,13 +788,56 @@ static int perf_file_section__process(struct perf_file_section *self, | |||
662 | return 0; | 788 | return 0; |
663 | } | 789 | } |
664 | 790 | ||
665 | int perf_header__read(struct perf_header *self, int fd) | 791 | static int perf_file_header__read_pipe(struct perf_pipe_file_header *self, |
792 | struct perf_header *ph, int fd, | ||
793 | bool repipe) | ||
794 | { | ||
795 | if (do_read(fd, self, sizeof(*self)) <= 0 || | ||
796 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) | ||
797 | return -1; | ||
798 | |||
799 | if (repipe && do_write(STDOUT_FILENO, self, sizeof(*self)) < 0) | ||
800 | return -1; | ||
801 | |||
802 | if (self->size != sizeof(*self)) { | ||
803 | u64 size = bswap_64(self->size); | ||
804 | |||
805 | if (size != sizeof(*self)) | ||
806 | return -1; | ||
807 | |||
808 | ph->needs_swap = true; | ||
809 | } | ||
810 | |||
811 | return 0; | ||
812 | } | ||
813 | |||
814 | static int perf_header__read_pipe(struct perf_session *session, int fd) | ||
666 | { | 815 | { |
816 | struct perf_header *self = &session->header; | ||
817 | struct perf_pipe_file_header f_header; | ||
818 | |||
819 | if (perf_file_header__read_pipe(&f_header, self, fd, | ||
820 | session->repipe) < 0) { | ||
821 | pr_debug("incompatible file format\n"); | ||
822 | return -EINVAL; | ||
823 | } | ||
824 | |||
825 | session->fd = fd; | ||
826 | |||
827 | return 0; | ||
828 | } | ||
829 | |||
830 | int perf_header__read(struct perf_session *session, int fd) | ||
831 | { | ||
832 | struct perf_header *self = &session->header; | ||
667 | struct perf_file_header f_header; | 833 | struct perf_file_header f_header; |
668 | struct perf_file_attr f_attr; | 834 | struct perf_file_attr f_attr; |
669 | u64 f_id; | 835 | u64 f_id; |
670 | int nr_attrs, nr_ids, i, j; | 836 | int nr_attrs, nr_ids, i, j; |
671 | 837 | ||
838 | if (session->fd_pipe) | ||
839 | return perf_header__read_pipe(session, fd); | ||
840 | |||
672 | if (perf_file_header__read(&f_header, self, fd) < 0) { | 841 | if (perf_file_header__read(&f_header, self, fd) < 0) { |
673 | pr_debug("incompatible file format\n"); | 842 | pr_debug("incompatible file format\n"); |
674 | return -EINVAL; | 843 | return -EINVAL; |
@@ -753,6 +922,14 @@ perf_header__find_attr(u64 id, struct perf_header *header) | |||
753 | { | 922 | { |
754 | int i; | 923 | int i; |
755 | 924 | ||
925 | /* | ||
926 | * We set id to -1 if the data file doesn't contain sample | ||
927 | * ids. Check for this and avoid walking through the entire | ||
928 | * list of ids which may be large. | ||
929 | */ | ||
930 | if (id == -1ULL) | ||
931 | return NULL; | ||
932 | |||
756 | for (i = 0; i < header->attrs; i++) { | 933 | for (i = 0; i < header->attrs; i++) { |
757 | struct perf_header_attr *attr = header->attr[i]; | 934 | struct perf_header_attr *attr = header->attr[i]; |
758 | int j; | 935 | int j; |
@@ -765,3 +942,231 @@ perf_header__find_attr(u64 id, struct perf_header *header) | |||
765 | 942 | ||
766 | return NULL; | 943 | return NULL; |
767 | } | 944 | } |
945 | |||
946 | int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id, | ||
947 | event__handler_t process, | ||
948 | struct perf_session *session) | ||
949 | { | ||
950 | event_t *ev; | ||
951 | size_t size; | ||
952 | int err; | ||
953 | |||
954 | size = sizeof(struct perf_event_attr); | ||
955 | size = ALIGN(size, sizeof(u64)); | ||
956 | size += sizeof(struct perf_event_header); | ||
957 | size += ids * sizeof(u64); | ||
958 | |||
959 | ev = malloc(size); | ||
960 | |||
961 | ev->attr.attr = *attr; | ||
962 | memcpy(ev->attr.id, id, ids * sizeof(u64)); | ||
963 | |||
964 | ev->attr.header.type = PERF_RECORD_HEADER_ATTR; | ||
965 | ev->attr.header.size = size; | ||
966 | |||
967 | err = process(ev, session); | ||
968 | |||
969 | free(ev); | ||
970 | |||
971 | return err; | ||
972 | } | ||
973 | |||
974 | int event__synthesize_attrs(struct perf_header *self, | ||
975 | event__handler_t process, | ||
976 | struct perf_session *session) | ||
977 | { | ||
978 | struct perf_header_attr *attr; | ||
979 | int i, err = 0; | ||
980 | |||
981 | for (i = 0; i < self->attrs; i++) { | ||
982 | attr = self->attr[i]; | ||
983 | |||
984 | err = event__synthesize_attr(&attr->attr, attr->ids, attr->id, | ||
985 | process, session); | ||
986 | if (err) { | ||
987 | pr_debug("failed to create perf header attribute\n"); | ||
988 | return err; | ||
989 | } | ||
990 | } | ||
991 | |||
992 | return err; | ||
993 | } | ||
994 | |||
995 | int event__process_attr(event_t *self, struct perf_session *session) | ||
996 | { | ||
997 | struct perf_header_attr *attr; | ||
998 | unsigned int i, ids, n_ids; | ||
999 | |||
1000 | attr = perf_header_attr__new(&self->attr.attr); | ||
1001 | if (attr == NULL) | ||
1002 | return -ENOMEM; | ||
1003 | |||
1004 | ids = self->header.size; | ||
1005 | ids -= (void *)&self->attr.id - (void *)self; | ||
1006 | n_ids = ids / sizeof(u64); | ||
1007 | |||
1008 | for (i = 0; i < n_ids; i++) { | ||
1009 | if (perf_header_attr__add_id(attr, self->attr.id[i]) < 0) { | ||
1010 | perf_header_attr__delete(attr); | ||
1011 | return -ENOMEM; | ||
1012 | } | ||
1013 | } | ||
1014 | |||
1015 | if (perf_header__add_attr(&session->header, attr) < 0) { | ||
1016 | perf_header_attr__delete(attr); | ||
1017 | return -ENOMEM; | ||
1018 | } | ||
1019 | |||
1020 | perf_session__update_sample_type(session); | ||
1021 | |||
1022 | return 0; | ||
1023 | } | ||
1024 | |||
1025 | int event__synthesize_event_type(u64 event_id, char *name, | ||
1026 | event__handler_t process, | ||
1027 | struct perf_session *session) | ||
1028 | { | ||
1029 | event_t ev; | ||
1030 | size_t size = 0; | ||
1031 | int err = 0; | ||
1032 | |||
1033 | memset(&ev, 0, sizeof(ev)); | ||
1034 | |||
1035 | ev.event_type.event_type.event_id = event_id; | ||
1036 | memset(ev.event_type.event_type.name, 0, MAX_EVENT_NAME); | ||
1037 | strncpy(ev.event_type.event_type.name, name, MAX_EVENT_NAME - 1); | ||
1038 | |||
1039 | ev.event_type.header.type = PERF_RECORD_HEADER_EVENT_TYPE; | ||
1040 | size = strlen(name); | ||
1041 | size = ALIGN(size, sizeof(u64)); | ||
1042 | ev.event_type.header.size = sizeof(ev.event_type) - | ||
1043 | (sizeof(ev.event_type.event_type.name) - size); | ||
1044 | |||
1045 | err = process(&ev, session); | ||
1046 | |||
1047 | return err; | ||
1048 | } | ||
1049 | |||
1050 | int event__synthesize_event_types(event__handler_t process, | ||
1051 | struct perf_session *session) | ||
1052 | { | ||
1053 | struct perf_trace_event_type *type; | ||
1054 | int i, err = 0; | ||
1055 | |||
1056 | for (i = 0; i < event_count; i++) { | ||
1057 | type = &events[i]; | ||
1058 | |||
1059 | err = event__synthesize_event_type(type->event_id, type->name, | ||
1060 | process, session); | ||
1061 | if (err) { | ||
1062 | pr_debug("failed to create perf header event type\n"); | ||
1063 | return err; | ||
1064 | } | ||
1065 | } | ||
1066 | |||
1067 | return err; | ||
1068 | } | ||
1069 | |||
1070 | int event__process_event_type(event_t *self, | ||
1071 | struct perf_session *session __unused) | ||
1072 | { | ||
1073 | if (perf_header__push_event(self->event_type.event_type.event_id, | ||
1074 | self->event_type.event_type.name) < 0) | ||
1075 | return -ENOMEM; | ||
1076 | |||
1077 | return 0; | ||
1078 | } | ||
1079 | |||
1080 | int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs, | ||
1081 | int nb_events, | ||
1082 | event__handler_t process, | ||
1083 | struct perf_session *session __unused) | ||
1084 | { | ||
1085 | event_t ev; | ||
1086 | ssize_t size = 0, aligned_size = 0, padding; | ||
1087 | int err = 0; | ||
1088 | |||
1089 | memset(&ev, 0, sizeof(ev)); | ||
1090 | |||
1091 | ev.tracing_data.header.type = PERF_RECORD_HEADER_TRACING_DATA; | ||
1092 | size = read_tracing_data_size(fd, pattrs, nb_events); | ||
1093 | if (size <= 0) | ||
1094 | return size; | ||
1095 | aligned_size = ALIGN(size, sizeof(u64)); | ||
1096 | padding = aligned_size - size; | ||
1097 | ev.tracing_data.header.size = sizeof(ev.tracing_data); | ||
1098 | ev.tracing_data.size = aligned_size; | ||
1099 | |||
1100 | process(&ev, session); | ||
1101 | |||
1102 | err = read_tracing_data(fd, pattrs, nb_events); | ||
1103 | write_padded(fd, NULL, 0, padding); | ||
1104 | |||
1105 | return aligned_size; | ||
1106 | } | ||
1107 | |||
1108 | int event__process_tracing_data(event_t *self, | ||
1109 | struct perf_session *session) | ||
1110 | { | ||
1111 | ssize_t size_read, padding, size = self->tracing_data.size; | ||
1112 | off_t offset = lseek(session->fd, 0, SEEK_CUR); | ||
1113 | char buf[BUFSIZ]; | ||
1114 | |||
1115 | /* setup for reading amidst mmap */ | ||
1116 | lseek(session->fd, offset + sizeof(struct tracing_data_event), | ||
1117 | SEEK_SET); | ||
1118 | |||
1119 | size_read = trace_report(session->fd, session->repipe); | ||
1120 | |||
1121 | padding = ALIGN(size_read, sizeof(u64)) - size_read; | ||
1122 | |||
1123 | if (read(session->fd, buf, padding) < 0) | ||
1124 | die("reading input file"); | ||
1125 | if (session->repipe) { | ||
1126 | int retw = write(STDOUT_FILENO, buf, padding); | ||
1127 | if (retw <= 0 || retw != padding) | ||
1128 | die("repiping tracing data padding"); | ||
1129 | } | ||
1130 | |||
1131 | if (size_read + padding != size) | ||
1132 | die("tracing data size mismatch"); | ||
1133 | |||
1134 | return size_read + padding; | ||
1135 | } | ||
1136 | |||
1137 | int event__synthesize_build_id(struct dso *pos, u16 misc, | ||
1138 | event__handler_t process, | ||
1139 | struct machine *machine, | ||
1140 | struct perf_session *session) | ||
1141 | { | ||
1142 | event_t ev; | ||
1143 | size_t len; | ||
1144 | int err = 0; | ||
1145 | |||
1146 | if (!pos->hit) | ||
1147 | return err; | ||
1148 | |||
1149 | memset(&ev, 0, sizeof(ev)); | ||
1150 | |||
1151 | len = pos->long_name_len + 1; | ||
1152 | len = ALIGN(len, NAME_ALIGN); | ||
1153 | memcpy(&ev.build_id.build_id, pos->build_id, sizeof(pos->build_id)); | ||
1154 | ev.build_id.header.type = PERF_RECORD_HEADER_BUILD_ID; | ||
1155 | ev.build_id.header.misc = misc; | ||
1156 | ev.build_id.pid = machine->pid; | ||
1157 | ev.build_id.header.size = sizeof(ev.build_id) + len; | ||
1158 | memcpy(&ev.build_id.filename, pos->long_name, pos->long_name_len); | ||
1159 | |||
1160 | err = process(&ev, session); | ||
1161 | |||
1162 | return err; | ||
1163 | } | ||
1164 | |||
1165 | int event__process_build_id(event_t *self, | ||
1166 | struct perf_session *session) | ||
1167 | { | ||
1168 | __event_process_build_id(&self->build_id, | ||
1169 | self->build_id.filename, | ||
1170 | session); | ||
1171 | return 0; | ||
1172 | } | ||
diff --git a/tools/perf/util/header.h b/tools/perf/util/header.h index 82a6af72d4cc..402ac2454cf8 100644 --- a/tools/perf/util/header.h +++ b/tools/perf/util/header.h | |||
@@ -39,6 +39,11 @@ struct perf_file_header { | |||
39 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); | 39 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); |
40 | }; | 40 | }; |
41 | 41 | ||
42 | struct perf_pipe_file_header { | ||
43 | u64 magic; | ||
44 | u64 size; | ||
45 | }; | ||
46 | |||
42 | struct perf_header; | 47 | struct perf_header; |
43 | 48 | ||
44 | int perf_file_header__read(struct perf_file_header *self, | 49 | int perf_file_header__read(struct perf_file_header *self, |
@@ -47,21 +52,22 @@ int perf_file_header__read(struct perf_file_header *self, | |||
47 | struct perf_header { | 52 | struct perf_header { |
48 | int frozen; | 53 | int frozen; |
49 | int attrs, size; | 54 | int attrs, size; |
55 | bool needs_swap; | ||
50 | struct perf_header_attr **attr; | 56 | struct perf_header_attr **attr; |
51 | s64 attr_offset; | 57 | s64 attr_offset; |
52 | u64 data_offset; | 58 | u64 data_offset; |
53 | u64 data_size; | 59 | u64 data_size; |
54 | u64 event_offset; | 60 | u64 event_offset; |
55 | u64 event_size; | 61 | u64 event_size; |
56 | bool needs_swap; | ||
57 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); | 62 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); |
58 | }; | 63 | }; |
59 | 64 | ||
60 | int perf_header__init(struct perf_header *self); | 65 | int perf_header__init(struct perf_header *self); |
61 | void perf_header__exit(struct perf_header *self); | 66 | void perf_header__exit(struct perf_header *self); |
62 | 67 | ||
63 | int perf_header__read(struct perf_header *self, int fd); | 68 | int perf_header__read(struct perf_session *session, int fd); |
64 | int perf_header__write(struct perf_header *self, int fd, bool at_exit); | 69 | int perf_header__write(struct perf_header *self, int fd, bool at_exit); |
70 | int perf_header__write_pipe(int fd); | ||
65 | 71 | ||
66 | int perf_header__add_attr(struct perf_header *self, | 72 | int perf_header__add_attr(struct perf_header *self, |
67 | struct perf_header_attr *attr); | 73 | struct perf_header_attr *attr); |
@@ -89,4 +95,33 @@ int build_id_cache__add_s(const char *sbuild_id, const char *debugdir, | |||
89 | const char *name, bool is_kallsyms); | 95 | const char *name, bool is_kallsyms); |
90 | int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir); | 96 | int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir); |
91 | 97 | ||
98 | int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id, | ||
99 | event__handler_t process, | ||
100 | struct perf_session *session); | ||
101 | int event__synthesize_attrs(struct perf_header *self, | ||
102 | event__handler_t process, | ||
103 | struct perf_session *session); | ||
104 | int event__process_attr(event_t *self, struct perf_session *session); | ||
105 | |||
106 | int event__synthesize_event_type(u64 event_id, char *name, | ||
107 | event__handler_t process, | ||
108 | struct perf_session *session); | ||
109 | int event__synthesize_event_types(event__handler_t process, | ||
110 | struct perf_session *session); | ||
111 | int event__process_event_type(event_t *self, | ||
112 | struct perf_session *session); | ||
113 | |||
114 | int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs, | ||
115 | int nb_events, | ||
116 | event__handler_t process, | ||
117 | struct perf_session *session); | ||
118 | int event__process_tracing_data(event_t *self, | ||
119 | struct perf_session *session); | ||
120 | |||
121 | int event__synthesize_build_id(struct dso *pos, u16 misc, | ||
122 | event__handler_t process, | ||
123 | struct machine *machine, | ||
124 | struct perf_session *session); | ||
125 | int event__process_build_id(event_t *self, struct perf_session *session); | ||
126 | |||
92 | #endif /* __PERF_HEADER_H */ | 127 | #endif /* __PERF_HEADER_H */ |
diff --git a/tools/perf/util/hist.c b/tools/perf/util/hist.c index 2be33c7dbf03..9a71c94f057a 100644 --- a/tools/perf/util/hist.c +++ b/tools/perf/util/hist.c | |||
@@ -1,3 +1,4 @@ | |||
1 | #include "util.h" | ||
1 | #include "hist.h" | 2 | #include "hist.h" |
2 | #include "session.h" | 3 | #include "session.h" |
3 | #include "sort.h" | 4 | #include "sort.h" |
@@ -8,25 +9,69 @@ struct callchain_param callchain_param = { | |||
8 | .min_percent = 0.5 | 9 | .min_percent = 0.5 |
9 | }; | 10 | }; |
10 | 11 | ||
12 | static void hist_entry__add_cpumode_period(struct hist_entry *self, | ||
13 | unsigned int cpumode, u64 period) | ||
14 | { | ||
15 | switch (cpumode) { | ||
16 | case PERF_RECORD_MISC_KERNEL: | ||
17 | self->period_sys += period; | ||
18 | break; | ||
19 | case PERF_RECORD_MISC_USER: | ||
20 | self->period_us += period; | ||
21 | break; | ||
22 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
23 | self->period_guest_sys += period; | ||
24 | break; | ||
25 | case PERF_RECORD_MISC_GUEST_USER: | ||
26 | self->period_guest_us += period; | ||
27 | break; | ||
28 | default: | ||
29 | break; | ||
30 | } | ||
31 | } | ||
32 | |||
11 | /* | 33 | /* |
12 | * histogram, sorted on item, collects counts | 34 | * histogram, sorted on item, collects periods |
13 | */ | 35 | */ |
14 | 36 | ||
15 | struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | 37 | static struct hist_entry *hist_entry__new(struct hist_entry *template) |
16 | struct addr_location *al, | 38 | { |
17 | struct symbol *sym_parent, | 39 | size_t callchain_size = symbol_conf.use_callchain ? sizeof(struct callchain_node) : 0; |
18 | u64 count, bool *hit) | 40 | struct hist_entry *self = malloc(sizeof(*self) + callchain_size); |
41 | |||
42 | if (self != NULL) { | ||
43 | *self = *template; | ||
44 | self->nr_events = 1; | ||
45 | if (symbol_conf.use_callchain) | ||
46 | callchain_init(self->callchain); | ||
47 | } | ||
48 | |||
49 | return self; | ||
50 | } | ||
51 | |||
52 | static void hists__inc_nr_entries(struct hists *self, struct hist_entry *entry) | ||
19 | { | 53 | { |
20 | struct rb_node **p = &hists->rb_node; | 54 | if (entry->ms.sym && self->max_sym_namelen < entry->ms.sym->namelen) |
55 | self->max_sym_namelen = entry->ms.sym->namelen; | ||
56 | ++self->nr_entries; | ||
57 | } | ||
58 | |||
59 | struct hist_entry *__hists__add_entry(struct hists *self, | ||
60 | struct addr_location *al, | ||
61 | struct symbol *sym_parent, u64 period) | ||
62 | { | ||
63 | struct rb_node **p = &self->entries.rb_node; | ||
21 | struct rb_node *parent = NULL; | 64 | struct rb_node *parent = NULL; |
22 | struct hist_entry *he; | 65 | struct hist_entry *he; |
23 | struct hist_entry entry = { | 66 | struct hist_entry entry = { |
24 | .thread = al->thread, | 67 | .thread = al->thread, |
25 | .map = al->map, | 68 | .ms = { |
26 | .sym = al->sym, | 69 | .map = al->map, |
70 | .sym = al->sym, | ||
71 | }, | ||
27 | .ip = al->addr, | 72 | .ip = al->addr, |
28 | .level = al->level, | 73 | .level = al->level, |
29 | .count = count, | 74 | .period = period, |
30 | .parent = sym_parent, | 75 | .parent = sym_parent, |
31 | }; | 76 | }; |
32 | int cmp; | 77 | int cmp; |
@@ -38,8 +83,9 @@ struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | |||
38 | cmp = hist_entry__cmp(&entry, he); | 83 | cmp = hist_entry__cmp(&entry, he); |
39 | 84 | ||
40 | if (!cmp) { | 85 | if (!cmp) { |
41 | *hit = true; | 86 | he->period += period; |
42 | return he; | 87 | ++he->nr_events; |
88 | goto out; | ||
43 | } | 89 | } |
44 | 90 | ||
45 | if (cmp < 0) | 91 | if (cmp < 0) |
@@ -48,13 +94,14 @@ struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | |||
48 | p = &(*p)->rb_right; | 94 | p = &(*p)->rb_right; |
49 | } | 95 | } |
50 | 96 | ||
51 | he = malloc(sizeof(*he)); | 97 | he = hist_entry__new(&entry); |
52 | if (!he) | 98 | if (!he) |
53 | return NULL; | 99 | return NULL; |
54 | *he = entry; | ||
55 | rb_link_node(&he->rb_node, parent, p); | 100 | rb_link_node(&he->rb_node, parent, p); |
56 | rb_insert_color(&he->rb_node, hists); | 101 | rb_insert_color(&he->rb_node, &self->entries); |
57 | *hit = false; | 102 | hists__inc_nr_entries(self, he); |
103 | out: | ||
104 | hist_entry__add_cpumode_period(he, al->cpumode, period); | ||
58 | return he; | 105 | return he; |
59 | } | 106 | } |
60 | 107 | ||
@@ -65,7 +112,7 @@ hist_entry__cmp(struct hist_entry *left, struct hist_entry *right) | |||
65 | int64_t cmp = 0; | 112 | int64_t cmp = 0; |
66 | 113 | ||
67 | list_for_each_entry(se, &hist_entry__sort_list, list) { | 114 | list_for_each_entry(se, &hist_entry__sort_list, list) { |
68 | cmp = se->cmp(left, right); | 115 | cmp = se->se_cmp(left, right); |
69 | if (cmp) | 116 | if (cmp) |
70 | break; | 117 | break; |
71 | } | 118 | } |
@@ -82,7 +129,7 @@ hist_entry__collapse(struct hist_entry *left, struct hist_entry *right) | |||
82 | list_for_each_entry(se, &hist_entry__sort_list, list) { | 129 | list_for_each_entry(se, &hist_entry__sort_list, list) { |
83 | int64_t (*f)(struct hist_entry *, struct hist_entry *); | 130 | int64_t (*f)(struct hist_entry *, struct hist_entry *); |
84 | 131 | ||
85 | f = se->collapse ?: se->cmp; | 132 | f = se->se_collapse ?: se->se_cmp; |
86 | 133 | ||
87 | cmp = f(left, right); | 134 | cmp = f(left, right); |
88 | if (cmp) | 135 | if (cmp) |
@@ -101,7 +148,7 @@ void hist_entry__free(struct hist_entry *he) | |||
101 | * collapse the histogram | 148 | * collapse the histogram |
102 | */ | 149 | */ |
103 | 150 | ||
104 | static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | 151 | static bool collapse__insert_entry(struct rb_root *root, struct hist_entry *he) |
105 | { | 152 | { |
106 | struct rb_node **p = &root->rb_node; | 153 | struct rb_node **p = &root->rb_node; |
107 | struct rb_node *parent = NULL; | 154 | struct rb_node *parent = NULL; |
@@ -115,9 +162,9 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | |||
115 | cmp = hist_entry__collapse(iter, he); | 162 | cmp = hist_entry__collapse(iter, he); |
116 | 163 | ||
117 | if (!cmp) { | 164 | if (!cmp) { |
118 | iter->count += he->count; | 165 | iter->period += he->period; |
119 | hist_entry__free(he); | 166 | hist_entry__free(he); |
120 | return; | 167 | return false; |
121 | } | 168 | } |
122 | 169 | ||
123 | if (cmp < 0) | 170 | if (cmp < 0) |
@@ -128,9 +175,10 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | |||
128 | 175 | ||
129 | rb_link_node(&he->rb_node, parent, p); | 176 | rb_link_node(&he->rb_node, parent, p); |
130 | rb_insert_color(&he->rb_node, root); | 177 | rb_insert_color(&he->rb_node, root); |
178 | return true; | ||
131 | } | 179 | } |
132 | 180 | ||
133 | void perf_session__collapse_resort(struct rb_root *hists) | 181 | void hists__collapse_resort(struct hists *self) |
134 | { | 182 | { |
135 | struct rb_root tmp; | 183 | struct rb_root tmp; |
136 | struct rb_node *next; | 184 | struct rb_node *next; |
@@ -140,72 +188,77 @@ void perf_session__collapse_resort(struct rb_root *hists) | |||
140 | return; | 188 | return; |
141 | 189 | ||
142 | tmp = RB_ROOT; | 190 | tmp = RB_ROOT; |
143 | next = rb_first(hists); | 191 | next = rb_first(&self->entries); |
192 | self->nr_entries = 0; | ||
193 | self->max_sym_namelen = 0; | ||
144 | 194 | ||
145 | while (next) { | 195 | while (next) { |
146 | n = rb_entry(next, struct hist_entry, rb_node); | 196 | n = rb_entry(next, struct hist_entry, rb_node); |
147 | next = rb_next(&n->rb_node); | 197 | next = rb_next(&n->rb_node); |
148 | 198 | ||
149 | rb_erase(&n->rb_node, hists); | 199 | rb_erase(&n->rb_node, &self->entries); |
150 | collapse__insert_entry(&tmp, n); | 200 | if (collapse__insert_entry(&tmp, n)) |
201 | hists__inc_nr_entries(self, n); | ||
151 | } | 202 | } |
152 | 203 | ||
153 | *hists = tmp; | 204 | self->entries = tmp; |
154 | } | 205 | } |
155 | 206 | ||
156 | /* | 207 | /* |
157 | * reverse the map, sort on count. | 208 | * reverse the map, sort on period. |
158 | */ | 209 | */ |
159 | 210 | ||
160 | static void perf_session__insert_output_hist_entry(struct rb_root *root, | 211 | static void __hists__insert_output_entry(struct rb_root *entries, |
161 | struct hist_entry *he, | 212 | struct hist_entry *he, |
162 | u64 min_callchain_hits) | 213 | u64 min_callchain_hits) |
163 | { | 214 | { |
164 | struct rb_node **p = &root->rb_node; | 215 | struct rb_node **p = &entries->rb_node; |
165 | struct rb_node *parent = NULL; | 216 | struct rb_node *parent = NULL; |
166 | struct hist_entry *iter; | 217 | struct hist_entry *iter; |
167 | 218 | ||
168 | if (symbol_conf.use_callchain) | 219 | if (symbol_conf.use_callchain) |
169 | callchain_param.sort(&he->sorted_chain, &he->callchain, | 220 | callchain_param.sort(&he->sorted_chain, he->callchain, |
170 | min_callchain_hits, &callchain_param); | 221 | min_callchain_hits, &callchain_param); |
171 | 222 | ||
172 | while (*p != NULL) { | 223 | while (*p != NULL) { |
173 | parent = *p; | 224 | parent = *p; |
174 | iter = rb_entry(parent, struct hist_entry, rb_node); | 225 | iter = rb_entry(parent, struct hist_entry, rb_node); |
175 | 226 | ||
176 | if (he->count > iter->count) | 227 | if (he->period > iter->period) |
177 | p = &(*p)->rb_left; | 228 | p = &(*p)->rb_left; |
178 | else | 229 | else |
179 | p = &(*p)->rb_right; | 230 | p = &(*p)->rb_right; |
180 | } | 231 | } |
181 | 232 | ||
182 | rb_link_node(&he->rb_node, parent, p); | 233 | rb_link_node(&he->rb_node, parent, p); |
183 | rb_insert_color(&he->rb_node, root); | 234 | rb_insert_color(&he->rb_node, entries); |
184 | } | 235 | } |
185 | 236 | ||
186 | void perf_session__output_resort(struct rb_root *hists, u64 total_samples) | 237 | void hists__output_resort(struct hists *self) |
187 | { | 238 | { |
188 | struct rb_root tmp; | 239 | struct rb_root tmp; |
189 | struct rb_node *next; | 240 | struct rb_node *next; |
190 | struct hist_entry *n; | 241 | struct hist_entry *n; |
191 | u64 min_callchain_hits; | 242 | u64 min_callchain_hits; |
192 | 243 | ||
193 | min_callchain_hits = | 244 | min_callchain_hits = self->stats.total_period * (callchain_param.min_percent / 100); |
194 | total_samples * (callchain_param.min_percent / 100); | ||
195 | 245 | ||
196 | tmp = RB_ROOT; | 246 | tmp = RB_ROOT; |
197 | next = rb_first(hists); | 247 | next = rb_first(&self->entries); |
248 | |||
249 | self->nr_entries = 0; | ||
250 | self->max_sym_namelen = 0; | ||
198 | 251 | ||
199 | while (next) { | 252 | while (next) { |
200 | n = rb_entry(next, struct hist_entry, rb_node); | 253 | n = rb_entry(next, struct hist_entry, rb_node); |
201 | next = rb_next(&n->rb_node); | 254 | next = rb_next(&n->rb_node); |
202 | 255 | ||
203 | rb_erase(&n->rb_node, hists); | 256 | rb_erase(&n->rb_node, &self->entries); |
204 | perf_session__insert_output_hist_entry(&tmp, n, | 257 | __hists__insert_output_entry(&tmp, n, min_callchain_hits); |
205 | min_callchain_hits); | 258 | hists__inc_nr_entries(self, n); |
206 | } | 259 | } |
207 | 260 | ||
208 | *hists = tmp; | 261 | self->entries = tmp; |
209 | } | 262 | } |
210 | 263 | ||
211 | static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin) | 264 | static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin) |
@@ -237,7 +290,7 @@ static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask, | |||
237 | } | 290 | } |
238 | 291 | ||
239 | static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | 292 | static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, |
240 | int depth, int depth_mask, int count, | 293 | int depth, int depth_mask, int period, |
241 | u64 total_samples, int hits, | 294 | u64 total_samples, int hits, |
242 | int left_margin) | 295 | int left_margin) |
243 | { | 296 | { |
@@ -250,7 +303,7 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | |||
250 | ret += fprintf(fp, "|"); | 303 | ret += fprintf(fp, "|"); |
251 | else | 304 | else |
252 | ret += fprintf(fp, " "); | 305 | ret += fprintf(fp, " "); |
253 | if (!count && i == depth - 1) { | 306 | if (!period && i == depth - 1) { |
254 | double percent; | 307 | double percent; |
255 | 308 | ||
256 | percent = hits * 100.0 / total_samples; | 309 | percent = hits * 100.0 / total_samples; |
@@ -258,8 +311,8 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | |||
258 | } else | 311 | } else |
259 | ret += fprintf(fp, "%s", " "); | 312 | ret += fprintf(fp, "%s", " "); |
260 | } | 313 | } |
261 | if (chain->sym) | 314 | if (chain->ms.sym) |
262 | ret += fprintf(fp, "%s\n", chain->sym->name); | 315 | ret += fprintf(fp, "%s\n", chain->ms.sym->name); |
263 | else | 316 | else |
264 | ret += fprintf(fp, "%p\n", (void *)(long)chain->ip); | 317 | ret += fprintf(fp, "%p\n", (void *)(long)chain->ip); |
265 | 318 | ||
@@ -278,7 +331,7 @@ static void init_rem_hits(void) | |||
278 | } | 331 | } |
279 | 332 | ||
280 | strcpy(rem_sq_bracket->name, "[...]"); | 333 | strcpy(rem_sq_bracket->name, "[...]"); |
281 | rem_hits.sym = rem_sq_bracket; | 334 | rem_hits.ms.sym = rem_sq_bracket; |
282 | } | 335 | } |
283 | 336 | ||
284 | static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | 337 | static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, |
@@ -293,6 +346,7 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
293 | u64 remaining; | 346 | u64 remaining; |
294 | size_t ret = 0; | 347 | size_t ret = 0; |
295 | int i; | 348 | int i; |
349 | uint entries_printed = 0; | ||
296 | 350 | ||
297 | if (callchain_param.mode == CHAIN_GRAPH_REL) | 351 | if (callchain_param.mode == CHAIN_GRAPH_REL) |
298 | new_total = self->children_hit; | 352 | new_total = self->children_hit; |
@@ -328,8 +382,6 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
328 | left_margin); | 382 | left_margin); |
329 | i = 0; | 383 | i = 0; |
330 | list_for_each_entry(chain, &child->val, list) { | 384 | list_for_each_entry(chain, &child->val, list) { |
331 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
332 | continue; | ||
333 | ret += ipchain__fprintf_graph(fp, chain, depth, | 385 | ret += ipchain__fprintf_graph(fp, chain, depth, |
334 | new_depth_mask, i++, | 386 | new_depth_mask, i++, |
335 | new_total, | 387 | new_total, |
@@ -341,6 +393,8 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
341 | new_depth_mask | (1 << depth), | 393 | new_depth_mask | (1 << depth), |
342 | left_margin); | 394 | left_margin); |
343 | node = next; | 395 | node = next; |
396 | if (++entries_printed == callchain_param.print_limit) | ||
397 | break; | ||
344 | } | 398 | } |
345 | 399 | ||
346 | if (callchain_param.mode == CHAIN_GRAPH_REL && | 400 | if (callchain_param.mode == CHAIN_GRAPH_REL && |
@@ -366,11 +420,9 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
366 | bool printed = false; | 420 | bool printed = false; |
367 | int i = 0; | 421 | int i = 0; |
368 | int ret = 0; | 422 | int ret = 0; |
423 | u32 entries_printed = 0; | ||
369 | 424 | ||
370 | list_for_each_entry(chain, &self->val, list) { | 425 | list_for_each_entry(chain, &self->val, list) { |
371 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
372 | continue; | ||
373 | |||
374 | if (!i++ && sort__first_dimension == SORT_SYM) | 426 | if (!i++ && sort__first_dimension == SORT_SYM) |
375 | continue; | 427 | continue; |
376 | 428 | ||
@@ -385,10 +437,13 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
385 | } else | 437 | } else |
386 | ret += callchain__fprintf_left_margin(fp, left_margin); | 438 | ret += callchain__fprintf_left_margin(fp, left_margin); |
387 | 439 | ||
388 | if (chain->sym) | 440 | if (chain->ms.sym) |
389 | ret += fprintf(fp, " %s\n", chain->sym->name); | 441 | ret += fprintf(fp, " %s\n", chain->ms.sym->name); |
390 | else | 442 | else |
391 | ret += fprintf(fp, " %p\n", (void *)(long)chain->ip); | 443 | ret += fprintf(fp, " %p\n", (void *)(long)chain->ip); |
444 | |||
445 | if (++entries_printed == callchain_param.print_limit) | ||
446 | break; | ||
392 | } | 447 | } |
393 | 448 | ||
394 | ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin); | 449 | ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin); |
@@ -411,8 +466,8 @@ static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self, | |||
411 | list_for_each_entry(chain, &self->val, list) { | 466 | list_for_each_entry(chain, &self->val, list) { |
412 | if (chain->ip >= PERF_CONTEXT_MAX) | 467 | if (chain->ip >= PERF_CONTEXT_MAX) |
413 | continue; | 468 | continue; |
414 | if (chain->sym) | 469 | if (chain->ms.sym) |
415 | ret += fprintf(fp, " %s\n", chain->sym->name); | 470 | ret += fprintf(fp, " %s\n", chain->ms.sym->name); |
416 | else | 471 | else |
417 | ret += fprintf(fp, " %p\n", | 472 | ret += fprintf(fp, " %p\n", |
418 | (void *)(long)chain->ip); | 473 | (void *)(long)chain->ip); |
@@ -427,6 +482,7 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self, | |||
427 | struct rb_node *rb_node; | 482 | struct rb_node *rb_node; |
428 | struct callchain_node *chain; | 483 | struct callchain_node *chain; |
429 | size_t ret = 0; | 484 | size_t ret = 0; |
485 | u32 entries_printed = 0; | ||
430 | 486 | ||
431 | rb_node = rb_first(&self->sorted_chain); | 487 | rb_node = rb_first(&self->sorted_chain); |
432 | while (rb_node) { | 488 | while (rb_node) { |
@@ -449,55 +505,88 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self, | |||
449 | break; | 505 | break; |
450 | } | 506 | } |
451 | ret += fprintf(fp, "\n"); | 507 | ret += fprintf(fp, "\n"); |
508 | if (++entries_printed == callchain_param.print_limit) | ||
509 | break; | ||
452 | rb_node = rb_next(rb_node); | 510 | rb_node = rb_next(rb_node); |
453 | } | 511 | } |
454 | 512 | ||
455 | return ret; | 513 | return ret; |
456 | } | 514 | } |
457 | 515 | ||
458 | static size_t hist_entry__fprintf(struct hist_entry *self, | 516 | int hist_entry__snprintf(struct hist_entry *self, char *s, size_t size, |
459 | struct perf_session *pair_session, | 517 | struct hists *pair_hists, bool show_displacement, |
460 | bool show_displacement, | 518 | long displacement, bool color, u64 session_total) |
461 | long displacement, FILE *fp, | ||
462 | u64 session_total) | ||
463 | { | 519 | { |
464 | struct sort_entry *se; | 520 | struct sort_entry *se; |
465 | u64 count, total; | 521 | u64 period, total, period_sys, period_us, period_guest_sys, period_guest_us; |
466 | const char *sep = symbol_conf.field_sep; | 522 | const char *sep = symbol_conf.field_sep; |
467 | size_t ret; | 523 | int ret; |
468 | 524 | ||
469 | if (symbol_conf.exclude_other && !self->parent) | 525 | if (symbol_conf.exclude_other && !self->parent) |
470 | return 0; | 526 | return 0; |
471 | 527 | ||
472 | if (pair_session) { | 528 | if (pair_hists) { |
473 | count = self->pair ? self->pair->count : 0; | 529 | period = self->pair ? self->pair->period : 0; |
474 | total = pair_session->events_stats.total; | 530 | total = pair_hists->stats.total_period; |
531 | period_sys = self->pair ? self->pair->period_sys : 0; | ||
532 | period_us = self->pair ? self->pair->period_us : 0; | ||
533 | period_guest_sys = self->pair ? self->pair->period_guest_sys : 0; | ||
534 | period_guest_us = self->pair ? self->pair->period_guest_us : 0; | ||
475 | } else { | 535 | } else { |
476 | count = self->count; | 536 | period = self->period; |
477 | total = session_total; | 537 | total = session_total; |
538 | period_sys = self->period_sys; | ||
539 | period_us = self->period_us; | ||
540 | period_guest_sys = self->period_guest_sys; | ||
541 | period_guest_us = self->period_guest_us; | ||
478 | } | 542 | } |
479 | 543 | ||
480 | if (total) | 544 | if (total) { |
481 | ret = percent_color_fprintf(fp, sep ? "%.2f" : " %6.2f%%", | 545 | if (color) |
482 | (count * 100.0) / total); | 546 | ret = percent_color_snprintf(s, size, |
483 | else | 547 | sep ? "%.2f" : " %6.2f%%", |
484 | ret = fprintf(fp, sep ? "%lld" : "%12lld ", count); | 548 | (period * 100.0) / total); |
549 | else | ||
550 | ret = snprintf(s, size, sep ? "%.2f" : " %6.2f%%", | ||
551 | (period * 100.0) / total); | ||
552 | if (symbol_conf.show_cpu_utilization) { | ||
553 | ret += percent_color_snprintf(s + ret, size - ret, | ||
554 | sep ? "%.2f" : " %6.2f%%", | ||
555 | (period_sys * 100.0) / total); | ||
556 | ret += percent_color_snprintf(s + ret, size - ret, | ||
557 | sep ? "%.2f" : " %6.2f%%", | ||
558 | (period_us * 100.0) / total); | ||
559 | if (perf_guest) { | ||
560 | ret += percent_color_snprintf(s + ret, | ||
561 | size - ret, | ||
562 | sep ? "%.2f" : " %6.2f%%", | ||
563 | (period_guest_sys * 100.0) / | ||
564 | total); | ||
565 | ret += percent_color_snprintf(s + ret, | ||
566 | size - ret, | ||
567 | sep ? "%.2f" : " %6.2f%%", | ||
568 | (period_guest_us * 100.0) / | ||
569 | total); | ||
570 | } | ||
571 | } | ||
572 | } else | ||
573 | ret = snprintf(s, size, sep ? "%lld" : "%12lld ", period); | ||
485 | 574 | ||
486 | if (symbol_conf.show_nr_samples) { | 575 | if (symbol_conf.show_nr_samples) { |
487 | if (sep) | 576 | if (sep) |
488 | fprintf(fp, "%c%lld", *sep, count); | 577 | ret += snprintf(s + ret, size - ret, "%c%lld", *sep, period); |
489 | else | 578 | else |
490 | fprintf(fp, "%11lld", count); | 579 | ret += snprintf(s + ret, size - ret, "%11lld", period); |
491 | } | 580 | } |
492 | 581 | ||
493 | if (pair_session) { | 582 | if (pair_hists) { |
494 | char bf[32]; | 583 | char bf[32]; |
495 | double old_percent = 0, new_percent = 0, diff; | 584 | double old_percent = 0, new_percent = 0, diff; |
496 | 585 | ||
497 | if (total > 0) | 586 | if (total > 0) |
498 | old_percent = (count * 100.0) / total; | 587 | old_percent = (period * 100.0) / total; |
499 | if (session_total > 0) | 588 | if (session_total > 0) |
500 | new_percent = (self->count * 100.0) / session_total; | 589 | new_percent = (self->period * 100.0) / session_total; |
501 | 590 | ||
502 | diff = new_percent - old_percent; | 591 | diff = new_percent - old_percent; |
503 | 592 | ||
@@ -507,9 +596,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
507 | snprintf(bf, sizeof(bf), " "); | 596 | snprintf(bf, sizeof(bf), " "); |
508 | 597 | ||
509 | if (sep) | 598 | if (sep) |
510 | ret += fprintf(fp, "%c%s", *sep, bf); | 599 | ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf); |
511 | else | 600 | else |
512 | ret += fprintf(fp, "%11.11s", bf); | 601 | ret += snprintf(s + ret, size - ret, "%11.11s", bf); |
513 | 602 | ||
514 | if (show_displacement) { | 603 | if (show_displacement) { |
515 | if (displacement) | 604 | if (displacement) |
@@ -518,9 +607,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
518 | snprintf(bf, sizeof(bf), " "); | 607 | snprintf(bf, sizeof(bf), " "); |
519 | 608 | ||
520 | if (sep) | 609 | if (sep) |
521 | fprintf(fp, "%c%s", *sep, bf); | 610 | ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf); |
522 | else | 611 | else |
523 | fprintf(fp, "%6.6s", bf); | 612 | ret += snprintf(s + ret, size - ret, "%6.6s", bf); |
524 | } | 613 | } |
525 | } | 614 | } |
526 | 615 | ||
@@ -528,33 +617,43 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
528 | if (se->elide) | 617 | if (se->elide) |
529 | continue; | 618 | continue; |
530 | 619 | ||
531 | fprintf(fp, "%s", sep ?: " "); | 620 | ret += snprintf(s + ret, size - ret, "%s", sep ?: " "); |
532 | ret += se->print(fp, self, se->width ? *se->width : 0); | 621 | ret += se->se_snprintf(self, s + ret, size - ret, |
622 | se->se_width ? *se->se_width : 0); | ||
533 | } | 623 | } |
534 | 624 | ||
535 | ret += fprintf(fp, "\n"); | 625 | return ret; |
626 | } | ||
536 | 627 | ||
537 | if (symbol_conf.use_callchain) { | 628 | int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists, |
538 | int left_margin = 0; | 629 | bool show_displacement, long displacement, FILE *fp, |
630 | u64 session_total) | ||
631 | { | ||
632 | char bf[512]; | ||
633 | hist_entry__snprintf(self, bf, sizeof(bf), pair_hists, | ||
634 | show_displacement, displacement, | ||
635 | true, session_total); | ||
636 | return fprintf(fp, "%s\n", bf); | ||
637 | } | ||
539 | 638 | ||
540 | if (sort__first_dimension == SORT_COMM) { | 639 | static size_t hist_entry__fprintf_callchain(struct hist_entry *self, FILE *fp, |
541 | se = list_first_entry(&hist_entry__sort_list, typeof(*se), | 640 | u64 session_total) |
542 | list); | 641 | { |
543 | left_margin = se->width ? *se->width : 0; | 642 | int left_margin = 0; |
544 | left_margin -= thread__comm_len(self->thread); | ||
545 | } | ||
546 | 643 | ||
547 | hist_entry_callchain__fprintf(fp, self, session_total, | 644 | if (sort__first_dimension == SORT_COMM) { |
548 | left_margin); | 645 | struct sort_entry *se = list_first_entry(&hist_entry__sort_list, |
646 | typeof(*se), list); | ||
647 | left_margin = se->se_width ? *se->se_width : 0; | ||
648 | left_margin -= thread__comm_len(self->thread); | ||
549 | } | 649 | } |
550 | 650 | ||
551 | return ret; | 651 | return hist_entry_callchain__fprintf(fp, self, session_total, |
652 | left_margin); | ||
552 | } | 653 | } |
553 | 654 | ||
554 | size_t perf_session__fprintf_hists(struct rb_root *hists, | 655 | size_t hists__fprintf(struct hists *self, struct hists *pair, |
555 | struct perf_session *pair, | 656 | bool show_displacement, FILE *fp) |
556 | bool show_displacement, FILE *fp, | ||
557 | u64 session_total) | ||
558 | { | 657 | { |
559 | struct sort_entry *se; | 658 | struct sort_entry *se; |
560 | struct rb_node *nd; | 659 | struct rb_node *nd; |
@@ -563,7 +662,7 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
563 | long displacement = 0; | 662 | long displacement = 0; |
564 | unsigned int width; | 663 | unsigned int width; |
565 | const char *sep = symbol_conf.field_sep; | 664 | const char *sep = symbol_conf.field_sep; |
566 | char *col_width = symbol_conf.col_width_list_str; | 665 | const char *col_width = symbol_conf.col_width_list_str; |
567 | 666 | ||
568 | init_rem_hits(); | 667 | init_rem_hits(); |
569 | 668 | ||
@@ -576,6 +675,24 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
576 | fputs(" Samples ", fp); | 675 | fputs(" Samples ", fp); |
577 | } | 676 | } |
578 | 677 | ||
678 | if (symbol_conf.show_cpu_utilization) { | ||
679 | if (sep) { | ||
680 | ret += fprintf(fp, "%csys", *sep); | ||
681 | ret += fprintf(fp, "%cus", *sep); | ||
682 | if (perf_guest) { | ||
683 | ret += fprintf(fp, "%cguest sys", *sep); | ||
684 | ret += fprintf(fp, "%cguest us", *sep); | ||
685 | } | ||
686 | } else { | ||
687 | ret += fprintf(fp, " sys "); | ||
688 | ret += fprintf(fp, " us "); | ||
689 | if (perf_guest) { | ||
690 | ret += fprintf(fp, " guest sys "); | ||
691 | ret += fprintf(fp, " guest us "); | ||
692 | } | ||
693 | } | ||
694 | } | ||
695 | |||
579 | if (pair) { | 696 | if (pair) { |
580 | if (sep) | 697 | if (sep) |
581 | ret += fprintf(fp, "%cDelta", *sep); | 698 | ret += fprintf(fp, "%cDelta", *sep); |
@@ -594,22 +711,22 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
594 | if (se->elide) | 711 | if (se->elide) |
595 | continue; | 712 | continue; |
596 | if (sep) { | 713 | if (sep) { |
597 | fprintf(fp, "%c%s", *sep, se->header); | 714 | fprintf(fp, "%c%s", *sep, se->se_header); |
598 | continue; | 715 | continue; |
599 | } | 716 | } |
600 | width = strlen(se->header); | 717 | width = strlen(se->se_header); |
601 | if (se->width) { | 718 | if (se->se_width) { |
602 | if (symbol_conf.col_width_list_str) { | 719 | if (symbol_conf.col_width_list_str) { |
603 | if (col_width) { | 720 | if (col_width) { |
604 | *se->width = atoi(col_width); | 721 | *se->se_width = atoi(col_width); |
605 | col_width = strchr(col_width, ','); | 722 | col_width = strchr(col_width, ','); |
606 | if (col_width) | 723 | if (col_width) |
607 | ++col_width; | 724 | ++col_width; |
608 | } | 725 | } |
609 | } | 726 | } |
610 | width = *se->width = max(*se->width, width); | 727 | width = *se->se_width = max(*se->se_width, width); |
611 | } | 728 | } |
612 | fprintf(fp, " %*s", width, se->header); | 729 | fprintf(fp, " %*s", width, se->se_header); |
613 | } | 730 | } |
614 | fprintf(fp, "\n"); | 731 | fprintf(fp, "\n"); |
615 | 732 | ||
@@ -631,10 +748,10 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
631 | continue; | 748 | continue; |
632 | 749 | ||
633 | fprintf(fp, " "); | 750 | fprintf(fp, " "); |
634 | if (se->width) | 751 | if (se->se_width) |
635 | width = *se->width; | 752 | width = *se->se_width; |
636 | else | 753 | else |
637 | width = strlen(se->header); | 754 | width = strlen(se->se_header); |
638 | for (i = 0; i < width; i++) | 755 | for (i = 0; i < width; i++) |
639 | fprintf(fp, "."); | 756 | fprintf(fp, "."); |
640 | } | 757 | } |
@@ -642,7 +759,7 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
642 | fprintf(fp, "\n#\n"); | 759 | fprintf(fp, "\n#\n"); |
643 | 760 | ||
644 | print_entries: | 761 | print_entries: |
645 | for (nd = rb_first(hists); nd; nd = rb_next(nd)) { | 762 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { |
646 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | 763 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); |
647 | 764 | ||
648 | if (show_displacement) { | 765 | if (show_displacement) { |
@@ -654,10 +771,14 @@ print_entries: | |||
654 | ++position; | 771 | ++position; |
655 | } | 772 | } |
656 | ret += hist_entry__fprintf(h, pair, show_displacement, | 773 | ret += hist_entry__fprintf(h, pair, show_displacement, |
657 | displacement, fp, session_total); | 774 | displacement, fp, self->stats.total_period); |
658 | if (h->map == NULL && verbose > 1) { | 775 | |
776 | if (symbol_conf.use_callchain) | ||
777 | ret += hist_entry__fprintf_callchain(h, fp, self->stats.total_period); | ||
778 | |||
779 | if (h->ms.map == NULL && verbose > 1) { | ||
659 | __map_groups__fprintf_maps(&h->thread->mg, | 780 | __map_groups__fprintf_maps(&h->thread->mg, |
660 | MAP__FUNCTION, fp); | 781 | MAP__FUNCTION, verbose, fp); |
661 | fprintf(fp, "%.10s end\n", graph_dotted_line); | 782 | fprintf(fp, "%.10s end\n", graph_dotted_line); |
662 | } | 783 | } |
663 | } | 784 | } |
@@ -666,3 +787,271 @@ print_entries: | |||
666 | 787 | ||
667 | return ret; | 788 | return ret; |
668 | } | 789 | } |
790 | |||
791 | enum hist_filter { | ||
792 | HIST_FILTER__DSO, | ||
793 | HIST_FILTER__THREAD, | ||
794 | }; | ||
795 | |||
796 | void hists__filter_by_dso(struct hists *self, const struct dso *dso) | ||
797 | { | ||
798 | struct rb_node *nd; | ||
799 | |||
800 | self->nr_entries = self->stats.total_period = 0; | ||
801 | self->stats.nr_events[PERF_RECORD_SAMPLE] = 0; | ||
802 | self->max_sym_namelen = 0; | ||
803 | |||
804 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { | ||
805 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
806 | |||
807 | if (symbol_conf.exclude_other && !h->parent) | ||
808 | continue; | ||
809 | |||
810 | if (dso != NULL && (h->ms.map == NULL || h->ms.map->dso != dso)) { | ||
811 | h->filtered |= (1 << HIST_FILTER__DSO); | ||
812 | continue; | ||
813 | } | ||
814 | |||
815 | h->filtered &= ~(1 << HIST_FILTER__DSO); | ||
816 | if (!h->filtered) { | ||
817 | ++self->nr_entries; | ||
818 | self->stats.total_period += h->period; | ||
819 | self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events; | ||
820 | if (h->ms.sym && | ||
821 | self->max_sym_namelen < h->ms.sym->namelen) | ||
822 | self->max_sym_namelen = h->ms.sym->namelen; | ||
823 | } | ||
824 | } | ||
825 | } | ||
826 | |||
827 | void hists__filter_by_thread(struct hists *self, const struct thread *thread) | ||
828 | { | ||
829 | struct rb_node *nd; | ||
830 | |||
831 | self->nr_entries = self->stats.total_period = 0; | ||
832 | self->stats.nr_events[PERF_RECORD_SAMPLE] = 0; | ||
833 | self->max_sym_namelen = 0; | ||
834 | |||
835 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { | ||
836 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
837 | |||
838 | if (thread != NULL && h->thread != thread) { | ||
839 | h->filtered |= (1 << HIST_FILTER__THREAD); | ||
840 | continue; | ||
841 | } | ||
842 | h->filtered &= ~(1 << HIST_FILTER__THREAD); | ||
843 | if (!h->filtered) { | ||
844 | ++self->nr_entries; | ||
845 | self->stats.total_period += h->period; | ||
846 | self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events; | ||
847 | if (h->ms.sym && | ||
848 | self->max_sym_namelen < h->ms.sym->namelen) | ||
849 | self->max_sym_namelen = h->ms.sym->namelen; | ||
850 | } | ||
851 | } | ||
852 | } | ||
853 | |||
854 | static int symbol__alloc_hist(struct symbol *self) | ||
855 | { | ||
856 | struct sym_priv *priv = symbol__priv(self); | ||
857 | const int size = (sizeof(*priv->hist) + | ||
858 | (self->end - self->start) * sizeof(u64)); | ||
859 | |||
860 | priv->hist = zalloc(size); | ||
861 | return priv->hist == NULL ? -1 : 0; | ||
862 | } | ||
863 | |||
864 | int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip) | ||
865 | { | ||
866 | unsigned int sym_size, offset; | ||
867 | struct symbol *sym = self->ms.sym; | ||
868 | struct sym_priv *priv; | ||
869 | struct sym_hist *h; | ||
870 | |||
871 | if (!sym || !self->ms.map) | ||
872 | return 0; | ||
873 | |||
874 | priv = symbol__priv(sym); | ||
875 | if (priv->hist == NULL && symbol__alloc_hist(sym) < 0) | ||
876 | return -ENOMEM; | ||
877 | |||
878 | sym_size = sym->end - sym->start; | ||
879 | offset = ip - sym->start; | ||
880 | |||
881 | pr_debug3("%s: ip=%#Lx\n", __func__, self->ms.map->unmap_ip(self->ms.map, ip)); | ||
882 | |||
883 | if (offset >= sym_size) | ||
884 | return 0; | ||
885 | |||
886 | h = priv->hist; | ||
887 | h->sum++; | ||
888 | h->ip[offset]++; | ||
889 | |||
890 | pr_debug3("%#Lx %s: period++ [ip: %#Lx, %#Lx] => %Ld\n", self->ms.sym->start, | ||
891 | self->ms.sym->name, ip, ip - self->ms.sym->start, h->ip[offset]); | ||
892 | return 0; | ||
893 | } | ||
894 | |||
895 | static struct objdump_line *objdump_line__new(s64 offset, char *line) | ||
896 | { | ||
897 | struct objdump_line *self = malloc(sizeof(*self)); | ||
898 | |||
899 | if (self != NULL) { | ||
900 | self->offset = offset; | ||
901 | self->line = line; | ||
902 | } | ||
903 | |||
904 | return self; | ||
905 | } | ||
906 | |||
907 | void objdump_line__free(struct objdump_line *self) | ||
908 | { | ||
909 | free(self->line); | ||
910 | free(self); | ||
911 | } | ||
912 | |||
913 | static void objdump__add_line(struct list_head *head, struct objdump_line *line) | ||
914 | { | ||
915 | list_add_tail(&line->node, head); | ||
916 | } | ||
917 | |||
918 | struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
919 | struct objdump_line *pos) | ||
920 | { | ||
921 | list_for_each_entry_continue(pos, head, node) | ||
922 | if (pos->offset >= 0) | ||
923 | return pos; | ||
924 | |||
925 | return NULL; | ||
926 | } | ||
927 | |||
928 | static int hist_entry__parse_objdump_line(struct hist_entry *self, FILE *file, | ||
929 | struct list_head *head) | ||
930 | { | ||
931 | struct symbol *sym = self->ms.sym; | ||
932 | struct objdump_line *objdump_line; | ||
933 | char *line = NULL, *tmp, *tmp2, *c; | ||
934 | size_t line_len; | ||
935 | s64 line_ip, offset = -1; | ||
936 | |||
937 | if (getline(&line, &line_len, file) < 0) | ||
938 | return -1; | ||
939 | |||
940 | if (!line) | ||
941 | return -1; | ||
942 | |||
943 | while (line_len != 0 && isspace(line[line_len - 1])) | ||
944 | line[--line_len] = '\0'; | ||
945 | |||
946 | c = strchr(line, '\n'); | ||
947 | if (c) | ||
948 | *c = 0; | ||
949 | |||
950 | line_ip = -1; | ||
951 | |||
952 | /* | ||
953 | * Strip leading spaces: | ||
954 | */ | ||
955 | tmp = line; | ||
956 | while (*tmp) { | ||
957 | if (*tmp != ' ') | ||
958 | break; | ||
959 | tmp++; | ||
960 | } | ||
961 | |||
962 | if (*tmp) { | ||
963 | /* | ||
964 | * Parse hexa addresses followed by ':' | ||
965 | */ | ||
966 | line_ip = strtoull(tmp, &tmp2, 16); | ||
967 | if (*tmp2 != ':') | ||
968 | line_ip = -1; | ||
969 | } | ||
970 | |||
971 | if (line_ip != -1) { | ||
972 | u64 start = map__rip_2objdump(self->ms.map, sym->start); | ||
973 | offset = line_ip - start; | ||
974 | } | ||
975 | |||
976 | objdump_line = objdump_line__new(offset, line); | ||
977 | if (objdump_line == NULL) { | ||
978 | free(line); | ||
979 | return -1; | ||
980 | } | ||
981 | objdump__add_line(head, objdump_line); | ||
982 | |||
983 | return 0; | ||
984 | } | ||
985 | |||
986 | int hist_entry__annotate(struct hist_entry *self, struct list_head *head) | ||
987 | { | ||
988 | struct symbol *sym = self->ms.sym; | ||
989 | struct map *map = self->ms.map; | ||
990 | struct dso *dso = map->dso; | ||
991 | const char *filename = dso->long_name; | ||
992 | char command[PATH_MAX * 2]; | ||
993 | FILE *file; | ||
994 | u64 len; | ||
995 | |||
996 | if (!filename) | ||
997 | return -1; | ||
998 | |||
999 | if (dso->origin == DSO__ORIG_KERNEL) { | ||
1000 | if (dso->annotate_warned) | ||
1001 | return 0; | ||
1002 | dso->annotate_warned = 1; | ||
1003 | pr_err("Can't annotate %s: No vmlinux file was found in the " | ||
1004 | "path:\n", sym->name); | ||
1005 | vmlinux_path__fprintf(stderr); | ||
1006 | return -1; | ||
1007 | } | ||
1008 | |||
1009 | pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__, | ||
1010 | filename, sym->name, map->unmap_ip(map, sym->start), | ||
1011 | map->unmap_ip(map, sym->end)); | ||
1012 | |||
1013 | len = sym->end - sym->start; | ||
1014 | |||
1015 | pr_debug("annotating [%p] %30s : [%p] %30s\n", | ||
1016 | dso, dso->long_name, sym, sym->name); | ||
1017 | |||
1018 | snprintf(command, sizeof(command), | ||
1019 | "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s|expand", | ||
1020 | map__rip_2objdump(map, sym->start), | ||
1021 | map__rip_2objdump(map, sym->end), | ||
1022 | filename, filename); | ||
1023 | |||
1024 | pr_debug("Executing: %s\n", command); | ||
1025 | |||
1026 | file = popen(command, "r"); | ||
1027 | if (!file) | ||
1028 | return -1; | ||
1029 | |||
1030 | while (!feof(file)) | ||
1031 | if (hist_entry__parse_objdump_line(self, file, head) < 0) | ||
1032 | break; | ||
1033 | |||
1034 | pclose(file); | ||
1035 | return 0; | ||
1036 | } | ||
1037 | |||
1038 | void hists__inc_nr_events(struct hists *self, u32 type) | ||
1039 | { | ||
1040 | ++self->stats.nr_events[0]; | ||
1041 | ++self->stats.nr_events[type]; | ||
1042 | } | ||
1043 | |||
1044 | size_t hists__fprintf_nr_events(struct hists *self, FILE *fp) | ||
1045 | { | ||
1046 | int i; | ||
1047 | size_t ret = 0; | ||
1048 | |||
1049 | for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) { | ||
1050 | if (!event__name[i]) | ||
1051 | continue; | ||
1052 | ret += fprintf(fp, "%10s events: %10d\n", | ||
1053 | event__name[i], self->stats.nr_events[i]); | ||
1054 | } | ||
1055 | |||
1056 | return ret; | ||
1057 | } | ||
diff --git a/tools/perf/util/hist.h b/tools/perf/util/hist.h index 16f360cce5bf..6f17dcd8412c 100644 --- a/tools/perf/util/hist.h +++ b/tools/perf/util/hist.h | |||
@@ -6,24 +6,104 @@ | |||
6 | 6 | ||
7 | extern struct callchain_param callchain_param; | 7 | extern struct callchain_param callchain_param; |
8 | 8 | ||
9 | struct perf_session; | ||
10 | struct hist_entry; | 9 | struct hist_entry; |
11 | struct addr_location; | 10 | struct addr_location; |
12 | struct symbol; | 11 | struct symbol; |
13 | struct rb_root; | 12 | struct rb_root; |
14 | 13 | ||
15 | struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | 14 | struct objdump_line { |
16 | struct addr_location *al, | 15 | struct list_head node; |
17 | struct symbol *parent, | 16 | s64 offset; |
18 | u64 count, bool *hit); | 17 | char *line; |
18 | }; | ||
19 | |||
20 | void objdump_line__free(struct objdump_line *self); | ||
21 | struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
22 | struct objdump_line *pos); | ||
23 | |||
24 | struct sym_hist { | ||
25 | u64 sum; | ||
26 | u64 ip[0]; | ||
27 | }; | ||
28 | |||
29 | struct sym_ext { | ||
30 | struct rb_node node; | ||
31 | double percent; | ||
32 | char *path; | ||
33 | }; | ||
34 | |||
35 | struct sym_priv { | ||
36 | struct sym_hist *hist; | ||
37 | struct sym_ext *ext; | ||
38 | }; | ||
39 | |||
40 | /* | ||
41 | * The kernel collects the number of events it couldn't send in a stretch and | ||
42 | * when possible sends this number in a PERF_RECORD_LOST event. The number of | ||
43 | * such "chunks" of lost events is stored in .nr_events[PERF_EVENT_LOST] while | ||
44 | * total_lost tells exactly how many events the kernel in fact lost, i.e. it is | ||
45 | * the sum of all struct lost_event.lost fields reported. | ||
46 | * | ||
47 | * The total_period is needed because by default auto-freq is used, so | ||
48 | * multipling nr_events[PERF_EVENT_SAMPLE] by a frequency isn't possible to get | ||
49 | * the total number of low level events, it is necessary to to sum all struct | ||
50 | * sample_event.period and stash the result in total_period. | ||
51 | */ | ||
52 | struct events_stats { | ||
53 | u64 total_period; | ||
54 | u64 total_lost; | ||
55 | u32 nr_events[PERF_RECORD_HEADER_MAX]; | ||
56 | u32 nr_unknown_events; | ||
57 | }; | ||
58 | |||
59 | struct hists { | ||
60 | struct rb_node rb_node; | ||
61 | struct rb_root entries; | ||
62 | u64 nr_entries; | ||
63 | struct events_stats stats; | ||
64 | u64 config; | ||
65 | u64 event_stream; | ||
66 | u32 type; | ||
67 | u32 max_sym_namelen; | ||
68 | }; | ||
69 | |||
70 | struct hist_entry *__hists__add_entry(struct hists *self, | ||
71 | struct addr_location *al, | ||
72 | struct symbol *parent, u64 period); | ||
19 | extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *); | 73 | extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *); |
20 | extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *); | 74 | extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *); |
75 | int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists, | ||
76 | bool show_displacement, long displacement, FILE *fp, | ||
77 | u64 total); | ||
78 | int hist_entry__snprintf(struct hist_entry *self, char *bf, size_t size, | ||
79 | struct hists *pair_hists, bool show_displacement, | ||
80 | long displacement, bool color, u64 total); | ||
21 | void hist_entry__free(struct hist_entry *); | 81 | void hist_entry__free(struct hist_entry *); |
22 | 82 | ||
23 | void perf_session__output_resort(struct rb_root *hists, u64 total_samples); | 83 | void hists__output_resort(struct hists *self); |
24 | void perf_session__collapse_resort(struct rb_root *hists); | 84 | void hists__collapse_resort(struct hists *self); |
25 | size_t perf_session__fprintf_hists(struct rb_root *hists, | 85 | |
26 | struct perf_session *pair, | 86 | void hists__inc_nr_events(struct hists *self, u32 type); |
27 | bool show_displacement, FILE *fp, | 87 | size_t hists__fprintf_nr_events(struct hists *self, FILE *fp); |
28 | u64 session_total); | 88 | |
89 | size_t hists__fprintf(struct hists *self, struct hists *pair, | ||
90 | bool show_displacement, FILE *fp); | ||
91 | |||
92 | int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip); | ||
93 | int hist_entry__annotate(struct hist_entry *self, struct list_head *head); | ||
94 | |||
95 | void hists__filter_by_dso(struct hists *self, const struct dso *dso); | ||
96 | void hists__filter_by_thread(struct hists *self, const struct thread *thread); | ||
97 | |||
98 | #ifdef NO_NEWT_SUPPORT | ||
99 | static inline int hists__browse(struct hists *self __used, | ||
100 | const char *helpline __used, | ||
101 | const char *input_name __used) | ||
102 | { | ||
103 | return 0; | ||
104 | } | ||
105 | #else | ||
106 | int hists__browse(struct hists *self, const char *helpline, | ||
107 | const char *input_name); | ||
108 | #endif | ||
29 | #endif /* __PERF_HIST_H */ | 109 | #endif /* __PERF_HIST_H */ |
diff --git a/tools/perf/util/hweight.c b/tools/perf/util/hweight.c new file mode 100644 index 000000000000..5c1d0d099f0d --- /dev/null +++ b/tools/perf/util/hweight.c | |||
@@ -0,0 +1,31 @@ | |||
1 | #include <linux/bitops.h> | ||
2 | |||
3 | /** | ||
4 | * hweightN - returns the hamming weight of a N-bit word | ||
5 | * @x: the word to weigh | ||
6 | * | ||
7 | * The Hamming Weight of a number is the total number of bits set in it. | ||
8 | */ | ||
9 | |||
10 | unsigned int hweight32(unsigned int w) | ||
11 | { | ||
12 | unsigned int res = w - ((w >> 1) & 0x55555555); | ||
13 | res = (res & 0x33333333) + ((res >> 2) & 0x33333333); | ||
14 | res = (res + (res >> 4)) & 0x0F0F0F0F; | ||
15 | res = res + (res >> 8); | ||
16 | return (res + (res >> 16)) & 0x000000FF; | ||
17 | } | ||
18 | |||
19 | unsigned long hweight64(__u64 w) | ||
20 | { | ||
21 | #if BITS_PER_LONG == 32 | ||
22 | return hweight32((unsigned int)(w >> 32)) + hweight32((unsigned int)w); | ||
23 | #elif BITS_PER_LONG == 64 | ||
24 | __u64 res = w - ((w >> 1) & 0x5555555555555555ul); | ||
25 | res = (res & 0x3333333333333333ul) + ((res >> 2) & 0x3333333333333333ul); | ||
26 | res = (res + (res >> 4)) & 0x0F0F0F0F0F0F0F0Ful; | ||
27 | res = res + (res >> 8); | ||
28 | res = res + (res >> 16); | ||
29 | return (res + (res >> 32)) & 0x00000000000000FFul; | ||
30 | #endif | ||
31 | } | ||
diff --git a/tools/perf/util/include/asm/bitops.h b/tools/perf/util/include/asm/bitops.h deleted file mode 100644 index 58e9817ffae0..000000000000 --- a/tools/perf/util/include/asm/bitops.h +++ /dev/null | |||
@@ -1,18 +0,0 @@ | |||
1 | #ifndef _PERF_ASM_BITOPS_H_ | ||
2 | #define _PERF_ASM_BITOPS_H_ | ||
3 | |||
4 | #include <sys/types.h> | ||
5 | #include "../../types.h" | ||
6 | #include <linux/compiler.h> | ||
7 | |||
8 | /* CHECKME: Not sure both always match */ | ||
9 | #define BITS_PER_LONG __WORDSIZE | ||
10 | |||
11 | #include "../../../../include/asm-generic/bitops/__fls.h" | ||
12 | #include "../../../../include/asm-generic/bitops/fls.h" | ||
13 | #include "../../../../include/asm-generic/bitops/fls64.h" | ||
14 | #include "../../../../include/asm-generic/bitops/__ffs.h" | ||
15 | #include "../../../../include/asm-generic/bitops/ffz.h" | ||
16 | #include "../../../../include/asm-generic/bitops/hweight.h" | ||
17 | |||
18 | #endif | ||
diff --git a/tools/perf/util/include/asm/hweight.h b/tools/perf/util/include/asm/hweight.h new file mode 100644 index 000000000000..36cf26d434a5 --- /dev/null +++ b/tools/perf/util/include/asm/hweight.h | |||
@@ -0,0 +1,8 @@ | |||
1 | #ifndef PERF_HWEIGHT_H | ||
2 | #define PERF_HWEIGHT_H | ||
3 | |||
4 | #include <linux/types.h> | ||
5 | unsigned int hweight32(unsigned int w); | ||
6 | unsigned long hweight64(__u64 w); | ||
7 | |||
8 | #endif /* PERF_HWEIGHT_H */ | ||
diff --git a/tools/perf/util/include/dwarf-regs.h b/tools/perf/util/include/dwarf-regs.h new file mode 100644 index 000000000000..cf6727e99c44 --- /dev/null +++ b/tools/perf/util/include/dwarf-regs.h | |||
@@ -0,0 +1,8 @@ | |||
1 | #ifndef _PERF_DWARF_REGS_H_ | ||
2 | #define _PERF_DWARF_REGS_H_ | ||
3 | |||
4 | #ifdef DWARF_SUPPORT | ||
5 | const char *get_arch_regstr(unsigned int n); | ||
6 | #endif | ||
7 | |||
8 | #endif | ||
diff --git a/tools/perf/util/include/linux/bitmap.h b/tools/perf/util/include/linux/bitmap.h index 94507639a8c4..eda4416efa0a 100644 --- a/tools/perf/util/include/linux/bitmap.h +++ b/tools/perf/util/include/linux/bitmap.h | |||
@@ -1,3 +1,35 @@ | |||
1 | #include "../../../../include/linux/bitmap.h" | 1 | #ifndef _PERF_BITOPS_H |
2 | #include "../../../../include/asm-generic/bitops/find.h" | 2 | #define _PERF_BITOPS_H |
3 | #include <linux/errno.h> | 3 | |
4 | #include <string.h> | ||
5 | #include <linux/bitops.h> | ||
6 | |||
7 | int __bitmap_weight(const unsigned long *bitmap, int bits); | ||
8 | |||
9 | #define BITMAP_LAST_WORD_MASK(nbits) \ | ||
10 | ( \ | ||
11 | ((nbits) % BITS_PER_LONG) ? \ | ||
12 | (1UL<<((nbits) % BITS_PER_LONG))-1 : ~0UL \ | ||
13 | ) | ||
14 | |||
15 | #define small_const_nbits(nbits) \ | ||
16 | (__builtin_constant_p(nbits) && (nbits) <= BITS_PER_LONG) | ||
17 | |||
18 | static inline void bitmap_zero(unsigned long *dst, int nbits) | ||
19 | { | ||
20 | if (small_const_nbits(nbits)) | ||
21 | *dst = 0UL; | ||
22 | else { | ||
23 | int len = BITS_TO_LONGS(nbits) * sizeof(unsigned long); | ||
24 | memset(dst, 0, len); | ||
25 | } | ||
26 | } | ||
27 | |||
28 | static inline int bitmap_weight(const unsigned long *src, int nbits) | ||
29 | { | ||
30 | if (small_const_nbits(nbits)) | ||
31 | return hweight_long(*src & BITMAP_LAST_WORD_MASK(nbits)); | ||
32 | return __bitmap_weight(src, nbits); | ||
33 | } | ||
34 | |||
35 | #endif /* _PERF_BITOPS_H */ | ||
diff --git a/tools/perf/util/include/linux/bitops.h b/tools/perf/util/include/linux/bitops.h index 8d63116e9435..bb4ac2e05385 100644 --- a/tools/perf/util/include/linux/bitops.h +++ b/tools/perf/util/include/linux/bitops.h | |||
@@ -1,13 +1,12 @@ | |||
1 | #ifndef _PERF_LINUX_BITOPS_H_ | 1 | #ifndef _PERF_LINUX_BITOPS_H_ |
2 | #define _PERF_LINUX_BITOPS_H_ | 2 | #define _PERF_LINUX_BITOPS_H_ |
3 | 3 | ||
4 | #define __KERNEL__ | 4 | #include <linux/kernel.h> |
5 | #include <asm/hweight.h> | ||
5 | 6 | ||
6 | #define CONFIG_GENERIC_FIND_NEXT_BIT | 7 | #define BITS_PER_LONG __WORDSIZE |
7 | #define CONFIG_GENERIC_FIND_FIRST_BIT | 8 | #define BITS_PER_BYTE 8 |
8 | #include "../../../../include/linux/bitops.h" | 9 | #define BITS_TO_LONGS(nr) DIV_ROUND_UP(nr, BITS_PER_BYTE * sizeof(long)) |
9 | |||
10 | #undef __KERNEL__ | ||
11 | 10 | ||
12 | static inline void set_bit(int nr, unsigned long *addr) | 11 | static inline void set_bit(int nr, unsigned long *addr) |
13 | { | 12 | { |
@@ -20,10 +19,9 @@ static __always_inline int test_bit(unsigned int nr, const unsigned long *addr) | |||
20 | (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0; | 19 | (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0; |
21 | } | 20 | } |
22 | 21 | ||
23 | unsigned long generic_find_next_zero_le_bit(const unsigned long *addr, unsigned | 22 | static inline unsigned long hweight_long(unsigned long w) |
24 | long size, unsigned long offset); | 23 | { |
25 | 24 | return sizeof(w) == 4 ? hweight32(w) : hweight64(w); | |
26 | unsigned long generic_find_next_le_bit(const unsigned long *addr, unsigned | 25 | } |
27 | long size, unsigned long offset); | ||
28 | 26 | ||
29 | #endif | 27 | #endif |
diff --git a/tools/perf/util/include/linux/compiler.h b/tools/perf/util/include/linux/compiler.h index dfb0713ed47f..791f9dd27ebf 100644 --- a/tools/perf/util/include/linux/compiler.h +++ b/tools/perf/util/include/linux/compiler.h | |||
@@ -7,4 +7,6 @@ | |||
7 | #define __user | 7 | #define __user |
8 | #define __attribute_const__ | 8 | #define __attribute_const__ |
9 | 9 | ||
10 | #define __used __attribute__((__unused__)) | ||
11 | |||
10 | #endif | 12 | #endif |
diff --git a/tools/perf/util/include/linux/kernel.h b/tools/perf/util/include/linux/kernel.h index f2611655ab51..1eb804fd3fbf 100644 --- a/tools/perf/util/include/linux/kernel.h +++ b/tools/perf/util/include/linux/kernel.h | |||
@@ -28,6 +28,8 @@ | |||
28 | (type *)((char *)__mptr - offsetof(type, member)); }) | 28 | (type *)((char *)__mptr - offsetof(type, member)); }) |
29 | #endif | 29 | #endif |
30 | 30 | ||
31 | #define BUILD_BUG_ON_ZERO(e) (sizeof(struct { int:-!!(e); })) | ||
32 | |||
31 | #ifndef max | 33 | #ifndef max |
32 | #define max(x, y) ({ \ | 34 | #define max(x, y) ({ \ |
33 | typeof(x) _max1 = (x); \ | 35 | typeof(x) _max1 = (x); \ |
@@ -85,16 +87,19 @@ simple_strtoul(const char *nptr, char **endptr, int base) | |||
85 | return strtoul(nptr, endptr, base); | 87 | return strtoul(nptr, endptr, base); |
86 | } | 88 | } |
87 | 89 | ||
90 | int eprintf(int level, | ||
91 | const char *fmt, ...) __attribute__((format(printf, 2, 3))); | ||
92 | |||
88 | #ifndef pr_fmt | 93 | #ifndef pr_fmt |
89 | #define pr_fmt(fmt) fmt | 94 | #define pr_fmt(fmt) fmt |
90 | #endif | 95 | #endif |
91 | 96 | ||
92 | #define pr_err(fmt, ...) \ | 97 | #define pr_err(fmt, ...) \ |
93 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 98 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
94 | #define pr_warning(fmt, ...) \ | 99 | #define pr_warning(fmt, ...) \ |
95 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 100 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
96 | #define pr_info(fmt, ...) \ | 101 | #define pr_info(fmt, ...) \ |
97 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 102 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
98 | #define pr_debug(fmt, ...) \ | 103 | #define pr_debug(fmt, ...) \ |
99 | eprintf(1, pr_fmt(fmt), ##__VA_ARGS__) | 104 | eprintf(1, pr_fmt(fmt), ##__VA_ARGS__) |
100 | #define pr_debugN(n, fmt, ...) \ | 105 | #define pr_debugN(n, fmt, ...) \ |
diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c index e509cd59c67d..e672f2fef65b 100644 --- a/tools/perf/util/map.c +++ b/tools/perf/util/map.c | |||
@@ -1,9 +1,11 @@ | |||
1 | #include "event.h" | ||
2 | #include "symbol.h" | 1 | #include "symbol.h" |
2 | #include <errno.h> | ||
3 | #include <limits.h> | ||
3 | #include <stdlib.h> | 4 | #include <stdlib.h> |
4 | #include <string.h> | 5 | #include <string.h> |
5 | #include <stdio.h> | 6 | #include <stdio.h> |
6 | #include "debug.h" | 7 | #include <unistd.h> |
8 | #include "map.h" | ||
7 | 9 | ||
8 | const char *map_type__name[MAP__NR_TYPES] = { | 10 | const char *map_type__name[MAP__NR_TYPES] = { |
9 | [MAP__FUNCTION] = "Functions", | 11 | [MAP__FUNCTION] = "Functions", |
@@ -36,15 +38,16 @@ void map__init(struct map *self, enum map_type type, | |||
36 | self->map_ip = map__map_ip; | 38 | self->map_ip = map__map_ip; |
37 | self->unmap_ip = map__unmap_ip; | 39 | self->unmap_ip = map__unmap_ip; |
38 | RB_CLEAR_NODE(&self->rb_node); | 40 | RB_CLEAR_NODE(&self->rb_node); |
41 | self->groups = NULL; | ||
39 | } | 42 | } |
40 | 43 | ||
41 | struct map *map__new(struct mmap_event *event, enum map_type type, | 44 | struct map *map__new(struct list_head *dsos__list, u64 start, u64 len, |
42 | char *cwd, int cwdlen) | 45 | u64 pgoff, u32 pid, char *filename, |
46 | enum map_type type, char *cwd, int cwdlen) | ||
43 | { | 47 | { |
44 | struct map *self = malloc(sizeof(*self)); | 48 | struct map *self = malloc(sizeof(*self)); |
45 | 49 | ||
46 | if (self != NULL) { | 50 | if (self != NULL) { |
47 | const char *filename = event->filename; | ||
48 | char newfilename[PATH_MAX]; | 51 | char newfilename[PATH_MAX]; |
49 | struct dso *dso; | 52 | struct dso *dso; |
50 | int anon; | 53 | int anon; |
@@ -62,16 +65,15 @@ struct map *map__new(struct mmap_event *event, enum map_type type, | |||
62 | anon = is_anon_memory(filename); | 65 | anon = is_anon_memory(filename); |
63 | 66 | ||
64 | if (anon) { | 67 | if (anon) { |
65 | snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", event->pid); | 68 | snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", pid); |
66 | filename = newfilename; | 69 | filename = newfilename; |
67 | } | 70 | } |
68 | 71 | ||
69 | dso = dsos__findnew(filename); | 72 | dso = __dsos__findnew(dsos__list, filename); |
70 | if (dso == NULL) | 73 | if (dso == NULL) |
71 | goto out_delete; | 74 | goto out_delete; |
72 | 75 | ||
73 | map__init(self, type, event->start, event->start + event->len, | 76 | map__init(self, type, start, start + len, pgoff, dso); |
74 | event->pgoff, dso); | ||
75 | 77 | ||
76 | if (anon) { | 78 | if (anon) { |
77 | set_identity: | 79 | set_identity: |
@@ -235,3 +237,392 @@ u64 map__objdump_2ip(struct map *map, u64 addr) | |||
235 | map->unmap_ip(map, addr); /* RIP -> IP */ | 237 | map->unmap_ip(map, addr); /* RIP -> IP */ |
236 | return ip; | 238 | return ip; |
237 | } | 239 | } |
240 | |||
241 | void map_groups__init(struct map_groups *self) | ||
242 | { | ||
243 | int i; | ||
244 | for (i = 0; i < MAP__NR_TYPES; ++i) { | ||
245 | self->maps[i] = RB_ROOT; | ||
246 | INIT_LIST_HEAD(&self->removed_maps[i]); | ||
247 | } | ||
248 | self->machine = NULL; | ||
249 | } | ||
250 | |||
251 | void map_groups__flush(struct map_groups *self) | ||
252 | { | ||
253 | int type; | ||
254 | |||
255 | for (type = 0; type < MAP__NR_TYPES; type++) { | ||
256 | struct rb_root *root = &self->maps[type]; | ||
257 | struct rb_node *next = rb_first(root); | ||
258 | |||
259 | while (next) { | ||
260 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
261 | next = rb_next(&pos->rb_node); | ||
262 | rb_erase(&pos->rb_node, root); | ||
263 | /* | ||
264 | * We may have references to this map, for | ||
265 | * instance in some hist_entry instances, so | ||
266 | * just move them to a separate list. | ||
267 | */ | ||
268 | list_add_tail(&pos->node, &self->removed_maps[pos->type]); | ||
269 | } | ||
270 | } | ||
271 | } | ||
272 | |||
273 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
274 | enum map_type type, u64 addr, | ||
275 | struct map **mapp, | ||
276 | symbol_filter_t filter) | ||
277 | { | ||
278 | struct map *map = map_groups__find(self, type, addr); | ||
279 | |||
280 | if (map != NULL) { | ||
281 | if (mapp != NULL) | ||
282 | *mapp = map; | ||
283 | return map__find_symbol(map, map->map_ip(map, addr), filter); | ||
284 | } | ||
285 | |||
286 | return NULL; | ||
287 | } | ||
288 | |||
289 | struct symbol *map_groups__find_symbol_by_name(struct map_groups *self, | ||
290 | enum map_type type, | ||
291 | const char *name, | ||
292 | struct map **mapp, | ||
293 | symbol_filter_t filter) | ||
294 | { | ||
295 | struct rb_node *nd; | ||
296 | |||
297 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
298 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
299 | struct symbol *sym = map__find_symbol_by_name(pos, name, filter); | ||
300 | |||
301 | if (sym == NULL) | ||
302 | continue; | ||
303 | if (mapp != NULL) | ||
304 | *mapp = pos; | ||
305 | return sym; | ||
306 | } | ||
307 | |||
308 | return NULL; | ||
309 | } | ||
310 | |||
311 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
312 | enum map_type type, int verbose, FILE *fp) | ||
313 | { | ||
314 | size_t printed = fprintf(fp, "%s:\n", map_type__name[type]); | ||
315 | struct rb_node *nd; | ||
316 | |||
317 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
318 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
319 | printed += fprintf(fp, "Map:"); | ||
320 | printed += map__fprintf(pos, fp); | ||
321 | if (verbose > 2) { | ||
322 | printed += dso__fprintf(pos->dso, type, fp); | ||
323 | printed += fprintf(fp, "--\n"); | ||
324 | } | ||
325 | } | ||
326 | |||
327 | return printed; | ||
328 | } | ||
329 | |||
330 | size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp) | ||
331 | { | ||
332 | size_t printed = 0, i; | ||
333 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
334 | printed += __map_groups__fprintf_maps(self, i, verbose, fp); | ||
335 | return printed; | ||
336 | } | ||
337 | |||
338 | static size_t __map_groups__fprintf_removed_maps(struct map_groups *self, | ||
339 | enum map_type type, | ||
340 | int verbose, FILE *fp) | ||
341 | { | ||
342 | struct map *pos; | ||
343 | size_t printed = 0; | ||
344 | |||
345 | list_for_each_entry(pos, &self->removed_maps[type], node) { | ||
346 | printed += fprintf(fp, "Map:"); | ||
347 | printed += map__fprintf(pos, fp); | ||
348 | if (verbose > 1) { | ||
349 | printed += dso__fprintf(pos->dso, type, fp); | ||
350 | printed += fprintf(fp, "--\n"); | ||
351 | } | ||
352 | } | ||
353 | return printed; | ||
354 | } | ||
355 | |||
356 | static size_t map_groups__fprintf_removed_maps(struct map_groups *self, | ||
357 | int verbose, FILE *fp) | ||
358 | { | ||
359 | size_t printed = 0, i; | ||
360 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
361 | printed += __map_groups__fprintf_removed_maps(self, i, verbose, fp); | ||
362 | return printed; | ||
363 | } | ||
364 | |||
365 | size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp) | ||
366 | { | ||
367 | size_t printed = map_groups__fprintf_maps(self, verbose, fp); | ||
368 | printed += fprintf(fp, "Removed maps:\n"); | ||
369 | return printed + map_groups__fprintf_removed_maps(self, verbose, fp); | ||
370 | } | ||
371 | |||
372 | int map_groups__fixup_overlappings(struct map_groups *self, struct map *map, | ||
373 | int verbose, FILE *fp) | ||
374 | { | ||
375 | struct rb_root *root = &self->maps[map->type]; | ||
376 | struct rb_node *next = rb_first(root); | ||
377 | |||
378 | while (next) { | ||
379 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
380 | next = rb_next(&pos->rb_node); | ||
381 | |||
382 | if (!map__overlap(pos, map)) | ||
383 | continue; | ||
384 | |||
385 | if (verbose >= 2) { | ||
386 | fputs("overlapping maps:\n", fp); | ||
387 | map__fprintf(map, fp); | ||
388 | map__fprintf(pos, fp); | ||
389 | } | ||
390 | |||
391 | rb_erase(&pos->rb_node, root); | ||
392 | /* | ||
393 | * We may have references to this map, for instance in some | ||
394 | * hist_entry instances, so just move them to a separate | ||
395 | * list. | ||
396 | */ | ||
397 | list_add_tail(&pos->node, &self->removed_maps[map->type]); | ||
398 | /* | ||
399 | * Now check if we need to create new maps for areas not | ||
400 | * overlapped by the new map: | ||
401 | */ | ||
402 | if (map->start > pos->start) { | ||
403 | struct map *before = map__clone(pos); | ||
404 | |||
405 | if (before == NULL) | ||
406 | return -ENOMEM; | ||
407 | |||
408 | before->end = map->start - 1; | ||
409 | map_groups__insert(self, before); | ||
410 | if (verbose >= 2) | ||
411 | map__fprintf(before, fp); | ||
412 | } | ||
413 | |||
414 | if (map->end < pos->end) { | ||
415 | struct map *after = map__clone(pos); | ||
416 | |||
417 | if (after == NULL) | ||
418 | return -ENOMEM; | ||
419 | |||
420 | after->start = map->end + 1; | ||
421 | map_groups__insert(self, after); | ||
422 | if (verbose >= 2) | ||
423 | map__fprintf(after, fp); | ||
424 | } | ||
425 | } | ||
426 | |||
427 | return 0; | ||
428 | } | ||
429 | |||
430 | /* | ||
431 | * XXX This should not really _copy_ te maps, but refcount them. | ||
432 | */ | ||
433 | int map_groups__clone(struct map_groups *self, | ||
434 | struct map_groups *parent, enum map_type type) | ||
435 | { | ||
436 | struct rb_node *nd; | ||
437 | for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) { | ||
438 | struct map *map = rb_entry(nd, struct map, rb_node); | ||
439 | struct map *new = map__clone(map); | ||
440 | if (new == NULL) | ||
441 | return -ENOMEM; | ||
442 | map_groups__insert(self, new); | ||
443 | } | ||
444 | return 0; | ||
445 | } | ||
446 | |||
447 | static u64 map__reloc_map_ip(struct map *map, u64 ip) | ||
448 | { | ||
449 | return ip + (s64)map->pgoff; | ||
450 | } | ||
451 | |||
452 | static u64 map__reloc_unmap_ip(struct map *map, u64 ip) | ||
453 | { | ||
454 | return ip - (s64)map->pgoff; | ||
455 | } | ||
456 | |||
457 | void map__reloc_vmlinux(struct map *self) | ||
458 | { | ||
459 | struct kmap *kmap = map__kmap(self); | ||
460 | s64 reloc; | ||
461 | |||
462 | if (!kmap->ref_reloc_sym || !kmap->ref_reloc_sym->unrelocated_addr) | ||
463 | return; | ||
464 | |||
465 | reloc = (kmap->ref_reloc_sym->unrelocated_addr - | ||
466 | kmap->ref_reloc_sym->addr); | ||
467 | |||
468 | if (!reloc) | ||
469 | return; | ||
470 | |||
471 | self->map_ip = map__reloc_map_ip; | ||
472 | self->unmap_ip = map__reloc_unmap_ip; | ||
473 | self->pgoff = reloc; | ||
474 | } | ||
475 | |||
476 | void maps__insert(struct rb_root *maps, struct map *map) | ||
477 | { | ||
478 | struct rb_node **p = &maps->rb_node; | ||
479 | struct rb_node *parent = NULL; | ||
480 | const u64 ip = map->start; | ||
481 | struct map *m; | ||
482 | |||
483 | while (*p != NULL) { | ||
484 | parent = *p; | ||
485 | m = rb_entry(parent, struct map, rb_node); | ||
486 | if (ip < m->start) | ||
487 | p = &(*p)->rb_left; | ||
488 | else | ||
489 | p = &(*p)->rb_right; | ||
490 | } | ||
491 | |||
492 | rb_link_node(&map->rb_node, parent, p); | ||
493 | rb_insert_color(&map->rb_node, maps); | ||
494 | } | ||
495 | |||
496 | struct map *maps__find(struct rb_root *maps, u64 ip) | ||
497 | { | ||
498 | struct rb_node **p = &maps->rb_node; | ||
499 | struct rb_node *parent = NULL; | ||
500 | struct map *m; | ||
501 | |||
502 | while (*p != NULL) { | ||
503 | parent = *p; | ||
504 | m = rb_entry(parent, struct map, rb_node); | ||
505 | if (ip < m->start) | ||
506 | p = &(*p)->rb_left; | ||
507 | else if (ip > m->end) | ||
508 | p = &(*p)->rb_right; | ||
509 | else | ||
510 | return m; | ||
511 | } | ||
512 | |||
513 | return NULL; | ||
514 | } | ||
515 | |||
516 | int machine__init(struct machine *self, const char *root_dir, pid_t pid) | ||
517 | { | ||
518 | map_groups__init(&self->kmaps); | ||
519 | RB_CLEAR_NODE(&self->rb_node); | ||
520 | INIT_LIST_HEAD(&self->user_dsos); | ||
521 | INIT_LIST_HEAD(&self->kernel_dsos); | ||
522 | |||
523 | self->kmaps.machine = self; | ||
524 | self->pid = pid; | ||
525 | self->root_dir = strdup(root_dir); | ||
526 | return self->root_dir == NULL ? -ENOMEM : 0; | ||
527 | } | ||
528 | |||
529 | struct machine *machines__add(struct rb_root *self, pid_t pid, | ||
530 | const char *root_dir) | ||
531 | { | ||
532 | struct rb_node **p = &self->rb_node; | ||
533 | struct rb_node *parent = NULL; | ||
534 | struct machine *pos, *machine = malloc(sizeof(*machine)); | ||
535 | |||
536 | if (!machine) | ||
537 | return NULL; | ||
538 | |||
539 | if (machine__init(machine, root_dir, pid) != 0) { | ||
540 | free(machine); | ||
541 | return NULL; | ||
542 | } | ||
543 | |||
544 | while (*p != NULL) { | ||
545 | parent = *p; | ||
546 | pos = rb_entry(parent, struct machine, rb_node); | ||
547 | if (pid < pos->pid) | ||
548 | p = &(*p)->rb_left; | ||
549 | else | ||
550 | p = &(*p)->rb_right; | ||
551 | } | ||
552 | |||
553 | rb_link_node(&machine->rb_node, parent, p); | ||
554 | rb_insert_color(&machine->rb_node, self); | ||
555 | |||
556 | return machine; | ||
557 | } | ||
558 | |||
559 | struct machine *machines__find(struct rb_root *self, pid_t pid) | ||
560 | { | ||
561 | struct rb_node **p = &self->rb_node; | ||
562 | struct rb_node *parent = NULL; | ||
563 | struct machine *machine; | ||
564 | struct machine *default_machine = NULL; | ||
565 | |||
566 | while (*p != NULL) { | ||
567 | parent = *p; | ||
568 | machine = rb_entry(parent, struct machine, rb_node); | ||
569 | if (pid < machine->pid) | ||
570 | p = &(*p)->rb_left; | ||
571 | else if (pid > machine->pid) | ||
572 | p = &(*p)->rb_right; | ||
573 | else | ||
574 | return machine; | ||
575 | if (!machine->pid) | ||
576 | default_machine = machine; | ||
577 | } | ||
578 | |||
579 | return default_machine; | ||
580 | } | ||
581 | |||
582 | struct machine *machines__findnew(struct rb_root *self, pid_t pid) | ||
583 | { | ||
584 | char path[PATH_MAX]; | ||
585 | const char *root_dir; | ||
586 | struct machine *machine = machines__find(self, pid); | ||
587 | |||
588 | if (!machine || machine->pid != pid) { | ||
589 | if (pid == HOST_KERNEL_ID || pid == DEFAULT_GUEST_KERNEL_ID) | ||
590 | root_dir = ""; | ||
591 | else { | ||
592 | if (!symbol_conf.guestmount) | ||
593 | goto out; | ||
594 | sprintf(path, "%s/%d", symbol_conf.guestmount, pid); | ||
595 | if (access(path, R_OK)) { | ||
596 | pr_err("Can't access file %s\n", path); | ||
597 | goto out; | ||
598 | } | ||
599 | root_dir = path; | ||
600 | } | ||
601 | machine = machines__add(self, pid, root_dir); | ||
602 | } | ||
603 | |||
604 | out: | ||
605 | return machine; | ||
606 | } | ||
607 | |||
608 | void machines__process(struct rb_root *self, machine__process_t process, void *data) | ||
609 | { | ||
610 | struct rb_node *nd; | ||
611 | |||
612 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
613 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
614 | process(pos, data); | ||
615 | } | ||
616 | } | ||
617 | |||
618 | char *machine__mmap_name(struct machine *self, char *bf, size_t size) | ||
619 | { | ||
620 | if (machine__is_host(self)) | ||
621 | snprintf(bf, size, "[%s]", "kernel.kallsyms"); | ||
622 | else if (machine__is_default_guest(self)) | ||
623 | snprintf(bf, size, "[%s]", "guest.kernel.kallsyms"); | ||
624 | else | ||
625 | snprintf(bf, size, "[%s.%d]", "guest.kernel.kallsyms", self->pid); | ||
626 | |||
627 | return bf; | ||
628 | } | ||
diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h index b756368076c6..f39134512829 100644 --- a/tools/perf/util/map.h +++ b/tools/perf/util/map.h | |||
@@ -4,7 +4,9 @@ | |||
4 | #include <linux/compiler.h> | 4 | #include <linux/compiler.h> |
5 | #include <linux/list.h> | 5 | #include <linux/list.h> |
6 | #include <linux/rbtree.h> | 6 | #include <linux/rbtree.h> |
7 | #include <linux/types.h> | 7 | #include <stdio.h> |
8 | #include <stdbool.h> | ||
9 | #include "types.h" | ||
8 | 10 | ||
9 | enum map_type { | 11 | enum map_type { |
10 | MAP__FUNCTION = 0, | 12 | MAP__FUNCTION = 0, |
@@ -18,6 +20,7 @@ extern const char *map_type__name[MAP__NR_TYPES]; | |||
18 | struct dso; | 20 | struct dso; |
19 | struct ref_reloc_sym; | 21 | struct ref_reloc_sym; |
20 | struct map_groups; | 22 | struct map_groups; |
23 | struct machine; | ||
21 | 24 | ||
22 | struct map { | 25 | struct map { |
23 | union { | 26 | union { |
@@ -27,6 +30,7 @@ struct map { | |||
27 | u64 start; | 30 | u64 start; |
28 | u64 end; | 31 | u64 end; |
29 | enum map_type type; | 32 | enum map_type type; |
33 | u32 priv; | ||
30 | u64 pgoff; | 34 | u64 pgoff; |
31 | 35 | ||
32 | /* ip -> dso rip */ | 36 | /* ip -> dso rip */ |
@@ -35,6 +39,7 @@ struct map { | |||
35 | u64 (*unmap_ip)(struct map *, u64); | 39 | u64 (*unmap_ip)(struct map *, u64); |
36 | 40 | ||
37 | struct dso *dso; | 41 | struct dso *dso; |
42 | struct map_groups *groups; | ||
38 | }; | 43 | }; |
39 | 44 | ||
40 | struct kmap { | 45 | struct kmap { |
@@ -42,6 +47,32 @@ struct kmap { | |||
42 | struct map_groups *kmaps; | 47 | struct map_groups *kmaps; |
43 | }; | 48 | }; |
44 | 49 | ||
50 | struct map_groups { | ||
51 | struct rb_root maps[MAP__NR_TYPES]; | ||
52 | struct list_head removed_maps[MAP__NR_TYPES]; | ||
53 | struct machine *machine; | ||
54 | }; | ||
55 | |||
56 | /* Native host kernel uses -1 as pid index in machine */ | ||
57 | #define HOST_KERNEL_ID (-1) | ||
58 | #define DEFAULT_GUEST_KERNEL_ID (0) | ||
59 | |||
60 | struct machine { | ||
61 | struct rb_node rb_node; | ||
62 | pid_t pid; | ||
63 | char *root_dir; | ||
64 | struct list_head user_dsos; | ||
65 | struct list_head kernel_dsos; | ||
66 | struct map_groups kmaps; | ||
67 | struct map *vmlinux_maps[MAP__NR_TYPES]; | ||
68 | }; | ||
69 | |||
70 | static inline | ||
71 | struct map *machine__kernel_map(struct machine *self, enum map_type type) | ||
72 | { | ||
73 | return self->vmlinux_maps[type]; | ||
74 | } | ||
75 | |||
45 | static inline struct kmap *map__kmap(struct map *self) | 76 | static inline struct kmap *map__kmap(struct map *self) |
46 | { | 77 | { |
47 | return (struct kmap *)(self + 1); | 78 | return (struct kmap *)(self + 1); |
@@ -68,14 +99,14 @@ u64 map__rip_2objdump(struct map *map, u64 rip); | |||
68 | u64 map__objdump_2ip(struct map *map, u64 addr); | 99 | u64 map__objdump_2ip(struct map *map, u64 addr); |
69 | 100 | ||
70 | struct symbol; | 101 | struct symbol; |
71 | struct mmap_event; | ||
72 | 102 | ||
73 | typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym); | 103 | typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym); |
74 | 104 | ||
75 | void map__init(struct map *self, enum map_type type, | 105 | void map__init(struct map *self, enum map_type type, |
76 | u64 start, u64 end, u64 pgoff, struct dso *dso); | 106 | u64 start, u64 end, u64 pgoff, struct dso *dso); |
77 | struct map *map__new(struct mmap_event *event, enum map_type, | 107 | struct map *map__new(struct list_head *dsos__list, u64 start, u64 len, |
78 | char *cwd, int cwdlen); | 108 | u64 pgoff, u32 pid, char *filename, |
109 | enum map_type type, char *cwd, int cwdlen); | ||
79 | void map__delete(struct map *self); | 110 | void map__delete(struct map *self); |
80 | struct map *map__clone(struct map *self); | 111 | struct map *map__clone(struct map *self); |
81 | int map__overlap(struct map *l, struct map *r); | 112 | int map__overlap(struct map *l, struct map *r); |
@@ -91,4 +122,96 @@ void map__fixup_end(struct map *self); | |||
91 | 122 | ||
92 | void map__reloc_vmlinux(struct map *self); | 123 | void map__reloc_vmlinux(struct map *self); |
93 | 124 | ||
125 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
126 | enum map_type type, int verbose, FILE *fp); | ||
127 | void maps__insert(struct rb_root *maps, struct map *map); | ||
128 | struct map *maps__find(struct rb_root *maps, u64 addr); | ||
129 | void map_groups__init(struct map_groups *self); | ||
130 | int map_groups__clone(struct map_groups *self, | ||
131 | struct map_groups *parent, enum map_type type); | ||
132 | size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp); | ||
133 | size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp); | ||
134 | |||
135 | typedef void (*machine__process_t)(struct machine *self, void *data); | ||
136 | |||
137 | void machines__process(struct rb_root *self, machine__process_t process, void *data); | ||
138 | struct machine *machines__add(struct rb_root *self, pid_t pid, | ||
139 | const char *root_dir); | ||
140 | struct machine *machines__find_host(struct rb_root *self); | ||
141 | struct machine *machines__find(struct rb_root *self, pid_t pid); | ||
142 | struct machine *machines__findnew(struct rb_root *self, pid_t pid); | ||
143 | char *machine__mmap_name(struct machine *self, char *bf, size_t size); | ||
144 | int machine__init(struct machine *self, const char *root_dir, pid_t pid); | ||
145 | |||
146 | /* | ||
147 | * Default guest kernel is defined by parameter --guestkallsyms | ||
148 | * and --guestmodules | ||
149 | */ | ||
150 | static inline bool machine__is_default_guest(struct machine *self) | ||
151 | { | ||
152 | return self ? self->pid == DEFAULT_GUEST_KERNEL_ID : false; | ||
153 | } | ||
154 | |||
155 | static inline bool machine__is_host(struct machine *self) | ||
156 | { | ||
157 | return self ? self->pid == HOST_KERNEL_ID : false; | ||
158 | } | ||
159 | |||
160 | static inline void map_groups__insert(struct map_groups *self, struct map *map) | ||
161 | { | ||
162 | maps__insert(&self->maps[map->type], map); | ||
163 | map->groups = self; | ||
164 | } | ||
165 | |||
166 | static inline struct map *map_groups__find(struct map_groups *self, | ||
167 | enum map_type type, u64 addr) | ||
168 | { | ||
169 | return maps__find(&self->maps[type], addr); | ||
170 | } | ||
171 | |||
172 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
173 | enum map_type type, u64 addr, | ||
174 | struct map **mapp, | ||
175 | symbol_filter_t filter); | ||
176 | |||
177 | struct symbol *map_groups__find_symbol_by_name(struct map_groups *self, | ||
178 | enum map_type type, | ||
179 | const char *name, | ||
180 | struct map **mapp, | ||
181 | symbol_filter_t filter); | ||
182 | |||
183 | static inline | ||
184 | struct symbol *machine__find_kernel_symbol(struct machine *self, | ||
185 | enum map_type type, u64 addr, | ||
186 | struct map **mapp, | ||
187 | symbol_filter_t filter) | ||
188 | { | ||
189 | return map_groups__find_symbol(&self->kmaps, type, addr, mapp, filter); | ||
190 | } | ||
191 | |||
192 | static inline | ||
193 | struct symbol *machine__find_kernel_function(struct machine *self, u64 addr, | ||
194 | struct map **mapp, | ||
195 | symbol_filter_t filter) | ||
196 | { | ||
197 | return machine__find_kernel_symbol(self, MAP__FUNCTION, addr, mapp, filter); | ||
198 | } | ||
199 | |||
200 | static inline | ||
201 | struct symbol *map_groups__find_function_by_name(struct map_groups *self, | ||
202 | const char *name, struct map **mapp, | ||
203 | symbol_filter_t filter) | ||
204 | { | ||
205 | return map_groups__find_symbol_by_name(self, MAP__FUNCTION, name, mapp, filter); | ||
206 | } | ||
207 | |||
208 | int map_groups__fixup_overlappings(struct map_groups *self, struct map *map, | ||
209 | int verbose, FILE *fp); | ||
210 | |||
211 | struct map *map_groups__find_by_name(struct map_groups *self, | ||
212 | enum map_type type, const char *name); | ||
213 | struct map *machine__new_module(struct machine *self, u64 start, const char *filename); | ||
214 | |||
215 | void map_groups__flush(struct map_groups *self); | ||
216 | |||
94 | #endif /* __PERF_MAP_H */ | 217 | #endif /* __PERF_MAP_H */ |
diff --git a/tools/perf/util/newt.c b/tools/perf/util/newt.c new file mode 100644 index 000000000000..ccb7c5bb269e --- /dev/null +++ b/tools/perf/util/newt.c | |||
@@ -0,0 +1,1084 @@ | |||
1 | #define _GNU_SOURCE | ||
2 | #include <stdio.h> | ||
3 | #undef _GNU_SOURCE | ||
4 | |||
5 | #include <slang.h> | ||
6 | #include <stdlib.h> | ||
7 | #include <newt.h> | ||
8 | #include <sys/ttydefaults.h> | ||
9 | |||
10 | #include "cache.h" | ||
11 | #include "hist.h" | ||
12 | #include "pstack.h" | ||
13 | #include "session.h" | ||
14 | #include "sort.h" | ||
15 | #include "symbol.h" | ||
16 | |||
17 | #if SLANG_VERSION < 20104 | ||
18 | #define slsmg_printf(msg, args...) SLsmg_printf((char *)msg, ##args) | ||
19 | #define slsmg_write_nstring(msg, len) SLsmg_write_nstring((char *)msg, len) | ||
20 | #define sltt_set_color(obj, name, fg, bg) SLtt_set_color(obj,(char *)name,\ | ||
21 | (char *)fg, (char *)bg) | ||
22 | #else | ||
23 | #define slsmg_printf SLsmg_printf | ||
24 | #define slsmg_write_nstring SLsmg_write_nstring | ||
25 | #define sltt_set_color SLtt_set_color | ||
26 | #endif | ||
27 | |||
28 | struct ui_progress { | ||
29 | newtComponent form, scale; | ||
30 | }; | ||
31 | |||
32 | struct ui_progress *ui_progress__new(const char *title, u64 total) | ||
33 | { | ||
34 | struct ui_progress *self = malloc(sizeof(*self)); | ||
35 | |||
36 | if (self != NULL) { | ||
37 | int cols; | ||
38 | newtGetScreenSize(&cols, NULL); | ||
39 | cols -= 4; | ||
40 | newtCenteredWindow(cols, 1, title); | ||
41 | self->form = newtForm(NULL, NULL, 0); | ||
42 | if (self->form == NULL) | ||
43 | goto out_free_self; | ||
44 | self->scale = newtScale(0, 0, cols, total); | ||
45 | if (self->scale == NULL) | ||
46 | goto out_free_form; | ||
47 | newtFormAddComponent(self->form, self->scale); | ||
48 | newtRefresh(); | ||
49 | } | ||
50 | |||
51 | return self; | ||
52 | |||
53 | out_free_form: | ||
54 | newtFormDestroy(self->form); | ||
55 | out_free_self: | ||
56 | free(self); | ||
57 | return NULL; | ||
58 | } | ||
59 | |||
60 | void ui_progress__update(struct ui_progress *self, u64 curr) | ||
61 | { | ||
62 | newtScaleSet(self->scale, curr); | ||
63 | newtRefresh(); | ||
64 | } | ||
65 | |||
66 | void ui_progress__delete(struct ui_progress *self) | ||
67 | { | ||
68 | newtFormDestroy(self->form); | ||
69 | newtPopWindow(); | ||
70 | free(self); | ||
71 | } | ||
72 | |||
73 | static void ui_helpline__pop(void) | ||
74 | { | ||
75 | newtPopHelpLine(); | ||
76 | } | ||
77 | |||
78 | static void ui_helpline__push(const char *msg) | ||
79 | { | ||
80 | newtPushHelpLine(msg); | ||
81 | } | ||
82 | |||
83 | static void ui_helpline__vpush(const char *fmt, va_list ap) | ||
84 | { | ||
85 | char *s; | ||
86 | |||
87 | if (vasprintf(&s, fmt, ap) < 0) | ||
88 | vfprintf(stderr, fmt, ap); | ||
89 | else { | ||
90 | ui_helpline__push(s); | ||
91 | free(s); | ||
92 | } | ||
93 | } | ||
94 | |||
95 | static void ui_helpline__fpush(const char *fmt, ...) | ||
96 | { | ||
97 | va_list ap; | ||
98 | |||
99 | va_start(ap, fmt); | ||
100 | ui_helpline__vpush(fmt, ap); | ||
101 | va_end(ap); | ||
102 | } | ||
103 | |||
104 | static void ui_helpline__puts(const char *msg) | ||
105 | { | ||
106 | ui_helpline__pop(); | ||
107 | ui_helpline__push(msg); | ||
108 | } | ||
109 | |||
110 | static char browser__last_msg[1024]; | ||
111 | |||
112 | int browser__show_help(const char *format, va_list ap) | ||
113 | { | ||
114 | int ret; | ||
115 | static int backlog; | ||
116 | |||
117 | ret = vsnprintf(browser__last_msg + backlog, | ||
118 | sizeof(browser__last_msg) - backlog, format, ap); | ||
119 | backlog += ret; | ||
120 | |||
121 | if (browser__last_msg[backlog - 1] == '\n') { | ||
122 | ui_helpline__puts(browser__last_msg); | ||
123 | newtRefresh(); | ||
124 | backlog = 0; | ||
125 | } | ||
126 | |||
127 | return ret; | ||
128 | } | ||
129 | |||
130 | static void newt_form__set_exit_keys(newtComponent self) | ||
131 | { | ||
132 | newtFormAddHotKey(self, NEWT_KEY_LEFT); | ||
133 | newtFormAddHotKey(self, NEWT_KEY_ESCAPE); | ||
134 | newtFormAddHotKey(self, 'Q'); | ||
135 | newtFormAddHotKey(self, 'q'); | ||
136 | newtFormAddHotKey(self, CTRL('c')); | ||
137 | } | ||
138 | |||
139 | static newtComponent newt_form__new(void) | ||
140 | { | ||
141 | newtComponent self = newtForm(NULL, NULL, 0); | ||
142 | if (self) | ||
143 | newt_form__set_exit_keys(self); | ||
144 | return self; | ||
145 | } | ||
146 | |||
147 | static int popup_menu(int argc, char * const argv[]) | ||
148 | { | ||
149 | struct newtExitStruct es; | ||
150 | int i, rc = -1, max_len = 5; | ||
151 | newtComponent listbox, form = newt_form__new(); | ||
152 | |||
153 | if (form == NULL) | ||
154 | return -1; | ||
155 | |||
156 | listbox = newtListbox(0, 0, argc, NEWT_FLAG_RETURNEXIT); | ||
157 | if (listbox == NULL) | ||
158 | goto out_destroy_form; | ||
159 | |||
160 | newtFormAddComponent(form, listbox); | ||
161 | |||
162 | for (i = 0; i < argc; ++i) { | ||
163 | int len = strlen(argv[i]); | ||
164 | if (len > max_len) | ||
165 | max_len = len; | ||
166 | if (newtListboxAddEntry(listbox, argv[i], (void *)(long)i)) | ||
167 | goto out_destroy_form; | ||
168 | } | ||
169 | |||
170 | newtCenteredWindow(max_len, argc, NULL); | ||
171 | newtFormRun(form, &es); | ||
172 | rc = newtListboxGetCurrent(listbox) - NULL; | ||
173 | if (es.reason == NEWT_EXIT_HOTKEY) | ||
174 | rc = -1; | ||
175 | newtPopWindow(); | ||
176 | out_destroy_form: | ||
177 | newtFormDestroy(form); | ||
178 | return rc; | ||
179 | } | ||
180 | |||
181 | static int ui__help_window(const char *text) | ||
182 | { | ||
183 | struct newtExitStruct es; | ||
184 | newtComponent tb, form = newt_form__new(); | ||
185 | int rc = -1; | ||
186 | int max_len = 0, nr_lines = 0; | ||
187 | const char *t; | ||
188 | |||
189 | if (form == NULL) | ||
190 | return -1; | ||
191 | |||
192 | t = text; | ||
193 | while (1) { | ||
194 | const char *sep = strchr(t, '\n'); | ||
195 | int len; | ||
196 | |||
197 | if (sep == NULL) | ||
198 | sep = strchr(t, '\0'); | ||
199 | len = sep - t; | ||
200 | if (max_len < len) | ||
201 | max_len = len; | ||
202 | ++nr_lines; | ||
203 | if (*sep == '\0') | ||
204 | break; | ||
205 | t = sep + 1; | ||
206 | } | ||
207 | |||
208 | tb = newtTextbox(0, 0, max_len, nr_lines, 0); | ||
209 | if (tb == NULL) | ||
210 | goto out_destroy_form; | ||
211 | |||
212 | newtTextboxSetText(tb, text); | ||
213 | newtFormAddComponent(form, tb); | ||
214 | newtCenteredWindow(max_len, nr_lines, NULL); | ||
215 | newtFormRun(form, &es); | ||
216 | newtPopWindow(); | ||
217 | rc = 0; | ||
218 | out_destroy_form: | ||
219 | newtFormDestroy(form); | ||
220 | return rc; | ||
221 | } | ||
222 | |||
223 | static bool dialog_yesno(const char *msg) | ||
224 | { | ||
225 | /* newtWinChoice should really be accepting const char pointers... */ | ||
226 | char yes[] = "Yes", no[] = "No"; | ||
227 | return newtWinChoice(NULL, yes, no, (char *)msg) == 1; | ||
228 | } | ||
229 | |||
230 | #define HE_COLORSET_TOP 50 | ||
231 | #define HE_COLORSET_MEDIUM 51 | ||
232 | #define HE_COLORSET_NORMAL 52 | ||
233 | #define HE_COLORSET_SELECTED 53 | ||
234 | #define HE_COLORSET_CODE 54 | ||
235 | |||
236 | static int ui_browser__percent_color(double percent, bool current) | ||
237 | { | ||
238 | if (current) | ||
239 | return HE_COLORSET_SELECTED; | ||
240 | if (percent >= MIN_RED) | ||
241 | return HE_COLORSET_TOP; | ||
242 | if (percent >= MIN_GREEN) | ||
243 | return HE_COLORSET_MEDIUM; | ||
244 | return HE_COLORSET_NORMAL; | ||
245 | } | ||
246 | |||
247 | struct ui_browser { | ||
248 | newtComponent form, sb; | ||
249 | u64 index, first_visible_entry_idx; | ||
250 | void *first_visible_entry, *entries; | ||
251 | u16 top, left, width, height; | ||
252 | void *priv; | ||
253 | u32 nr_entries; | ||
254 | }; | ||
255 | |||
256 | static void ui_browser__refresh_dimensions(struct ui_browser *self) | ||
257 | { | ||
258 | int cols, rows; | ||
259 | newtGetScreenSize(&cols, &rows); | ||
260 | |||
261 | if (self->width > cols - 4) | ||
262 | self->width = cols - 4; | ||
263 | self->height = rows - 5; | ||
264 | if (self->height > self->nr_entries) | ||
265 | self->height = self->nr_entries; | ||
266 | self->top = (rows - self->height) / 2; | ||
267 | self->left = (cols - self->width) / 2; | ||
268 | } | ||
269 | |||
270 | static void ui_browser__reset_index(struct ui_browser *self) | ||
271 | { | ||
272 | self->index = self->first_visible_entry_idx = 0; | ||
273 | self->first_visible_entry = NULL; | ||
274 | } | ||
275 | |||
276 | static int objdump_line__show(struct objdump_line *self, struct list_head *head, | ||
277 | int width, struct hist_entry *he, int len, | ||
278 | bool current_entry) | ||
279 | { | ||
280 | if (self->offset != -1) { | ||
281 | struct symbol *sym = he->ms.sym; | ||
282 | unsigned int hits = 0; | ||
283 | double percent = 0.0; | ||
284 | int color; | ||
285 | struct sym_priv *priv = symbol__priv(sym); | ||
286 | struct sym_ext *sym_ext = priv->ext; | ||
287 | struct sym_hist *h = priv->hist; | ||
288 | s64 offset = self->offset; | ||
289 | struct objdump_line *next = objdump__get_next_ip_line(head, self); | ||
290 | |||
291 | while (offset < (s64)len && | ||
292 | (next == NULL || offset < next->offset)) { | ||
293 | if (sym_ext) { | ||
294 | percent += sym_ext[offset].percent; | ||
295 | } else | ||
296 | hits += h->ip[offset]; | ||
297 | |||
298 | ++offset; | ||
299 | } | ||
300 | |||
301 | if (sym_ext == NULL && h->sum) | ||
302 | percent = 100.0 * hits / h->sum; | ||
303 | |||
304 | color = ui_browser__percent_color(percent, current_entry); | ||
305 | SLsmg_set_color(color); | ||
306 | slsmg_printf(" %7.2f ", percent); | ||
307 | if (!current_entry) | ||
308 | SLsmg_set_color(HE_COLORSET_CODE); | ||
309 | } else { | ||
310 | int color = ui_browser__percent_color(0, current_entry); | ||
311 | SLsmg_set_color(color); | ||
312 | slsmg_write_nstring(" ", 9); | ||
313 | } | ||
314 | |||
315 | SLsmg_write_char(':'); | ||
316 | slsmg_write_nstring(" ", 8); | ||
317 | if (!*self->line) | ||
318 | slsmg_write_nstring(" ", width - 18); | ||
319 | else | ||
320 | slsmg_write_nstring(self->line, width - 18); | ||
321 | |||
322 | return 0; | ||
323 | } | ||
324 | |||
325 | static int ui_browser__refresh_entries(struct ui_browser *self) | ||
326 | { | ||
327 | struct objdump_line *pos; | ||
328 | struct list_head *head = self->entries; | ||
329 | struct hist_entry *he = self->priv; | ||
330 | int row = 0; | ||
331 | int len = he->ms.sym->end - he->ms.sym->start; | ||
332 | |||
333 | if (self->first_visible_entry == NULL || self->first_visible_entry == self->entries) | ||
334 | self->first_visible_entry = head->next; | ||
335 | |||
336 | pos = list_entry(self->first_visible_entry, struct objdump_line, node); | ||
337 | |||
338 | list_for_each_entry_from(pos, head, node) { | ||
339 | bool current_entry = (self->first_visible_entry_idx + row) == self->index; | ||
340 | SLsmg_gotorc(self->top + row, self->left); | ||
341 | objdump_line__show(pos, head, self->width, | ||
342 | he, len, current_entry); | ||
343 | if (++row == self->height) | ||
344 | break; | ||
345 | } | ||
346 | |||
347 | SLsmg_set_color(HE_COLORSET_NORMAL); | ||
348 | SLsmg_fill_region(self->top + row, self->left, | ||
349 | self->height - row, self->width, ' '); | ||
350 | |||
351 | return 0; | ||
352 | } | ||
353 | |||
354 | static int ui_browser__run(struct ui_browser *self, const char *title, | ||
355 | struct newtExitStruct *es) | ||
356 | { | ||
357 | if (self->form) { | ||
358 | newtFormDestroy(self->form); | ||
359 | newtPopWindow(); | ||
360 | } | ||
361 | |||
362 | ui_browser__refresh_dimensions(self); | ||
363 | newtCenteredWindow(self->width + 2, self->height, title); | ||
364 | self->form = newt_form__new(); | ||
365 | if (self->form == NULL) | ||
366 | return -1; | ||
367 | |||
368 | self->sb = newtVerticalScrollbar(self->width + 1, 0, self->height, | ||
369 | HE_COLORSET_NORMAL, | ||
370 | HE_COLORSET_SELECTED); | ||
371 | if (self->sb == NULL) | ||
372 | return -1; | ||
373 | |||
374 | newtFormAddHotKey(self->form, NEWT_KEY_UP); | ||
375 | newtFormAddHotKey(self->form, NEWT_KEY_DOWN); | ||
376 | newtFormAddHotKey(self->form, NEWT_KEY_PGUP); | ||
377 | newtFormAddHotKey(self->form, NEWT_KEY_PGDN); | ||
378 | newtFormAddHotKey(self->form, NEWT_KEY_HOME); | ||
379 | newtFormAddHotKey(self->form, NEWT_KEY_END); | ||
380 | |||
381 | if (ui_browser__refresh_entries(self) < 0) | ||
382 | return -1; | ||
383 | newtFormAddComponent(self->form, self->sb); | ||
384 | |||
385 | while (1) { | ||
386 | unsigned int offset; | ||
387 | |||
388 | newtFormRun(self->form, es); | ||
389 | |||
390 | if (es->reason != NEWT_EXIT_HOTKEY) | ||
391 | break; | ||
392 | switch (es->u.key) { | ||
393 | case NEWT_KEY_DOWN: | ||
394 | if (self->index == self->nr_entries - 1) | ||
395 | break; | ||
396 | ++self->index; | ||
397 | if (self->index == self->first_visible_entry_idx + self->height) { | ||
398 | struct list_head *pos = self->first_visible_entry; | ||
399 | ++self->first_visible_entry_idx; | ||
400 | self->first_visible_entry = pos->next; | ||
401 | } | ||
402 | break; | ||
403 | case NEWT_KEY_UP: | ||
404 | if (self->index == 0) | ||
405 | break; | ||
406 | --self->index; | ||
407 | if (self->index < self->first_visible_entry_idx) { | ||
408 | struct list_head *pos = self->first_visible_entry; | ||
409 | --self->first_visible_entry_idx; | ||
410 | self->first_visible_entry = pos->prev; | ||
411 | } | ||
412 | break; | ||
413 | case NEWT_KEY_PGDN: | ||
414 | if (self->first_visible_entry_idx + self->height > self->nr_entries - 1) | ||
415 | break; | ||
416 | |||
417 | offset = self->height; | ||
418 | if (self->index + offset > self->nr_entries - 1) | ||
419 | offset = self->nr_entries - 1 - self->index; | ||
420 | self->index += offset; | ||
421 | self->first_visible_entry_idx += offset; | ||
422 | |||
423 | while (offset--) { | ||
424 | struct list_head *pos = self->first_visible_entry; | ||
425 | self->first_visible_entry = pos->next; | ||
426 | } | ||
427 | |||
428 | break; | ||
429 | case NEWT_KEY_PGUP: | ||
430 | if (self->first_visible_entry_idx == 0) | ||
431 | break; | ||
432 | |||
433 | if (self->first_visible_entry_idx < self->height) | ||
434 | offset = self->first_visible_entry_idx; | ||
435 | else | ||
436 | offset = self->height; | ||
437 | |||
438 | self->index -= offset; | ||
439 | self->first_visible_entry_idx -= offset; | ||
440 | |||
441 | while (offset--) { | ||
442 | struct list_head *pos = self->first_visible_entry; | ||
443 | self->first_visible_entry = pos->prev; | ||
444 | } | ||
445 | break; | ||
446 | case NEWT_KEY_HOME: | ||
447 | ui_browser__reset_index(self); | ||
448 | break; | ||
449 | case NEWT_KEY_END: { | ||
450 | struct list_head *head = self->entries; | ||
451 | offset = self->height - 1; | ||
452 | |||
453 | if (offset > self->nr_entries) | ||
454 | offset = self->nr_entries; | ||
455 | |||
456 | self->index = self->first_visible_entry_idx = self->nr_entries - 1 - offset; | ||
457 | self->first_visible_entry = head->prev; | ||
458 | while (offset-- != 0) { | ||
459 | struct list_head *pos = self->first_visible_entry; | ||
460 | self->first_visible_entry = pos->prev; | ||
461 | } | ||
462 | } | ||
463 | break; | ||
464 | case NEWT_KEY_ESCAPE: | ||
465 | case NEWT_KEY_LEFT: | ||
466 | case CTRL('c'): | ||
467 | case 'Q': | ||
468 | case 'q': | ||
469 | return 0; | ||
470 | default: | ||
471 | continue; | ||
472 | } | ||
473 | if (ui_browser__refresh_entries(self) < 0) | ||
474 | return -1; | ||
475 | } | ||
476 | return 0; | ||
477 | } | ||
478 | |||
479 | /* | ||
480 | * When debugging newt problems it was useful to be able to "unroll" | ||
481 | * the calls to newtCheckBoxTreeAdd{Array,Item}, so that we can generate | ||
482 | * a source file with the sequence of calls to these methods, to then | ||
483 | * tweak the arrays to get the intended results, so I'm keeping this code | ||
484 | * here, may be useful again in the future. | ||
485 | */ | ||
486 | #undef NEWT_DEBUG | ||
487 | |||
488 | static void newt_checkbox_tree__add(newtComponent tree, const char *str, | ||
489 | void *priv, int *indexes) | ||
490 | { | ||
491 | #ifdef NEWT_DEBUG | ||
492 | /* Print the newtCheckboxTreeAddArray to tinker with its index arrays */ | ||
493 | int i = 0, len = 40 - strlen(str); | ||
494 | |||
495 | fprintf(stderr, | ||
496 | "\tnewtCheckboxTreeAddItem(tree, %*.*s\"%s\", (void *)%p, 0, ", | ||
497 | len, len, " ", str, priv); | ||
498 | while (indexes[i] != NEWT_ARG_LAST) { | ||
499 | if (indexes[i] != NEWT_ARG_APPEND) | ||
500 | fprintf(stderr, " %d,", indexes[i]); | ||
501 | else | ||
502 | fprintf(stderr, " %s,", "NEWT_ARG_APPEND"); | ||
503 | ++i; | ||
504 | } | ||
505 | fprintf(stderr, " %s", " NEWT_ARG_LAST);\n"); | ||
506 | fflush(stderr); | ||
507 | #endif | ||
508 | newtCheckboxTreeAddArray(tree, str, priv, 0, indexes); | ||
509 | } | ||
510 | |||
511 | static char *callchain_list__sym_name(struct callchain_list *self, | ||
512 | char *bf, size_t bfsize) | ||
513 | { | ||
514 | if (self->ms.sym) | ||
515 | return self->ms.sym->name; | ||
516 | |||
517 | snprintf(bf, bfsize, "%#Lx", self->ip); | ||
518 | return bf; | ||
519 | } | ||
520 | |||
521 | static void __callchain__append_graph_browser(struct callchain_node *self, | ||
522 | newtComponent tree, u64 total, | ||
523 | int *indexes, int depth) | ||
524 | { | ||
525 | struct rb_node *node; | ||
526 | u64 new_total, remaining; | ||
527 | int idx = 0; | ||
528 | |||
529 | if (callchain_param.mode == CHAIN_GRAPH_REL) | ||
530 | new_total = self->children_hit; | ||
531 | else | ||
532 | new_total = total; | ||
533 | |||
534 | remaining = new_total; | ||
535 | node = rb_first(&self->rb_root); | ||
536 | while (node) { | ||
537 | struct callchain_node *child = rb_entry(node, struct callchain_node, rb_node); | ||
538 | struct rb_node *next = rb_next(node); | ||
539 | u64 cumul = cumul_hits(child); | ||
540 | struct callchain_list *chain; | ||
541 | int first = true, printed = 0; | ||
542 | int chain_idx = -1; | ||
543 | remaining -= cumul; | ||
544 | |||
545 | indexes[depth] = NEWT_ARG_APPEND; | ||
546 | indexes[depth + 1] = NEWT_ARG_LAST; | ||
547 | |||
548 | list_for_each_entry(chain, &child->val, list) { | ||
549 | char ipstr[BITS_PER_LONG / 4 + 1], | ||
550 | *alloc_str = NULL; | ||
551 | const char *str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr)); | ||
552 | |||
553 | if (first) { | ||
554 | double percent = cumul * 100.0 / new_total; | ||
555 | |||
556 | first = false; | ||
557 | if (asprintf(&alloc_str, "%2.2f%% %s", percent, str) < 0) | ||
558 | str = "Not enough memory!"; | ||
559 | else | ||
560 | str = alloc_str; | ||
561 | } else { | ||
562 | indexes[depth] = idx; | ||
563 | indexes[depth + 1] = NEWT_ARG_APPEND; | ||
564 | indexes[depth + 2] = NEWT_ARG_LAST; | ||
565 | ++chain_idx; | ||
566 | } | ||
567 | newt_checkbox_tree__add(tree, str, &chain->ms, indexes); | ||
568 | free(alloc_str); | ||
569 | ++printed; | ||
570 | } | ||
571 | |||
572 | indexes[depth] = idx; | ||
573 | if (chain_idx != -1) | ||
574 | indexes[depth + 1] = chain_idx; | ||
575 | if (printed != 0) | ||
576 | ++idx; | ||
577 | __callchain__append_graph_browser(child, tree, new_total, indexes, | ||
578 | depth + (chain_idx != -1 ? 2 : 1)); | ||
579 | node = next; | ||
580 | } | ||
581 | } | ||
582 | |||
583 | static void callchain__append_graph_browser(struct callchain_node *self, | ||
584 | newtComponent tree, u64 total, | ||
585 | int *indexes, int parent_idx) | ||
586 | { | ||
587 | struct callchain_list *chain; | ||
588 | int i = 0; | ||
589 | |||
590 | indexes[1] = NEWT_ARG_APPEND; | ||
591 | indexes[2] = NEWT_ARG_LAST; | ||
592 | |||
593 | list_for_each_entry(chain, &self->val, list) { | ||
594 | char ipstr[BITS_PER_LONG / 4 + 1], *str; | ||
595 | |||
596 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
597 | continue; | ||
598 | |||
599 | if (!i++ && sort__first_dimension == SORT_SYM) | ||
600 | continue; | ||
601 | |||
602 | str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr)); | ||
603 | newt_checkbox_tree__add(tree, str, &chain->ms, indexes); | ||
604 | } | ||
605 | |||
606 | indexes[1] = parent_idx; | ||
607 | indexes[2] = NEWT_ARG_APPEND; | ||
608 | indexes[3] = NEWT_ARG_LAST; | ||
609 | __callchain__append_graph_browser(self, tree, total, indexes, 2); | ||
610 | } | ||
611 | |||
612 | static void hist_entry__append_callchain_browser(struct hist_entry *self, | ||
613 | newtComponent tree, u64 total, int parent_idx) | ||
614 | { | ||
615 | struct rb_node *rb_node; | ||
616 | int indexes[1024] = { [0] = parent_idx, }; | ||
617 | int idx = 0; | ||
618 | struct callchain_node *chain; | ||
619 | |||
620 | rb_node = rb_first(&self->sorted_chain); | ||
621 | while (rb_node) { | ||
622 | chain = rb_entry(rb_node, struct callchain_node, rb_node); | ||
623 | switch (callchain_param.mode) { | ||
624 | case CHAIN_FLAT: | ||
625 | break; | ||
626 | case CHAIN_GRAPH_ABS: /* falldown */ | ||
627 | case CHAIN_GRAPH_REL: | ||
628 | callchain__append_graph_browser(chain, tree, total, indexes, idx++); | ||
629 | break; | ||
630 | case CHAIN_NONE: | ||
631 | default: | ||
632 | break; | ||
633 | } | ||
634 | rb_node = rb_next(rb_node); | ||
635 | } | ||
636 | } | ||
637 | |||
638 | static size_t hist_entry__append_browser(struct hist_entry *self, | ||
639 | newtComponent tree, u64 total) | ||
640 | { | ||
641 | char s[256]; | ||
642 | size_t ret; | ||
643 | |||
644 | if (symbol_conf.exclude_other && !self->parent) | ||
645 | return 0; | ||
646 | |||
647 | ret = hist_entry__snprintf(self, s, sizeof(s), NULL, | ||
648 | false, 0, false, total); | ||
649 | if (symbol_conf.use_callchain) { | ||
650 | int indexes[2]; | ||
651 | |||
652 | indexes[0] = NEWT_ARG_APPEND; | ||
653 | indexes[1] = NEWT_ARG_LAST; | ||
654 | newt_checkbox_tree__add(tree, s, &self->ms, indexes); | ||
655 | } else | ||
656 | newtListboxAppendEntry(tree, s, &self->ms); | ||
657 | |||
658 | return ret; | ||
659 | } | ||
660 | |||
661 | static void hist_entry__annotate_browser(struct hist_entry *self) | ||
662 | { | ||
663 | struct ui_browser browser; | ||
664 | struct newtExitStruct es; | ||
665 | struct objdump_line *pos, *n; | ||
666 | LIST_HEAD(head); | ||
667 | |||
668 | if (self->ms.sym == NULL) | ||
669 | return; | ||
670 | |||
671 | if (hist_entry__annotate(self, &head) < 0) | ||
672 | return; | ||
673 | |||
674 | ui_helpline__push("Press <- or ESC to exit"); | ||
675 | |||
676 | memset(&browser, 0, sizeof(browser)); | ||
677 | browser.entries = &head; | ||
678 | browser.priv = self; | ||
679 | list_for_each_entry(pos, &head, node) { | ||
680 | size_t line_len = strlen(pos->line); | ||
681 | if (browser.width < line_len) | ||
682 | browser.width = line_len; | ||
683 | ++browser.nr_entries; | ||
684 | } | ||
685 | |||
686 | browser.width += 18; /* Percentage */ | ||
687 | ui_browser__run(&browser, self->ms.sym->name, &es); | ||
688 | newtFormDestroy(browser.form); | ||
689 | newtPopWindow(); | ||
690 | list_for_each_entry_safe(pos, n, &head, node) { | ||
691 | list_del(&pos->node); | ||
692 | objdump_line__free(pos); | ||
693 | } | ||
694 | ui_helpline__pop(); | ||
695 | } | ||
696 | |||
697 | static const void *newt__symbol_tree_get_current(newtComponent self) | ||
698 | { | ||
699 | if (symbol_conf.use_callchain) | ||
700 | return newtCheckboxTreeGetCurrent(self); | ||
701 | return newtListboxGetCurrent(self); | ||
702 | } | ||
703 | |||
704 | static void hist_browser__selection(newtComponent self, void *data) | ||
705 | { | ||
706 | const struct map_symbol **symbol_ptr = data; | ||
707 | *symbol_ptr = newt__symbol_tree_get_current(self); | ||
708 | } | ||
709 | |||
710 | struct hist_browser { | ||
711 | newtComponent form, tree; | ||
712 | const struct map_symbol *selection; | ||
713 | }; | ||
714 | |||
715 | static struct hist_browser *hist_browser__new(void) | ||
716 | { | ||
717 | struct hist_browser *self = malloc(sizeof(*self)); | ||
718 | |||
719 | if (self != NULL) | ||
720 | self->form = NULL; | ||
721 | |||
722 | return self; | ||
723 | } | ||
724 | |||
725 | static void hist_browser__delete(struct hist_browser *self) | ||
726 | { | ||
727 | newtFormDestroy(self->form); | ||
728 | newtPopWindow(); | ||
729 | free(self); | ||
730 | } | ||
731 | |||
732 | static int hist_browser__populate(struct hist_browser *self, struct hists *hists, | ||
733 | const char *title) | ||
734 | { | ||
735 | int max_len = 0, idx, cols, rows; | ||
736 | struct ui_progress *progress; | ||
737 | struct rb_node *nd; | ||
738 | u64 curr_hist = 0; | ||
739 | char seq[] = ".", unit; | ||
740 | char str[256]; | ||
741 | unsigned long nr_events = hists->stats.nr_events[PERF_RECORD_SAMPLE]; | ||
742 | |||
743 | if (self->form) { | ||
744 | newtFormDestroy(self->form); | ||
745 | newtPopWindow(); | ||
746 | } | ||
747 | |||
748 | nr_events = convert_unit(nr_events, &unit); | ||
749 | snprintf(str, sizeof(str), "Events: %lu%c ", | ||
750 | nr_events, unit); | ||
751 | newtDrawRootText(0, 0, str); | ||
752 | |||
753 | newtGetScreenSize(NULL, &rows); | ||
754 | |||
755 | if (symbol_conf.use_callchain) | ||
756 | self->tree = newtCheckboxTreeMulti(0, 0, rows - 5, seq, | ||
757 | NEWT_FLAG_SCROLL); | ||
758 | else | ||
759 | self->tree = newtListbox(0, 0, rows - 5, | ||
760 | (NEWT_FLAG_SCROLL | | ||
761 | NEWT_FLAG_RETURNEXIT)); | ||
762 | |||
763 | newtComponentAddCallback(self->tree, hist_browser__selection, | ||
764 | &self->selection); | ||
765 | |||
766 | progress = ui_progress__new("Adding entries to the browser...", | ||
767 | hists->nr_entries); | ||
768 | if (progress == NULL) | ||
769 | return -1; | ||
770 | |||
771 | idx = 0; | ||
772 | for (nd = rb_first(&hists->entries); nd; nd = rb_next(nd)) { | ||
773 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
774 | int len; | ||
775 | |||
776 | if (h->filtered) | ||
777 | continue; | ||
778 | |||
779 | len = hist_entry__append_browser(h, self->tree, hists->stats.total_period); | ||
780 | if (len > max_len) | ||
781 | max_len = len; | ||
782 | if (symbol_conf.use_callchain) | ||
783 | hist_entry__append_callchain_browser(h, self->tree, | ||
784 | hists->stats.total_period, idx++); | ||
785 | ++curr_hist; | ||
786 | if (curr_hist % 5) | ||
787 | ui_progress__update(progress, curr_hist); | ||
788 | } | ||
789 | |||
790 | ui_progress__delete(progress); | ||
791 | |||
792 | newtGetScreenSize(&cols, &rows); | ||
793 | |||
794 | if (max_len > cols) | ||
795 | max_len = cols - 3; | ||
796 | |||
797 | if (!symbol_conf.use_callchain) | ||
798 | newtListboxSetWidth(self->tree, max_len); | ||
799 | |||
800 | newtCenteredWindow(max_len + (symbol_conf.use_callchain ? 5 : 0), | ||
801 | rows - 5, title); | ||
802 | self->form = newt_form__new(); | ||
803 | if (self->form == NULL) | ||
804 | return -1; | ||
805 | |||
806 | newtFormAddHotKey(self->form, 'A'); | ||
807 | newtFormAddHotKey(self->form, 'a'); | ||
808 | newtFormAddHotKey(self->form, 'D'); | ||
809 | newtFormAddHotKey(self->form, 'd'); | ||
810 | newtFormAddHotKey(self->form, 'T'); | ||
811 | newtFormAddHotKey(self->form, 't'); | ||
812 | newtFormAddHotKey(self->form, '?'); | ||
813 | newtFormAddHotKey(self->form, 'H'); | ||
814 | newtFormAddHotKey(self->form, 'h'); | ||
815 | newtFormAddHotKey(self->form, NEWT_KEY_F1); | ||
816 | newtFormAddHotKey(self->form, NEWT_KEY_RIGHT); | ||
817 | newtFormAddComponents(self->form, self->tree, NULL); | ||
818 | self->selection = newt__symbol_tree_get_current(self->tree); | ||
819 | |||
820 | return 0; | ||
821 | } | ||
822 | |||
823 | static struct hist_entry *hist_browser__selected_entry(struct hist_browser *self) | ||
824 | { | ||
825 | int *indexes; | ||
826 | |||
827 | if (!symbol_conf.use_callchain) | ||
828 | goto out; | ||
829 | |||
830 | indexes = newtCheckboxTreeFindItem(self->tree, (void *)self->selection); | ||
831 | if (indexes) { | ||
832 | bool is_hist_entry = indexes[1] == NEWT_ARG_LAST; | ||
833 | free(indexes); | ||
834 | if (is_hist_entry) | ||
835 | goto out; | ||
836 | } | ||
837 | return NULL; | ||
838 | out: | ||
839 | return container_of(self->selection, struct hist_entry, ms); | ||
840 | } | ||
841 | |||
842 | static struct thread *hist_browser__selected_thread(struct hist_browser *self) | ||
843 | { | ||
844 | struct hist_entry *he = hist_browser__selected_entry(self); | ||
845 | return he ? he->thread : NULL; | ||
846 | } | ||
847 | |||
848 | static int hist_browser__title(char *bf, size_t size, const char *input_name, | ||
849 | const struct dso *dso, const struct thread *thread) | ||
850 | { | ||
851 | int printed = 0; | ||
852 | |||
853 | if (thread) | ||
854 | printed += snprintf(bf + printed, size - printed, | ||
855 | "Thread: %s(%d)", | ||
856 | (thread->comm_set ? thread->comm : ""), | ||
857 | thread->pid); | ||
858 | if (dso) | ||
859 | printed += snprintf(bf + printed, size - printed, | ||
860 | "%sDSO: %s", thread ? " " : "", | ||
861 | dso->short_name); | ||
862 | return printed ?: snprintf(bf, size, "Report: %s", input_name); | ||
863 | } | ||
864 | |||
865 | int hists__browse(struct hists *self, const char *helpline, const char *input_name) | ||
866 | { | ||
867 | struct hist_browser *browser = hist_browser__new(); | ||
868 | struct pstack *fstack = pstack__new(2); | ||
869 | const struct thread *thread_filter = NULL; | ||
870 | const struct dso *dso_filter = NULL; | ||
871 | struct newtExitStruct es; | ||
872 | char msg[160]; | ||
873 | int err = -1; | ||
874 | |||
875 | if (browser == NULL) | ||
876 | return -1; | ||
877 | |||
878 | fstack = pstack__new(2); | ||
879 | if (fstack == NULL) | ||
880 | goto out; | ||
881 | |||
882 | ui_helpline__push(helpline); | ||
883 | |||
884 | hist_browser__title(msg, sizeof(msg), input_name, | ||
885 | dso_filter, thread_filter); | ||
886 | if (hist_browser__populate(browser, self, msg) < 0) | ||
887 | goto out_free_stack; | ||
888 | |||
889 | while (1) { | ||
890 | const struct thread *thread; | ||
891 | const struct dso *dso; | ||
892 | char *options[16]; | ||
893 | int nr_options = 0, choice = 0, i, | ||
894 | annotate = -2, zoom_dso = -2, zoom_thread = -2; | ||
895 | |||
896 | newtFormRun(browser->form, &es); | ||
897 | |||
898 | thread = hist_browser__selected_thread(browser); | ||
899 | dso = browser->selection->map ? browser->selection->map->dso : NULL; | ||
900 | |||
901 | if (es.reason == NEWT_EXIT_HOTKEY) { | ||
902 | if (es.u.key == NEWT_KEY_F1) | ||
903 | goto do_help; | ||
904 | |||
905 | switch (toupper(es.u.key)) { | ||
906 | case 'A': | ||
907 | goto do_annotate; | ||
908 | case 'D': | ||
909 | goto zoom_dso; | ||
910 | case 'T': | ||
911 | goto zoom_thread; | ||
912 | case 'H': | ||
913 | case '?': | ||
914 | do_help: | ||
915 | ui__help_window("-> Zoom into DSO/Threads & Annotate current symbol\n" | ||
916 | "<- Zoom out\n" | ||
917 | "a Annotate current symbol\n" | ||
918 | "h/?/F1 Show this window\n" | ||
919 | "d Zoom into current DSO\n" | ||
920 | "t Zoom into current Thread\n" | ||
921 | "q/CTRL+C Exit browser"); | ||
922 | continue; | ||
923 | default:; | ||
924 | } | ||
925 | if (toupper(es.u.key) == 'Q' || | ||
926 | es.u.key == CTRL('c')) | ||
927 | break; | ||
928 | if (es.u.key == NEWT_KEY_ESCAPE) { | ||
929 | if (dialog_yesno("Do you really want to exit?")) | ||
930 | break; | ||
931 | else | ||
932 | continue; | ||
933 | } | ||
934 | |||
935 | if (es.u.key == NEWT_KEY_LEFT) { | ||
936 | const void *top; | ||
937 | |||
938 | if (pstack__empty(fstack)) | ||
939 | continue; | ||
940 | top = pstack__pop(fstack); | ||
941 | if (top == &dso_filter) | ||
942 | goto zoom_out_dso; | ||
943 | if (top == &thread_filter) | ||
944 | goto zoom_out_thread; | ||
945 | continue; | ||
946 | } | ||
947 | } | ||
948 | |||
949 | if (browser->selection->sym != NULL && | ||
950 | asprintf(&options[nr_options], "Annotate %s", | ||
951 | browser->selection->sym->name) > 0) | ||
952 | annotate = nr_options++; | ||
953 | |||
954 | if (thread != NULL && | ||
955 | asprintf(&options[nr_options], "Zoom %s %s(%d) thread", | ||
956 | (thread_filter ? "out of" : "into"), | ||
957 | (thread->comm_set ? thread->comm : ""), | ||
958 | thread->pid) > 0) | ||
959 | zoom_thread = nr_options++; | ||
960 | |||
961 | if (dso != NULL && | ||
962 | asprintf(&options[nr_options], "Zoom %s %s DSO", | ||
963 | (dso_filter ? "out of" : "into"), | ||
964 | (dso->kernel ? "the Kernel" : dso->short_name)) > 0) | ||
965 | zoom_dso = nr_options++; | ||
966 | |||
967 | options[nr_options++] = (char *)"Exit"; | ||
968 | |||
969 | choice = popup_menu(nr_options, options); | ||
970 | |||
971 | for (i = 0; i < nr_options - 1; ++i) | ||
972 | free(options[i]); | ||
973 | |||
974 | if (choice == nr_options - 1) | ||
975 | break; | ||
976 | |||
977 | if (choice == -1) | ||
978 | continue; | ||
979 | |||
980 | if (choice == annotate) { | ||
981 | struct hist_entry *he; | ||
982 | do_annotate: | ||
983 | if (browser->selection->map->dso->origin == DSO__ORIG_KERNEL) { | ||
984 | ui_helpline__puts("No vmlinux file found, can't " | ||
985 | "annotate with just a " | ||
986 | "kallsyms file"); | ||
987 | continue; | ||
988 | } | ||
989 | |||
990 | he = hist_browser__selected_entry(browser); | ||
991 | if (he == NULL) | ||
992 | continue; | ||
993 | |||
994 | hist_entry__annotate_browser(he); | ||
995 | } else if (choice == zoom_dso) { | ||
996 | zoom_dso: | ||
997 | if (dso_filter) { | ||
998 | pstack__remove(fstack, &dso_filter); | ||
999 | zoom_out_dso: | ||
1000 | ui_helpline__pop(); | ||
1001 | dso_filter = NULL; | ||
1002 | } else { | ||
1003 | if (dso == NULL) | ||
1004 | continue; | ||
1005 | ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s DSO\"", | ||
1006 | dso->kernel ? "the Kernel" : dso->short_name); | ||
1007 | dso_filter = dso; | ||
1008 | pstack__push(fstack, &dso_filter); | ||
1009 | } | ||
1010 | hists__filter_by_dso(self, dso_filter); | ||
1011 | hist_browser__title(msg, sizeof(msg), input_name, | ||
1012 | dso_filter, thread_filter); | ||
1013 | if (hist_browser__populate(browser, self, msg) < 0) | ||
1014 | goto out; | ||
1015 | } else if (choice == zoom_thread) { | ||
1016 | zoom_thread: | ||
1017 | if (thread_filter) { | ||
1018 | pstack__remove(fstack, &thread_filter); | ||
1019 | zoom_out_thread: | ||
1020 | ui_helpline__pop(); | ||
1021 | thread_filter = NULL; | ||
1022 | } else { | ||
1023 | ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s(%d) thread\"", | ||
1024 | thread->comm_set ? thread->comm : "", | ||
1025 | thread->pid); | ||
1026 | thread_filter = thread; | ||
1027 | pstack__push(fstack, &thread_filter); | ||
1028 | } | ||
1029 | hists__filter_by_thread(self, thread_filter); | ||
1030 | hist_browser__title(msg, sizeof(msg), input_name, | ||
1031 | dso_filter, thread_filter); | ||
1032 | if (hist_browser__populate(browser, self, msg) < 0) | ||
1033 | goto out; | ||
1034 | } | ||
1035 | } | ||
1036 | err = 0; | ||
1037 | out_free_stack: | ||
1038 | pstack__delete(fstack); | ||
1039 | out: | ||
1040 | hist_browser__delete(browser); | ||
1041 | return err; | ||
1042 | } | ||
1043 | |||
1044 | static struct newtPercentTreeColors { | ||
1045 | const char *topColorFg, *topColorBg; | ||
1046 | const char *mediumColorFg, *mediumColorBg; | ||
1047 | const char *normalColorFg, *normalColorBg; | ||
1048 | const char *selColorFg, *selColorBg; | ||
1049 | const char *codeColorFg, *codeColorBg; | ||
1050 | } defaultPercentTreeColors = { | ||
1051 | "red", "lightgray", | ||
1052 | "green", "lightgray", | ||
1053 | "black", "lightgray", | ||
1054 | "lightgray", "magenta", | ||
1055 | "blue", "lightgray", | ||
1056 | }; | ||
1057 | |||
1058 | void setup_browser(void) | ||
1059 | { | ||
1060 | struct newtPercentTreeColors *c = &defaultPercentTreeColors; | ||
1061 | if (!isatty(1)) | ||
1062 | return; | ||
1063 | |||
1064 | use_browser = true; | ||
1065 | newtInit(); | ||
1066 | newtCls(); | ||
1067 | ui_helpline__puts(" "); | ||
1068 | sltt_set_color(HE_COLORSET_TOP, NULL, c->topColorFg, c->topColorBg); | ||
1069 | sltt_set_color(HE_COLORSET_MEDIUM, NULL, c->mediumColorFg, c->mediumColorBg); | ||
1070 | sltt_set_color(HE_COLORSET_NORMAL, NULL, c->normalColorFg, c->normalColorBg); | ||
1071 | sltt_set_color(HE_COLORSET_SELECTED, NULL, c->selColorFg, c->selColorBg); | ||
1072 | sltt_set_color(HE_COLORSET_CODE, NULL, c->codeColorFg, c->codeColorBg); | ||
1073 | } | ||
1074 | |||
1075 | void exit_browser(bool wait_for_ok) | ||
1076 | { | ||
1077 | if (use_browser) { | ||
1078 | if (wait_for_ok) { | ||
1079 | char title[] = "Fatal Error", ok[] = "Ok"; | ||
1080 | newtWinMessage(title, ok, browser__last_msg); | ||
1081 | } | ||
1082 | newtFinished(); | ||
1083 | } | ||
1084 | } | ||
diff --git a/tools/perf/util/parse-events.c b/tools/perf/util/parse-events.c index 05d0c5c2030c..9bf0f402ca73 100644 --- a/tools/perf/util/parse-events.c +++ b/tools/perf/util/parse-events.c | |||
@@ -5,6 +5,7 @@ | |||
5 | #include "parse-events.h" | 5 | #include "parse-events.h" |
6 | #include "exec_cmd.h" | 6 | #include "exec_cmd.h" |
7 | #include "string.h" | 7 | #include "string.h" |
8 | #include "symbol.h" | ||
8 | #include "cache.h" | 9 | #include "cache.h" |
9 | #include "header.h" | 10 | #include "header.h" |
10 | #include "debugfs.h" | 11 | #include "debugfs.h" |
@@ -409,7 +410,6 @@ static enum event_result | |||
409 | parse_single_tracepoint_event(char *sys_name, | 410 | parse_single_tracepoint_event(char *sys_name, |
410 | const char *evt_name, | 411 | const char *evt_name, |
411 | unsigned int evt_length, | 412 | unsigned int evt_length, |
412 | char *flags, | ||
413 | struct perf_event_attr *attr, | 413 | struct perf_event_attr *attr, |
414 | const char **strp) | 414 | const char **strp) |
415 | { | 415 | { |
@@ -418,14 +418,6 @@ parse_single_tracepoint_event(char *sys_name, | |||
418 | u64 id; | 418 | u64 id; |
419 | int fd; | 419 | int fd; |
420 | 420 | ||
421 | if (flags) { | ||
422 | if (!strncmp(flags, "record", strlen(flags))) { | ||
423 | attr->sample_type |= PERF_SAMPLE_RAW; | ||
424 | attr->sample_type |= PERF_SAMPLE_TIME; | ||
425 | attr->sample_type |= PERF_SAMPLE_CPU; | ||
426 | } | ||
427 | } | ||
428 | |||
429 | snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path, | 421 | snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path, |
430 | sys_name, evt_name); | 422 | sys_name, evt_name); |
431 | 423 | ||
@@ -444,6 +436,13 @@ parse_single_tracepoint_event(char *sys_name, | |||
444 | attr->type = PERF_TYPE_TRACEPOINT; | 436 | attr->type = PERF_TYPE_TRACEPOINT; |
445 | *strp = evt_name + evt_length; | 437 | *strp = evt_name + evt_length; |
446 | 438 | ||
439 | attr->sample_type |= PERF_SAMPLE_RAW; | ||
440 | attr->sample_type |= PERF_SAMPLE_TIME; | ||
441 | attr->sample_type |= PERF_SAMPLE_CPU; | ||
442 | |||
443 | attr->sample_period = 1; | ||
444 | |||
445 | |||
447 | return EVT_HANDLED; | 446 | return EVT_HANDLED; |
448 | } | 447 | } |
449 | 448 | ||
@@ -532,8 +531,7 @@ static enum event_result parse_tracepoint_event(const char **strp, | |||
532 | flags); | 531 | flags); |
533 | } else | 532 | } else |
534 | return parse_single_tracepoint_event(sys_name, evt_name, | 533 | return parse_single_tracepoint_event(sys_name, evt_name, |
535 | evt_length, flags, | 534 | evt_length, attr, strp); |
536 | attr, strp); | ||
537 | } | 535 | } |
538 | 536 | ||
539 | static enum event_result | 537 | static enum event_result |
@@ -690,19 +688,29 @@ static enum event_result | |||
690 | parse_event_modifier(const char **strp, struct perf_event_attr *attr) | 688 | parse_event_modifier(const char **strp, struct perf_event_attr *attr) |
691 | { | 689 | { |
692 | const char *str = *strp; | 690 | const char *str = *strp; |
693 | int eu = 1, ek = 1, eh = 1; | 691 | int exclude = 0; |
692 | int eu = 0, ek = 0, eh = 0, precise = 0; | ||
694 | 693 | ||
695 | if (*str++ != ':') | 694 | if (*str++ != ':') |
696 | return 0; | 695 | return 0; |
697 | while (*str) { | 696 | while (*str) { |
698 | if (*str == 'u') | 697 | if (*str == 'u') { |
698 | if (!exclude) | ||
699 | exclude = eu = ek = eh = 1; | ||
699 | eu = 0; | 700 | eu = 0; |
700 | else if (*str == 'k') | 701 | } else if (*str == 'k') { |
702 | if (!exclude) | ||
703 | exclude = eu = ek = eh = 1; | ||
701 | ek = 0; | 704 | ek = 0; |
702 | else if (*str == 'h') | 705 | } else if (*str == 'h') { |
706 | if (!exclude) | ||
707 | exclude = eu = ek = eh = 1; | ||
703 | eh = 0; | 708 | eh = 0; |
704 | else | 709 | } else if (*str == 'p') { |
710 | precise++; | ||
711 | } else | ||
705 | break; | 712 | break; |
713 | |||
706 | ++str; | 714 | ++str; |
707 | } | 715 | } |
708 | if (str >= *strp + 2) { | 716 | if (str >= *strp + 2) { |
@@ -710,6 +718,7 @@ parse_event_modifier(const char **strp, struct perf_event_attr *attr) | |||
710 | attr->exclude_user = eu; | 718 | attr->exclude_user = eu; |
711 | attr->exclude_kernel = ek; | 719 | attr->exclude_kernel = ek; |
712 | attr->exclude_hv = eh; | 720 | attr->exclude_hv = eh; |
721 | attr->precise_ip = precise; | ||
713 | return 1; | 722 | return 1; |
714 | } | 723 | } |
715 | return 0; | 724 | return 0; |
@@ -934,7 +943,8 @@ void print_events(void) | |||
934 | 943 | ||
935 | printf("\n"); | 944 | printf("\n"); |
936 | printf(" %-42s [%s]\n", | 945 | printf(" %-42s [%s]\n", |
937 | "rNNN", event_type_descriptors[PERF_TYPE_RAW]); | 946 | "rNNN (see 'perf list --help' on how to encode it)", |
947 | event_type_descriptors[PERF_TYPE_RAW]); | ||
938 | printf("\n"); | 948 | printf("\n"); |
939 | 949 | ||
940 | printf(" %-42s [%s]\n", | 950 | printf(" %-42s [%s]\n", |
diff --git a/tools/perf/util/parse-events.h b/tools/perf/util/parse-events.h index b8c1f64bc935..fc4ab3fe877a 100644 --- a/tools/perf/util/parse-events.h +++ b/tools/perf/util/parse-events.h | |||
@@ -13,6 +13,7 @@ struct tracepoint_path { | |||
13 | }; | 13 | }; |
14 | 14 | ||
15 | extern struct tracepoint_path *tracepoint_id_to_path(u64 config); | 15 | extern struct tracepoint_path *tracepoint_id_to_path(u64 config); |
16 | extern bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events); | ||
16 | 17 | ||
17 | extern int nr_counters; | 18 | extern int nr_counters; |
18 | 19 | ||
diff --git a/tools/perf/util/parse-options.c b/tools/perf/util/parse-options.c index efebd5b476b3..99d02aa57dbf 100644 --- a/tools/perf/util/parse-options.c +++ b/tools/perf/util/parse-options.c | |||
@@ -49,8 +49,9 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
49 | break; | 49 | break; |
50 | /* FALLTHROUGH */ | 50 | /* FALLTHROUGH */ |
51 | case OPTION_BOOLEAN: | 51 | case OPTION_BOOLEAN: |
52 | case OPTION_INCR: | ||
52 | case OPTION_BIT: | 53 | case OPTION_BIT: |
53 | case OPTION_SET_INT: | 54 | case OPTION_SET_UINT: |
54 | case OPTION_SET_PTR: | 55 | case OPTION_SET_PTR: |
55 | return opterror(opt, "takes no value", flags); | 56 | return opterror(opt, "takes no value", flags); |
56 | case OPTION_END: | 57 | case OPTION_END: |
@@ -58,7 +59,9 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
58 | case OPTION_GROUP: | 59 | case OPTION_GROUP: |
59 | case OPTION_STRING: | 60 | case OPTION_STRING: |
60 | case OPTION_INTEGER: | 61 | case OPTION_INTEGER: |
62 | case OPTION_UINTEGER: | ||
61 | case OPTION_LONG: | 63 | case OPTION_LONG: |
64 | case OPTION_U64: | ||
62 | default: | 65 | default: |
63 | break; | 66 | break; |
64 | } | 67 | } |
@@ -73,11 +76,15 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
73 | return 0; | 76 | return 0; |
74 | 77 | ||
75 | case OPTION_BOOLEAN: | 78 | case OPTION_BOOLEAN: |
79 | *(bool *)opt->value = unset ? false : true; | ||
80 | return 0; | ||
81 | |||
82 | case OPTION_INCR: | ||
76 | *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1; | 83 | *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1; |
77 | return 0; | 84 | return 0; |
78 | 85 | ||
79 | case OPTION_SET_INT: | 86 | case OPTION_SET_UINT: |
80 | *(int *)opt->value = unset ? 0 : opt->defval; | 87 | *(unsigned int *)opt->value = unset ? 0 : opt->defval; |
81 | return 0; | 88 | return 0; |
82 | 89 | ||
83 | case OPTION_SET_PTR: | 90 | case OPTION_SET_PTR: |
@@ -120,6 +127,22 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
120 | return opterror(opt, "expects a numerical value", flags); | 127 | return opterror(opt, "expects a numerical value", flags); |
121 | return 0; | 128 | return 0; |
122 | 129 | ||
130 | case OPTION_UINTEGER: | ||
131 | if (unset) { | ||
132 | *(unsigned int *)opt->value = 0; | ||
133 | return 0; | ||
134 | } | ||
135 | if (opt->flags & PARSE_OPT_OPTARG && !p->opt) { | ||
136 | *(unsigned int *)opt->value = opt->defval; | ||
137 | return 0; | ||
138 | } | ||
139 | if (get_arg(p, opt, flags, &arg)) | ||
140 | return -1; | ||
141 | *(unsigned int *)opt->value = strtol(arg, (char **)&s, 10); | ||
142 | if (*s) | ||
143 | return opterror(opt, "expects a numerical value", flags); | ||
144 | return 0; | ||
145 | |||
123 | case OPTION_LONG: | 146 | case OPTION_LONG: |
124 | if (unset) { | 147 | if (unset) { |
125 | *(long *)opt->value = 0; | 148 | *(long *)opt->value = 0; |
@@ -136,6 +159,22 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
136 | return opterror(opt, "expects a numerical value", flags); | 159 | return opterror(opt, "expects a numerical value", flags); |
137 | return 0; | 160 | return 0; |
138 | 161 | ||
162 | case OPTION_U64: | ||
163 | if (unset) { | ||
164 | *(u64 *)opt->value = 0; | ||
165 | return 0; | ||
166 | } | ||
167 | if (opt->flags & PARSE_OPT_OPTARG && !p->opt) { | ||
168 | *(u64 *)opt->value = opt->defval; | ||
169 | return 0; | ||
170 | } | ||
171 | if (get_arg(p, opt, flags, &arg)) | ||
172 | return -1; | ||
173 | *(u64 *)opt->value = strtoull(arg, (char **)&s, 10); | ||
174 | if (*s) | ||
175 | return opterror(opt, "expects a numerical value", flags); | ||
176 | return 0; | ||
177 | |||
139 | case OPTION_END: | 178 | case OPTION_END: |
140 | case OPTION_ARGUMENT: | 179 | case OPTION_ARGUMENT: |
141 | case OPTION_GROUP: | 180 | case OPTION_GROUP: |
@@ -441,7 +480,10 @@ int usage_with_options_internal(const char * const *usagestr, | |||
441 | switch (opts->type) { | 480 | switch (opts->type) { |
442 | case OPTION_ARGUMENT: | 481 | case OPTION_ARGUMENT: |
443 | break; | 482 | break; |
483 | case OPTION_LONG: | ||
484 | case OPTION_U64: | ||
444 | case OPTION_INTEGER: | 485 | case OPTION_INTEGER: |
486 | case OPTION_UINTEGER: | ||
445 | if (opts->flags & PARSE_OPT_OPTARG) | 487 | if (opts->flags & PARSE_OPT_OPTARG) |
446 | if (opts->long_name) | 488 | if (opts->long_name) |
447 | pos += fprintf(stderr, "[=<n>]"); | 489 | pos += fprintf(stderr, "[=<n>]"); |
@@ -473,14 +515,14 @@ int usage_with_options_internal(const char * const *usagestr, | |||
473 | pos += fprintf(stderr, " ..."); | 515 | pos += fprintf(stderr, " ..."); |
474 | } | 516 | } |
475 | break; | 517 | break; |
476 | default: /* OPTION_{BIT,BOOLEAN,SET_INT,SET_PTR} */ | 518 | default: /* OPTION_{BIT,BOOLEAN,SET_UINT,SET_PTR} */ |
477 | case OPTION_END: | 519 | case OPTION_END: |
478 | case OPTION_GROUP: | 520 | case OPTION_GROUP: |
479 | case OPTION_BIT: | 521 | case OPTION_BIT: |
480 | case OPTION_BOOLEAN: | 522 | case OPTION_BOOLEAN: |
481 | case OPTION_SET_INT: | 523 | case OPTION_INCR: |
524 | case OPTION_SET_UINT: | ||
482 | case OPTION_SET_PTR: | 525 | case OPTION_SET_PTR: |
483 | case OPTION_LONG: | ||
484 | break; | 526 | break; |
485 | } | 527 | } |
486 | 528 | ||
@@ -500,6 +542,7 @@ int usage_with_options_internal(const char * const *usagestr, | |||
500 | void usage_with_options(const char * const *usagestr, | 542 | void usage_with_options(const char * const *usagestr, |
501 | const struct option *opts) | 543 | const struct option *opts) |
502 | { | 544 | { |
545 | exit_browser(false); | ||
503 | usage_with_options_internal(usagestr, opts, 0); | 546 | usage_with_options_internal(usagestr, opts, 0); |
504 | exit(129); | 547 | exit(129); |
505 | } | 548 | } |
diff --git a/tools/perf/util/parse-options.h b/tools/perf/util/parse-options.h index 948805af43c2..c7d72dce54b2 100644 --- a/tools/perf/util/parse-options.h +++ b/tools/perf/util/parse-options.h | |||
@@ -1,6 +1,9 @@ | |||
1 | #ifndef __PERF_PARSE_OPTIONS_H | 1 | #ifndef __PERF_PARSE_OPTIONS_H |
2 | #define __PERF_PARSE_OPTIONS_H | 2 | #define __PERF_PARSE_OPTIONS_H |
3 | 3 | ||
4 | #include <linux/kernel.h> | ||
5 | #include <stdbool.h> | ||
6 | |||
4 | enum parse_opt_type { | 7 | enum parse_opt_type { |
5 | /* special types */ | 8 | /* special types */ |
6 | OPTION_END, | 9 | OPTION_END, |
@@ -8,14 +11,17 @@ enum parse_opt_type { | |||
8 | OPTION_GROUP, | 11 | OPTION_GROUP, |
9 | /* options with no arguments */ | 12 | /* options with no arguments */ |
10 | OPTION_BIT, | 13 | OPTION_BIT, |
11 | OPTION_BOOLEAN, /* _INCR would have been a better name */ | 14 | OPTION_BOOLEAN, |
12 | OPTION_SET_INT, | 15 | OPTION_INCR, |
16 | OPTION_SET_UINT, | ||
13 | OPTION_SET_PTR, | 17 | OPTION_SET_PTR, |
14 | /* options with arguments (usually) */ | 18 | /* options with arguments (usually) */ |
15 | OPTION_STRING, | 19 | OPTION_STRING, |
16 | OPTION_INTEGER, | 20 | OPTION_INTEGER, |
17 | OPTION_LONG, | 21 | OPTION_LONG, |
18 | OPTION_CALLBACK, | 22 | OPTION_CALLBACK, |
23 | OPTION_U64, | ||
24 | OPTION_UINTEGER, | ||
19 | }; | 25 | }; |
20 | 26 | ||
21 | enum parse_opt_flags { | 27 | enum parse_opt_flags { |
@@ -73,7 +79,7 @@ typedef int parse_opt_cb(const struct option *, const char *arg, int unset); | |||
73 | * | 79 | * |
74 | * `defval`:: | 80 | * `defval`:: |
75 | * default value to fill (*->value) with for PARSE_OPT_OPTARG. | 81 | * default value to fill (*->value) with for PARSE_OPT_OPTARG. |
76 | * OPTION_{BIT,SET_INT,SET_PTR} store the {mask,integer,pointer} to put in | 82 | * OPTION_{BIT,SET_UINT,SET_PTR} store the {mask,integer,pointer} to put in |
77 | * the value when met. | 83 | * the value when met. |
78 | * CALLBACKS can use it like they want. | 84 | * CALLBACKS can use it like they want. |
79 | */ | 85 | */ |
@@ -90,16 +96,21 @@ struct option { | |||
90 | intptr_t defval; | 96 | intptr_t defval; |
91 | }; | 97 | }; |
92 | 98 | ||
99 | #define check_vtype(v, type) ( BUILD_BUG_ON_ZERO(!__builtin_types_compatible_p(typeof(v), type)) + v ) | ||
100 | |||
93 | #define OPT_END() { .type = OPTION_END } | 101 | #define OPT_END() { .type = OPTION_END } |
94 | #define OPT_ARGUMENT(l, h) { .type = OPTION_ARGUMENT, .long_name = (l), .help = (h) } | 102 | #define OPT_ARGUMENT(l, h) { .type = OPTION_ARGUMENT, .long_name = (l), .help = (h) } |
95 | #define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) } | 103 | #define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) } |
96 | #define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (b) } | 104 | #define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h), .defval = (b) } |
97 | #define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | 105 | #define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = check_vtype(v, bool *), .help = (h) } |
98 | #define OPT_SET_INT(s, l, v, h, i) { .type = OPTION_SET_INT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (i) } | 106 | #define OPT_INCR(s, l, v, h) { .type = OPTION_INCR, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h) } |
107 | #define OPT_SET_UINT(s, l, v, h, i) { .type = OPTION_SET_UINT, .short_name = (s), .long_name = (l), .value = check_vtype(v, unsigned int *), .help = (h), .defval = (i) } | ||
99 | #define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) } | 108 | #define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) } |
100 | #define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | 109 | #define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h) } |
101 | #define OPT_LONG(s, l, v, h) { .type = OPTION_LONG, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | 110 | #define OPT_UINTEGER(s, l, v, h) { .type = OPTION_UINTEGER, .short_name = (s), .long_name = (l), .value = check_vtype(v, unsigned int *), .help = (h) } |
102 | #define OPT_STRING(s, l, v, a, h) { .type = OPTION_STRING, .short_name = (s), .long_name = (l), .value = (v), (a), .help = (h) } | 111 | #define OPT_LONG(s, l, v, h) { .type = OPTION_LONG, .short_name = (s), .long_name = (l), .value = check_vtype(v, long *), .help = (h) } |
112 | #define OPT_U64(s, l, v, h) { .type = OPTION_U64, .short_name = (s), .long_name = (l), .value = check_vtype(v, u64 *), .help = (h) } | ||
113 | #define OPT_STRING(s, l, v, a, h) { .type = OPTION_STRING, .short_name = (s), .long_name = (l), .value = check_vtype(v, const char **), (a), .help = (h) } | ||
103 | #define OPT_DATE(s, l, v, h) \ | 114 | #define OPT_DATE(s, l, v, h) \ |
104 | { .type = OPTION_CALLBACK, .short_name = (s), .long_name = (l), .value = (v), .argh = "time", .help = (h), .callback = parse_opt_approxidate_cb } | 115 | { .type = OPTION_CALLBACK, .short_name = (s), .long_name = (l), .value = (v), .argh = "time", .help = (h), .callback = parse_opt_approxidate_cb } |
105 | #define OPT_CALLBACK(s, l, v, a, h, f) \ | 116 | #define OPT_CALLBACK(s, l, v, a, h, f) \ |
diff --git a/tools/perf/util/probe-event.c b/tools/perf/util/probe-event.c index 7c004b6ef24f..914c67095d96 100644 --- a/tools/perf/util/probe-event.c +++ b/tools/perf/util/probe-event.c | |||
@@ -33,20 +33,27 @@ | |||
33 | #include <limits.h> | 33 | #include <limits.h> |
34 | 34 | ||
35 | #undef _GNU_SOURCE | 35 | #undef _GNU_SOURCE |
36 | #include "util.h" | ||
36 | #include "event.h" | 37 | #include "event.h" |
37 | #include "string.h" | 38 | #include "string.h" |
38 | #include "strlist.h" | 39 | #include "strlist.h" |
39 | #include "debug.h" | 40 | #include "debug.h" |
40 | #include "cache.h" | 41 | #include "cache.h" |
41 | #include "color.h" | 42 | #include "color.h" |
42 | #include "parse-events.h" /* For debugfs_path */ | 43 | #include "symbol.h" |
44 | #include "thread.h" | ||
45 | #include "debugfs.h" | ||
46 | #include "trace-event.h" /* For __unused */ | ||
43 | #include "probe-event.h" | 47 | #include "probe-event.h" |
48 | #include "probe-finder.h" | ||
44 | 49 | ||
45 | #define MAX_CMDLEN 256 | 50 | #define MAX_CMDLEN 256 |
46 | #define MAX_PROBE_ARGS 128 | 51 | #define MAX_PROBE_ARGS 128 |
47 | #define PERFPROBE_GROUP "probe" | 52 | #define PERFPROBE_GROUP "probe" |
48 | 53 | ||
49 | #define semantic_error(msg ...) die("Semantic error :" msg) | 54 | bool probe_event_dry_run; /* Dry run flag */ |
55 | |||
56 | #define semantic_error(msg ...) pr_err("Semantic error :" msg) | ||
50 | 57 | ||
51 | /* If there is no space to write, returns -E2BIG. */ | 58 | /* If there is no space to write, returns -E2BIG. */ |
52 | static int e_snprintf(char *str, size_t size, const char *format, ...) | 59 | static int e_snprintf(char *str, size_t size, const char *format, ...) |
@@ -64,7 +71,275 @@ static int e_snprintf(char *str, size_t size, const char *format, ...) | |||
64 | return ret; | 71 | return ret; |
65 | } | 72 | } |
66 | 73 | ||
67 | void parse_line_range_desc(const char *arg, struct line_range *lr) | 74 | static char *synthesize_perf_probe_point(struct perf_probe_point *pp); |
75 | static struct machine machine; | ||
76 | |||
77 | /* Initialize symbol maps and path of vmlinux */ | ||
78 | static int init_vmlinux(void) | ||
79 | { | ||
80 | struct dso *kernel; | ||
81 | int ret; | ||
82 | |||
83 | symbol_conf.sort_by_name = true; | ||
84 | if (symbol_conf.vmlinux_name == NULL) | ||
85 | symbol_conf.try_vmlinux_path = true; | ||
86 | else | ||
87 | pr_debug("Use vmlinux: %s\n", symbol_conf.vmlinux_name); | ||
88 | ret = symbol__init(); | ||
89 | if (ret < 0) { | ||
90 | pr_debug("Failed to init symbol map.\n"); | ||
91 | goto out; | ||
92 | } | ||
93 | |||
94 | ret = machine__init(&machine, "/", 0); | ||
95 | if (ret < 0) | ||
96 | goto out; | ||
97 | |||
98 | kernel = dso__new_kernel(symbol_conf.vmlinux_name); | ||
99 | if (kernel == NULL) | ||
100 | die("Failed to create kernel dso."); | ||
101 | |||
102 | ret = __machine__create_kernel_maps(&machine, kernel); | ||
103 | if (ret < 0) | ||
104 | pr_debug("Failed to create kernel maps.\n"); | ||
105 | |||
106 | out: | ||
107 | if (ret < 0) | ||
108 | pr_warning("Failed to init vmlinux path.\n"); | ||
109 | return ret; | ||
110 | } | ||
111 | |||
112 | #ifdef DWARF_SUPPORT | ||
113 | static int open_vmlinux(void) | ||
114 | { | ||
115 | if (map__load(machine.vmlinux_maps[MAP__FUNCTION], NULL) < 0) { | ||
116 | pr_debug("Failed to load kernel map.\n"); | ||
117 | return -EINVAL; | ||
118 | } | ||
119 | pr_debug("Try to open %s\n", machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name); | ||
120 | return open(machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name, O_RDONLY); | ||
121 | } | ||
122 | |||
123 | /* Convert trace point to probe point with debuginfo */ | ||
124 | static int convert_to_perf_probe_point(struct kprobe_trace_point *tp, | ||
125 | struct perf_probe_point *pp) | ||
126 | { | ||
127 | struct symbol *sym; | ||
128 | int fd, ret = -ENOENT; | ||
129 | |||
130 | sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION], | ||
131 | tp->symbol, NULL); | ||
132 | if (sym) { | ||
133 | fd = open_vmlinux(); | ||
134 | if (fd >= 0) { | ||
135 | ret = find_perf_probe_point(fd, | ||
136 | sym->start + tp->offset, pp); | ||
137 | close(fd); | ||
138 | } | ||
139 | } | ||
140 | if (ret <= 0) { | ||
141 | pr_debug("Failed to find corresponding probes from " | ||
142 | "debuginfo. Use kprobe event information.\n"); | ||
143 | pp->function = strdup(tp->symbol); | ||
144 | if (pp->function == NULL) | ||
145 | return -ENOMEM; | ||
146 | pp->offset = tp->offset; | ||
147 | } | ||
148 | pp->retprobe = tp->retprobe; | ||
149 | |||
150 | return 0; | ||
151 | } | ||
152 | |||
153 | /* Try to find perf_probe_event with debuginfo */ | ||
154 | static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev, | ||
155 | struct kprobe_trace_event **tevs, | ||
156 | int max_tevs) | ||
157 | { | ||
158 | bool need_dwarf = perf_probe_event_need_dwarf(pev); | ||
159 | int fd, ntevs; | ||
160 | |||
161 | fd = open_vmlinux(); | ||
162 | if (fd < 0) { | ||
163 | if (need_dwarf) { | ||
164 | pr_warning("Failed to open debuginfo file.\n"); | ||
165 | return fd; | ||
166 | } | ||
167 | pr_debug("Could not open vmlinux. Try to use symbols.\n"); | ||
168 | return 0; | ||
169 | } | ||
170 | |||
171 | /* Searching trace events corresponding to probe event */ | ||
172 | ntevs = find_kprobe_trace_events(fd, pev, tevs, max_tevs); | ||
173 | close(fd); | ||
174 | |||
175 | if (ntevs > 0) { /* Succeeded to find trace events */ | ||
176 | pr_debug("find %d kprobe_trace_events.\n", ntevs); | ||
177 | return ntevs; | ||
178 | } | ||
179 | |||
180 | if (ntevs == 0) { /* No error but failed to find probe point. */ | ||
181 | pr_warning("Probe point '%s' not found.\n", | ||
182 | synthesize_perf_probe_point(&pev->point)); | ||
183 | return -ENOENT; | ||
184 | } | ||
185 | /* Error path : ntevs < 0 */ | ||
186 | pr_debug("An error occurred in debuginfo analysis (%d).\n", ntevs); | ||
187 | if (ntevs == -EBADF) { | ||
188 | pr_warning("Warning: No dwarf info found in the vmlinux - " | ||
189 | "please rebuild kernel with CONFIG_DEBUG_INFO=y.\n"); | ||
190 | if (!need_dwarf) { | ||
191 | pr_debug("Trying to use symbols.\nn"); | ||
192 | return 0; | ||
193 | } | ||
194 | } | ||
195 | return ntevs; | ||
196 | } | ||
197 | |||
198 | #define LINEBUF_SIZE 256 | ||
199 | #define NR_ADDITIONAL_LINES 2 | ||
200 | |||
201 | static int show_one_line(FILE *fp, int l, bool skip, bool show_num) | ||
202 | { | ||
203 | char buf[LINEBUF_SIZE]; | ||
204 | const char *color = PERF_COLOR_BLUE; | ||
205 | |||
206 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
207 | goto error; | ||
208 | if (!skip) { | ||
209 | if (show_num) | ||
210 | fprintf(stdout, "%7d %s", l, buf); | ||
211 | else | ||
212 | color_fprintf(stdout, color, " %s", buf); | ||
213 | } | ||
214 | |||
215 | while (strlen(buf) == LINEBUF_SIZE - 1 && | ||
216 | buf[LINEBUF_SIZE - 2] != '\n') { | ||
217 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
218 | goto error; | ||
219 | if (!skip) { | ||
220 | if (show_num) | ||
221 | fprintf(stdout, "%s", buf); | ||
222 | else | ||
223 | color_fprintf(stdout, color, "%s", buf); | ||
224 | } | ||
225 | } | ||
226 | |||
227 | return 0; | ||
228 | error: | ||
229 | if (feof(fp)) | ||
230 | pr_warning("Source file is shorter than expected.\n"); | ||
231 | else | ||
232 | pr_warning("File read error: %s\n", strerror(errno)); | ||
233 | |||
234 | return -1; | ||
235 | } | ||
236 | |||
237 | /* | ||
238 | * Show line-range always requires debuginfo to find source file and | ||
239 | * line number. | ||
240 | */ | ||
241 | int show_line_range(struct line_range *lr) | ||
242 | { | ||
243 | int l = 1; | ||
244 | struct line_node *ln; | ||
245 | FILE *fp; | ||
246 | int fd, ret; | ||
247 | |||
248 | /* Search a line range */ | ||
249 | ret = init_vmlinux(); | ||
250 | if (ret < 0) | ||
251 | return ret; | ||
252 | |||
253 | fd = open_vmlinux(); | ||
254 | if (fd < 0) { | ||
255 | pr_warning("Failed to open debuginfo file.\n"); | ||
256 | return fd; | ||
257 | } | ||
258 | |||
259 | ret = find_line_range(fd, lr); | ||
260 | close(fd); | ||
261 | if (ret == 0) { | ||
262 | pr_warning("Specified source line is not found.\n"); | ||
263 | return -ENOENT; | ||
264 | } else if (ret < 0) { | ||
265 | pr_warning("Debuginfo analysis failed. (%d)\n", ret); | ||
266 | return ret; | ||
267 | } | ||
268 | |||
269 | setup_pager(); | ||
270 | |||
271 | if (lr->function) | ||
272 | fprintf(stdout, "<%s:%d>\n", lr->function, | ||
273 | lr->start - lr->offset); | ||
274 | else | ||
275 | fprintf(stdout, "<%s:%d>\n", lr->file, lr->start); | ||
276 | |||
277 | fp = fopen(lr->path, "r"); | ||
278 | if (fp == NULL) { | ||
279 | pr_warning("Failed to open %s: %s\n", lr->path, | ||
280 | strerror(errno)); | ||
281 | return -errno; | ||
282 | } | ||
283 | /* Skip to starting line number */ | ||
284 | while (l < lr->start && ret >= 0) | ||
285 | ret = show_one_line(fp, l++, true, false); | ||
286 | if (ret < 0) | ||
287 | goto end; | ||
288 | |||
289 | list_for_each_entry(ln, &lr->line_list, list) { | ||
290 | while (ln->line > l && ret >= 0) | ||
291 | ret = show_one_line(fp, (l++) - lr->offset, | ||
292 | false, false); | ||
293 | if (ret >= 0) | ||
294 | ret = show_one_line(fp, (l++) - lr->offset, | ||
295 | false, true); | ||
296 | if (ret < 0) | ||
297 | goto end; | ||
298 | } | ||
299 | |||
300 | if (lr->end == INT_MAX) | ||
301 | lr->end = l + NR_ADDITIONAL_LINES; | ||
302 | while (l <= lr->end && !feof(fp) && ret >= 0) | ||
303 | ret = show_one_line(fp, (l++) - lr->offset, false, false); | ||
304 | end: | ||
305 | fclose(fp); | ||
306 | return ret; | ||
307 | } | ||
308 | |||
309 | #else /* !DWARF_SUPPORT */ | ||
310 | |||
311 | static int convert_to_perf_probe_point(struct kprobe_trace_point *tp, | ||
312 | struct perf_probe_point *pp) | ||
313 | { | ||
314 | pp->function = strdup(tp->symbol); | ||
315 | if (pp->function == NULL) | ||
316 | return -ENOMEM; | ||
317 | pp->offset = tp->offset; | ||
318 | pp->retprobe = tp->retprobe; | ||
319 | |||
320 | return 0; | ||
321 | } | ||
322 | |||
323 | static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev, | ||
324 | struct kprobe_trace_event **tevs __unused, | ||
325 | int max_tevs __unused) | ||
326 | { | ||
327 | if (perf_probe_event_need_dwarf(pev)) { | ||
328 | pr_warning("Debuginfo-analysis is not supported.\n"); | ||
329 | return -ENOSYS; | ||
330 | } | ||
331 | return 0; | ||
332 | } | ||
333 | |||
334 | int show_line_range(struct line_range *lr __unused) | ||
335 | { | ||
336 | pr_warning("Debuginfo-analysis is not supported.\n"); | ||
337 | return -ENOSYS; | ||
338 | } | ||
339 | |||
340 | #endif | ||
341 | |||
342 | int parse_line_range_desc(const char *arg, struct line_range *lr) | ||
68 | { | 343 | { |
69 | const char *ptr; | 344 | const char *ptr; |
70 | char *tmp; | 345 | char *tmp; |
@@ -75,29 +350,45 @@ void parse_line_range_desc(const char *arg, struct line_range *lr) | |||
75 | */ | 350 | */ |
76 | ptr = strchr(arg, ':'); | 351 | ptr = strchr(arg, ':'); |
77 | if (ptr) { | 352 | if (ptr) { |
78 | lr->start = (unsigned int)strtoul(ptr + 1, &tmp, 0); | 353 | lr->start = (int)strtoul(ptr + 1, &tmp, 0); |
79 | if (*tmp == '+') | 354 | if (*tmp == '+') { |
80 | lr->end = lr->start + (unsigned int)strtoul(tmp + 1, | 355 | lr->end = lr->start + (int)strtoul(tmp + 1, &tmp, 0); |
81 | &tmp, 0); | 356 | lr->end--; /* |
82 | else if (*tmp == '-') | 357 | * Adjust the number of lines here. |
83 | lr->end = (unsigned int)strtoul(tmp + 1, &tmp, 0); | 358 | * If the number of lines == 1, the |
359 | * the end of line should be equal to | ||
360 | * the start of line. | ||
361 | */ | ||
362 | } else if (*tmp == '-') | ||
363 | lr->end = (int)strtoul(tmp + 1, &tmp, 0); | ||
84 | else | 364 | else |
85 | lr->end = 0; | 365 | lr->end = INT_MAX; |
86 | pr_debug("Line range is %u to %u\n", lr->start, lr->end); | 366 | pr_debug("Line range is %d to %d\n", lr->start, lr->end); |
87 | if (lr->end && lr->start > lr->end) | 367 | if (lr->start > lr->end) { |
88 | semantic_error("Start line must be smaller" | 368 | semantic_error("Start line must be smaller" |
89 | " than end line."); | 369 | " than end line.\n"); |
90 | if (*tmp != '\0') | 370 | return -EINVAL; |
91 | semantic_error("Tailing with invalid character '%d'.", | 371 | } |
372 | if (*tmp != '\0') { | ||
373 | semantic_error("Tailing with invalid character '%d'.\n", | ||
92 | *tmp); | 374 | *tmp); |
375 | return -EINVAL; | ||
376 | } | ||
93 | tmp = strndup(arg, (ptr - arg)); | 377 | tmp = strndup(arg, (ptr - arg)); |
94 | } else | 378 | } else { |
95 | tmp = strdup(arg); | 379 | tmp = strdup(arg); |
380 | lr->end = INT_MAX; | ||
381 | } | ||
382 | |||
383 | if (tmp == NULL) | ||
384 | return -ENOMEM; | ||
96 | 385 | ||
97 | if (strchr(tmp, '.')) | 386 | if (strchr(tmp, '.')) |
98 | lr->file = tmp; | 387 | lr->file = tmp; |
99 | else | 388 | else |
100 | lr->function = tmp; | 389 | lr->function = tmp; |
390 | |||
391 | return 0; | ||
101 | } | 392 | } |
102 | 393 | ||
103 | /* Check the name is good for event/group */ | 394 | /* Check the name is good for event/group */ |
@@ -113,8 +404,9 @@ static bool check_event_name(const char *name) | |||
113 | } | 404 | } |
114 | 405 | ||
115 | /* Parse probepoint definition. */ | 406 | /* Parse probepoint definition. */ |
116 | static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | 407 | static int parse_perf_probe_point(char *arg, struct perf_probe_event *pev) |
117 | { | 408 | { |
409 | struct perf_probe_point *pp = &pev->point; | ||
118 | char *ptr, *tmp; | 410 | char *ptr, *tmp; |
119 | char c, nc = 0; | 411 | char c, nc = 0; |
120 | /* | 412 | /* |
@@ -129,13 +421,19 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
129 | if (ptr && *ptr == '=') { /* Event name */ | 421 | if (ptr && *ptr == '=') { /* Event name */ |
130 | *ptr = '\0'; | 422 | *ptr = '\0'; |
131 | tmp = ptr + 1; | 423 | tmp = ptr + 1; |
132 | ptr = strchr(arg, ':'); | 424 | if (strchr(arg, ':')) { |
133 | if (ptr) /* Group name is not supported yet. */ | 425 | semantic_error("Group name is not supported yet.\n"); |
134 | semantic_error("Group name is not supported yet."); | 426 | return -ENOTSUP; |
135 | if (!check_event_name(arg)) | 427 | } |
428 | if (!check_event_name(arg)) { | ||
136 | semantic_error("%s is bad for event name -it must " | 429 | semantic_error("%s is bad for event name -it must " |
137 | "follow C symbol-naming rule.", arg); | 430 | "follow C symbol-naming rule.\n", arg); |
138 | pp->event = strdup(arg); | 431 | return -EINVAL; |
432 | } | ||
433 | pev->event = strdup(arg); | ||
434 | if (pev->event == NULL) | ||
435 | return -ENOMEM; | ||
436 | pev->group = NULL; | ||
139 | arg = tmp; | 437 | arg = tmp; |
140 | } | 438 | } |
141 | 439 | ||
@@ -145,12 +443,15 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
145 | *ptr++ = '\0'; | 443 | *ptr++ = '\0'; |
146 | } | 444 | } |
147 | 445 | ||
446 | tmp = strdup(arg); | ||
447 | if (tmp == NULL) | ||
448 | return -ENOMEM; | ||
449 | |||
148 | /* Check arg is function or file and copy it */ | 450 | /* Check arg is function or file and copy it */ |
149 | if (strchr(arg, '.')) /* File */ | 451 | if (strchr(tmp, '.')) /* File */ |
150 | pp->file = strdup(arg); | 452 | pp->file = tmp; |
151 | else /* Function */ | 453 | else /* Function */ |
152 | pp->function = strdup(arg); | 454 | pp->function = tmp; |
153 | DIE_IF(pp->file == NULL && pp->function == NULL); | ||
154 | 455 | ||
155 | /* Parse other options */ | 456 | /* Parse other options */ |
156 | while (ptr) { | 457 | while (ptr) { |
@@ -158,6 +459,8 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
158 | c = nc; | 459 | c = nc; |
159 | if (c == ';') { /* Lazy pattern must be the last part */ | 460 | if (c == ';') { /* Lazy pattern must be the last part */ |
160 | pp->lazy_line = strdup(arg); | 461 | pp->lazy_line = strdup(arg); |
462 | if (pp->lazy_line == NULL) | ||
463 | return -ENOMEM; | ||
161 | break; | 464 | break; |
162 | } | 465 | } |
163 | ptr = strpbrk(arg, ";:+@%"); | 466 | ptr = strpbrk(arg, ";:+@%"); |
@@ -168,266 +471,658 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
168 | switch (c) { | 471 | switch (c) { |
169 | case ':': /* Line number */ | 472 | case ':': /* Line number */ |
170 | pp->line = strtoul(arg, &tmp, 0); | 473 | pp->line = strtoul(arg, &tmp, 0); |
171 | if (*tmp != '\0') | 474 | if (*tmp != '\0') { |
172 | semantic_error("There is non-digit char" | 475 | semantic_error("There is non-digit char" |
173 | " in line number."); | 476 | " in line number.\n"); |
477 | return -EINVAL; | ||
478 | } | ||
174 | break; | 479 | break; |
175 | case '+': /* Byte offset from a symbol */ | 480 | case '+': /* Byte offset from a symbol */ |
176 | pp->offset = strtoul(arg, &tmp, 0); | 481 | pp->offset = strtoul(arg, &tmp, 0); |
177 | if (*tmp != '\0') | 482 | if (*tmp != '\0') { |
178 | semantic_error("There is non-digit character" | 483 | semantic_error("There is non-digit character" |
179 | " in offset."); | 484 | " in offset.\n"); |
485 | return -EINVAL; | ||
486 | } | ||
180 | break; | 487 | break; |
181 | case '@': /* File name */ | 488 | case '@': /* File name */ |
182 | if (pp->file) | 489 | if (pp->file) { |
183 | semantic_error("SRC@SRC is not allowed."); | 490 | semantic_error("SRC@SRC is not allowed.\n"); |
491 | return -EINVAL; | ||
492 | } | ||
184 | pp->file = strdup(arg); | 493 | pp->file = strdup(arg); |
185 | DIE_IF(pp->file == NULL); | 494 | if (pp->file == NULL) |
495 | return -ENOMEM; | ||
186 | break; | 496 | break; |
187 | case '%': /* Probe places */ | 497 | case '%': /* Probe places */ |
188 | if (strcmp(arg, "return") == 0) { | 498 | if (strcmp(arg, "return") == 0) { |
189 | pp->retprobe = 1; | 499 | pp->retprobe = 1; |
190 | } else /* Others not supported yet */ | 500 | } else { /* Others not supported yet */ |
191 | semantic_error("%%%s is not supported.", arg); | 501 | semantic_error("%%%s is not supported.\n", arg); |
502 | return -ENOTSUP; | ||
503 | } | ||
192 | break; | 504 | break; |
193 | default: | 505 | default: /* Buggy case */ |
194 | DIE_IF("Program has a bug."); | 506 | pr_err("This program has a bug at %s:%d.\n", |
507 | __FILE__, __LINE__); | ||
508 | return -ENOTSUP; | ||
195 | break; | 509 | break; |
196 | } | 510 | } |
197 | } | 511 | } |
198 | 512 | ||
199 | /* Exclusion check */ | 513 | /* Exclusion check */ |
200 | if (pp->lazy_line && pp->line) | 514 | if (pp->lazy_line && pp->line) { |
201 | semantic_error("Lazy pattern can't be used with line number."); | 515 | semantic_error("Lazy pattern can't be used with line number."); |
516 | return -EINVAL; | ||
517 | } | ||
202 | 518 | ||
203 | if (pp->lazy_line && pp->offset) | 519 | if (pp->lazy_line && pp->offset) { |
204 | semantic_error("Lazy pattern can't be used with offset."); | 520 | semantic_error("Lazy pattern can't be used with offset."); |
521 | return -EINVAL; | ||
522 | } | ||
205 | 523 | ||
206 | if (pp->line && pp->offset) | 524 | if (pp->line && pp->offset) { |
207 | semantic_error("Offset can't be used with line number."); | 525 | semantic_error("Offset can't be used with line number."); |
526 | return -EINVAL; | ||
527 | } | ||
208 | 528 | ||
209 | if (!pp->line && !pp->lazy_line && pp->file && !pp->function) | 529 | if (!pp->line && !pp->lazy_line && pp->file && !pp->function) { |
210 | semantic_error("File always requires line number or " | 530 | semantic_error("File always requires line number or " |
211 | "lazy pattern."); | 531 | "lazy pattern."); |
532 | return -EINVAL; | ||
533 | } | ||
212 | 534 | ||
213 | if (pp->offset && !pp->function) | 535 | if (pp->offset && !pp->function) { |
214 | semantic_error("Offset requires an entry function."); | 536 | semantic_error("Offset requires an entry function."); |
537 | return -EINVAL; | ||
538 | } | ||
215 | 539 | ||
216 | if (pp->retprobe && !pp->function) | 540 | if (pp->retprobe && !pp->function) { |
217 | semantic_error("Return probe requires an entry function."); | 541 | semantic_error("Return probe requires an entry function."); |
542 | return -EINVAL; | ||
543 | } | ||
218 | 544 | ||
219 | if ((pp->offset || pp->line || pp->lazy_line) && pp->retprobe) | 545 | if ((pp->offset || pp->line || pp->lazy_line) && pp->retprobe) { |
220 | semantic_error("Offset/Line/Lazy pattern can't be used with " | 546 | semantic_error("Offset/Line/Lazy pattern can't be used with " |
221 | "return probe."); | 547 | "return probe."); |
548 | return -EINVAL; | ||
549 | } | ||
222 | 550 | ||
223 | pr_debug("symbol:%s file:%s line:%d offset:%d return:%d lazy:%s\n", | 551 | pr_debug("symbol:%s file:%s line:%d offset:%lu return:%d lazy:%s\n", |
224 | pp->function, pp->file, pp->line, pp->offset, pp->retprobe, | 552 | pp->function, pp->file, pp->line, pp->offset, pp->retprobe, |
225 | pp->lazy_line); | 553 | pp->lazy_line); |
554 | return 0; | ||
226 | } | 555 | } |
227 | 556 | ||
228 | /* Parse perf-probe event definition */ | 557 | /* Parse perf-probe event argument */ |
229 | void parse_perf_probe_event(const char *str, struct probe_point *pp, | 558 | static int parse_perf_probe_arg(char *str, struct perf_probe_arg *arg) |
230 | bool *need_dwarf) | ||
231 | { | 559 | { |
232 | char **argv; | 560 | char *tmp; |
233 | int argc, i; | 561 | struct perf_probe_arg_field **fieldp; |
562 | |||
563 | pr_debug("parsing arg: %s into ", str); | ||
234 | 564 | ||
235 | *need_dwarf = false; | 565 | tmp = strchr(str, '='); |
566 | if (tmp) { | ||
567 | arg->name = strndup(str, tmp - str); | ||
568 | if (arg->name == NULL) | ||
569 | return -ENOMEM; | ||
570 | pr_debug("name:%s ", arg->name); | ||
571 | str = tmp + 1; | ||
572 | } | ||
236 | 573 | ||
237 | argv = argv_split(str, &argc); | 574 | tmp = strchr(str, ':'); |
238 | if (!argv) | 575 | if (tmp) { /* Type setting */ |
239 | die("argv_split failed."); | 576 | *tmp = '\0'; |
240 | if (argc > MAX_PROBE_ARGS + 1) | 577 | arg->type = strdup(tmp + 1); |
241 | semantic_error("Too many arguments"); | 578 | if (arg->type == NULL) |
579 | return -ENOMEM; | ||
580 | pr_debug("type:%s ", arg->type); | ||
581 | } | ||
242 | 582 | ||
583 | tmp = strpbrk(str, "-."); | ||
584 | if (!is_c_varname(str) || !tmp) { | ||
585 | /* A variable, register, symbol or special value */ | ||
586 | arg->var = strdup(str); | ||
587 | if (arg->var == NULL) | ||
588 | return -ENOMEM; | ||
589 | pr_debug("%s\n", arg->var); | ||
590 | return 0; | ||
591 | } | ||
592 | |||
593 | /* Structure fields */ | ||
594 | arg->var = strndup(str, tmp - str); | ||
595 | if (arg->var == NULL) | ||
596 | return -ENOMEM; | ||
597 | pr_debug("%s, ", arg->var); | ||
598 | fieldp = &arg->field; | ||
599 | |||
600 | do { | ||
601 | *fieldp = zalloc(sizeof(struct perf_probe_arg_field)); | ||
602 | if (*fieldp == NULL) | ||
603 | return -ENOMEM; | ||
604 | if (*tmp == '.') { | ||
605 | str = tmp + 1; | ||
606 | (*fieldp)->ref = false; | ||
607 | } else if (tmp[1] == '>') { | ||
608 | str = tmp + 2; | ||
609 | (*fieldp)->ref = true; | ||
610 | } else { | ||
611 | semantic_error("Argument parse error: %s\n", str); | ||
612 | return -EINVAL; | ||
613 | } | ||
614 | |||
615 | tmp = strpbrk(str, "-."); | ||
616 | if (tmp) { | ||
617 | (*fieldp)->name = strndup(str, tmp - str); | ||
618 | if ((*fieldp)->name == NULL) | ||
619 | return -ENOMEM; | ||
620 | pr_debug("%s(%d), ", (*fieldp)->name, (*fieldp)->ref); | ||
621 | fieldp = &(*fieldp)->next; | ||
622 | } | ||
623 | } while (tmp); | ||
624 | (*fieldp)->name = strdup(str); | ||
625 | if ((*fieldp)->name == NULL) | ||
626 | return -ENOMEM; | ||
627 | pr_debug("%s(%d)\n", (*fieldp)->name, (*fieldp)->ref); | ||
628 | |||
629 | /* If no name is specified, set the last field name */ | ||
630 | if (!arg->name) { | ||
631 | arg->name = strdup((*fieldp)->name); | ||
632 | if (arg->name == NULL) | ||
633 | return -ENOMEM; | ||
634 | } | ||
635 | return 0; | ||
636 | } | ||
637 | |||
638 | /* Parse perf-probe event command */ | ||
639 | int parse_perf_probe_command(const char *cmd, struct perf_probe_event *pev) | ||
640 | { | ||
641 | char **argv; | ||
642 | int argc, i, ret = 0; | ||
643 | |||
644 | argv = argv_split(cmd, &argc); | ||
645 | if (!argv) { | ||
646 | pr_debug("Failed to split arguments.\n"); | ||
647 | return -ENOMEM; | ||
648 | } | ||
649 | if (argc - 1 > MAX_PROBE_ARGS) { | ||
650 | semantic_error("Too many probe arguments (%d).\n", argc - 1); | ||
651 | ret = -ERANGE; | ||
652 | goto out; | ||
653 | } | ||
243 | /* Parse probe point */ | 654 | /* Parse probe point */ |
244 | parse_perf_probe_probepoint(argv[0], pp); | 655 | ret = parse_perf_probe_point(argv[0], pev); |
245 | if (pp->file || pp->line || pp->lazy_line) | 656 | if (ret < 0) |
246 | *need_dwarf = true; | 657 | goto out; |
247 | 658 | ||
248 | /* Copy arguments and ensure return probe has no C argument */ | 659 | /* Copy arguments and ensure return probe has no C argument */ |
249 | pp->nr_args = argc - 1; | 660 | pev->nargs = argc - 1; |
250 | pp->args = zalloc(sizeof(char *) * pp->nr_args); | 661 | pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs); |
251 | for (i = 0; i < pp->nr_args; i++) { | 662 | if (pev->args == NULL) { |
252 | pp->args[i] = strdup(argv[i + 1]); | 663 | ret = -ENOMEM; |
253 | if (!pp->args[i]) | 664 | goto out; |
254 | die("Failed to copy argument."); | 665 | } |
255 | if (is_c_varname(pp->args[i])) { | 666 | for (i = 0; i < pev->nargs && ret >= 0; i++) { |
256 | if (pp->retprobe) | 667 | ret = parse_perf_probe_arg(argv[i + 1], &pev->args[i]); |
257 | semantic_error("You can't specify local" | 668 | if (ret >= 0 && |
258 | " variable for kretprobe"); | 669 | is_c_varname(pev->args[i].var) && pev->point.retprobe) { |
259 | *need_dwarf = true; | 670 | semantic_error("You can't specify local variable for" |
671 | " kretprobe.\n"); | ||
672 | ret = -EINVAL; | ||
260 | } | 673 | } |
261 | } | 674 | } |
262 | 675 | out: | |
263 | argv_free(argv); | 676 | argv_free(argv); |
677 | |||
678 | return ret; | ||
679 | } | ||
680 | |||
681 | /* Return true if this perf_probe_event requires debuginfo */ | ||
682 | bool perf_probe_event_need_dwarf(struct perf_probe_event *pev) | ||
683 | { | ||
684 | int i; | ||
685 | |||
686 | if (pev->point.file || pev->point.line || pev->point.lazy_line) | ||
687 | return true; | ||
688 | |||
689 | for (i = 0; i < pev->nargs; i++) | ||
690 | if (is_c_varname(pev->args[i].var)) | ||
691 | return true; | ||
692 | |||
693 | return false; | ||
264 | } | 694 | } |
265 | 695 | ||
266 | /* Parse kprobe_events event into struct probe_point */ | 696 | /* Parse kprobe_events event into struct probe_point */ |
267 | void parse_trace_kprobe_event(const char *str, struct probe_point *pp) | 697 | int parse_kprobe_trace_command(const char *cmd, struct kprobe_trace_event *tev) |
268 | { | 698 | { |
699 | struct kprobe_trace_point *tp = &tev->point; | ||
269 | char pr; | 700 | char pr; |
270 | char *p; | 701 | char *p; |
271 | int ret, i, argc; | 702 | int ret, i, argc; |
272 | char **argv; | 703 | char **argv; |
273 | 704 | ||
274 | pr_debug("Parsing kprobe_events: %s\n", str); | 705 | pr_debug("Parsing kprobe_events: %s\n", cmd); |
275 | argv = argv_split(str, &argc); | 706 | argv = argv_split(cmd, &argc); |
276 | if (!argv) | 707 | if (!argv) { |
277 | die("argv_split failed."); | 708 | pr_debug("Failed to split arguments.\n"); |
278 | if (argc < 2) | 709 | return -ENOMEM; |
279 | semantic_error("Too less arguments."); | 710 | } |
711 | if (argc < 2) { | ||
712 | semantic_error("Too few probe arguments.\n"); | ||
713 | ret = -ERANGE; | ||
714 | goto out; | ||
715 | } | ||
280 | 716 | ||
281 | /* Scan event and group name. */ | 717 | /* Scan event and group name. */ |
282 | ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]", | 718 | ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]", |
283 | &pr, (float *)(void *)&pp->group, | 719 | &pr, (float *)(void *)&tev->group, |
284 | (float *)(void *)&pp->event); | 720 | (float *)(void *)&tev->event); |
285 | if (ret != 3) | 721 | if (ret != 3) { |
286 | semantic_error("Failed to parse event name: %s", argv[0]); | 722 | semantic_error("Failed to parse event name: %s\n", argv[0]); |
287 | pr_debug("Group:%s Event:%s probe:%c\n", pp->group, pp->event, pr); | 723 | ret = -EINVAL; |
724 | goto out; | ||
725 | } | ||
726 | pr_debug("Group:%s Event:%s probe:%c\n", tev->group, tev->event, pr); | ||
288 | 727 | ||
289 | pp->retprobe = (pr == 'r'); | 728 | tp->retprobe = (pr == 'r'); |
290 | 729 | ||
291 | /* Scan function name and offset */ | 730 | /* Scan function name and offset */ |
292 | ret = sscanf(argv[1], "%a[^+]+%d", (float *)(void *)&pp->function, | 731 | ret = sscanf(argv[1], "%a[^+]+%lu", (float *)(void *)&tp->symbol, |
293 | &pp->offset); | 732 | &tp->offset); |
294 | if (ret == 1) | 733 | if (ret == 1) |
295 | pp->offset = 0; | 734 | tp->offset = 0; |
296 | |||
297 | /* kprobe_events doesn't have this information */ | ||
298 | pp->line = 0; | ||
299 | pp->file = NULL; | ||
300 | 735 | ||
301 | pp->nr_args = argc - 2; | 736 | tev->nargs = argc - 2; |
302 | pp->args = zalloc(sizeof(char *) * pp->nr_args); | 737 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs); |
303 | for (i = 0; i < pp->nr_args; i++) { | 738 | if (tev->args == NULL) { |
739 | ret = -ENOMEM; | ||
740 | goto out; | ||
741 | } | ||
742 | for (i = 0; i < tev->nargs; i++) { | ||
304 | p = strchr(argv[i + 2], '='); | 743 | p = strchr(argv[i + 2], '='); |
305 | if (p) /* We don't need which register is assigned. */ | 744 | if (p) /* We don't need which register is assigned. */ |
306 | *p = '\0'; | 745 | *p++ = '\0'; |
307 | pp->args[i] = strdup(argv[i + 2]); | 746 | else |
308 | if (!pp->args[i]) | 747 | p = argv[i + 2]; |
309 | die("Failed to copy argument."); | 748 | tev->args[i].name = strdup(argv[i + 2]); |
749 | /* TODO: parse regs and offset */ | ||
750 | tev->args[i].value = strdup(p); | ||
751 | if (tev->args[i].name == NULL || tev->args[i].value == NULL) { | ||
752 | ret = -ENOMEM; | ||
753 | goto out; | ||
754 | } | ||
310 | } | 755 | } |
311 | 756 | ret = 0; | |
757 | out: | ||
312 | argv_free(argv); | 758 | argv_free(argv); |
759 | return ret; | ||
313 | } | 760 | } |
314 | 761 | ||
315 | /* Synthesize only probe point (not argument) */ | 762 | /* Compose only probe arg */ |
316 | int synthesize_perf_probe_point(struct probe_point *pp) | 763 | int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf, size_t len) |
317 | { | 764 | { |
318 | char *buf; | 765 | struct perf_probe_arg_field *field = pa->field; |
319 | char offs[64] = "", line[64] = ""; | ||
320 | int ret; | 766 | int ret; |
767 | char *tmp = buf; | ||
321 | 768 | ||
322 | pp->probes[0] = buf = zalloc(MAX_CMDLEN); | 769 | if (pa->name && pa->var) |
323 | pp->found = 1; | 770 | ret = e_snprintf(tmp, len, "%s=%s", pa->name, pa->var); |
324 | if (!buf) | 771 | else |
325 | die("Failed to allocate memory by zalloc."); | 772 | ret = e_snprintf(tmp, len, "%s", pa->name ? pa->name : pa->var); |
773 | if (ret <= 0) | ||
774 | goto error; | ||
775 | tmp += ret; | ||
776 | len -= ret; | ||
777 | |||
778 | while (field) { | ||
779 | ret = e_snprintf(tmp, len, "%s%s", field->ref ? "->" : ".", | ||
780 | field->name); | ||
781 | if (ret <= 0) | ||
782 | goto error; | ||
783 | tmp += ret; | ||
784 | len -= ret; | ||
785 | field = field->next; | ||
786 | } | ||
787 | |||
788 | if (pa->type) { | ||
789 | ret = e_snprintf(tmp, len, ":%s", pa->type); | ||
790 | if (ret <= 0) | ||
791 | goto error; | ||
792 | tmp += ret; | ||
793 | len -= ret; | ||
794 | } | ||
795 | |||
796 | return tmp - buf; | ||
797 | error: | ||
798 | pr_debug("Failed to synthesize perf probe argument: %s", | ||
799 | strerror(-ret)); | ||
800 | return ret; | ||
801 | } | ||
802 | |||
803 | /* Compose only probe point (not argument) */ | ||
804 | static char *synthesize_perf_probe_point(struct perf_probe_point *pp) | ||
805 | { | ||
806 | char *buf, *tmp; | ||
807 | char offs[32] = "", line[32] = "", file[32] = ""; | ||
808 | int ret, len; | ||
809 | |||
810 | buf = zalloc(MAX_CMDLEN); | ||
811 | if (buf == NULL) { | ||
812 | ret = -ENOMEM; | ||
813 | goto error; | ||
814 | } | ||
326 | if (pp->offset) { | 815 | if (pp->offset) { |
327 | ret = e_snprintf(offs, 64, "+%d", pp->offset); | 816 | ret = e_snprintf(offs, 32, "+%lu", pp->offset); |
328 | if (ret <= 0) | 817 | if (ret <= 0) |
329 | goto error; | 818 | goto error; |
330 | } | 819 | } |
331 | if (pp->line) { | 820 | if (pp->line) { |
332 | ret = e_snprintf(line, 64, ":%d", pp->line); | 821 | ret = e_snprintf(line, 32, ":%d", pp->line); |
822 | if (ret <= 0) | ||
823 | goto error; | ||
824 | } | ||
825 | if (pp->file) { | ||
826 | len = strlen(pp->file) - 31; | ||
827 | if (len < 0) | ||
828 | len = 0; | ||
829 | tmp = strchr(pp->file + len, '/'); | ||
830 | if (!tmp) | ||
831 | tmp = pp->file + len; | ||
832 | ret = e_snprintf(file, 32, "@%s", tmp + 1); | ||
333 | if (ret <= 0) | 833 | if (ret <= 0) |
334 | goto error; | 834 | goto error; |
335 | } | 835 | } |
336 | 836 | ||
337 | if (pp->function) | 837 | if (pp->function) |
338 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s", pp->function, | 838 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s%s", pp->function, |
339 | offs, pp->retprobe ? "%return" : "", line); | 839 | offs, pp->retprobe ? "%return" : "", line, |
840 | file); | ||
340 | else | 841 | else |
341 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", pp->file, line); | 842 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", file, line); |
342 | if (ret <= 0) { | 843 | if (ret <= 0) |
844 | goto error; | ||
845 | |||
846 | return buf; | ||
343 | error: | 847 | error: |
344 | free(pp->probes[0]); | 848 | pr_debug("Failed to synthesize perf probe point: %s", |
345 | pp->probes[0] = NULL; | 849 | strerror(-ret)); |
346 | pp->found = 0; | 850 | if (buf) |
347 | } | 851 | free(buf); |
348 | return ret; | 852 | return NULL; |
349 | } | 853 | } |
350 | 854 | ||
351 | int synthesize_perf_probe_event(struct probe_point *pp) | 855 | #if 0 |
856 | char *synthesize_perf_probe_command(struct perf_probe_event *pev) | ||
352 | { | 857 | { |
353 | char *buf; | 858 | char *buf; |
354 | int i, len, ret; | 859 | int i, len, ret; |
355 | 860 | ||
356 | len = synthesize_perf_probe_point(pp); | 861 | buf = synthesize_perf_probe_point(&pev->point); |
357 | if (len < 0) | 862 | if (!buf) |
358 | return 0; | 863 | return NULL; |
359 | 864 | ||
360 | buf = pp->probes[0]; | 865 | len = strlen(buf); |
361 | for (i = 0; i < pp->nr_args; i++) { | 866 | for (i = 0; i < pev->nargs; i++) { |
362 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", | 867 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", |
363 | pp->args[i]); | 868 | pev->args[i].name); |
364 | if (ret <= 0) | 869 | if (ret <= 0) { |
365 | goto error; | 870 | free(buf); |
871 | return NULL; | ||
872 | } | ||
366 | len += ret; | 873 | len += ret; |
367 | } | 874 | } |
368 | pp->found = 1; | ||
369 | 875 | ||
370 | return pp->found; | 876 | return buf; |
371 | error: | 877 | } |
372 | free(pp->probes[0]); | 878 | #endif |
373 | pp->probes[0] = NULL; | 879 | |
880 | static int __synthesize_kprobe_trace_arg_ref(struct kprobe_trace_arg_ref *ref, | ||
881 | char **buf, size_t *buflen, | ||
882 | int depth) | ||
883 | { | ||
884 | int ret; | ||
885 | if (ref->next) { | ||
886 | depth = __synthesize_kprobe_trace_arg_ref(ref->next, buf, | ||
887 | buflen, depth + 1); | ||
888 | if (depth < 0) | ||
889 | goto out; | ||
890 | } | ||
891 | |||
892 | ret = e_snprintf(*buf, *buflen, "%+ld(", ref->offset); | ||
893 | if (ret < 0) | ||
894 | depth = ret; | ||
895 | else { | ||
896 | *buf += ret; | ||
897 | *buflen -= ret; | ||
898 | } | ||
899 | out: | ||
900 | return depth; | ||
374 | 901 | ||
375 | return ret; | ||
376 | } | 902 | } |
377 | 903 | ||
378 | int synthesize_trace_kprobe_event(struct probe_point *pp) | 904 | static int synthesize_kprobe_trace_arg(struct kprobe_trace_arg *arg, |
905 | char *buf, size_t buflen) | ||
379 | { | 906 | { |
907 | int ret, depth = 0; | ||
908 | char *tmp = buf; | ||
909 | |||
910 | /* Argument name or separator */ | ||
911 | if (arg->name) | ||
912 | ret = e_snprintf(buf, buflen, " %s=", arg->name); | ||
913 | else | ||
914 | ret = e_snprintf(buf, buflen, " "); | ||
915 | if (ret < 0) | ||
916 | return ret; | ||
917 | buf += ret; | ||
918 | buflen -= ret; | ||
919 | |||
920 | /* Dereferencing arguments */ | ||
921 | if (arg->ref) { | ||
922 | depth = __synthesize_kprobe_trace_arg_ref(arg->ref, &buf, | ||
923 | &buflen, 1); | ||
924 | if (depth < 0) | ||
925 | return depth; | ||
926 | } | ||
927 | |||
928 | /* Print argument value */ | ||
929 | ret = e_snprintf(buf, buflen, "%s", arg->value); | ||
930 | if (ret < 0) | ||
931 | return ret; | ||
932 | buf += ret; | ||
933 | buflen -= ret; | ||
934 | |||
935 | /* Closing */ | ||
936 | while (depth--) { | ||
937 | ret = e_snprintf(buf, buflen, ")"); | ||
938 | if (ret < 0) | ||
939 | return ret; | ||
940 | buf += ret; | ||
941 | buflen -= ret; | ||
942 | } | ||
943 | /* Print argument type */ | ||
944 | if (arg->type) { | ||
945 | ret = e_snprintf(buf, buflen, ":%s", arg->type); | ||
946 | if (ret <= 0) | ||
947 | return ret; | ||
948 | buf += ret; | ||
949 | } | ||
950 | |||
951 | return buf - tmp; | ||
952 | } | ||
953 | |||
954 | char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev) | ||
955 | { | ||
956 | struct kprobe_trace_point *tp = &tev->point; | ||
380 | char *buf; | 957 | char *buf; |
381 | int i, len, ret; | 958 | int i, len, ret; |
382 | 959 | ||
383 | pp->probes[0] = buf = zalloc(MAX_CMDLEN); | 960 | buf = zalloc(MAX_CMDLEN); |
384 | if (!buf) | 961 | if (buf == NULL) |
385 | die("Failed to allocate memory by zalloc."); | 962 | return NULL; |
386 | ret = e_snprintf(buf, MAX_CMDLEN, "%s+%d", pp->function, pp->offset); | 963 | |
387 | if (ret <= 0) | 964 | len = e_snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s+%lu", |
965 | tp->retprobe ? 'r' : 'p', | ||
966 | tev->group, tev->event, | ||
967 | tp->symbol, tp->offset); | ||
968 | if (len <= 0) | ||
388 | goto error; | 969 | goto error; |
389 | len = ret; | ||
390 | 970 | ||
391 | for (i = 0; i < pp->nr_args; i++) { | 971 | for (i = 0; i < tev->nargs; i++) { |
392 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", | 972 | ret = synthesize_kprobe_trace_arg(&tev->args[i], buf + len, |
393 | pp->args[i]); | 973 | MAX_CMDLEN - len); |
394 | if (ret <= 0) | 974 | if (ret <= 0) |
395 | goto error; | 975 | goto error; |
396 | len += ret; | 976 | len += ret; |
397 | } | 977 | } |
398 | pp->found = 1; | ||
399 | 978 | ||
400 | return pp->found; | 979 | return buf; |
401 | error: | 980 | error: |
402 | free(pp->probes[0]); | 981 | free(buf); |
403 | pp->probes[0] = NULL; | 982 | return NULL; |
983 | } | ||
984 | |||
985 | int convert_to_perf_probe_event(struct kprobe_trace_event *tev, | ||
986 | struct perf_probe_event *pev) | ||
987 | { | ||
988 | char buf[64] = ""; | ||
989 | int i, ret; | ||
990 | |||
991 | /* Convert event/group name */ | ||
992 | pev->event = strdup(tev->event); | ||
993 | pev->group = strdup(tev->group); | ||
994 | if (pev->event == NULL || pev->group == NULL) | ||
995 | return -ENOMEM; | ||
996 | |||
997 | /* Convert trace_point to probe_point */ | ||
998 | ret = convert_to_perf_probe_point(&tev->point, &pev->point); | ||
999 | if (ret < 0) | ||
1000 | return ret; | ||
1001 | |||
1002 | /* Convert trace_arg to probe_arg */ | ||
1003 | pev->nargs = tev->nargs; | ||
1004 | pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs); | ||
1005 | if (pev->args == NULL) | ||
1006 | return -ENOMEM; | ||
1007 | for (i = 0; i < tev->nargs && ret >= 0; i++) { | ||
1008 | if (tev->args[i].name) | ||
1009 | pev->args[i].name = strdup(tev->args[i].name); | ||
1010 | else { | ||
1011 | ret = synthesize_kprobe_trace_arg(&tev->args[i], | ||
1012 | buf, 64); | ||
1013 | pev->args[i].name = strdup(buf); | ||
1014 | } | ||
1015 | if (pev->args[i].name == NULL && ret >= 0) | ||
1016 | ret = -ENOMEM; | ||
1017 | } | ||
1018 | |||
1019 | if (ret < 0) | ||
1020 | clear_perf_probe_event(pev); | ||
404 | 1021 | ||
405 | return ret; | 1022 | return ret; |
406 | } | 1023 | } |
407 | 1024 | ||
408 | static int open_kprobe_events(int flags, int mode) | 1025 | void clear_perf_probe_event(struct perf_probe_event *pev) |
1026 | { | ||
1027 | struct perf_probe_point *pp = &pev->point; | ||
1028 | struct perf_probe_arg_field *field, *next; | ||
1029 | int i; | ||
1030 | |||
1031 | if (pev->event) | ||
1032 | free(pev->event); | ||
1033 | if (pev->group) | ||
1034 | free(pev->group); | ||
1035 | if (pp->file) | ||
1036 | free(pp->file); | ||
1037 | if (pp->function) | ||
1038 | free(pp->function); | ||
1039 | if (pp->lazy_line) | ||
1040 | free(pp->lazy_line); | ||
1041 | for (i = 0; i < pev->nargs; i++) { | ||
1042 | if (pev->args[i].name) | ||
1043 | free(pev->args[i].name); | ||
1044 | if (pev->args[i].var) | ||
1045 | free(pev->args[i].var); | ||
1046 | if (pev->args[i].type) | ||
1047 | free(pev->args[i].type); | ||
1048 | field = pev->args[i].field; | ||
1049 | while (field) { | ||
1050 | next = field->next; | ||
1051 | if (field->name) | ||
1052 | free(field->name); | ||
1053 | free(field); | ||
1054 | field = next; | ||
1055 | } | ||
1056 | } | ||
1057 | if (pev->args) | ||
1058 | free(pev->args); | ||
1059 | memset(pev, 0, sizeof(*pev)); | ||
1060 | } | ||
1061 | |||
1062 | void clear_kprobe_trace_event(struct kprobe_trace_event *tev) | ||
1063 | { | ||
1064 | struct kprobe_trace_arg_ref *ref, *next; | ||
1065 | int i; | ||
1066 | |||
1067 | if (tev->event) | ||
1068 | free(tev->event); | ||
1069 | if (tev->group) | ||
1070 | free(tev->group); | ||
1071 | if (tev->point.symbol) | ||
1072 | free(tev->point.symbol); | ||
1073 | for (i = 0; i < tev->nargs; i++) { | ||
1074 | if (tev->args[i].name) | ||
1075 | free(tev->args[i].name); | ||
1076 | if (tev->args[i].value) | ||
1077 | free(tev->args[i].value); | ||
1078 | if (tev->args[i].type) | ||
1079 | free(tev->args[i].type); | ||
1080 | ref = tev->args[i].ref; | ||
1081 | while (ref) { | ||
1082 | next = ref->next; | ||
1083 | free(ref); | ||
1084 | ref = next; | ||
1085 | } | ||
1086 | } | ||
1087 | if (tev->args) | ||
1088 | free(tev->args); | ||
1089 | memset(tev, 0, sizeof(*tev)); | ||
1090 | } | ||
1091 | |||
1092 | static int open_kprobe_events(bool readwrite) | ||
409 | { | 1093 | { |
410 | char buf[PATH_MAX]; | 1094 | char buf[PATH_MAX]; |
1095 | const char *__debugfs; | ||
411 | int ret; | 1096 | int ret; |
412 | 1097 | ||
413 | ret = e_snprintf(buf, PATH_MAX, "%s/../kprobe_events", debugfs_path); | 1098 | __debugfs = debugfs_find_mountpoint(); |
414 | if (ret < 0) | 1099 | if (__debugfs == NULL) { |
415 | die("Failed to make kprobe_events path."); | 1100 | pr_warning("Debugfs is not mounted.\n"); |
1101 | return -ENOENT; | ||
1102 | } | ||
1103 | |||
1104 | ret = e_snprintf(buf, PATH_MAX, "%stracing/kprobe_events", __debugfs); | ||
1105 | if (ret >= 0) { | ||
1106 | pr_debug("Opening %s write=%d\n", buf, readwrite); | ||
1107 | if (readwrite && !probe_event_dry_run) | ||
1108 | ret = open(buf, O_RDWR, O_APPEND); | ||
1109 | else | ||
1110 | ret = open(buf, O_RDONLY, 0); | ||
1111 | } | ||
416 | 1112 | ||
417 | ret = open(buf, flags, mode); | ||
418 | if (ret < 0) { | 1113 | if (ret < 0) { |
419 | if (errno == ENOENT) | 1114 | if (errno == ENOENT) |
420 | die("kprobe_events file does not exist -" | 1115 | pr_warning("kprobe_events file does not exist - please" |
421 | " please rebuild with CONFIG_KPROBE_EVENT."); | 1116 | " rebuild kernel with CONFIG_KPROBE_EVENT.\n"); |
422 | else | 1117 | else |
423 | die("Could not open kprobe_events file: %s", | 1118 | pr_warning("Failed to open kprobe_events file: %s\n", |
424 | strerror(errno)); | 1119 | strerror(errno)); |
425 | } | 1120 | } |
426 | return ret; | 1121 | return ret; |
427 | } | 1122 | } |
428 | 1123 | ||
429 | /* Get raw string list of current kprobe_events */ | 1124 | /* Get raw string list of current kprobe_events */ |
430 | static struct strlist *get_trace_kprobe_event_rawlist(int fd) | 1125 | static struct strlist *get_kprobe_trace_command_rawlist(int fd) |
431 | { | 1126 | { |
432 | int ret, idx; | 1127 | int ret, idx; |
433 | FILE *fp; | 1128 | FILE *fp; |
@@ -447,271 +1142,486 @@ static struct strlist *get_trace_kprobe_event_rawlist(int fd) | |||
447 | if (p[idx] == '\n') | 1142 | if (p[idx] == '\n') |
448 | p[idx] = '\0'; | 1143 | p[idx] = '\0'; |
449 | ret = strlist__add(sl, buf); | 1144 | ret = strlist__add(sl, buf); |
450 | if (ret < 0) | 1145 | if (ret < 0) { |
451 | die("strlist__add failed: %s", strerror(-ret)); | 1146 | pr_debug("strlist__add failed: %s\n", strerror(-ret)); |
1147 | strlist__delete(sl); | ||
1148 | return NULL; | ||
1149 | } | ||
452 | } | 1150 | } |
453 | fclose(fp); | 1151 | fclose(fp); |
454 | 1152 | ||
455 | return sl; | 1153 | return sl; |
456 | } | 1154 | } |
457 | 1155 | ||
458 | /* Free and zero clear probe_point */ | ||
459 | static void clear_probe_point(struct probe_point *pp) | ||
460 | { | ||
461 | int i; | ||
462 | |||
463 | if (pp->event) | ||
464 | free(pp->event); | ||
465 | if (pp->group) | ||
466 | free(pp->group); | ||
467 | if (pp->function) | ||
468 | free(pp->function); | ||
469 | if (pp->file) | ||
470 | free(pp->file); | ||
471 | if (pp->lazy_line) | ||
472 | free(pp->lazy_line); | ||
473 | for (i = 0; i < pp->nr_args; i++) | ||
474 | free(pp->args[i]); | ||
475 | if (pp->args) | ||
476 | free(pp->args); | ||
477 | for (i = 0; i < pp->found; i++) | ||
478 | free(pp->probes[i]); | ||
479 | memset(pp, 0, sizeof(*pp)); | ||
480 | } | ||
481 | |||
482 | /* Show an event */ | 1156 | /* Show an event */ |
483 | static void show_perf_probe_event(const char *event, const char *place, | 1157 | static int show_perf_probe_event(struct perf_probe_event *pev) |
484 | struct probe_point *pp) | ||
485 | { | 1158 | { |
486 | int i, ret; | 1159 | int i, ret; |
487 | char buf[128]; | 1160 | char buf[128]; |
1161 | char *place; | ||
1162 | |||
1163 | /* Synthesize only event probe point */ | ||
1164 | place = synthesize_perf_probe_point(&pev->point); | ||
1165 | if (!place) | ||
1166 | return -EINVAL; | ||
488 | 1167 | ||
489 | ret = e_snprintf(buf, 128, "%s:%s", pp->group, event); | 1168 | ret = e_snprintf(buf, 128, "%s:%s", pev->group, pev->event); |
490 | if (ret < 0) | 1169 | if (ret < 0) |
491 | die("Failed to copy event: %s", strerror(-ret)); | 1170 | return ret; |
492 | printf(" %-40s (on %s", buf, place); | 1171 | |
1172 | printf(" %-20s (on %s", buf, place); | ||
493 | 1173 | ||
494 | if (pp->nr_args > 0) { | 1174 | if (pev->nargs > 0) { |
495 | printf(" with"); | 1175 | printf(" with"); |
496 | for (i = 0; i < pp->nr_args; i++) | 1176 | for (i = 0; i < pev->nargs; i++) { |
497 | printf(" %s", pp->args[i]); | 1177 | ret = synthesize_perf_probe_arg(&pev->args[i], |
1178 | buf, 128); | ||
1179 | if (ret < 0) | ||
1180 | break; | ||
1181 | printf(" %s", buf); | ||
1182 | } | ||
498 | } | 1183 | } |
499 | printf(")\n"); | 1184 | printf(")\n"); |
1185 | free(place); | ||
1186 | return ret; | ||
500 | } | 1187 | } |
501 | 1188 | ||
502 | /* List up current perf-probe events */ | 1189 | /* List up current perf-probe events */ |
503 | void show_perf_probe_events(void) | 1190 | int show_perf_probe_events(void) |
504 | { | 1191 | { |
505 | int fd; | 1192 | int fd, ret; |
506 | struct probe_point pp; | 1193 | struct kprobe_trace_event tev; |
1194 | struct perf_probe_event pev; | ||
507 | struct strlist *rawlist; | 1195 | struct strlist *rawlist; |
508 | struct str_node *ent; | 1196 | struct str_node *ent; |
509 | 1197 | ||
510 | setup_pager(); | 1198 | setup_pager(); |
511 | memset(&pp, 0, sizeof(pp)); | 1199 | ret = init_vmlinux(); |
1200 | if (ret < 0) | ||
1201 | return ret; | ||
1202 | |||
1203 | memset(&tev, 0, sizeof(tev)); | ||
1204 | memset(&pev, 0, sizeof(pev)); | ||
512 | 1205 | ||
513 | fd = open_kprobe_events(O_RDONLY, 0); | 1206 | fd = open_kprobe_events(false); |
514 | rawlist = get_trace_kprobe_event_rawlist(fd); | 1207 | if (fd < 0) |
1208 | return fd; | ||
1209 | |||
1210 | rawlist = get_kprobe_trace_command_rawlist(fd); | ||
515 | close(fd); | 1211 | close(fd); |
1212 | if (!rawlist) | ||
1213 | return -ENOENT; | ||
516 | 1214 | ||
517 | strlist__for_each(ent, rawlist) { | 1215 | strlist__for_each(ent, rawlist) { |
518 | parse_trace_kprobe_event(ent->s, &pp); | 1216 | ret = parse_kprobe_trace_command(ent->s, &tev); |
519 | /* Synthesize only event probe point */ | 1217 | if (ret >= 0) { |
520 | synthesize_perf_probe_point(&pp); | 1218 | ret = convert_to_perf_probe_event(&tev, &pev); |
521 | /* Show an event */ | 1219 | if (ret >= 0) |
522 | show_perf_probe_event(pp.event, pp.probes[0], &pp); | 1220 | ret = show_perf_probe_event(&pev); |
523 | clear_probe_point(&pp); | 1221 | } |
1222 | clear_perf_probe_event(&pev); | ||
1223 | clear_kprobe_trace_event(&tev); | ||
1224 | if (ret < 0) | ||
1225 | break; | ||
524 | } | 1226 | } |
525 | |||
526 | strlist__delete(rawlist); | 1227 | strlist__delete(rawlist); |
1228 | |||
1229 | return ret; | ||
527 | } | 1230 | } |
528 | 1231 | ||
529 | /* Get current perf-probe event names */ | 1232 | /* Get current perf-probe event names */ |
530 | static struct strlist *get_perf_event_names(int fd, bool include_group) | 1233 | static struct strlist *get_kprobe_trace_event_names(int fd, bool include_group) |
531 | { | 1234 | { |
532 | char buf[128]; | 1235 | char buf[128]; |
533 | struct strlist *sl, *rawlist; | 1236 | struct strlist *sl, *rawlist; |
534 | struct str_node *ent; | 1237 | struct str_node *ent; |
535 | struct probe_point pp; | 1238 | struct kprobe_trace_event tev; |
1239 | int ret = 0; | ||
536 | 1240 | ||
537 | memset(&pp, 0, sizeof(pp)); | 1241 | memset(&tev, 0, sizeof(tev)); |
538 | rawlist = get_trace_kprobe_event_rawlist(fd); | ||
539 | 1242 | ||
1243 | rawlist = get_kprobe_trace_command_rawlist(fd); | ||
540 | sl = strlist__new(true, NULL); | 1244 | sl = strlist__new(true, NULL); |
541 | strlist__for_each(ent, rawlist) { | 1245 | strlist__for_each(ent, rawlist) { |
542 | parse_trace_kprobe_event(ent->s, &pp); | 1246 | ret = parse_kprobe_trace_command(ent->s, &tev); |
1247 | if (ret < 0) | ||
1248 | break; | ||
543 | if (include_group) { | 1249 | if (include_group) { |
544 | if (e_snprintf(buf, 128, "%s:%s", pp.group, | 1250 | ret = e_snprintf(buf, 128, "%s:%s", tev.group, |
545 | pp.event) < 0) | 1251 | tev.event); |
546 | die("Failed to copy group:event name."); | 1252 | if (ret >= 0) |
547 | strlist__add(sl, buf); | 1253 | ret = strlist__add(sl, buf); |
548 | } else | 1254 | } else |
549 | strlist__add(sl, pp.event); | 1255 | ret = strlist__add(sl, tev.event); |
550 | clear_probe_point(&pp); | 1256 | clear_kprobe_trace_event(&tev); |
1257 | if (ret < 0) | ||
1258 | break; | ||
551 | } | 1259 | } |
552 | |||
553 | strlist__delete(rawlist); | 1260 | strlist__delete(rawlist); |
554 | 1261 | ||
1262 | if (ret < 0) { | ||
1263 | strlist__delete(sl); | ||
1264 | return NULL; | ||
1265 | } | ||
555 | return sl; | 1266 | return sl; |
556 | } | 1267 | } |
557 | 1268 | ||
558 | static void write_trace_kprobe_event(int fd, const char *buf) | 1269 | static int write_kprobe_trace_event(int fd, struct kprobe_trace_event *tev) |
559 | { | 1270 | { |
560 | int ret; | 1271 | int ret = 0; |
1272 | char *buf = synthesize_kprobe_trace_command(tev); | ||
1273 | |||
1274 | if (!buf) { | ||
1275 | pr_debug("Failed to synthesize kprobe trace event.\n"); | ||
1276 | return -EINVAL; | ||
1277 | } | ||
561 | 1278 | ||
562 | pr_debug("Writing event: %s\n", buf); | 1279 | pr_debug("Writing event: %s\n", buf); |
563 | ret = write(fd, buf, strlen(buf)); | 1280 | if (!probe_event_dry_run) { |
564 | if (ret <= 0) | 1281 | ret = write(fd, buf, strlen(buf)); |
565 | die("Failed to write event: %s", strerror(errno)); | 1282 | if (ret <= 0) |
1283 | pr_warning("Failed to write event: %s\n", | ||
1284 | strerror(errno)); | ||
1285 | } | ||
1286 | free(buf); | ||
1287 | return ret; | ||
566 | } | 1288 | } |
567 | 1289 | ||
568 | static void get_new_event_name(char *buf, size_t len, const char *base, | 1290 | static int get_new_event_name(char *buf, size_t len, const char *base, |
569 | struct strlist *namelist, bool allow_suffix) | 1291 | struct strlist *namelist, bool allow_suffix) |
570 | { | 1292 | { |
571 | int i, ret; | 1293 | int i, ret; |
572 | 1294 | ||
573 | /* Try no suffix */ | 1295 | /* Try no suffix */ |
574 | ret = e_snprintf(buf, len, "%s", base); | 1296 | ret = e_snprintf(buf, len, "%s", base); |
575 | if (ret < 0) | 1297 | if (ret < 0) { |
576 | die("snprintf() failed: %s", strerror(-ret)); | 1298 | pr_debug("snprintf() failed: %s\n", strerror(-ret)); |
1299 | return ret; | ||
1300 | } | ||
577 | if (!strlist__has_entry(namelist, buf)) | 1301 | if (!strlist__has_entry(namelist, buf)) |
578 | return; | 1302 | return 0; |
579 | 1303 | ||
580 | if (!allow_suffix) { | 1304 | if (!allow_suffix) { |
581 | pr_warning("Error: event \"%s\" already exists. " | 1305 | pr_warning("Error: event \"%s\" already exists. " |
582 | "(Use -f to force duplicates.)\n", base); | 1306 | "(Use -f to force duplicates.)\n", base); |
583 | die("Can't add new event."); | 1307 | return -EEXIST; |
584 | } | 1308 | } |
585 | 1309 | ||
586 | /* Try to add suffix */ | 1310 | /* Try to add suffix */ |
587 | for (i = 1; i < MAX_EVENT_INDEX; i++) { | 1311 | for (i = 1; i < MAX_EVENT_INDEX; i++) { |
588 | ret = e_snprintf(buf, len, "%s_%d", base, i); | 1312 | ret = e_snprintf(buf, len, "%s_%d", base, i); |
589 | if (ret < 0) | 1313 | if (ret < 0) { |
590 | die("snprintf() failed: %s", strerror(-ret)); | 1314 | pr_debug("snprintf() failed: %s\n", strerror(-ret)); |
1315 | return ret; | ||
1316 | } | ||
591 | if (!strlist__has_entry(namelist, buf)) | 1317 | if (!strlist__has_entry(namelist, buf)) |
592 | break; | 1318 | break; |
593 | } | 1319 | } |
594 | if (i == MAX_EVENT_INDEX) | 1320 | if (i == MAX_EVENT_INDEX) { |
595 | die("Too many events are on the same function."); | 1321 | pr_warning("Too many events are on the same function.\n"); |
1322 | ret = -ERANGE; | ||
1323 | } | ||
1324 | |||
1325 | return ret; | ||
596 | } | 1326 | } |
597 | 1327 | ||
598 | void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, | 1328 | static int __add_kprobe_trace_events(struct perf_probe_event *pev, |
599 | bool force_add) | 1329 | struct kprobe_trace_event *tevs, |
1330 | int ntevs, bool allow_suffix) | ||
600 | { | 1331 | { |
601 | int i, j, fd; | 1332 | int i, fd, ret; |
602 | struct probe_point *pp; | 1333 | struct kprobe_trace_event *tev = NULL; |
603 | char buf[MAX_CMDLEN]; | 1334 | char buf[64]; |
604 | char event[64]; | 1335 | const char *event, *group; |
605 | struct strlist *namelist; | 1336 | struct strlist *namelist; |
606 | bool allow_suffix; | ||
607 | 1337 | ||
608 | fd = open_kprobe_events(O_RDWR, O_APPEND); | 1338 | fd = open_kprobe_events(true); |
1339 | if (fd < 0) | ||
1340 | return fd; | ||
609 | /* Get current event names */ | 1341 | /* Get current event names */ |
610 | namelist = get_perf_event_names(fd, false); | 1342 | namelist = get_kprobe_trace_event_names(fd, false); |
611 | 1343 | if (!namelist) { | |
612 | for (j = 0; j < nr_probes; j++) { | 1344 | pr_debug("Failed to get current event list.\n"); |
613 | pp = probes + j; | 1345 | return -EIO; |
614 | if (!pp->event) | 1346 | } |
615 | pp->event = strdup(pp->function); | 1347 | |
616 | if (!pp->group) | 1348 | ret = 0; |
617 | pp->group = strdup(PERFPROBE_GROUP); | 1349 | printf("Add new event%s\n", (ntevs > 1) ? "s:" : ":"); |
618 | DIE_IF(!pp->event || !pp->group); | 1350 | for (i = 0; i < ntevs; i++) { |
619 | /* If force_add is true, suffix search is allowed */ | 1351 | tev = &tevs[i]; |
620 | allow_suffix = force_add; | 1352 | if (pev->event) |
621 | for (i = 0; i < pp->found; i++) { | 1353 | event = pev->event; |
622 | /* Get an unused new event name */ | 1354 | else |
623 | get_new_event_name(event, 64, pp->event, namelist, | 1355 | if (pev->point.function) |
624 | allow_suffix); | 1356 | event = pev->point.function; |
625 | snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s\n", | 1357 | else |
626 | pp->retprobe ? 'r' : 'p', | 1358 | event = tev->point.symbol; |
627 | pp->group, event, | 1359 | if (pev->group) |
628 | pp->probes[i]); | 1360 | group = pev->group; |
629 | write_trace_kprobe_event(fd, buf); | 1361 | else |
630 | printf("Added new event:\n"); | 1362 | group = PERFPROBE_GROUP; |
631 | /* Get the first parameter (probe-point) */ | 1363 | |
632 | sscanf(pp->probes[i], "%s", buf); | 1364 | /* Get an unused new event name */ |
633 | show_perf_probe_event(event, buf, pp); | 1365 | ret = get_new_event_name(buf, 64, event, |
634 | /* Add added event name to namelist */ | 1366 | namelist, allow_suffix); |
635 | strlist__add(namelist, event); | 1367 | if (ret < 0) |
636 | /* | 1368 | break; |
637 | * Probes after the first probe which comes from same | 1369 | event = buf; |
638 | * user input are always allowed to add suffix, because | 1370 | |
639 | * there might be several addresses corresponding to | 1371 | tev->event = strdup(event); |
640 | * one code line. | 1372 | tev->group = strdup(group); |
641 | */ | 1373 | if (tev->event == NULL || tev->group == NULL) { |
642 | allow_suffix = true; | 1374 | ret = -ENOMEM; |
1375 | break; | ||
643 | } | 1376 | } |
1377 | ret = write_kprobe_trace_event(fd, tev); | ||
1378 | if (ret < 0) | ||
1379 | break; | ||
1380 | /* Add added event name to namelist */ | ||
1381 | strlist__add(namelist, event); | ||
1382 | |||
1383 | /* Trick here - save current event/group */ | ||
1384 | event = pev->event; | ||
1385 | group = pev->group; | ||
1386 | pev->event = tev->event; | ||
1387 | pev->group = tev->group; | ||
1388 | show_perf_probe_event(pev); | ||
1389 | /* Trick here - restore current event/group */ | ||
1390 | pev->event = (char *)event; | ||
1391 | pev->group = (char *)group; | ||
1392 | |||
1393 | /* | ||
1394 | * Probes after the first probe which comes from same | ||
1395 | * user input are always allowed to add suffix, because | ||
1396 | * there might be several addresses corresponding to | ||
1397 | * one code line. | ||
1398 | */ | ||
1399 | allow_suffix = true; | ||
1400 | } | ||
1401 | |||
1402 | if (ret >= 0) { | ||
1403 | /* Show how to use the event. */ | ||
1404 | printf("\nYou can now use it on all perf tools, such as:\n\n"); | ||
1405 | printf("\tperf record -e %s:%s -aR sleep 1\n\n", tev->group, | ||
1406 | tev->event); | ||
644 | } | 1407 | } |
645 | /* Show how to use the event. */ | ||
646 | printf("\nYou can now use it on all perf tools, such as:\n\n"); | ||
647 | printf("\tperf record -e %s:%s -a sleep 1\n\n", PERFPROBE_GROUP, event); | ||
648 | 1408 | ||
649 | strlist__delete(namelist); | 1409 | strlist__delete(namelist); |
650 | close(fd); | 1410 | close(fd); |
1411 | return ret; | ||
1412 | } | ||
1413 | |||
1414 | static int convert_to_kprobe_trace_events(struct perf_probe_event *pev, | ||
1415 | struct kprobe_trace_event **tevs, | ||
1416 | int max_tevs) | ||
1417 | { | ||
1418 | struct symbol *sym; | ||
1419 | int ret = 0, i; | ||
1420 | struct kprobe_trace_event *tev; | ||
1421 | |||
1422 | /* Convert perf_probe_event with debuginfo */ | ||
1423 | ret = try_to_find_kprobe_trace_events(pev, tevs, max_tevs); | ||
1424 | if (ret != 0) | ||
1425 | return ret; | ||
1426 | |||
1427 | /* Allocate trace event buffer */ | ||
1428 | tev = *tevs = zalloc(sizeof(struct kprobe_trace_event)); | ||
1429 | if (tev == NULL) | ||
1430 | return -ENOMEM; | ||
1431 | |||
1432 | /* Copy parameters */ | ||
1433 | tev->point.symbol = strdup(pev->point.function); | ||
1434 | if (tev->point.symbol == NULL) { | ||
1435 | ret = -ENOMEM; | ||
1436 | goto error; | ||
1437 | } | ||
1438 | tev->point.offset = pev->point.offset; | ||
1439 | tev->nargs = pev->nargs; | ||
1440 | if (tev->nargs) { | ||
1441 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) | ||
1442 | * tev->nargs); | ||
1443 | if (tev->args == NULL) { | ||
1444 | ret = -ENOMEM; | ||
1445 | goto error; | ||
1446 | } | ||
1447 | for (i = 0; i < tev->nargs; i++) { | ||
1448 | if (pev->args[i].name) { | ||
1449 | tev->args[i].name = strdup(pev->args[i].name); | ||
1450 | if (tev->args[i].name == NULL) { | ||
1451 | ret = -ENOMEM; | ||
1452 | goto error; | ||
1453 | } | ||
1454 | } | ||
1455 | tev->args[i].value = strdup(pev->args[i].var); | ||
1456 | if (tev->args[i].value == NULL) { | ||
1457 | ret = -ENOMEM; | ||
1458 | goto error; | ||
1459 | } | ||
1460 | if (pev->args[i].type) { | ||
1461 | tev->args[i].type = strdup(pev->args[i].type); | ||
1462 | if (tev->args[i].type == NULL) { | ||
1463 | ret = -ENOMEM; | ||
1464 | goto error; | ||
1465 | } | ||
1466 | } | ||
1467 | } | ||
1468 | } | ||
1469 | |||
1470 | /* Currently just checking function name from symbol map */ | ||
1471 | sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION], | ||
1472 | tev->point.symbol, NULL); | ||
1473 | if (!sym) { | ||
1474 | pr_warning("Kernel symbol \'%s\' not found.\n", | ||
1475 | tev->point.symbol); | ||
1476 | ret = -ENOENT; | ||
1477 | goto error; | ||
1478 | } | ||
1479 | |||
1480 | return 1; | ||
1481 | error: | ||
1482 | clear_kprobe_trace_event(tev); | ||
1483 | free(tev); | ||
1484 | *tevs = NULL; | ||
1485 | return ret; | ||
1486 | } | ||
1487 | |||
1488 | struct __event_package { | ||
1489 | struct perf_probe_event *pev; | ||
1490 | struct kprobe_trace_event *tevs; | ||
1491 | int ntevs; | ||
1492 | }; | ||
1493 | |||
1494 | int add_perf_probe_events(struct perf_probe_event *pevs, int npevs, | ||
1495 | bool force_add, int max_tevs) | ||
1496 | { | ||
1497 | int i, j, ret; | ||
1498 | struct __event_package *pkgs; | ||
1499 | |||
1500 | pkgs = zalloc(sizeof(struct __event_package) * npevs); | ||
1501 | if (pkgs == NULL) | ||
1502 | return -ENOMEM; | ||
1503 | |||
1504 | /* Init vmlinux path */ | ||
1505 | ret = init_vmlinux(); | ||
1506 | if (ret < 0) | ||
1507 | return ret; | ||
1508 | |||
1509 | /* Loop 1: convert all events */ | ||
1510 | for (i = 0; i < npevs; i++) { | ||
1511 | pkgs[i].pev = &pevs[i]; | ||
1512 | /* Convert with or without debuginfo */ | ||
1513 | ret = convert_to_kprobe_trace_events(pkgs[i].pev, | ||
1514 | &pkgs[i].tevs, max_tevs); | ||
1515 | if (ret < 0) | ||
1516 | goto end; | ||
1517 | pkgs[i].ntevs = ret; | ||
1518 | } | ||
1519 | |||
1520 | /* Loop 2: add all events */ | ||
1521 | for (i = 0; i < npevs && ret >= 0; i++) | ||
1522 | ret = __add_kprobe_trace_events(pkgs[i].pev, pkgs[i].tevs, | ||
1523 | pkgs[i].ntevs, force_add); | ||
1524 | end: | ||
1525 | /* Loop 3: cleanup trace events */ | ||
1526 | for (i = 0; i < npevs; i++) | ||
1527 | for (j = 0; j < pkgs[i].ntevs; j++) | ||
1528 | clear_kprobe_trace_event(&pkgs[i].tevs[j]); | ||
1529 | |||
1530 | return ret; | ||
651 | } | 1531 | } |
652 | 1532 | ||
653 | static void __del_trace_kprobe_event(int fd, struct str_node *ent) | 1533 | static int __del_trace_kprobe_event(int fd, struct str_node *ent) |
654 | { | 1534 | { |
655 | char *p; | 1535 | char *p; |
656 | char buf[128]; | 1536 | char buf[128]; |
1537 | int ret; | ||
657 | 1538 | ||
658 | /* Convert from perf-probe event to trace-kprobe event */ | 1539 | /* Convert from perf-probe event to trace-kprobe event */ |
659 | if (e_snprintf(buf, 128, "-:%s", ent->s) < 0) | 1540 | ret = e_snprintf(buf, 128, "-:%s", ent->s); |
660 | die("Failed to copy event."); | 1541 | if (ret < 0) |
1542 | goto error; | ||
1543 | |||
661 | p = strchr(buf + 2, ':'); | 1544 | p = strchr(buf + 2, ':'); |
662 | if (!p) | 1545 | if (!p) { |
663 | die("Internal error: %s should have ':' but not.", ent->s); | 1546 | pr_debug("Internal error: %s should have ':' but not.\n", |
1547 | ent->s); | ||
1548 | ret = -ENOTSUP; | ||
1549 | goto error; | ||
1550 | } | ||
664 | *p = '/'; | 1551 | *p = '/'; |
665 | 1552 | ||
666 | write_trace_kprobe_event(fd, buf); | 1553 | pr_debug("Writing event: %s\n", buf); |
1554 | ret = write(fd, buf, strlen(buf)); | ||
1555 | if (ret < 0) | ||
1556 | goto error; | ||
1557 | |||
667 | printf("Remove event: %s\n", ent->s); | 1558 | printf("Remove event: %s\n", ent->s); |
1559 | return 0; | ||
1560 | error: | ||
1561 | pr_warning("Failed to delete event: %s\n", strerror(-ret)); | ||
1562 | return ret; | ||
668 | } | 1563 | } |
669 | 1564 | ||
670 | static void del_trace_kprobe_event(int fd, const char *group, | 1565 | static int del_trace_kprobe_event(int fd, const char *group, |
671 | const char *event, struct strlist *namelist) | 1566 | const char *event, struct strlist *namelist) |
672 | { | 1567 | { |
673 | char buf[128]; | 1568 | char buf[128]; |
674 | struct str_node *ent, *n; | 1569 | struct str_node *ent, *n; |
675 | int found = 0; | 1570 | int found = 0, ret = 0; |
676 | 1571 | ||
677 | if (e_snprintf(buf, 128, "%s:%s", group, event) < 0) | 1572 | ret = e_snprintf(buf, 128, "%s:%s", group, event); |
678 | die("Failed to copy event."); | 1573 | if (ret < 0) { |
1574 | pr_err("Failed to copy event."); | ||
1575 | return ret; | ||
1576 | } | ||
679 | 1577 | ||
680 | if (strpbrk(buf, "*?")) { /* Glob-exp */ | 1578 | if (strpbrk(buf, "*?")) { /* Glob-exp */ |
681 | strlist__for_each_safe(ent, n, namelist) | 1579 | strlist__for_each_safe(ent, n, namelist) |
682 | if (strglobmatch(ent->s, buf)) { | 1580 | if (strglobmatch(ent->s, buf)) { |
683 | found++; | 1581 | found++; |
684 | __del_trace_kprobe_event(fd, ent); | 1582 | ret = __del_trace_kprobe_event(fd, ent); |
1583 | if (ret < 0) | ||
1584 | break; | ||
685 | strlist__remove(namelist, ent); | 1585 | strlist__remove(namelist, ent); |
686 | } | 1586 | } |
687 | } else { | 1587 | } else { |
688 | ent = strlist__find(namelist, buf); | 1588 | ent = strlist__find(namelist, buf); |
689 | if (ent) { | 1589 | if (ent) { |
690 | found++; | 1590 | found++; |
691 | __del_trace_kprobe_event(fd, ent); | 1591 | ret = __del_trace_kprobe_event(fd, ent); |
692 | strlist__remove(namelist, ent); | 1592 | if (ret >= 0) |
1593 | strlist__remove(namelist, ent); | ||
693 | } | 1594 | } |
694 | } | 1595 | } |
695 | if (found == 0) | 1596 | if (found == 0 && ret >= 0) |
696 | pr_info("Info: event \"%s\" does not exist, could not remove it.\n", buf); | 1597 | pr_info("Info: Event \"%s\" does not exist.\n", buf); |
1598 | |||
1599 | return ret; | ||
697 | } | 1600 | } |
698 | 1601 | ||
699 | void del_trace_kprobe_events(struct strlist *dellist) | 1602 | int del_perf_probe_events(struct strlist *dellist) |
700 | { | 1603 | { |
701 | int fd; | 1604 | int fd, ret = 0; |
702 | const char *group, *event; | 1605 | const char *group, *event; |
703 | char *p, *str; | 1606 | char *p, *str; |
704 | struct str_node *ent; | 1607 | struct str_node *ent; |
705 | struct strlist *namelist; | 1608 | struct strlist *namelist; |
706 | 1609 | ||
707 | fd = open_kprobe_events(O_RDWR, O_APPEND); | 1610 | fd = open_kprobe_events(true); |
1611 | if (fd < 0) | ||
1612 | return fd; | ||
1613 | |||
708 | /* Get current event names */ | 1614 | /* Get current event names */ |
709 | namelist = get_perf_event_names(fd, true); | 1615 | namelist = get_kprobe_trace_event_names(fd, true); |
1616 | if (namelist == NULL) | ||
1617 | return -EINVAL; | ||
710 | 1618 | ||
711 | strlist__for_each(ent, dellist) { | 1619 | strlist__for_each(ent, dellist) { |
712 | str = strdup(ent->s); | 1620 | str = strdup(ent->s); |
713 | if (!str) | 1621 | if (str == NULL) { |
714 | die("Failed to copy event."); | 1622 | ret = -ENOMEM; |
1623 | break; | ||
1624 | } | ||
715 | pr_debug("Parsing: %s\n", str); | 1625 | pr_debug("Parsing: %s\n", str); |
716 | p = strchr(str, ':'); | 1626 | p = strchr(str, ':'); |
717 | if (p) { | 1627 | if (p) { |
@@ -723,80 +1633,14 @@ void del_trace_kprobe_events(struct strlist *dellist) | |||
723 | event = str; | 1633 | event = str; |
724 | } | 1634 | } |
725 | pr_debug("Group: %s, Event: %s\n", group, event); | 1635 | pr_debug("Group: %s, Event: %s\n", group, event); |
726 | del_trace_kprobe_event(fd, group, event, namelist); | 1636 | ret = del_trace_kprobe_event(fd, group, event, namelist); |
727 | free(str); | 1637 | free(str); |
1638 | if (ret < 0) | ||
1639 | break; | ||
728 | } | 1640 | } |
729 | strlist__delete(namelist); | 1641 | strlist__delete(namelist); |
730 | close(fd); | 1642 | close(fd); |
731 | } | ||
732 | 1643 | ||
733 | #define LINEBUF_SIZE 256 | 1644 | return ret; |
734 | #define NR_ADDITIONAL_LINES 2 | ||
735 | |||
736 | static void show_one_line(FILE *fp, unsigned int l, bool skip, bool show_num) | ||
737 | { | ||
738 | char buf[LINEBUF_SIZE]; | ||
739 | const char *color = PERF_COLOR_BLUE; | ||
740 | |||
741 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
742 | goto error; | ||
743 | if (!skip) { | ||
744 | if (show_num) | ||
745 | fprintf(stdout, "%7u %s", l, buf); | ||
746 | else | ||
747 | color_fprintf(stdout, color, " %s", buf); | ||
748 | } | ||
749 | |||
750 | while (strlen(buf) == LINEBUF_SIZE - 1 && | ||
751 | buf[LINEBUF_SIZE - 2] != '\n') { | ||
752 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
753 | goto error; | ||
754 | if (!skip) { | ||
755 | if (show_num) | ||
756 | fprintf(stdout, "%s", buf); | ||
757 | else | ||
758 | color_fprintf(stdout, color, "%s", buf); | ||
759 | } | ||
760 | } | ||
761 | return; | ||
762 | error: | ||
763 | if (feof(fp)) | ||
764 | die("Source file is shorter than expected."); | ||
765 | else | ||
766 | die("File read error: %s", strerror(errno)); | ||
767 | } | 1645 | } |
768 | 1646 | ||
769 | void show_line_range(struct line_range *lr) | ||
770 | { | ||
771 | unsigned int l = 1; | ||
772 | struct line_node *ln; | ||
773 | FILE *fp; | ||
774 | |||
775 | setup_pager(); | ||
776 | |||
777 | if (lr->function) | ||
778 | fprintf(stdout, "<%s:%d>\n", lr->function, | ||
779 | lr->start - lr->offset); | ||
780 | else | ||
781 | fprintf(stdout, "<%s:%d>\n", lr->file, lr->start); | ||
782 | |||
783 | fp = fopen(lr->path, "r"); | ||
784 | if (fp == NULL) | ||
785 | die("Failed to open %s: %s", lr->path, strerror(errno)); | ||
786 | /* Skip to starting line number */ | ||
787 | while (l < lr->start) | ||
788 | show_one_line(fp, l++, true, false); | ||
789 | |||
790 | list_for_each_entry(ln, &lr->line_list, list) { | ||
791 | while (ln->line > l) | ||
792 | show_one_line(fp, (l++) - lr->offset, false, false); | ||
793 | show_one_line(fp, (l++) - lr->offset, false, true); | ||
794 | } | ||
795 | |||
796 | if (lr->end == INT_MAX) | ||
797 | lr->end = l + NR_ADDITIONAL_LINES; | ||
798 | while (l < lr->end && !feof(fp)) | ||
799 | show_one_line(fp, (l++) - lr->offset, false, false); | ||
800 | |||
801 | fclose(fp); | ||
802 | } | ||
diff --git a/tools/perf/util/probe-event.h b/tools/perf/util/probe-event.h index 711287d4baea..e9db1a214ca4 100644 --- a/tools/perf/util/probe-event.h +++ b/tools/perf/util/probe-event.h | |||
@@ -2,21 +2,125 @@ | |||
2 | #define _PROBE_EVENT_H | 2 | #define _PROBE_EVENT_H |
3 | 3 | ||
4 | #include <stdbool.h> | 4 | #include <stdbool.h> |
5 | #include "probe-finder.h" | ||
6 | #include "strlist.h" | 5 | #include "strlist.h" |
7 | 6 | ||
8 | extern void parse_line_range_desc(const char *arg, struct line_range *lr); | 7 | extern bool probe_event_dry_run; |
9 | extern void parse_perf_probe_event(const char *str, struct probe_point *pp, | 8 | |
10 | bool *need_dwarf); | 9 | /* kprobe-tracer tracing point */ |
11 | extern int synthesize_perf_probe_point(struct probe_point *pp); | 10 | struct kprobe_trace_point { |
12 | extern int synthesize_perf_probe_event(struct probe_point *pp); | 11 | char *symbol; /* Base symbol */ |
13 | extern void parse_trace_kprobe_event(const char *str, struct probe_point *pp); | 12 | unsigned long offset; /* Offset from symbol */ |
14 | extern int synthesize_trace_kprobe_event(struct probe_point *pp); | 13 | bool retprobe; /* Return probe flag */ |
15 | extern void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, | 14 | }; |
16 | bool force_add); | 15 | |
17 | extern void del_trace_kprobe_events(struct strlist *dellist); | 16 | /* kprobe-tracer tracing argument referencing offset */ |
18 | extern void show_perf_probe_events(void); | 17 | struct kprobe_trace_arg_ref { |
19 | extern void show_line_range(struct line_range *lr); | 18 | struct kprobe_trace_arg_ref *next; /* Next reference */ |
19 | long offset; /* Offset value */ | ||
20 | }; | ||
21 | |||
22 | /* kprobe-tracer tracing argument */ | ||
23 | struct kprobe_trace_arg { | ||
24 | char *name; /* Argument name */ | ||
25 | char *value; /* Base value */ | ||
26 | char *type; /* Type name */ | ||
27 | struct kprobe_trace_arg_ref *ref; /* Referencing offset */ | ||
28 | }; | ||
29 | |||
30 | /* kprobe-tracer tracing event (point + arg) */ | ||
31 | struct kprobe_trace_event { | ||
32 | char *event; /* Event name */ | ||
33 | char *group; /* Group name */ | ||
34 | struct kprobe_trace_point point; /* Trace point */ | ||
35 | int nargs; /* Number of args */ | ||
36 | struct kprobe_trace_arg *args; /* Arguments */ | ||
37 | }; | ||
38 | |||
39 | /* Perf probe probing point */ | ||
40 | struct perf_probe_point { | ||
41 | char *file; /* File path */ | ||
42 | char *function; /* Function name */ | ||
43 | int line; /* Line number */ | ||
44 | bool retprobe; /* Return probe flag */ | ||
45 | char *lazy_line; /* Lazy matching pattern */ | ||
46 | unsigned long offset; /* Offset from function entry */ | ||
47 | }; | ||
48 | |||
49 | /* Perf probe probing argument field chain */ | ||
50 | struct perf_probe_arg_field { | ||
51 | struct perf_probe_arg_field *next; /* Next field */ | ||
52 | char *name; /* Name of the field */ | ||
53 | bool ref; /* Referencing flag */ | ||
54 | }; | ||
55 | |||
56 | /* Perf probe probing argument */ | ||
57 | struct perf_probe_arg { | ||
58 | char *name; /* Argument name */ | ||
59 | char *var; /* Variable name */ | ||
60 | char *type; /* Type name */ | ||
61 | struct perf_probe_arg_field *field; /* Structure fields */ | ||
62 | }; | ||
63 | |||
64 | /* Perf probe probing event (point + arg) */ | ||
65 | struct perf_probe_event { | ||
66 | char *event; /* Event name */ | ||
67 | char *group; /* Group name */ | ||
68 | struct perf_probe_point point; /* Probe point */ | ||
69 | int nargs; /* Number of arguments */ | ||
70 | struct perf_probe_arg *args; /* Arguments */ | ||
71 | }; | ||
72 | |||
73 | |||
74 | /* Line number container */ | ||
75 | struct line_node { | ||
76 | struct list_head list; | ||
77 | int line; | ||
78 | }; | ||
79 | |||
80 | /* Line range */ | ||
81 | struct line_range { | ||
82 | char *file; /* File name */ | ||
83 | char *function; /* Function name */ | ||
84 | int start; /* Start line number */ | ||
85 | int end; /* End line number */ | ||
86 | int offset; /* Start line offset */ | ||
87 | char *path; /* Real path name */ | ||
88 | struct list_head line_list; /* Visible lines */ | ||
89 | }; | ||
90 | |||
91 | /* Command string to events */ | ||
92 | extern int parse_perf_probe_command(const char *cmd, | ||
93 | struct perf_probe_event *pev); | ||
94 | extern int parse_kprobe_trace_command(const char *cmd, | ||
95 | struct kprobe_trace_event *tev); | ||
96 | |||
97 | /* Events to command string */ | ||
98 | extern char *synthesize_perf_probe_command(struct perf_probe_event *pev); | ||
99 | extern char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev); | ||
100 | extern int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf, | ||
101 | size_t len); | ||
102 | |||
103 | /* Check the perf_probe_event needs debuginfo */ | ||
104 | extern bool perf_probe_event_need_dwarf(struct perf_probe_event *pev); | ||
105 | |||
106 | /* Convert from kprobe_trace_event to perf_probe_event */ | ||
107 | extern int convert_to_perf_probe_event(struct kprobe_trace_event *tev, | ||
108 | struct perf_probe_event *pev); | ||
109 | |||
110 | /* Release event contents */ | ||
111 | extern void clear_perf_probe_event(struct perf_probe_event *pev); | ||
112 | extern void clear_kprobe_trace_event(struct kprobe_trace_event *tev); | ||
113 | |||
114 | /* Command string to line-range */ | ||
115 | extern int parse_line_range_desc(const char *cmd, struct line_range *lr); | ||
116 | |||
117 | |||
118 | extern int add_perf_probe_events(struct perf_probe_event *pevs, int npevs, | ||
119 | bool force_add, int max_probe_points); | ||
120 | extern int del_perf_probe_events(struct strlist *dellist); | ||
121 | extern int show_perf_probe_events(void); | ||
122 | extern int show_line_range(struct line_range *lr); | ||
123 | |||
20 | 124 | ||
21 | /* Maximum index number of event-name postfix */ | 125 | /* Maximum index number of event-name postfix */ |
22 | #define MAX_EVENT_INDEX 1024 | 126 | #define MAX_EVENT_INDEX 1024 |
diff --git a/tools/perf/util/probe-finder.c b/tools/perf/util/probe-finder.c index c171a243d05b..562b1443e785 100644 --- a/tools/perf/util/probe-finder.c +++ b/tools/perf/util/probe-finder.c | |||
@@ -31,6 +31,7 @@ | |||
31 | #include <string.h> | 31 | #include <string.h> |
32 | #include <stdarg.h> | 32 | #include <stdarg.h> |
33 | #include <ctype.h> | 33 | #include <ctype.h> |
34 | #include <dwarf-regs.h> | ||
34 | 35 | ||
35 | #include "string.h" | 36 | #include "string.h" |
36 | #include "event.h" | 37 | #include "event.h" |
@@ -38,57 +39,8 @@ | |||
38 | #include "util.h" | 39 | #include "util.h" |
39 | #include "probe-finder.h" | 40 | #include "probe-finder.h" |
40 | 41 | ||
41 | 42 | /* Kprobe tracer basic type is up to u64 */ | |
42 | /* | 43 | #define MAX_BASIC_TYPE_BITS 64 |
43 | * Generic dwarf analysis helpers | ||
44 | */ | ||
45 | |||
46 | #define X86_32_MAX_REGS 8 | ||
47 | const char *x86_32_regs_table[X86_32_MAX_REGS] = { | ||
48 | "%ax", | ||
49 | "%cx", | ||
50 | "%dx", | ||
51 | "%bx", | ||
52 | "$stack", /* Stack address instead of %sp */ | ||
53 | "%bp", | ||
54 | "%si", | ||
55 | "%di", | ||
56 | }; | ||
57 | |||
58 | #define X86_64_MAX_REGS 16 | ||
59 | const char *x86_64_regs_table[X86_64_MAX_REGS] = { | ||
60 | "%ax", | ||
61 | "%dx", | ||
62 | "%cx", | ||
63 | "%bx", | ||
64 | "%si", | ||
65 | "%di", | ||
66 | "%bp", | ||
67 | "%sp", | ||
68 | "%r8", | ||
69 | "%r9", | ||
70 | "%r10", | ||
71 | "%r11", | ||
72 | "%r12", | ||
73 | "%r13", | ||
74 | "%r14", | ||
75 | "%r15", | ||
76 | }; | ||
77 | |||
78 | /* TODO: switching by dwarf address size */ | ||
79 | #ifdef __x86_64__ | ||
80 | #define ARCH_MAX_REGS X86_64_MAX_REGS | ||
81 | #define arch_regs_table x86_64_regs_table | ||
82 | #else | ||
83 | #define ARCH_MAX_REGS X86_32_MAX_REGS | ||
84 | #define arch_regs_table x86_32_regs_table | ||
85 | #endif | ||
86 | |||
87 | /* Return architecture dependent register string (for kprobe-tracer) */ | ||
88 | static const char *get_arch_regstr(unsigned int n) | ||
89 | { | ||
90 | return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL; | ||
91 | } | ||
92 | 44 | ||
93 | /* | 45 | /* |
94 | * Compare the tail of two strings. | 46 | * Compare the tail of two strings. |
@@ -108,7 +60,7 @@ static int strtailcmp(const char *s1, const char *s2) | |||
108 | /* Line number list operations */ | 60 | /* Line number list operations */ |
109 | 61 | ||
110 | /* Add a line to line number list */ | 62 | /* Add a line to line number list */ |
111 | static void line_list__add_line(struct list_head *head, unsigned int line) | 63 | static int line_list__add_line(struct list_head *head, int line) |
112 | { | 64 | { |
113 | struct line_node *ln; | 65 | struct line_node *ln; |
114 | struct list_head *p; | 66 | struct list_head *p; |
@@ -119,21 +71,23 @@ static void line_list__add_line(struct list_head *head, unsigned int line) | |||
119 | p = &ln->list; | 71 | p = &ln->list; |
120 | goto found; | 72 | goto found; |
121 | } else if (ln->line == line) /* Already exist */ | 73 | } else if (ln->line == line) /* Already exist */ |
122 | return ; | 74 | return 1; |
123 | } | 75 | } |
124 | /* List is empty, or the smallest entry */ | 76 | /* List is empty, or the smallest entry */ |
125 | p = head; | 77 | p = head; |
126 | found: | 78 | found: |
127 | pr_debug("line list: add a line %u\n", line); | 79 | pr_debug("line list: add a line %u\n", line); |
128 | ln = zalloc(sizeof(struct line_node)); | 80 | ln = zalloc(sizeof(struct line_node)); |
129 | DIE_IF(ln == NULL); | 81 | if (ln == NULL) |
82 | return -ENOMEM; | ||
130 | ln->line = line; | 83 | ln->line = line; |
131 | INIT_LIST_HEAD(&ln->list); | 84 | INIT_LIST_HEAD(&ln->list); |
132 | list_add(&ln->list, p); | 85 | list_add(&ln->list, p); |
86 | return 0; | ||
133 | } | 87 | } |
134 | 88 | ||
135 | /* Check if the line in line number list */ | 89 | /* Check if the line in line number list */ |
136 | static int line_list__has_line(struct list_head *head, unsigned int line) | 90 | static int line_list__has_line(struct list_head *head, int line) |
137 | { | 91 | { |
138 | struct line_node *ln; | 92 | struct line_node *ln; |
139 | 93 | ||
@@ -184,9 +138,129 @@ static const char *cu_find_realpath(Dwarf_Die *cu_die, const char *fname) | |||
184 | if (strtailcmp(src, fname) == 0) | 138 | if (strtailcmp(src, fname) == 0) |
185 | break; | 139 | break; |
186 | } | 140 | } |
141 | if (i == nfiles) | ||
142 | return NULL; | ||
187 | return src; | 143 | return src; |
188 | } | 144 | } |
189 | 145 | ||
146 | /* Compare diename and tname */ | ||
147 | static bool die_compare_name(Dwarf_Die *dw_die, const char *tname) | ||
148 | { | ||
149 | const char *name; | ||
150 | name = dwarf_diename(dw_die); | ||
151 | return name ? strcmp(tname, name) : -1; | ||
152 | } | ||
153 | |||
154 | /* Get type die, but skip qualifiers and typedef */ | ||
155 | static Dwarf_Die *die_get_real_type(Dwarf_Die *vr_die, Dwarf_Die *die_mem) | ||
156 | { | ||
157 | Dwarf_Attribute attr; | ||
158 | int tag; | ||
159 | |||
160 | do { | ||
161 | if (dwarf_attr(vr_die, DW_AT_type, &attr) == NULL || | ||
162 | dwarf_formref_die(&attr, die_mem) == NULL) | ||
163 | return NULL; | ||
164 | |||
165 | tag = dwarf_tag(die_mem); | ||
166 | vr_die = die_mem; | ||
167 | } while (tag == DW_TAG_const_type || | ||
168 | tag == DW_TAG_restrict_type || | ||
169 | tag == DW_TAG_volatile_type || | ||
170 | tag == DW_TAG_shared_type || | ||
171 | tag == DW_TAG_typedef); | ||
172 | |||
173 | return die_mem; | ||
174 | } | ||
175 | |||
176 | static bool die_is_signed_type(Dwarf_Die *tp_die) | ||
177 | { | ||
178 | Dwarf_Attribute attr; | ||
179 | Dwarf_Word ret; | ||
180 | |||
181 | if (dwarf_attr(tp_die, DW_AT_encoding, &attr) == NULL || | ||
182 | dwarf_formudata(&attr, &ret) != 0) | ||
183 | return false; | ||
184 | |||
185 | return (ret == DW_ATE_signed_char || ret == DW_ATE_signed || | ||
186 | ret == DW_ATE_signed_fixed); | ||
187 | } | ||
188 | |||
189 | static int die_get_byte_size(Dwarf_Die *tp_die) | ||
190 | { | ||
191 | Dwarf_Attribute attr; | ||
192 | Dwarf_Word ret; | ||
193 | |||
194 | if (dwarf_attr(tp_die, DW_AT_byte_size, &attr) == NULL || | ||
195 | dwarf_formudata(&attr, &ret) != 0) | ||
196 | return 0; | ||
197 | |||
198 | return (int)ret; | ||
199 | } | ||
200 | |||
201 | /* Get data_member_location offset */ | ||
202 | static int die_get_data_member_location(Dwarf_Die *mb_die, Dwarf_Word *offs) | ||
203 | { | ||
204 | Dwarf_Attribute attr; | ||
205 | Dwarf_Op *expr; | ||
206 | size_t nexpr; | ||
207 | int ret; | ||
208 | |||
209 | if (dwarf_attr(mb_die, DW_AT_data_member_location, &attr) == NULL) | ||
210 | return -ENOENT; | ||
211 | |||
212 | if (dwarf_formudata(&attr, offs) != 0) { | ||
213 | /* DW_AT_data_member_location should be DW_OP_plus_uconst */ | ||
214 | ret = dwarf_getlocation(&attr, &expr, &nexpr); | ||
215 | if (ret < 0 || nexpr == 0) | ||
216 | return -ENOENT; | ||
217 | |||
218 | if (expr[0].atom != DW_OP_plus_uconst || nexpr != 1) { | ||
219 | pr_debug("Unable to get offset:Unexpected OP %x (%zd)\n", | ||
220 | expr[0].atom, nexpr); | ||
221 | return -ENOTSUP; | ||
222 | } | ||
223 | *offs = (Dwarf_Word)expr[0].number; | ||
224 | } | ||
225 | return 0; | ||
226 | } | ||
227 | |||
228 | /* Return values for die_find callbacks */ | ||
229 | enum { | ||
230 | DIE_FIND_CB_FOUND = 0, /* End of Search */ | ||
231 | DIE_FIND_CB_CHILD = 1, /* Search only children */ | ||
232 | DIE_FIND_CB_SIBLING = 2, /* Search only siblings */ | ||
233 | DIE_FIND_CB_CONTINUE = 3, /* Search children and siblings */ | ||
234 | }; | ||
235 | |||
236 | /* Search a child die */ | ||
237 | static Dwarf_Die *die_find_child(Dwarf_Die *rt_die, | ||
238 | int (*callback)(Dwarf_Die *, void *), | ||
239 | void *data, Dwarf_Die *die_mem) | ||
240 | { | ||
241 | Dwarf_Die child_die; | ||
242 | int ret; | ||
243 | |||
244 | ret = dwarf_child(rt_die, die_mem); | ||
245 | if (ret != 0) | ||
246 | return NULL; | ||
247 | |||
248 | do { | ||
249 | ret = callback(die_mem, data); | ||
250 | if (ret == DIE_FIND_CB_FOUND) | ||
251 | return die_mem; | ||
252 | |||
253 | if ((ret & DIE_FIND_CB_CHILD) && | ||
254 | die_find_child(die_mem, callback, data, &child_die)) { | ||
255 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | ||
256 | return die_mem; | ||
257 | } | ||
258 | } while ((ret & DIE_FIND_CB_SIBLING) && | ||
259 | dwarf_siblingof(die_mem, die_mem) == 0); | ||
260 | |||
261 | return NULL; | ||
262 | } | ||
263 | |||
190 | struct __addr_die_search_param { | 264 | struct __addr_die_search_param { |
191 | Dwarf_Addr addr; | 265 | Dwarf_Addr addr; |
192 | Dwarf_Die *die_mem; | 266 | Dwarf_Die *die_mem; |
@@ -205,8 +279,8 @@ static int __die_search_func_cb(Dwarf_Die *fn_die, void *data) | |||
205 | } | 279 | } |
206 | 280 | ||
207 | /* Search a real subprogram including this line, */ | 281 | /* Search a real subprogram including this line, */ |
208 | static Dwarf_Die *die_get_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, | 282 | static Dwarf_Die *die_find_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, |
209 | Dwarf_Die *die_mem) | 283 | Dwarf_Die *die_mem) |
210 | { | 284 | { |
211 | struct __addr_die_search_param ad; | 285 | struct __addr_die_search_param ad; |
212 | ad.addr = addr; | 286 | ad.addr = addr; |
@@ -218,77 +292,64 @@ static Dwarf_Die *die_get_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, | |||
218 | return die_mem; | 292 | return die_mem; |
219 | } | 293 | } |
220 | 294 | ||
221 | /* Similar to dwarf_getfuncs, but returns inlined_subroutine if exists. */ | 295 | /* die_find callback for inline function search */ |
222 | static Dwarf_Die *die_get_inlinefunc(Dwarf_Die *sp_die, Dwarf_Addr addr, | 296 | static int __die_find_inline_cb(Dwarf_Die *die_mem, void *data) |
223 | Dwarf_Die *die_mem) | ||
224 | { | 297 | { |
225 | Dwarf_Die child_die; | 298 | Dwarf_Addr *addr = data; |
226 | int ret; | ||
227 | 299 | ||
228 | ret = dwarf_child(sp_die, die_mem); | 300 | if (dwarf_tag(die_mem) == DW_TAG_inlined_subroutine && |
229 | if (ret != 0) | 301 | dwarf_haspc(die_mem, *addr)) |
230 | return NULL; | 302 | return DIE_FIND_CB_FOUND; |
231 | 303 | ||
232 | do { | 304 | return DIE_FIND_CB_CONTINUE; |
233 | if (dwarf_tag(die_mem) == DW_TAG_inlined_subroutine && | ||
234 | dwarf_haspc(die_mem, addr)) | ||
235 | return die_mem; | ||
236 | |||
237 | if (die_get_inlinefunc(die_mem, addr, &child_die)) { | ||
238 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | ||
239 | return die_mem; | ||
240 | } | ||
241 | } while (dwarf_siblingof(die_mem, die_mem) == 0); | ||
242 | |||
243 | return NULL; | ||
244 | } | 305 | } |
245 | 306 | ||
246 | /* Compare diename and tname */ | 307 | /* Similar to dwarf_getfuncs, but returns inlined_subroutine if exists. */ |
247 | static bool die_compare_name(Dwarf_Die *dw_die, const char *tname) | 308 | static Dwarf_Die *die_find_inlinefunc(Dwarf_Die *sp_die, Dwarf_Addr addr, |
309 | Dwarf_Die *die_mem) | ||
248 | { | 310 | { |
249 | const char *name; | 311 | return die_find_child(sp_die, __die_find_inline_cb, &addr, die_mem); |
250 | name = dwarf_diename(dw_die); | ||
251 | DIE_IF(name == NULL); | ||
252 | return strcmp(tname, name); | ||
253 | } | 312 | } |
254 | 313 | ||
255 | /* Get entry pc(or low pc, 1st entry of ranges) of the die */ | 314 | static int __die_find_variable_cb(Dwarf_Die *die_mem, void *data) |
256 | static Dwarf_Addr die_get_entrypc(Dwarf_Die *dw_die) | ||
257 | { | 315 | { |
258 | Dwarf_Addr epc; | 316 | const char *name = data; |
259 | int ret; | 317 | int tag; |
260 | 318 | ||
261 | ret = dwarf_entrypc(dw_die, &epc); | 319 | tag = dwarf_tag(die_mem); |
262 | DIE_IF(ret == -1); | 320 | if ((tag == DW_TAG_formal_parameter || |
263 | return epc; | 321 | tag == DW_TAG_variable) && |
322 | (die_compare_name(die_mem, name) == 0)) | ||
323 | return DIE_FIND_CB_FOUND; | ||
324 | |||
325 | return DIE_FIND_CB_CONTINUE; | ||
264 | } | 326 | } |
265 | 327 | ||
266 | /* Get a variable die */ | 328 | /* Find a variable called 'name' */ |
267 | static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, | 329 | static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, |
268 | Dwarf_Die *die_mem) | 330 | Dwarf_Die *die_mem) |
269 | { | 331 | { |
270 | Dwarf_Die child_die; | 332 | return die_find_child(sp_die, __die_find_variable_cb, (void *)name, |
271 | int tag; | 333 | die_mem); |
272 | int ret; | 334 | } |
273 | 335 | ||
274 | ret = dwarf_child(sp_die, die_mem); | 336 | static int __die_find_member_cb(Dwarf_Die *die_mem, void *data) |
275 | if (ret != 0) | 337 | { |
276 | return NULL; | 338 | const char *name = data; |
277 | 339 | ||
278 | do { | 340 | if ((dwarf_tag(die_mem) == DW_TAG_member) && |
279 | tag = dwarf_tag(die_mem); | 341 | (die_compare_name(die_mem, name) == 0)) |
280 | if ((tag == DW_TAG_formal_parameter || | 342 | return DIE_FIND_CB_FOUND; |
281 | tag == DW_TAG_variable) && | ||
282 | (die_compare_name(die_mem, name) == 0)) | ||
283 | return die_mem; | ||
284 | 343 | ||
285 | if (die_find_variable(die_mem, name, &child_die)) { | 344 | return DIE_FIND_CB_SIBLING; |
286 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | 345 | } |
287 | return die_mem; | ||
288 | } | ||
289 | } while (dwarf_siblingof(die_mem, die_mem) == 0); | ||
290 | 346 | ||
291 | return NULL; | 347 | /* Find a member called 'name' */ |
348 | static Dwarf_Die *die_find_member(Dwarf_Die *st_die, const char *name, | ||
349 | Dwarf_Die *die_mem) | ||
350 | { | ||
351 | return die_find_child(st_die, __die_find_member_cb, (void *)name, | ||
352 | die_mem); | ||
292 | } | 353 | } |
293 | 354 | ||
294 | /* | 355 | /* |
@@ -296,19 +357,22 @@ static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, | |||
296 | */ | 357 | */ |
297 | 358 | ||
298 | /* Show a location */ | 359 | /* Show a location */ |
299 | static void show_location(Dwarf_Op *op, struct probe_finder *pf) | 360 | static int convert_location(Dwarf_Op *op, struct probe_finder *pf) |
300 | { | 361 | { |
301 | unsigned int regn; | 362 | unsigned int regn; |
302 | Dwarf_Word offs = 0; | 363 | Dwarf_Word offs = 0; |
303 | int deref = 0, ret; | 364 | bool ref = false; |
304 | const char *regs; | 365 | const char *regs; |
366 | struct kprobe_trace_arg *tvar = pf->tvar; | ||
305 | 367 | ||
306 | /* TODO: support CFA */ | ||
307 | /* If this is based on frame buffer, set the offset */ | 368 | /* If this is based on frame buffer, set the offset */ |
308 | if (op->atom == DW_OP_fbreg) { | 369 | if (op->atom == DW_OP_fbreg) { |
309 | if (pf->fb_ops == NULL) | 370 | if (pf->fb_ops == NULL) { |
310 | die("The attribute of frame base is not supported.\n"); | 371 | pr_warning("The attribute of frame base is not " |
311 | deref = 1; | 372 | "supported.\n"); |
373 | return -ENOTSUP; | ||
374 | } | ||
375 | ref = true; | ||
312 | offs = op->number; | 376 | offs = op->number; |
313 | op = &pf->fb_ops[0]; | 377 | op = &pf->fb_ops[0]; |
314 | } | 378 | } |
@@ -316,35 +380,164 @@ static void show_location(Dwarf_Op *op, struct probe_finder *pf) | |||
316 | if (op->atom >= DW_OP_breg0 && op->atom <= DW_OP_breg31) { | 380 | if (op->atom >= DW_OP_breg0 && op->atom <= DW_OP_breg31) { |
317 | regn = op->atom - DW_OP_breg0; | 381 | regn = op->atom - DW_OP_breg0; |
318 | offs += op->number; | 382 | offs += op->number; |
319 | deref = 1; | 383 | ref = true; |
320 | } else if (op->atom >= DW_OP_reg0 && op->atom <= DW_OP_reg31) { | 384 | } else if (op->atom >= DW_OP_reg0 && op->atom <= DW_OP_reg31) { |
321 | regn = op->atom - DW_OP_reg0; | 385 | regn = op->atom - DW_OP_reg0; |
322 | } else if (op->atom == DW_OP_bregx) { | 386 | } else if (op->atom == DW_OP_bregx) { |
323 | regn = op->number; | 387 | regn = op->number; |
324 | offs += op->number2; | 388 | offs += op->number2; |
325 | deref = 1; | 389 | ref = true; |
326 | } else if (op->atom == DW_OP_regx) { | 390 | } else if (op->atom == DW_OP_regx) { |
327 | regn = op->number; | 391 | regn = op->number; |
328 | } else | 392 | } else { |
329 | die("DW_OP %d is not supported.", op->atom); | 393 | pr_warning("DW_OP %x is not supported.\n", op->atom); |
394 | return -ENOTSUP; | ||
395 | } | ||
330 | 396 | ||
331 | regs = get_arch_regstr(regn); | 397 | regs = get_arch_regstr(regn); |
332 | if (!regs) | 398 | if (!regs) { |
333 | die("%u exceeds max register number.", regn); | 399 | pr_warning("Mapping for DWARF register number %u missing on this architecture.", regn); |
400 | return -ERANGE; | ||
401 | } | ||
402 | |||
403 | tvar->value = strdup(regs); | ||
404 | if (tvar->value == NULL) | ||
405 | return -ENOMEM; | ||
406 | |||
407 | if (ref) { | ||
408 | tvar->ref = zalloc(sizeof(struct kprobe_trace_arg_ref)); | ||
409 | if (tvar->ref == NULL) | ||
410 | return -ENOMEM; | ||
411 | tvar->ref->offset = (long)offs; | ||
412 | } | ||
413 | return 0; | ||
414 | } | ||
415 | |||
416 | static int convert_variable_type(Dwarf_Die *vr_die, | ||
417 | struct kprobe_trace_arg *targ) | ||
418 | { | ||
419 | Dwarf_Die type; | ||
420 | char buf[16]; | ||
421 | int ret; | ||
422 | |||
423 | if (die_get_real_type(vr_die, &type) == NULL) { | ||
424 | pr_warning("Failed to get a type information of %s.\n", | ||
425 | dwarf_diename(vr_die)); | ||
426 | return -ENOENT; | ||
427 | } | ||
428 | |||
429 | ret = die_get_byte_size(&type) * 8; | ||
430 | if (ret) { | ||
431 | /* Check the bitwidth */ | ||
432 | if (ret > MAX_BASIC_TYPE_BITS) { | ||
433 | pr_info("%s exceeds max-bitwidth." | ||
434 | " Cut down to %d bits.\n", | ||
435 | dwarf_diename(&type), MAX_BASIC_TYPE_BITS); | ||
436 | ret = MAX_BASIC_TYPE_BITS; | ||
437 | } | ||
438 | |||
439 | ret = snprintf(buf, 16, "%c%d", | ||
440 | die_is_signed_type(&type) ? 's' : 'u', ret); | ||
441 | if (ret < 0 || ret >= 16) { | ||
442 | if (ret >= 16) | ||
443 | ret = -E2BIG; | ||
444 | pr_warning("Failed to convert variable type: %s\n", | ||
445 | strerror(-ret)); | ||
446 | return ret; | ||
447 | } | ||
448 | targ->type = strdup(buf); | ||
449 | if (targ->type == NULL) | ||
450 | return -ENOMEM; | ||
451 | } | ||
452 | return 0; | ||
453 | } | ||
454 | |||
455 | static int convert_variable_fields(Dwarf_Die *vr_die, const char *varname, | ||
456 | struct perf_probe_arg_field *field, | ||
457 | struct kprobe_trace_arg_ref **ref_ptr, | ||
458 | Dwarf_Die *die_mem) | ||
459 | { | ||
460 | struct kprobe_trace_arg_ref *ref = *ref_ptr; | ||
461 | Dwarf_Die type; | ||
462 | Dwarf_Word offs; | ||
463 | int ret; | ||
464 | |||
465 | pr_debug("converting %s in %s\n", field->name, varname); | ||
466 | if (die_get_real_type(vr_die, &type) == NULL) { | ||
467 | pr_warning("Failed to get the type of %s.\n", varname); | ||
468 | return -ENOENT; | ||
469 | } | ||
470 | |||
471 | /* Check the pointer and dereference */ | ||
472 | if (dwarf_tag(&type) == DW_TAG_pointer_type) { | ||
473 | if (!field->ref) { | ||
474 | pr_err("Semantic error: %s must be referred by '->'\n", | ||
475 | field->name); | ||
476 | return -EINVAL; | ||
477 | } | ||
478 | /* Get the type pointed by this pointer */ | ||
479 | if (die_get_real_type(&type, &type) == NULL) { | ||
480 | pr_warning("Failed to get the type of %s.\n", varname); | ||
481 | return -ENOENT; | ||
482 | } | ||
483 | /* Verify it is a data structure */ | ||
484 | if (dwarf_tag(&type) != DW_TAG_structure_type) { | ||
485 | pr_warning("%s is not a data structure.\n", varname); | ||
486 | return -EINVAL; | ||
487 | } | ||
488 | |||
489 | ref = zalloc(sizeof(struct kprobe_trace_arg_ref)); | ||
490 | if (ref == NULL) | ||
491 | return -ENOMEM; | ||
492 | if (*ref_ptr) | ||
493 | (*ref_ptr)->next = ref; | ||
494 | else | ||
495 | *ref_ptr = ref; | ||
496 | } else { | ||
497 | /* Verify it is a data structure */ | ||
498 | if (dwarf_tag(&type) != DW_TAG_structure_type) { | ||
499 | pr_warning("%s is not a data structure.\n", varname); | ||
500 | return -EINVAL; | ||
501 | } | ||
502 | if (field->ref) { | ||
503 | pr_err("Semantic error: %s must be referred by '.'\n", | ||
504 | field->name); | ||
505 | return -EINVAL; | ||
506 | } | ||
507 | if (!ref) { | ||
508 | pr_warning("Structure on a register is not " | ||
509 | "supported yet.\n"); | ||
510 | return -ENOTSUP; | ||
511 | } | ||
512 | } | ||
513 | |||
514 | if (die_find_member(&type, field->name, die_mem) == NULL) { | ||
515 | pr_warning("%s(tyep:%s) has no member %s.\n", varname, | ||
516 | dwarf_diename(&type), field->name); | ||
517 | return -EINVAL; | ||
518 | } | ||
334 | 519 | ||
335 | if (deref) | 520 | /* Get the offset of the field */ |
336 | ret = snprintf(pf->buf, pf->len, " %s=%+jd(%s)", | 521 | ret = die_get_data_member_location(die_mem, &offs); |
337 | pf->var, (intmax_t)offs, regs); | 522 | if (ret < 0) { |
523 | pr_warning("Failed to get the offset of %s.\n", field->name); | ||
524 | return ret; | ||
525 | } | ||
526 | ref->offset += (long)offs; | ||
527 | |||
528 | /* Converting next field */ | ||
529 | if (field->next) | ||
530 | return convert_variable_fields(die_mem, field->name, | ||
531 | field->next, &ref, die_mem); | ||
338 | else | 532 | else |
339 | ret = snprintf(pf->buf, pf->len, " %s=%s", pf->var, regs); | 533 | return 0; |
340 | DIE_IF(ret < 0); | ||
341 | DIE_IF(ret >= pf->len); | ||
342 | } | 534 | } |
343 | 535 | ||
344 | /* Show a variables in kprobe event format */ | 536 | /* Show a variables in kprobe event format */ |
345 | static void show_variable(Dwarf_Die *vr_die, struct probe_finder *pf) | 537 | static int convert_variable(Dwarf_Die *vr_die, struct probe_finder *pf) |
346 | { | 538 | { |
347 | Dwarf_Attribute attr; | 539 | Dwarf_Attribute attr; |
540 | Dwarf_Die die_mem; | ||
348 | Dwarf_Op *expr; | 541 | Dwarf_Op *expr; |
349 | size_t nexpr; | 542 | size_t nexpr; |
350 | int ret; | 543 | int ret; |
@@ -356,142 +549,191 @@ static void show_variable(Dwarf_Die *vr_die, struct probe_finder *pf) | |||
356 | if (ret <= 0 || nexpr == 0) | 549 | if (ret <= 0 || nexpr == 0) |
357 | goto error; | 550 | goto error; |
358 | 551 | ||
359 | show_location(expr, pf); | 552 | ret = convert_location(expr, pf); |
553 | if (ret == 0 && pf->pvar->field) { | ||
554 | ret = convert_variable_fields(vr_die, pf->pvar->var, | ||
555 | pf->pvar->field, &pf->tvar->ref, | ||
556 | &die_mem); | ||
557 | vr_die = &die_mem; | ||
558 | } | ||
559 | if (ret == 0) { | ||
560 | if (pf->pvar->type) { | ||
561 | pf->tvar->type = strdup(pf->pvar->type); | ||
562 | if (pf->tvar->type == NULL) | ||
563 | ret = -ENOMEM; | ||
564 | } else | ||
565 | ret = convert_variable_type(vr_die, pf->tvar); | ||
566 | } | ||
360 | /* *expr will be cached in libdw. Don't free it. */ | 567 | /* *expr will be cached in libdw. Don't free it. */ |
361 | return ; | 568 | return ret; |
362 | error: | 569 | error: |
363 | /* TODO: Support const_value */ | 570 | /* TODO: Support const_value */ |
364 | die("Failed to find the location of %s at this address.\n" | 571 | pr_err("Failed to find the location of %s at this address.\n" |
365 | " Perhaps, it has been optimized out.", pf->var); | 572 | " Perhaps, it has been optimized out.\n", pf->pvar->var); |
573 | return -ENOENT; | ||
366 | } | 574 | } |
367 | 575 | ||
368 | /* Find a variable in a subprogram die */ | 576 | /* Find a variable in a subprogram die */ |
369 | static void find_variable(Dwarf_Die *sp_die, struct probe_finder *pf) | 577 | static int find_variable(Dwarf_Die *sp_die, struct probe_finder *pf) |
370 | { | 578 | { |
371 | int ret; | ||
372 | Dwarf_Die vr_die; | 579 | Dwarf_Die vr_die; |
580 | char buf[32], *ptr; | ||
581 | int ret; | ||
373 | 582 | ||
374 | /* TODO: Support struct members and arrays */ | 583 | /* TODO: Support arrays */ |
375 | if (!is_c_varname(pf->var)) { | 584 | if (pf->pvar->name) |
376 | /* Output raw parameters */ | 585 | pf->tvar->name = strdup(pf->pvar->name); |
377 | ret = snprintf(pf->buf, pf->len, " %s", pf->var); | 586 | else { |
378 | DIE_IF(ret < 0); | 587 | ret = synthesize_perf_probe_arg(pf->pvar, buf, 32); |
379 | DIE_IF(ret >= pf->len); | 588 | if (ret < 0) |
380 | return ; | 589 | return ret; |
590 | ptr = strchr(buf, ':'); /* Change type separator to _ */ | ||
591 | if (ptr) | ||
592 | *ptr = '_'; | ||
593 | pf->tvar->name = strdup(buf); | ||
594 | } | ||
595 | if (pf->tvar->name == NULL) | ||
596 | return -ENOMEM; | ||
597 | |||
598 | if (!is_c_varname(pf->pvar->var)) { | ||
599 | /* Copy raw parameters */ | ||
600 | pf->tvar->value = strdup(pf->pvar->var); | ||
601 | if (pf->tvar->value == NULL) | ||
602 | return -ENOMEM; | ||
603 | else | ||
604 | return 0; | ||
381 | } | 605 | } |
382 | 606 | ||
383 | pr_debug("Searching '%s' variable in context.\n", pf->var); | 607 | pr_debug("Searching '%s' variable in context.\n", |
608 | pf->pvar->var); | ||
384 | /* Search child die for local variables and parameters. */ | 609 | /* Search child die for local variables and parameters. */ |
385 | if (!die_find_variable(sp_die, pf->var, &vr_die)) | 610 | if (!die_find_variable(sp_die, pf->pvar->var, &vr_die)) { |
386 | die("Failed to find '%s' in this function.", pf->var); | 611 | pr_warning("Failed to find '%s' in this function.\n", |
387 | 612 | pf->pvar->var); | |
388 | show_variable(&vr_die, pf); | 613 | return -ENOENT; |
614 | } | ||
615 | return convert_variable(&vr_die, pf); | ||
389 | } | 616 | } |
390 | 617 | ||
391 | /* Show a probe point to output buffer */ | 618 | /* Show a probe point to output buffer */ |
392 | static void show_probe_point(Dwarf_Die *sp_die, struct probe_finder *pf) | 619 | static int convert_probe_point(Dwarf_Die *sp_die, struct probe_finder *pf) |
393 | { | 620 | { |
394 | struct probe_point *pp = pf->pp; | 621 | struct kprobe_trace_event *tev; |
395 | Dwarf_Addr eaddr; | 622 | Dwarf_Addr eaddr; |
396 | Dwarf_Die die_mem; | 623 | Dwarf_Die die_mem; |
397 | const char *name; | 624 | const char *name; |
398 | char tmp[MAX_PROBE_BUFFER]; | 625 | int ret, i; |
399 | int ret, i, len; | ||
400 | Dwarf_Attribute fb_attr; | 626 | Dwarf_Attribute fb_attr; |
401 | size_t nops; | 627 | size_t nops; |
402 | 628 | ||
629 | if (pf->ntevs == pf->max_tevs) { | ||
630 | pr_warning("Too many( > %d) probe point found.\n", | ||
631 | pf->max_tevs); | ||
632 | return -ERANGE; | ||
633 | } | ||
634 | tev = &pf->tevs[pf->ntevs++]; | ||
635 | |||
403 | /* If no real subprogram, find a real one */ | 636 | /* If no real subprogram, find a real one */ |
404 | if (!sp_die || dwarf_tag(sp_die) != DW_TAG_subprogram) { | 637 | if (!sp_die || dwarf_tag(sp_die) != DW_TAG_subprogram) { |
405 | sp_die = die_get_real_subprogram(&pf->cu_die, | 638 | sp_die = die_find_real_subprogram(&pf->cu_die, |
406 | pf->addr, &die_mem); | 639 | pf->addr, &die_mem); |
407 | if (!sp_die) | 640 | if (!sp_die) { |
408 | die("Probe point is not found in subprograms."); | 641 | pr_warning("Failed to find probe point in any " |
642 | "functions.\n"); | ||
643 | return -ENOENT; | ||
644 | } | ||
409 | } | 645 | } |
410 | 646 | ||
411 | /* Output name of probe point */ | 647 | /* Copy the name of probe point */ |
412 | name = dwarf_diename(sp_die); | 648 | name = dwarf_diename(sp_die); |
413 | if (name) { | 649 | if (name) { |
414 | dwarf_entrypc(sp_die, &eaddr); | 650 | if (dwarf_entrypc(sp_die, &eaddr) != 0) { |
415 | ret = snprintf(tmp, MAX_PROBE_BUFFER, "%s+%lu", name, | 651 | pr_warning("Failed to get entry pc of %s\n", |
416 | (unsigned long)(pf->addr - eaddr)); | 652 | dwarf_diename(sp_die)); |
417 | /* Copy the function name if possible */ | 653 | return -ENOENT; |
418 | if (!pp->function) { | ||
419 | pp->function = strdup(name); | ||
420 | pp->offset = (size_t)(pf->addr - eaddr); | ||
421 | } | 654 | } |
422 | } else { | 655 | tev->point.symbol = strdup(name); |
656 | if (tev->point.symbol == NULL) | ||
657 | return -ENOMEM; | ||
658 | tev->point.offset = (unsigned long)(pf->addr - eaddr); | ||
659 | } else | ||
423 | /* This function has no name. */ | 660 | /* This function has no name. */ |
424 | ret = snprintf(tmp, MAX_PROBE_BUFFER, "0x%jx", | 661 | tev->point.offset = (unsigned long)pf->addr; |
425 | (uintmax_t)pf->addr); | 662 | |
426 | if (!pp->function) { | 663 | pr_debug("Probe point found: %s+%lu\n", tev->point.symbol, |
427 | /* TODO: Use _stext */ | 664 | tev->point.offset); |
428 | pp->function = strdup(""); | ||
429 | pp->offset = (size_t)pf->addr; | ||
430 | } | ||
431 | } | ||
432 | DIE_IF(ret < 0); | ||
433 | DIE_IF(ret >= MAX_PROBE_BUFFER); | ||
434 | len = ret; | ||
435 | pr_debug("Probe point found: %s\n", tmp); | ||
436 | 665 | ||
437 | /* Get the frame base attribute/ops */ | 666 | /* Get the frame base attribute/ops */ |
438 | dwarf_attr(sp_die, DW_AT_frame_base, &fb_attr); | 667 | dwarf_attr(sp_die, DW_AT_frame_base, &fb_attr); |
439 | ret = dwarf_getlocation_addr(&fb_attr, pf->addr, &pf->fb_ops, &nops, 1); | 668 | ret = dwarf_getlocation_addr(&fb_attr, pf->addr, &pf->fb_ops, &nops, 1); |
440 | if (ret <= 0 || nops == 0) | 669 | if (ret <= 0 || nops == 0) { |
441 | pf->fb_ops = NULL; | 670 | pf->fb_ops = NULL; |
671 | } else if (nops == 1 && pf->fb_ops[0].atom == DW_OP_call_frame_cfa && | ||
672 | pf->cfi != NULL) { | ||
673 | Dwarf_Frame *frame; | ||
674 | if (dwarf_cfi_addrframe(pf->cfi, pf->addr, &frame) != 0 || | ||
675 | dwarf_frame_cfa(frame, &pf->fb_ops, &nops) != 0) { | ||
676 | pr_warning("Failed to get CFA on 0x%jx\n", | ||
677 | (uintmax_t)pf->addr); | ||
678 | return -ENOENT; | ||
679 | } | ||
680 | } | ||
442 | 681 | ||
443 | /* Find each argument */ | 682 | /* Find each argument */ |
444 | /* TODO: use dwarf_cfi_addrframe */ | 683 | tev->nargs = pf->pev->nargs; |
445 | for (i = 0; i < pp->nr_args; i++) { | 684 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs); |
446 | pf->var = pp->args[i]; | 685 | if (tev->args == NULL) |
447 | pf->buf = &tmp[len]; | 686 | return -ENOMEM; |
448 | pf->len = MAX_PROBE_BUFFER - len; | 687 | for (i = 0; i < pf->pev->nargs; i++) { |
449 | find_variable(sp_die, pf); | 688 | pf->pvar = &pf->pev->args[i]; |
450 | len += strlen(pf->buf); | 689 | pf->tvar = &tev->args[i]; |
690 | ret = find_variable(sp_die, pf); | ||
691 | if (ret != 0) | ||
692 | return ret; | ||
451 | } | 693 | } |
452 | 694 | ||
453 | /* *pf->fb_ops will be cached in libdw. Don't free it. */ | 695 | /* *pf->fb_ops will be cached in libdw. Don't free it. */ |
454 | pf->fb_ops = NULL; | 696 | pf->fb_ops = NULL; |
455 | 697 | return 0; | |
456 | if (pp->found == MAX_PROBES) | ||
457 | die("Too many( > %d) probe point found.\n", MAX_PROBES); | ||
458 | |||
459 | pp->probes[pp->found] = strdup(tmp); | ||
460 | pp->found++; | ||
461 | } | 698 | } |
462 | 699 | ||
463 | /* Find probe point from its line number */ | 700 | /* Find probe point from its line number */ |
464 | static void find_probe_point_by_line(struct probe_finder *pf) | 701 | static int find_probe_point_by_line(struct probe_finder *pf) |
465 | { | 702 | { |
466 | Dwarf_Lines *lines; | 703 | Dwarf_Lines *lines; |
467 | Dwarf_Line *line; | 704 | Dwarf_Line *line; |
468 | size_t nlines, i; | 705 | size_t nlines, i; |
469 | Dwarf_Addr addr; | 706 | Dwarf_Addr addr; |
470 | int lineno; | 707 | int lineno; |
471 | int ret; | 708 | int ret = 0; |
472 | 709 | ||
473 | ret = dwarf_getsrclines(&pf->cu_die, &lines, &nlines); | 710 | if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) { |
474 | DIE_IF(ret != 0); | 711 | pr_warning("No source lines found in this CU.\n"); |
712 | return -ENOENT; | ||
713 | } | ||
475 | 714 | ||
476 | for (i = 0; i < nlines; i++) { | 715 | for (i = 0; i < nlines && ret == 0; i++) { |
477 | line = dwarf_onesrcline(lines, i); | 716 | line = dwarf_onesrcline(lines, i); |
478 | dwarf_lineno(line, &lineno); | 717 | if (dwarf_lineno(line, &lineno) != 0 || |
479 | if (lineno != pf->lno) | 718 | lineno != pf->lno) |
480 | continue; | 719 | continue; |
481 | 720 | ||
482 | /* TODO: Get fileno from line, but how? */ | 721 | /* TODO: Get fileno from line, but how? */ |
483 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) | 722 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) |
484 | continue; | 723 | continue; |
485 | 724 | ||
486 | ret = dwarf_lineaddr(line, &addr); | 725 | if (dwarf_lineaddr(line, &addr) != 0) { |
487 | DIE_IF(ret != 0); | 726 | pr_warning("Failed to get the address of the line.\n"); |
727 | return -ENOENT; | ||
728 | } | ||
488 | pr_debug("Probe line found: line[%d]:%d addr:0x%jx\n", | 729 | pr_debug("Probe line found: line[%d]:%d addr:0x%jx\n", |
489 | (int)i, lineno, (uintmax_t)addr); | 730 | (int)i, lineno, (uintmax_t)addr); |
490 | pf->addr = addr; | 731 | pf->addr = addr; |
491 | 732 | ||
492 | show_probe_point(NULL, pf); | 733 | ret = convert_probe_point(NULL, pf); |
493 | /* Continuing, because target line might be inlined. */ | 734 | /* Continuing, because target line might be inlined. */ |
494 | } | 735 | } |
736 | return ret; | ||
495 | } | 737 | } |
496 | 738 | ||
497 | /* Find lines which match lazy pattern */ | 739 | /* Find lines which match lazy pattern */ |
@@ -499,16 +741,27 @@ static int find_lazy_match_lines(struct list_head *head, | |||
499 | const char *fname, const char *pat) | 741 | const char *fname, const char *pat) |
500 | { | 742 | { |
501 | char *fbuf, *p1, *p2; | 743 | char *fbuf, *p1, *p2; |
502 | int fd, line, nlines = 0; | 744 | int fd, ret, line, nlines = 0; |
503 | struct stat st; | 745 | struct stat st; |
504 | 746 | ||
505 | fd = open(fname, O_RDONLY); | 747 | fd = open(fname, O_RDONLY); |
506 | if (fd < 0) | 748 | if (fd < 0) { |
507 | die("failed to open %s", fname); | 749 | pr_warning("Failed to open %s: %s\n", fname, strerror(-fd)); |
508 | DIE_IF(fstat(fd, &st) < 0); | 750 | return fd; |
509 | fbuf = malloc(st.st_size + 2); | 751 | } |
510 | DIE_IF(fbuf == NULL); | 752 | |
511 | DIE_IF(read(fd, fbuf, st.st_size) < 0); | 753 | ret = fstat(fd, &st); |
754 | if (ret < 0) { | ||
755 | pr_warning("Failed to get the size of %s: %s\n", | ||
756 | fname, strerror(errno)); | ||
757 | return ret; | ||
758 | } | ||
759 | fbuf = xmalloc(st.st_size + 2); | ||
760 | ret = read(fd, fbuf, st.st_size); | ||
761 | if (ret < 0) { | ||
762 | pr_warning("Failed to read %s: %s\n", fname, strerror(errno)); | ||
763 | return ret; | ||
764 | } | ||
512 | close(fd); | 765 | close(fd); |
513 | fbuf[st.st_size] = '\n'; /* Dummy line */ | 766 | fbuf[st.st_size] = '\n'; /* Dummy line */ |
514 | fbuf[st.st_size + 1] = '\0'; | 767 | fbuf[st.st_size + 1] = '\0'; |
@@ -528,7 +781,7 @@ static int find_lazy_match_lines(struct list_head *head, | |||
528 | } | 781 | } |
529 | 782 | ||
530 | /* Find probe points from lazy pattern */ | 783 | /* Find probe points from lazy pattern */ |
531 | static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | 784 | static int find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) |
532 | { | 785 | { |
533 | Dwarf_Lines *lines; | 786 | Dwarf_Lines *lines; |
534 | Dwarf_Line *line; | 787 | Dwarf_Line *line; |
@@ -536,37 +789,46 @@ static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | |||
536 | Dwarf_Addr addr; | 789 | Dwarf_Addr addr; |
537 | Dwarf_Die die_mem; | 790 | Dwarf_Die die_mem; |
538 | int lineno; | 791 | int lineno; |
539 | int ret; | 792 | int ret = 0; |
540 | 793 | ||
541 | if (list_empty(&pf->lcache)) { | 794 | if (list_empty(&pf->lcache)) { |
542 | /* Matching lazy line pattern */ | 795 | /* Matching lazy line pattern */ |
543 | ret = find_lazy_match_lines(&pf->lcache, pf->fname, | 796 | ret = find_lazy_match_lines(&pf->lcache, pf->fname, |
544 | pf->pp->lazy_line); | 797 | pf->pev->point.lazy_line); |
545 | if (ret <= 0) | 798 | if (ret == 0) { |
546 | die("No matched lines found in %s.", pf->fname); | 799 | pr_debug("No matched lines found in %s.\n", pf->fname); |
800 | return 0; | ||
801 | } else if (ret < 0) | ||
802 | return ret; | ||
547 | } | 803 | } |
548 | 804 | ||
549 | ret = dwarf_getsrclines(&pf->cu_die, &lines, &nlines); | 805 | if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) { |
550 | DIE_IF(ret != 0); | 806 | pr_warning("No source lines found in this CU.\n"); |
551 | for (i = 0; i < nlines; i++) { | 807 | return -ENOENT; |
808 | } | ||
809 | |||
810 | for (i = 0; i < nlines && ret >= 0; i++) { | ||
552 | line = dwarf_onesrcline(lines, i); | 811 | line = dwarf_onesrcline(lines, i); |
553 | 812 | ||
554 | dwarf_lineno(line, &lineno); | 813 | if (dwarf_lineno(line, &lineno) != 0 || |
555 | if (!line_list__has_line(&pf->lcache, lineno)) | 814 | !line_list__has_line(&pf->lcache, lineno)) |
556 | continue; | 815 | continue; |
557 | 816 | ||
558 | /* TODO: Get fileno from line, but how? */ | 817 | /* TODO: Get fileno from line, but how? */ |
559 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) | 818 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) |
560 | continue; | 819 | continue; |
561 | 820 | ||
562 | ret = dwarf_lineaddr(line, &addr); | 821 | if (dwarf_lineaddr(line, &addr) != 0) { |
563 | DIE_IF(ret != 0); | 822 | pr_debug("Failed to get the address of line %d.\n", |
823 | lineno); | ||
824 | continue; | ||
825 | } | ||
564 | if (sp_die) { | 826 | if (sp_die) { |
565 | /* Address filtering 1: does sp_die include addr? */ | 827 | /* Address filtering 1: does sp_die include addr? */ |
566 | if (!dwarf_haspc(sp_die, addr)) | 828 | if (!dwarf_haspc(sp_die, addr)) |
567 | continue; | 829 | continue; |
568 | /* Address filtering 2: No child include addr? */ | 830 | /* Address filtering 2: No child include addr? */ |
569 | if (die_get_inlinefunc(sp_die, addr, &die_mem)) | 831 | if (die_find_inlinefunc(sp_die, addr, &die_mem)) |
570 | continue; | 832 | continue; |
571 | } | 833 | } |
572 | 834 | ||
@@ -574,27 +836,44 @@ static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | |||
574 | (int)i, lineno, (unsigned long long)addr); | 836 | (int)i, lineno, (unsigned long long)addr); |
575 | pf->addr = addr; | 837 | pf->addr = addr; |
576 | 838 | ||
577 | show_probe_point(sp_die, pf); | 839 | ret = convert_probe_point(sp_die, pf); |
578 | /* Continuing, because target line might be inlined. */ | 840 | /* Continuing, because target line might be inlined. */ |
579 | } | 841 | } |
580 | /* TODO: deallocate lines, but how? */ | 842 | /* TODO: deallocate lines, but how? */ |
843 | return ret; | ||
581 | } | 844 | } |
582 | 845 | ||
846 | /* Callback parameter with return value */ | ||
847 | struct dwarf_callback_param { | ||
848 | void *data; | ||
849 | int retval; | ||
850 | }; | ||
851 | |||
583 | static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) | 852 | static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) |
584 | { | 853 | { |
585 | struct probe_finder *pf = (struct probe_finder *)data; | 854 | struct dwarf_callback_param *param = data; |
586 | struct probe_point *pp = pf->pp; | 855 | struct probe_finder *pf = param->data; |
856 | struct perf_probe_point *pp = &pf->pev->point; | ||
857 | Dwarf_Addr addr; | ||
587 | 858 | ||
588 | if (pp->lazy_line) | 859 | if (pp->lazy_line) |
589 | find_probe_point_lazy(in_die, pf); | 860 | param->retval = find_probe_point_lazy(in_die, pf); |
590 | else { | 861 | else { |
591 | /* Get probe address */ | 862 | /* Get probe address */ |
592 | pf->addr = die_get_entrypc(in_die); | 863 | if (dwarf_entrypc(in_die, &addr) != 0) { |
864 | pr_warning("Failed to get entry pc of %s.\n", | ||
865 | dwarf_diename(in_die)); | ||
866 | param->retval = -ENOENT; | ||
867 | return DWARF_CB_ABORT; | ||
868 | } | ||
869 | pf->addr = addr; | ||
593 | pf->addr += pp->offset; | 870 | pf->addr += pp->offset; |
594 | pr_debug("found inline addr: 0x%jx\n", | 871 | pr_debug("found inline addr: 0x%jx\n", |
595 | (uintmax_t)pf->addr); | 872 | (uintmax_t)pf->addr); |
596 | 873 | ||
597 | show_probe_point(in_die, pf); | 874 | param->retval = convert_probe_point(in_die, pf); |
875 | if (param->retval < 0) | ||
876 | return DWARF_CB_ABORT; | ||
598 | } | 877 | } |
599 | 878 | ||
600 | return DWARF_CB_OK; | 879 | return DWARF_CB_OK; |
@@ -603,59 +882,88 @@ static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) | |||
603 | /* Search function from function name */ | 882 | /* Search function from function name */ |
604 | static int probe_point_search_cb(Dwarf_Die *sp_die, void *data) | 883 | static int probe_point_search_cb(Dwarf_Die *sp_die, void *data) |
605 | { | 884 | { |
606 | struct probe_finder *pf = (struct probe_finder *)data; | 885 | struct dwarf_callback_param *param = data; |
607 | struct probe_point *pp = pf->pp; | 886 | struct probe_finder *pf = param->data; |
887 | struct perf_probe_point *pp = &pf->pev->point; | ||
608 | 888 | ||
609 | /* Check tag and diename */ | 889 | /* Check tag and diename */ |
610 | if (dwarf_tag(sp_die) != DW_TAG_subprogram || | 890 | if (dwarf_tag(sp_die) != DW_TAG_subprogram || |
611 | die_compare_name(sp_die, pp->function) != 0) | 891 | die_compare_name(sp_die, pp->function) != 0) |
612 | return 0; | 892 | return DWARF_CB_OK; |
613 | 893 | ||
614 | pf->fname = dwarf_decl_file(sp_die); | 894 | pf->fname = dwarf_decl_file(sp_die); |
615 | if (pp->line) { /* Function relative line */ | 895 | if (pp->line) { /* Function relative line */ |
616 | dwarf_decl_line(sp_die, &pf->lno); | 896 | dwarf_decl_line(sp_die, &pf->lno); |
617 | pf->lno += pp->line; | 897 | pf->lno += pp->line; |
618 | find_probe_point_by_line(pf); | 898 | param->retval = find_probe_point_by_line(pf); |
619 | } else if (!dwarf_func_inline(sp_die)) { | 899 | } else if (!dwarf_func_inline(sp_die)) { |
620 | /* Real function */ | 900 | /* Real function */ |
621 | if (pp->lazy_line) | 901 | if (pp->lazy_line) |
622 | find_probe_point_lazy(sp_die, pf); | 902 | param->retval = find_probe_point_lazy(sp_die, pf); |
623 | else { | 903 | else { |
624 | pf->addr = die_get_entrypc(sp_die); | 904 | if (dwarf_entrypc(sp_die, &pf->addr) != 0) { |
905 | pr_warning("Failed to get entry pc of %s.\n", | ||
906 | dwarf_diename(sp_die)); | ||
907 | param->retval = -ENOENT; | ||
908 | return DWARF_CB_ABORT; | ||
909 | } | ||
625 | pf->addr += pp->offset; | 910 | pf->addr += pp->offset; |
626 | /* TODO: Check the address in this function */ | 911 | /* TODO: Check the address in this function */ |
627 | show_probe_point(sp_die, pf); | 912 | param->retval = convert_probe_point(sp_die, pf); |
628 | } | 913 | } |
629 | } else | 914 | } else { |
915 | struct dwarf_callback_param _param = {.data = (void *)pf, | ||
916 | .retval = 0}; | ||
630 | /* Inlined function: search instances */ | 917 | /* Inlined function: search instances */ |
631 | dwarf_func_inline_instances(sp_die, probe_point_inline_cb, pf); | 918 | dwarf_func_inline_instances(sp_die, probe_point_inline_cb, |
919 | &_param); | ||
920 | param->retval = _param.retval; | ||
921 | } | ||
632 | 922 | ||
633 | return 1; /* Exit; no same symbol in this CU. */ | 923 | return DWARF_CB_ABORT; /* Exit; no same symbol in this CU. */ |
634 | } | 924 | } |
635 | 925 | ||
636 | static void find_probe_point_by_func(struct probe_finder *pf) | 926 | static int find_probe_point_by_func(struct probe_finder *pf) |
637 | { | 927 | { |
638 | dwarf_getfuncs(&pf->cu_die, probe_point_search_cb, pf, 0); | 928 | struct dwarf_callback_param _param = {.data = (void *)pf, |
929 | .retval = 0}; | ||
930 | dwarf_getfuncs(&pf->cu_die, probe_point_search_cb, &_param, 0); | ||
931 | return _param.retval; | ||
639 | } | 932 | } |
640 | 933 | ||
641 | /* Find a probe point */ | 934 | /* Find kprobe_trace_events specified by perf_probe_event from debuginfo */ |
642 | int find_probe_point(int fd, struct probe_point *pp) | 935 | int find_kprobe_trace_events(int fd, struct perf_probe_event *pev, |
936 | struct kprobe_trace_event **tevs, int max_tevs) | ||
643 | { | 937 | { |
644 | struct probe_finder pf = {.pp = pp}; | 938 | struct probe_finder pf = {.pev = pev, .max_tevs = max_tevs}; |
939 | struct perf_probe_point *pp = &pev->point; | ||
645 | Dwarf_Off off, noff; | 940 | Dwarf_Off off, noff; |
646 | size_t cuhl; | 941 | size_t cuhl; |
647 | Dwarf_Die *diep; | 942 | Dwarf_Die *diep; |
648 | Dwarf *dbg; | 943 | Dwarf *dbg; |
944 | int ret = 0; | ||
945 | |||
946 | pf.tevs = zalloc(sizeof(struct kprobe_trace_event) * max_tevs); | ||
947 | if (pf.tevs == NULL) | ||
948 | return -ENOMEM; | ||
949 | *tevs = pf.tevs; | ||
950 | pf.ntevs = 0; | ||
649 | 951 | ||
650 | dbg = dwarf_begin(fd, DWARF_C_READ); | 952 | dbg = dwarf_begin(fd, DWARF_C_READ); |
651 | if (!dbg) | 953 | if (!dbg) { |
652 | return -ENOENT; | 954 | pr_warning("No dwarf info found in the vmlinux - " |
955 | "please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
956 | return -EBADF; | ||
957 | } | ||
958 | |||
959 | /* Get the call frame information from this dwarf */ | ||
960 | pf.cfi = dwarf_getcfi(dbg); | ||
653 | 961 | ||
654 | pp->found = 0; | ||
655 | off = 0; | 962 | off = 0; |
656 | line_list__init(&pf.lcache); | 963 | line_list__init(&pf.lcache); |
657 | /* Loop on CUs (Compilation Unit) */ | 964 | /* Loop on CUs (Compilation Unit) */ |
658 | while (!dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL)) { | 965 | while (!dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) && |
966 | ret >= 0) { | ||
659 | /* Get the DIE(Debugging Information Entry) of this CU */ | 967 | /* Get the DIE(Debugging Information Entry) of this CU */ |
660 | diep = dwarf_offdie(dbg, off + cuhl, &pf.cu_die); | 968 | diep = dwarf_offdie(dbg, off + cuhl, &pf.cu_die); |
661 | if (!diep) | 969 | if (!diep) |
@@ -669,12 +977,12 @@ int find_probe_point(int fd, struct probe_point *pp) | |||
669 | 977 | ||
670 | if (!pp->file || pf.fname) { | 978 | if (!pp->file || pf.fname) { |
671 | if (pp->function) | 979 | if (pp->function) |
672 | find_probe_point_by_func(&pf); | 980 | ret = find_probe_point_by_func(&pf); |
673 | else if (pp->lazy_line) | 981 | else if (pp->lazy_line) |
674 | find_probe_point_lazy(NULL, &pf); | 982 | ret = find_probe_point_lazy(NULL, &pf); |
675 | else { | 983 | else { |
676 | pf.lno = pp->line; | 984 | pf.lno = pp->line; |
677 | find_probe_point_by_line(&pf); | 985 | ret = find_probe_point_by_line(&pf); |
678 | } | 986 | } |
679 | } | 987 | } |
680 | off = noff; | 988 | off = noff; |
@@ -682,41 +990,169 @@ int find_probe_point(int fd, struct probe_point *pp) | |||
682 | line_list__free(&pf.lcache); | 990 | line_list__free(&pf.lcache); |
683 | dwarf_end(dbg); | 991 | dwarf_end(dbg); |
684 | 992 | ||
685 | return pp->found; | 993 | return (ret < 0) ? ret : pf.ntevs; |
994 | } | ||
995 | |||
996 | /* Reverse search */ | ||
997 | int find_perf_probe_point(int fd, unsigned long addr, | ||
998 | struct perf_probe_point *ppt) | ||
999 | { | ||
1000 | Dwarf_Die cudie, spdie, indie; | ||
1001 | Dwarf *dbg; | ||
1002 | Dwarf_Line *line; | ||
1003 | Dwarf_Addr laddr, eaddr; | ||
1004 | const char *tmp; | ||
1005 | int lineno, ret = 0; | ||
1006 | bool found = false; | ||
1007 | |||
1008 | dbg = dwarf_begin(fd, DWARF_C_READ); | ||
1009 | if (!dbg) | ||
1010 | return -EBADF; | ||
1011 | |||
1012 | /* Find cu die */ | ||
1013 | if (!dwarf_addrdie(dbg, (Dwarf_Addr)addr, &cudie)) { | ||
1014 | ret = -EINVAL; | ||
1015 | goto end; | ||
1016 | } | ||
1017 | |||
1018 | /* Find a corresponding line */ | ||
1019 | line = dwarf_getsrc_die(&cudie, (Dwarf_Addr)addr); | ||
1020 | if (line) { | ||
1021 | if (dwarf_lineaddr(line, &laddr) == 0 && | ||
1022 | (Dwarf_Addr)addr == laddr && | ||
1023 | dwarf_lineno(line, &lineno) == 0) { | ||
1024 | tmp = dwarf_linesrc(line, NULL, NULL); | ||
1025 | if (tmp) { | ||
1026 | ppt->line = lineno; | ||
1027 | ppt->file = strdup(tmp); | ||
1028 | if (ppt->file == NULL) { | ||
1029 | ret = -ENOMEM; | ||
1030 | goto end; | ||
1031 | } | ||
1032 | found = true; | ||
1033 | } | ||
1034 | } | ||
1035 | } | ||
1036 | |||
1037 | /* Find a corresponding function */ | ||
1038 | if (die_find_real_subprogram(&cudie, (Dwarf_Addr)addr, &spdie)) { | ||
1039 | tmp = dwarf_diename(&spdie); | ||
1040 | if (!tmp || dwarf_entrypc(&spdie, &eaddr) != 0) | ||
1041 | goto end; | ||
1042 | |||
1043 | if (ppt->line) { | ||
1044 | if (die_find_inlinefunc(&spdie, (Dwarf_Addr)addr, | ||
1045 | &indie)) { | ||
1046 | /* addr in an inline function */ | ||
1047 | tmp = dwarf_diename(&indie); | ||
1048 | if (!tmp) | ||
1049 | goto end; | ||
1050 | ret = dwarf_decl_line(&indie, &lineno); | ||
1051 | } else { | ||
1052 | if (eaddr == addr) { /* Function entry */ | ||
1053 | lineno = ppt->line; | ||
1054 | ret = 0; | ||
1055 | } else | ||
1056 | ret = dwarf_decl_line(&spdie, &lineno); | ||
1057 | } | ||
1058 | if (ret == 0) { | ||
1059 | /* Make a relative line number */ | ||
1060 | ppt->line -= lineno; | ||
1061 | goto found; | ||
1062 | } | ||
1063 | } | ||
1064 | /* We don't have a line number, let's use offset */ | ||
1065 | ppt->offset = addr - (unsigned long)eaddr; | ||
1066 | found: | ||
1067 | ppt->function = strdup(tmp); | ||
1068 | if (ppt->function == NULL) { | ||
1069 | ret = -ENOMEM; | ||
1070 | goto end; | ||
1071 | } | ||
1072 | found = true; | ||
1073 | } | ||
1074 | |||
1075 | end: | ||
1076 | dwarf_end(dbg); | ||
1077 | if (ret >= 0) | ||
1078 | ret = found ? 1 : 0; | ||
1079 | return ret; | ||
1080 | } | ||
1081 | |||
1082 | /* Add a line and store the src path */ | ||
1083 | static int line_range_add_line(const char *src, unsigned int lineno, | ||
1084 | struct line_range *lr) | ||
1085 | { | ||
1086 | /* Copy real path */ | ||
1087 | if (!lr->path) { | ||
1088 | lr->path = strdup(src); | ||
1089 | if (lr->path == NULL) | ||
1090 | return -ENOMEM; | ||
1091 | } | ||
1092 | return line_list__add_line(&lr->line_list, lineno); | ||
1093 | } | ||
1094 | |||
1095 | /* Search function declaration lines */ | ||
1096 | static int line_range_funcdecl_cb(Dwarf_Die *sp_die, void *data) | ||
1097 | { | ||
1098 | struct dwarf_callback_param *param = data; | ||
1099 | struct line_finder *lf = param->data; | ||
1100 | const char *src; | ||
1101 | int lineno; | ||
1102 | |||
1103 | src = dwarf_decl_file(sp_die); | ||
1104 | if (src && strtailcmp(src, lf->fname) != 0) | ||
1105 | return DWARF_CB_OK; | ||
1106 | |||
1107 | if (dwarf_decl_line(sp_die, &lineno) != 0 || | ||
1108 | (lf->lno_s > lineno || lf->lno_e < lineno)) | ||
1109 | return DWARF_CB_OK; | ||
1110 | |||
1111 | param->retval = line_range_add_line(src, lineno, lf->lr); | ||
1112 | if (param->retval < 0) | ||
1113 | return DWARF_CB_ABORT; | ||
1114 | return DWARF_CB_OK; | ||
1115 | } | ||
1116 | |||
1117 | static int find_line_range_func_decl_lines(struct line_finder *lf) | ||
1118 | { | ||
1119 | struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0}; | ||
1120 | dwarf_getfuncs(&lf->cu_die, line_range_funcdecl_cb, ¶m, 0); | ||
1121 | return param.retval; | ||
686 | } | 1122 | } |
687 | 1123 | ||
688 | /* Find line range from its line number */ | 1124 | /* Find line range from its line number */ |
689 | static void find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) | 1125 | static int find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) |
690 | { | 1126 | { |
691 | Dwarf_Lines *lines; | 1127 | Dwarf_Lines *lines; |
692 | Dwarf_Line *line; | 1128 | Dwarf_Line *line; |
693 | size_t nlines, i; | 1129 | size_t nlines, i; |
694 | Dwarf_Addr addr; | 1130 | Dwarf_Addr addr; |
695 | int lineno; | 1131 | int lineno, ret = 0; |
696 | int ret; | ||
697 | const char *src; | 1132 | const char *src; |
698 | Dwarf_Die die_mem; | 1133 | Dwarf_Die die_mem; |
699 | 1134 | ||
700 | line_list__init(&lf->lr->line_list); | 1135 | line_list__init(&lf->lr->line_list); |
701 | ret = dwarf_getsrclines(&lf->cu_die, &lines, &nlines); | 1136 | if (dwarf_getsrclines(&lf->cu_die, &lines, &nlines) != 0) { |
702 | DIE_IF(ret != 0); | 1137 | pr_warning("No source lines found in this CU.\n"); |
1138 | return -ENOENT; | ||
1139 | } | ||
703 | 1140 | ||
1141 | /* Search probable lines on lines list */ | ||
704 | for (i = 0; i < nlines; i++) { | 1142 | for (i = 0; i < nlines; i++) { |
705 | line = dwarf_onesrcline(lines, i); | 1143 | line = dwarf_onesrcline(lines, i); |
706 | ret = dwarf_lineno(line, &lineno); | 1144 | if (dwarf_lineno(line, &lineno) != 0 || |
707 | DIE_IF(ret != 0); | 1145 | (lf->lno_s > lineno || lf->lno_e < lineno)) |
708 | if (lf->lno_s > lineno || lf->lno_e < lineno) | ||
709 | continue; | 1146 | continue; |
710 | 1147 | ||
711 | if (sp_die) { | 1148 | if (sp_die) { |
712 | /* Address filtering 1: does sp_die include addr? */ | 1149 | /* Address filtering 1: does sp_die include addr? */ |
713 | ret = dwarf_lineaddr(line, &addr); | 1150 | if (dwarf_lineaddr(line, &addr) != 0 || |
714 | DIE_IF(ret != 0); | 1151 | !dwarf_haspc(sp_die, addr)) |
715 | if (!dwarf_haspc(sp_die, addr)) | ||
716 | continue; | 1152 | continue; |
717 | 1153 | ||
718 | /* Address filtering 2: No child include addr? */ | 1154 | /* Address filtering 2: No child include addr? */ |
719 | if (die_get_inlinefunc(sp_die, addr, &die_mem)) | 1155 | if (die_find_inlinefunc(sp_die, addr, &die_mem)) |
720 | continue; | 1156 | continue; |
721 | } | 1157 | } |
722 | 1158 | ||
@@ -725,30 +1161,49 @@ static void find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) | |||
725 | if (strtailcmp(src, lf->fname) != 0) | 1161 | if (strtailcmp(src, lf->fname) != 0) |
726 | continue; | 1162 | continue; |
727 | 1163 | ||
728 | /* Copy real path */ | 1164 | ret = line_range_add_line(src, lineno, lf->lr); |
729 | if (!lf->lr->path) | 1165 | if (ret < 0) |
730 | lf->lr->path = strdup(src); | 1166 | return ret; |
731 | line_list__add_line(&lf->lr->line_list, (unsigned int)lineno); | ||
732 | } | 1167 | } |
1168 | |||
1169 | /* | ||
1170 | * Dwarf lines doesn't include function declarations. We have to | ||
1171 | * check functions list or given function. | ||
1172 | */ | ||
1173 | if (sp_die) { | ||
1174 | src = dwarf_decl_file(sp_die); | ||
1175 | if (src && dwarf_decl_line(sp_die, &lineno) == 0 && | ||
1176 | (lf->lno_s <= lineno && lf->lno_e >= lineno)) | ||
1177 | ret = line_range_add_line(src, lineno, lf->lr); | ||
1178 | } else | ||
1179 | ret = find_line_range_func_decl_lines(lf); | ||
1180 | |||
733 | /* Update status */ | 1181 | /* Update status */ |
734 | if (!list_empty(&lf->lr->line_list)) | 1182 | if (ret >= 0) |
735 | lf->found = 1; | 1183 | if (!list_empty(&lf->lr->line_list)) |
1184 | ret = lf->found = 1; | ||
1185 | else | ||
1186 | ret = 0; /* Lines are not found */ | ||
736 | else { | 1187 | else { |
737 | free(lf->lr->path); | 1188 | free(lf->lr->path); |
738 | lf->lr->path = NULL; | 1189 | lf->lr->path = NULL; |
739 | } | 1190 | } |
1191 | return ret; | ||
740 | } | 1192 | } |
741 | 1193 | ||
742 | static int line_range_inline_cb(Dwarf_Die *in_die, void *data) | 1194 | static int line_range_inline_cb(Dwarf_Die *in_die, void *data) |
743 | { | 1195 | { |
744 | find_line_range_by_line(in_die, (struct line_finder *)data); | 1196 | struct dwarf_callback_param *param = data; |
1197 | |||
1198 | param->retval = find_line_range_by_line(in_die, param->data); | ||
745 | return DWARF_CB_ABORT; /* No need to find other instances */ | 1199 | return DWARF_CB_ABORT; /* No need to find other instances */ |
746 | } | 1200 | } |
747 | 1201 | ||
748 | /* Search function from function name */ | 1202 | /* Search function from function name */ |
749 | static int line_range_search_cb(Dwarf_Die *sp_die, void *data) | 1203 | static int line_range_search_cb(Dwarf_Die *sp_die, void *data) |
750 | { | 1204 | { |
751 | struct line_finder *lf = (struct line_finder *)data; | 1205 | struct dwarf_callback_param *param = data; |
1206 | struct line_finder *lf = param->data; | ||
752 | struct line_range *lr = lf->lr; | 1207 | struct line_range *lr = lf->lr; |
753 | 1208 | ||
754 | if (dwarf_tag(sp_die) == DW_TAG_subprogram && | 1209 | if (dwarf_tag(sp_die) == DW_TAG_subprogram && |
@@ -757,44 +1212,55 @@ static int line_range_search_cb(Dwarf_Die *sp_die, void *data) | |||
757 | dwarf_decl_line(sp_die, &lr->offset); | 1212 | dwarf_decl_line(sp_die, &lr->offset); |
758 | pr_debug("fname: %s, lineno:%d\n", lf->fname, lr->offset); | 1213 | pr_debug("fname: %s, lineno:%d\n", lf->fname, lr->offset); |
759 | lf->lno_s = lr->offset + lr->start; | 1214 | lf->lno_s = lr->offset + lr->start; |
760 | if (!lr->end) | 1215 | if (lf->lno_s < 0) /* Overflow */ |
1216 | lf->lno_s = INT_MAX; | ||
1217 | lf->lno_e = lr->offset + lr->end; | ||
1218 | if (lf->lno_e < 0) /* Overflow */ | ||
761 | lf->lno_e = INT_MAX; | 1219 | lf->lno_e = INT_MAX; |
762 | else | 1220 | pr_debug("New line range: %d to %d\n", lf->lno_s, lf->lno_e); |
763 | lf->lno_e = lr->offset + lr->end; | ||
764 | lr->start = lf->lno_s; | 1221 | lr->start = lf->lno_s; |
765 | lr->end = lf->lno_e; | 1222 | lr->end = lf->lno_e; |
766 | if (dwarf_func_inline(sp_die)) | 1223 | if (dwarf_func_inline(sp_die)) { |
1224 | struct dwarf_callback_param _param; | ||
1225 | _param.data = (void *)lf; | ||
1226 | _param.retval = 0; | ||
767 | dwarf_func_inline_instances(sp_die, | 1227 | dwarf_func_inline_instances(sp_die, |
768 | line_range_inline_cb, lf); | 1228 | line_range_inline_cb, |
769 | else | 1229 | &_param); |
770 | find_line_range_by_line(sp_die, lf); | 1230 | param->retval = _param.retval; |
771 | return 1; | 1231 | } else |
1232 | param->retval = find_line_range_by_line(sp_die, lf); | ||
1233 | return DWARF_CB_ABORT; | ||
772 | } | 1234 | } |
773 | return 0; | 1235 | return DWARF_CB_OK; |
774 | } | 1236 | } |
775 | 1237 | ||
776 | static void find_line_range_by_func(struct line_finder *lf) | 1238 | static int find_line_range_by_func(struct line_finder *lf) |
777 | { | 1239 | { |
778 | dwarf_getfuncs(&lf->cu_die, line_range_search_cb, lf, 0); | 1240 | struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0}; |
1241 | dwarf_getfuncs(&lf->cu_die, line_range_search_cb, ¶m, 0); | ||
1242 | return param.retval; | ||
779 | } | 1243 | } |
780 | 1244 | ||
781 | int find_line_range(int fd, struct line_range *lr) | 1245 | int find_line_range(int fd, struct line_range *lr) |
782 | { | 1246 | { |
783 | struct line_finder lf = {.lr = lr, .found = 0}; | 1247 | struct line_finder lf = {.lr = lr, .found = 0}; |
784 | int ret; | 1248 | int ret = 0; |
785 | Dwarf_Off off = 0, noff; | 1249 | Dwarf_Off off = 0, noff; |
786 | size_t cuhl; | 1250 | size_t cuhl; |
787 | Dwarf_Die *diep; | 1251 | Dwarf_Die *diep; |
788 | Dwarf *dbg; | 1252 | Dwarf *dbg; |
789 | 1253 | ||
790 | dbg = dwarf_begin(fd, DWARF_C_READ); | 1254 | dbg = dwarf_begin(fd, DWARF_C_READ); |
791 | if (!dbg) | 1255 | if (!dbg) { |
792 | return -ENOENT; | 1256 | pr_warning("No dwarf info found in the vmlinux - " |
1257 | "please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
1258 | return -EBADF; | ||
1259 | } | ||
793 | 1260 | ||
794 | /* Loop on CUs (Compilation Unit) */ | 1261 | /* Loop on CUs (Compilation Unit) */ |
795 | while (!lf.found) { | 1262 | while (!lf.found && ret >= 0) { |
796 | ret = dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL); | 1263 | if (dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) != 0) |
797 | if (ret != 0) | ||
798 | break; | 1264 | break; |
799 | 1265 | ||
800 | /* Get the DIE(Debugging Information Entry) of this CU */ | 1266 | /* Get the DIE(Debugging Information Entry) of this CU */ |
@@ -810,20 +1276,18 @@ int find_line_range(int fd, struct line_range *lr) | |||
810 | 1276 | ||
811 | if (!lr->file || lf.fname) { | 1277 | if (!lr->file || lf.fname) { |
812 | if (lr->function) | 1278 | if (lr->function) |
813 | find_line_range_by_func(&lf); | 1279 | ret = find_line_range_by_func(&lf); |
814 | else { | 1280 | else { |
815 | lf.lno_s = lr->start; | 1281 | lf.lno_s = lr->start; |
816 | if (!lr->end) | 1282 | lf.lno_e = lr->end; |
817 | lf.lno_e = INT_MAX; | 1283 | ret = find_line_range_by_line(NULL, &lf); |
818 | else | ||
819 | lf.lno_e = lr->end; | ||
820 | find_line_range_by_line(NULL, &lf); | ||
821 | } | 1284 | } |
822 | } | 1285 | } |
823 | off = noff; | 1286 | off = noff; |
824 | } | 1287 | } |
825 | pr_debug("path: %lx\n", (unsigned long)lr->path); | 1288 | pr_debug("path: %lx\n", (unsigned long)lr->path); |
826 | dwarf_end(dbg); | 1289 | dwarf_end(dbg); |
827 | return lf.found; | 1290 | |
1291 | return (ret < 0) ? ret : lf.found; | ||
828 | } | 1292 | } |
829 | 1293 | ||
diff --git a/tools/perf/util/probe-finder.h b/tools/perf/util/probe-finder.h index 21f7354397b4..66f1980e3855 100644 --- a/tools/perf/util/probe-finder.h +++ b/tools/perf/util/probe-finder.h | |||
@@ -3,6 +3,7 @@ | |||
3 | 3 | ||
4 | #include <stdbool.h> | 4 | #include <stdbool.h> |
5 | #include "util.h" | 5 | #include "util.h" |
6 | #include "probe-event.h" | ||
6 | 7 | ||
7 | #define MAX_PATH_LEN 256 | 8 | #define MAX_PATH_LEN 256 |
8 | #define MAX_PROBE_BUFFER 1024 | 9 | #define MAX_PROBE_BUFFER 1024 |
@@ -14,67 +15,39 @@ static inline int is_c_varname(const char *name) | |||
14 | return isalpha(name[0]) || name[0] == '_'; | 15 | return isalpha(name[0]) || name[0] == '_'; |
15 | } | 16 | } |
16 | 17 | ||
17 | struct probe_point { | 18 | #ifdef DWARF_SUPPORT |
18 | char *event; /* Event name */ | 19 | /* Find kprobe_trace_events specified by perf_probe_event from debuginfo */ |
19 | char *group; /* Event group */ | 20 | extern int find_kprobe_trace_events(int fd, struct perf_probe_event *pev, |
21 | struct kprobe_trace_event **tevs, | ||
22 | int max_tevs); | ||
20 | 23 | ||
21 | /* Inputs */ | 24 | /* Find a perf_probe_point from debuginfo */ |
22 | char *file; /* File name */ | 25 | extern int find_perf_probe_point(int fd, unsigned long addr, |
23 | int line; /* Line number */ | 26 | struct perf_probe_point *ppt); |
24 | char *lazy_line; /* Lazy line pattern */ | ||
25 | 27 | ||
26 | char *function; /* Function name */ | ||
27 | int offset; /* Offset bytes */ | ||
28 | |||
29 | int nr_args; /* Number of arguments */ | ||
30 | char **args; /* Arguments */ | ||
31 | |||
32 | int retprobe; /* Return probe */ | ||
33 | |||
34 | /* Output */ | ||
35 | int found; /* Number of found probe points */ | ||
36 | char *probes[MAX_PROBES]; /* Output buffers (will be allocated)*/ | ||
37 | }; | ||
38 | |||
39 | /* Line number container */ | ||
40 | struct line_node { | ||
41 | struct list_head list; | ||
42 | unsigned int line; | ||
43 | }; | ||
44 | |||
45 | /* Line range */ | ||
46 | struct line_range { | ||
47 | char *file; /* File name */ | ||
48 | char *function; /* Function name */ | ||
49 | unsigned int start; /* Start line number */ | ||
50 | unsigned int end; /* End line number */ | ||
51 | int offset; /* Start line offset */ | ||
52 | char *path; /* Real path name */ | ||
53 | struct list_head line_list; /* Visible lines */ | ||
54 | }; | ||
55 | |||
56 | #ifndef NO_DWARF_SUPPORT | ||
57 | extern int find_probe_point(int fd, struct probe_point *pp); | ||
58 | extern int find_line_range(int fd, struct line_range *lr); | 28 | extern int find_line_range(int fd, struct line_range *lr); |
59 | 29 | ||
60 | #include <dwarf.h> | 30 | #include <dwarf.h> |
61 | #include <libdw.h> | 31 | #include <libdw.h> |
62 | 32 | ||
63 | struct probe_finder { | 33 | struct probe_finder { |
64 | struct probe_point *pp; /* Target probe point */ | 34 | struct perf_probe_event *pev; /* Target probe event */ |
35 | struct kprobe_trace_event *tevs; /* Result trace events */ | ||
36 | int ntevs; /* Number of trace events */ | ||
37 | int max_tevs; /* Max number of trace events */ | ||
65 | 38 | ||
66 | /* For function searching */ | 39 | /* For function searching */ |
67 | Dwarf_Addr addr; /* Address */ | ||
68 | const char *fname; /* File name */ | ||
69 | int lno; /* Line number */ | 40 | int lno; /* Line number */ |
41 | Dwarf_Addr addr; /* Address */ | ||
42 | const char *fname; /* Real file name */ | ||
70 | Dwarf_Die cu_die; /* Current CU */ | 43 | Dwarf_Die cu_die; /* Current CU */ |
44 | struct list_head lcache; /* Line cache for lazy match */ | ||
71 | 45 | ||
72 | /* For variable searching */ | 46 | /* For variable searching */ |
47 | Dwarf_CFI *cfi; /* Call Frame Information */ | ||
73 | Dwarf_Op *fb_ops; /* Frame base attribute */ | 48 | Dwarf_Op *fb_ops; /* Frame base attribute */ |
74 | const char *var; /* Current variable name */ | 49 | struct perf_probe_arg *pvar; /* Current target variable */ |
75 | char *buf; /* Current output buffer */ | 50 | struct kprobe_trace_arg *tvar; /* Current result variable */ |
76 | int len; /* Length of output buffer */ | ||
77 | struct list_head lcache; /* Line cache for lazy match */ | ||
78 | }; | 51 | }; |
79 | 52 | ||
80 | struct line_finder { | 53 | struct line_finder { |
@@ -87,6 +60,6 @@ struct line_finder { | |||
87 | int found; | 60 | int found; |
88 | }; | 61 | }; |
89 | 62 | ||
90 | #endif /* NO_DWARF_SUPPORT */ | 63 | #endif /* DWARF_SUPPORT */ |
91 | 64 | ||
92 | #endif /*_PROBE_FINDER_H */ | 65 | #endif /*_PROBE_FINDER_H */ |
diff --git a/tools/perf/util/pstack.c b/tools/perf/util/pstack.c new file mode 100644 index 000000000000..13d36faf64eb --- /dev/null +++ b/tools/perf/util/pstack.c | |||
@@ -0,0 +1,75 @@ | |||
1 | /* | ||
2 | * Simple pointer stack | ||
3 | * | ||
4 | * (c) 2010 Arnaldo Carvalho de Melo <acme@redhat.com> | ||
5 | */ | ||
6 | |||
7 | #include "util.h" | ||
8 | #include "pstack.h" | ||
9 | #include <linux/kernel.h> | ||
10 | #include <stdlib.h> | ||
11 | |||
12 | struct pstack { | ||
13 | unsigned short top; | ||
14 | unsigned short max_nr_entries; | ||
15 | void *entries[0]; | ||
16 | }; | ||
17 | |||
18 | struct pstack *pstack__new(unsigned short max_nr_entries) | ||
19 | { | ||
20 | struct pstack *self = zalloc((sizeof(*self) + | ||
21 | max_nr_entries * sizeof(void *))); | ||
22 | if (self != NULL) | ||
23 | self->max_nr_entries = max_nr_entries; | ||
24 | return self; | ||
25 | } | ||
26 | |||
27 | void pstack__delete(struct pstack *self) | ||
28 | { | ||
29 | free(self); | ||
30 | } | ||
31 | |||
32 | bool pstack__empty(const struct pstack *self) | ||
33 | { | ||
34 | return self->top == 0; | ||
35 | } | ||
36 | |||
37 | void pstack__remove(struct pstack *self, void *key) | ||
38 | { | ||
39 | unsigned short i = self->top, last_index = self->top - 1; | ||
40 | |||
41 | while (i-- != 0) { | ||
42 | if (self->entries[i] == key) { | ||
43 | if (i < last_index) | ||
44 | memmove(self->entries + i, | ||
45 | self->entries + i + 1, | ||
46 | (last_index - i) * sizeof(void *)); | ||
47 | --self->top; | ||
48 | return; | ||
49 | } | ||
50 | } | ||
51 | pr_err("%s: %p not on the pstack!\n", __func__, key); | ||
52 | } | ||
53 | |||
54 | void pstack__push(struct pstack *self, void *key) | ||
55 | { | ||
56 | if (self->top == self->max_nr_entries) { | ||
57 | pr_err("%s: top=%d, overflow!\n", __func__, self->top); | ||
58 | return; | ||
59 | } | ||
60 | self->entries[self->top++] = key; | ||
61 | } | ||
62 | |||
63 | void *pstack__pop(struct pstack *self) | ||
64 | { | ||
65 | void *ret; | ||
66 | |||
67 | if (self->top == 0) { | ||
68 | pr_err("%s: underflow!\n", __func__); | ||
69 | return NULL; | ||
70 | } | ||
71 | |||
72 | ret = self->entries[--self->top]; | ||
73 | self->entries[self->top] = NULL; | ||
74 | return ret; | ||
75 | } | ||
diff --git a/tools/perf/util/pstack.h b/tools/perf/util/pstack.h new file mode 100644 index 000000000000..5ad07023504b --- /dev/null +++ b/tools/perf/util/pstack.h | |||
@@ -0,0 +1,12 @@ | |||
1 | #ifndef _PERF_PSTACK_ | ||
2 | #define _PERF_PSTACK_ | ||
3 | |||
4 | struct pstack; | ||
5 | struct pstack *pstack__new(unsigned short max_nr_entries); | ||
6 | void pstack__delete(struct pstack *self); | ||
7 | bool pstack__empty(const struct pstack *self); | ||
8 | void pstack__remove(struct pstack *self, void *key); | ||
9 | void pstack__push(struct pstack *self, void *key); | ||
10 | void *pstack__pop(struct pstack *self); | ||
11 | |||
12 | #endif /* _PERF_PSTACK_ */ | ||
diff --git a/tools/perf/util/scripting-engines/trace-event-perl.c b/tools/perf/util/scripting-engines/trace-event-perl.c index 5376378e0cfc..b059dc50cc2d 100644 --- a/tools/perf/util/scripting-engines/trace-event-perl.c +++ b/tools/perf/util/scripting-engines/trace-event-perl.c | |||
@@ -371,7 +371,6 @@ static int perl_start_script(const char *script, int argc, const char **argv) | |||
371 | run_start_sub(); | 371 | run_start_sub(); |
372 | 372 | ||
373 | free(command_line); | 373 | free(command_line); |
374 | fprintf(stderr, "perf trace started with Perl script %s\n\n", script); | ||
375 | return 0; | 374 | return 0; |
376 | error: | 375 | error: |
377 | perl_free(my_perl); | 376 | perl_free(my_perl); |
@@ -394,8 +393,6 @@ static int perl_stop_script(void) | |||
394 | perl_destruct(my_perl); | 393 | perl_destruct(my_perl); |
395 | perl_free(my_perl); | 394 | perl_free(my_perl); |
396 | 395 | ||
397 | fprintf(stderr, "\nperf trace Perl script stopped\n"); | ||
398 | |||
399 | return 0; | 396 | return 0; |
400 | } | 397 | } |
401 | 398 | ||
diff --git a/tools/perf/util/scripting-engines/trace-event-python.c b/tools/perf/util/scripting-engines/trace-event-python.c index 6a72f14c5986..81f39cab3aaa 100644 --- a/tools/perf/util/scripting-engines/trace-event-python.c +++ b/tools/perf/util/scripting-engines/trace-event-python.c | |||
@@ -374,8 +374,6 @@ static int python_start_script(const char *script, int argc, const char **argv) | |||
374 | } | 374 | } |
375 | 375 | ||
376 | free(command_line); | 376 | free(command_line); |
377 | fprintf(stderr, "perf trace started with Python script %s\n\n", | ||
378 | script); | ||
379 | 377 | ||
380 | return err; | 378 | return err; |
381 | error: | 379 | error: |
@@ -407,8 +405,6 @@ out: | |||
407 | Py_XDECREF(main_module); | 405 | Py_XDECREF(main_module); |
408 | Py_Finalize(); | 406 | Py_Finalize(); |
409 | 407 | ||
410 | fprintf(stderr, "\nperf trace Python script stopped\n"); | ||
411 | |||
412 | return err; | 408 | return err; |
413 | } | 409 | } |
414 | 410 | ||
diff --git a/tools/perf/util/session.c b/tools/perf/util/session.c index eed1cb889008..25bfca4f10f0 100644 --- a/tools/perf/util/session.c +++ b/tools/perf/util/session.c | |||
@@ -14,6 +14,16 @@ static int perf_session__open(struct perf_session *self, bool force) | |||
14 | { | 14 | { |
15 | struct stat input_stat; | 15 | struct stat input_stat; |
16 | 16 | ||
17 | if (!strcmp(self->filename, "-")) { | ||
18 | self->fd_pipe = true; | ||
19 | self->fd = STDIN_FILENO; | ||
20 | |||
21 | if (perf_header__read(self, self->fd) < 0) | ||
22 | pr_err("incompatible file format"); | ||
23 | |||
24 | return 0; | ||
25 | } | ||
26 | |||
17 | self->fd = open(self->filename, O_RDONLY); | 27 | self->fd = open(self->filename, O_RDONLY); |
18 | if (self->fd < 0) { | 28 | if (self->fd < 0) { |
19 | pr_err("failed to open file: %s", self->filename); | 29 | pr_err("failed to open file: %s", self->filename); |
@@ -38,7 +48,7 @@ static int perf_session__open(struct perf_session *self, bool force) | |||
38 | goto out_close; | 48 | goto out_close; |
39 | } | 49 | } |
40 | 50 | ||
41 | if (perf_header__read(&self->header, self->fd) < 0) { | 51 | if (perf_header__read(self, self->fd) < 0) { |
42 | pr_err("incompatible file format"); | 52 | pr_err("incompatible file format"); |
43 | goto out_close; | 53 | goto out_close; |
44 | } | 54 | } |
@@ -52,12 +62,21 @@ out_close: | |||
52 | return -1; | 62 | return -1; |
53 | } | 63 | } |
54 | 64 | ||
55 | static inline int perf_session__create_kernel_maps(struct perf_session *self) | 65 | void perf_session__update_sample_type(struct perf_session *self) |
66 | { | ||
67 | self->sample_type = perf_header__sample_type(&self->header); | ||
68 | } | ||
69 | |||
70 | int perf_session__create_kernel_maps(struct perf_session *self) | ||
56 | { | 71 | { |
57 | return map_groups__create_kernel_maps(&self->kmaps, self->vmlinux_maps); | 72 | int ret = machine__create_kernel_maps(&self->host_machine); |
73 | |||
74 | if (ret >= 0) | ||
75 | ret = machines__create_guest_kernel_maps(&self->machines); | ||
76 | return ret; | ||
58 | } | 77 | } |
59 | 78 | ||
60 | struct perf_session *perf_session__new(const char *filename, int mode, bool force) | 79 | struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe) |
61 | { | 80 | { |
62 | size_t len = filename ? strlen(filename) + 1 : 0; | 81 | size_t len = filename ? strlen(filename) + 1 : 0; |
63 | struct perf_session *self = zalloc(sizeof(*self) + len); | 82 | struct perf_session *self = zalloc(sizeof(*self) + len); |
@@ -70,13 +89,15 @@ struct perf_session *perf_session__new(const char *filename, int mode, bool forc | |||
70 | 89 | ||
71 | memcpy(self->filename, filename, len); | 90 | memcpy(self->filename, filename, len); |
72 | self->threads = RB_ROOT; | 91 | self->threads = RB_ROOT; |
73 | self->stats_by_id = RB_ROOT; | 92 | self->hists_tree = RB_ROOT; |
74 | self->last_match = NULL; | 93 | self->last_match = NULL; |
75 | self->mmap_window = 32; | 94 | self->mmap_window = 32; |
76 | self->cwd = NULL; | 95 | self->cwd = NULL; |
77 | self->cwdlen = 0; | 96 | self->cwdlen = 0; |
78 | self->unknown_events = 0; | 97 | self->machines = RB_ROOT; |
79 | map_groups__init(&self->kmaps); | 98 | self->repipe = repipe; |
99 | INIT_LIST_HEAD(&self->ordered_samples.samples_head); | ||
100 | machine__init(&self->host_machine, "", HOST_KERNEL_ID); | ||
80 | 101 | ||
81 | if (mode == O_RDONLY) { | 102 | if (mode == O_RDONLY) { |
82 | if (perf_session__open(self, force) < 0) | 103 | if (perf_session__open(self, force) < 0) |
@@ -90,7 +111,7 @@ struct perf_session *perf_session__new(const char *filename, int mode, bool forc | |||
90 | goto out_delete; | 111 | goto out_delete; |
91 | } | 112 | } |
92 | 113 | ||
93 | self->sample_type = perf_header__sample_type(&self->header); | 114 | perf_session__update_sample_type(self); |
94 | out: | 115 | out: |
95 | return self; | 116 | return self; |
96 | out_free: | 117 | out_free: |
@@ -117,22 +138,17 @@ static bool symbol__match_parent_regex(struct symbol *sym) | |||
117 | return 0; | 138 | return 0; |
118 | } | 139 | } |
119 | 140 | ||
120 | struct symbol **perf_session__resolve_callchain(struct perf_session *self, | 141 | struct map_symbol *perf_session__resolve_callchain(struct perf_session *self, |
121 | struct thread *thread, | 142 | struct thread *thread, |
122 | struct ip_callchain *chain, | 143 | struct ip_callchain *chain, |
123 | struct symbol **parent) | 144 | struct symbol **parent) |
124 | { | 145 | { |
125 | u8 cpumode = PERF_RECORD_MISC_USER; | 146 | u8 cpumode = PERF_RECORD_MISC_USER; |
126 | struct symbol **syms = NULL; | ||
127 | unsigned int i; | 147 | unsigned int i; |
148 | struct map_symbol *syms = calloc(chain->nr, sizeof(*syms)); | ||
128 | 149 | ||
129 | if (symbol_conf.use_callchain) { | 150 | if (!syms) |
130 | syms = calloc(chain->nr, sizeof(*syms)); | 151 | return NULL; |
131 | if (!syms) { | ||
132 | fprintf(stderr, "Can't allocate memory for symbols\n"); | ||
133 | exit(-1); | ||
134 | } | ||
135 | } | ||
136 | 152 | ||
137 | for (i = 0; i < chain->nr; i++) { | 153 | for (i = 0; i < chain->nr; i++) { |
138 | u64 ip = chain->ips[i]; | 154 | u64 ip = chain->ips[i]; |
@@ -152,15 +168,17 @@ struct symbol **perf_session__resolve_callchain(struct perf_session *self, | |||
152 | continue; | 168 | continue; |
153 | } | 169 | } |
154 | 170 | ||
171 | al.filtered = false; | ||
155 | thread__find_addr_location(thread, self, cpumode, | 172 | thread__find_addr_location(thread, self, cpumode, |
156 | MAP__FUNCTION, ip, &al, NULL); | 173 | MAP__FUNCTION, thread->pid, ip, &al, NULL); |
157 | if (al.sym != NULL) { | 174 | if (al.sym != NULL) { |
158 | if (sort__has_parent && !*parent && | 175 | if (sort__has_parent && !*parent && |
159 | symbol__match_parent_regex(al.sym)) | 176 | symbol__match_parent_regex(al.sym)) |
160 | *parent = al.sym; | 177 | *parent = al.sym; |
161 | if (!symbol_conf.use_callchain) | 178 | if (!symbol_conf.use_callchain) |
162 | break; | 179 | break; |
163 | syms[i] = al.sym; | 180 | syms[i].map = al.map; |
181 | syms[i].sym = al.sym; | ||
164 | } | 182 | } |
165 | } | 183 | } |
166 | 184 | ||
@@ -174,6 +192,18 @@ static int process_event_stub(event_t *event __used, | |||
174 | return 0; | 192 | return 0; |
175 | } | 193 | } |
176 | 194 | ||
195 | static int process_finished_round_stub(event_t *event __used, | ||
196 | struct perf_session *session __used, | ||
197 | struct perf_event_ops *ops __used) | ||
198 | { | ||
199 | dump_printf(": unhandled!\n"); | ||
200 | return 0; | ||
201 | } | ||
202 | |||
203 | static int process_finished_round(event_t *event, | ||
204 | struct perf_session *session, | ||
205 | struct perf_event_ops *ops); | ||
206 | |||
177 | static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) | 207 | static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) |
178 | { | 208 | { |
179 | if (handler->sample == NULL) | 209 | if (handler->sample == NULL) |
@@ -194,29 +224,20 @@ static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) | |||
194 | handler->throttle = process_event_stub; | 224 | handler->throttle = process_event_stub; |
195 | if (handler->unthrottle == NULL) | 225 | if (handler->unthrottle == NULL) |
196 | handler->unthrottle = process_event_stub; | 226 | handler->unthrottle = process_event_stub; |
197 | } | 227 | if (handler->attr == NULL) |
198 | 228 | handler->attr = process_event_stub; | |
199 | static const char *event__name[] = { | 229 | if (handler->event_type == NULL) |
200 | [0] = "TOTAL", | 230 | handler->event_type = process_event_stub; |
201 | [PERF_RECORD_MMAP] = "MMAP", | 231 | if (handler->tracing_data == NULL) |
202 | [PERF_RECORD_LOST] = "LOST", | 232 | handler->tracing_data = process_event_stub; |
203 | [PERF_RECORD_COMM] = "COMM", | 233 | if (handler->build_id == NULL) |
204 | [PERF_RECORD_EXIT] = "EXIT", | 234 | handler->build_id = process_event_stub; |
205 | [PERF_RECORD_THROTTLE] = "THROTTLE", | 235 | if (handler->finished_round == NULL) { |
206 | [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE", | 236 | if (handler->ordered_samples) |
207 | [PERF_RECORD_FORK] = "FORK", | 237 | handler->finished_round = process_finished_round; |
208 | [PERF_RECORD_READ] = "READ", | 238 | else |
209 | [PERF_RECORD_SAMPLE] = "SAMPLE", | 239 | handler->finished_round = process_finished_round_stub; |
210 | }; | 240 | } |
211 | |||
212 | unsigned long event__total[PERF_RECORD_MAX]; | ||
213 | |||
214 | void event__print_totals(void) | ||
215 | { | ||
216 | int i; | ||
217 | for (i = 0; i < PERF_RECORD_MAX; ++i) | ||
218 | pr_info("%10s events: %10ld\n", | ||
219 | event__name[i], event__total[i]); | ||
220 | } | 241 | } |
221 | 242 | ||
222 | void mem_bswap_64(void *src, int byte_size) | 243 | void mem_bswap_64(void *src, int byte_size) |
@@ -270,6 +291,37 @@ static void event__read_swap(event_t *self) | |||
270 | self->read.id = bswap_64(self->read.id); | 291 | self->read.id = bswap_64(self->read.id); |
271 | } | 292 | } |
272 | 293 | ||
294 | static void event__attr_swap(event_t *self) | ||
295 | { | ||
296 | size_t size; | ||
297 | |||
298 | self->attr.attr.type = bswap_32(self->attr.attr.type); | ||
299 | self->attr.attr.size = bswap_32(self->attr.attr.size); | ||
300 | self->attr.attr.config = bswap_64(self->attr.attr.config); | ||
301 | self->attr.attr.sample_period = bswap_64(self->attr.attr.sample_period); | ||
302 | self->attr.attr.sample_type = bswap_64(self->attr.attr.sample_type); | ||
303 | self->attr.attr.read_format = bswap_64(self->attr.attr.read_format); | ||
304 | self->attr.attr.wakeup_events = bswap_32(self->attr.attr.wakeup_events); | ||
305 | self->attr.attr.bp_type = bswap_32(self->attr.attr.bp_type); | ||
306 | self->attr.attr.bp_addr = bswap_64(self->attr.attr.bp_addr); | ||
307 | self->attr.attr.bp_len = bswap_64(self->attr.attr.bp_len); | ||
308 | |||
309 | size = self->header.size; | ||
310 | size -= (void *)&self->attr.id - (void *)self; | ||
311 | mem_bswap_64(self->attr.id, size); | ||
312 | } | ||
313 | |||
314 | static void event__event_type_swap(event_t *self) | ||
315 | { | ||
316 | self->event_type.event_type.event_id = | ||
317 | bswap_64(self->event_type.event_type.event_id); | ||
318 | } | ||
319 | |||
320 | static void event__tracing_data_swap(event_t *self) | ||
321 | { | ||
322 | self->tracing_data.size = bswap_32(self->tracing_data.size); | ||
323 | } | ||
324 | |||
273 | typedef void (*event__swap_op)(event_t *self); | 325 | typedef void (*event__swap_op)(event_t *self); |
274 | 326 | ||
275 | static event__swap_op event__swap_ops[] = { | 327 | static event__swap_op event__swap_ops[] = { |
@@ -280,9 +332,212 @@ static event__swap_op event__swap_ops[] = { | |||
280 | [PERF_RECORD_LOST] = event__all64_swap, | 332 | [PERF_RECORD_LOST] = event__all64_swap, |
281 | [PERF_RECORD_READ] = event__read_swap, | 333 | [PERF_RECORD_READ] = event__read_swap, |
282 | [PERF_RECORD_SAMPLE] = event__all64_swap, | 334 | [PERF_RECORD_SAMPLE] = event__all64_swap, |
283 | [PERF_RECORD_MAX] = NULL, | 335 | [PERF_RECORD_HEADER_ATTR] = event__attr_swap, |
336 | [PERF_RECORD_HEADER_EVENT_TYPE] = event__event_type_swap, | ||
337 | [PERF_RECORD_HEADER_TRACING_DATA] = event__tracing_data_swap, | ||
338 | [PERF_RECORD_HEADER_BUILD_ID] = NULL, | ||
339 | [PERF_RECORD_HEADER_MAX] = NULL, | ||
284 | }; | 340 | }; |
285 | 341 | ||
342 | struct sample_queue { | ||
343 | u64 timestamp; | ||
344 | struct sample_event *event; | ||
345 | struct list_head list; | ||
346 | }; | ||
347 | |||
348 | static void flush_sample_queue(struct perf_session *s, | ||
349 | struct perf_event_ops *ops) | ||
350 | { | ||
351 | struct list_head *head = &s->ordered_samples.samples_head; | ||
352 | u64 limit = s->ordered_samples.next_flush; | ||
353 | struct sample_queue *tmp, *iter; | ||
354 | |||
355 | if (!ops->ordered_samples || !limit) | ||
356 | return; | ||
357 | |||
358 | list_for_each_entry_safe(iter, tmp, head, list) { | ||
359 | if (iter->timestamp > limit) | ||
360 | return; | ||
361 | |||
362 | if (iter == s->ordered_samples.last_inserted) | ||
363 | s->ordered_samples.last_inserted = NULL; | ||
364 | |||
365 | ops->sample((event_t *)iter->event, s); | ||
366 | |||
367 | s->ordered_samples.last_flush = iter->timestamp; | ||
368 | list_del(&iter->list); | ||
369 | free(iter->event); | ||
370 | free(iter); | ||
371 | } | ||
372 | } | ||
373 | |||
374 | /* | ||
375 | * When perf record finishes a pass on every buffers, it records this pseudo | ||
376 | * event. | ||
377 | * We record the max timestamp t found in the pass n. | ||
378 | * Assuming these timestamps are monotonic across cpus, we know that if | ||
379 | * a buffer still has events with timestamps below t, they will be all | ||
380 | * available and then read in the pass n + 1. | ||
381 | * Hence when we start to read the pass n + 2, we can safely flush every | ||
382 | * events with timestamps below t. | ||
383 | * | ||
384 | * ============ PASS n ================= | ||
385 | * CPU 0 | CPU 1 | ||
386 | * | | ||
387 | * cnt1 timestamps | cnt2 timestamps | ||
388 | * 1 | 2 | ||
389 | * 2 | 3 | ||
390 | * - | 4 <--- max recorded | ||
391 | * | ||
392 | * ============ PASS n + 1 ============== | ||
393 | * CPU 0 | CPU 1 | ||
394 | * | | ||
395 | * cnt1 timestamps | cnt2 timestamps | ||
396 | * 3 | 5 | ||
397 | * 4 | 6 | ||
398 | * 5 | 7 <---- max recorded | ||
399 | * | ||
400 | * Flush every events below timestamp 4 | ||
401 | * | ||
402 | * ============ PASS n + 2 ============== | ||
403 | * CPU 0 | CPU 1 | ||
404 | * | | ||
405 | * cnt1 timestamps | cnt2 timestamps | ||
406 | * 6 | 8 | ||
407 | * 7 | 9 | ||
408 | * - | 10 | ||
409 | * | ||
410 | * Flush every events below timestamp 7 | ||
411 | * etc... | ||
412 | */ | ||
413 | static int process_finished_round(event_t *event __used, | ||
414 | struct perf_session *session, | ||
415 | struct perf_event_ops *ops) | ||
416 | { | ||
417 | flush_sample_queue(session, ops); | ||
418 | session->ordered_samples.next_flush = session->ordered_samples.max_timestamp; | ||
419 | |||
420 | return 0; | ||
421 | } | ||
422 | |||
423 | static void __queue_sample_end(struct sample_queue *new, struct list_head *head) | ||
424 | { | ||
425 | struct sample_queue *iter; | ||
426 | |||
427 | list_for_each_entry_reverse(iter, head, list) { | ||
428 | if (iter->timestamp < new->timestamp) { | ||
429 | list_add(&new->list, &iter->list); | ||
430 | return; | ||
431 | } | ||
432 | } | ||
433 | |||
434 | list_add(&new->list, head); | ||
435 | } | ||
436 | |||
437 | static void __queue_sample_before(struct sample_queue *new, | ||
438 | struct sample_queue *iter, | ||
439 | struct list_head *head) | ||
440 | { | ||
441 | list_for_each_entry_continue_reverse(iter, head, list) { | ||
442 | if (iter->timestamp < new->timestamp) { | ||
443 | list_add(&new->list, &iter->list); | ||
444 | return; | ||
445 | } | ||
446 | } | ||
447 | |||
448 | list_add(&new->list, head); | ||
449 | } | ||
450 | |||
451 | static void __queue_sample_after(struct sample_queue *new, | ||
452 | struct sample_queue *iter, | ||
453 | struct list_head *head) | ||
454 | { | ||
455 | list_for_each_entry_continue(iter, head, list) { | ||
456 | if (iter->timestamp > new->timestamp) { | ||
457 | list_add_tail(&new->list, &iter->list); | ||
458 | return; | ||
459 | } | ||
460 | } | ||
461 | list_add_tail(&new->list, head); | ||
462 | } | ||
463 | |||
464 | /* The queue is ordered by time */ | ||
465 | static void __queue_sample_event(struct sample_queue *new, | ||
466 | struct perf_session *s) | ||
467 | { | ||
468 | struct sample_queue *last_inserted = s->ordered_samples.last_inserted; | ||
469 | struct list_head *head = &s->ordered_samples.samples_head; | ||
470 | |||
471 | |||
472 | if (!last_inserted) { | ||
473 | __queue_sample_end(new, head); | ||
474 | return; | ||
475 | } | ||
476 | |||
477 | /* | ||
478 | * Most of the time the current event has a timestamp | ||
479 | * very close to the last event inserted, unless we just switched | ||
480 | * to another event buffer. Having a sorting based on a list and | ||
481 | * on the last inserted event that is close to the current one is | ||
482 | * probably more efficient than an rbtree based sorting. | ||
483 | */ | ||
484 | if (last_inserted->timestamp >= new->timestamp) | ||
485 | __queue_sample_before(new, last_inserted, head); | ||
486 | else | ||
487 | __queue_sample_after(new, last_inserted, head); | ||
488 | } | ||
489 | |||
490 | static int queue_sample_event(event_t *event, struct sample_data *data, | ||
491 | struct perf_session *s) | ||
492 | { | ||
493 | u64 timestamp = data->time; | ||
494 | struct sample_queue *new; | ||
495 | |||
496 | |||
497 | if (timestamp < s->ordered_samples.last_flush) { | ||
498 | printf("Warning: Timestamp below last timeslice flush\n"); | ||
499 | return -EINVAL; | ||
500 | } | ||
501 | |||
502 | new = malloc(sizeof(*new)); | ||
503 | if (!new) | ||
504 | return -ENOMEM; | ||
505 | |||
506 | new->timestamp = timestamp; | ||
507 | |||
508 | new->event = malloc(event->header.size); | ||
509 | if (!new->event) { | ||
510 | free(new); | ||
511 | return -ENOMEM; | ||
512 | } | ||
513 | |||
514 | memcpy(new->event, event, event->header.size); | ||
515 | |||
516 | __queue_sample_event(new, s); | ||
517 | s->ordered_samples.last_inserted = new; | ||
518 | |||
519 | if (new->timestamp > s->ordered_samples.max_timestamp) | ||
520 | s->ordered_samples.max_timestamp = new->timestamp; | ||
521 | |||
522 | return 0; | ||
523 | } | ||
524 | |||
525 | static int perf_session__process_sample(event_t *event, struct perf_session *s, | ||
526 | struct perf_event_ops *ops) | ||
527 | { | ||
528 | struct sample_data data; | ||
529 | |||
530 | if (!ops->ordered_samples) | ||
531 | return ops->sample(event, s); | ||
532 | |||
533 | bzero(&data, sizeof(struct sample_data)); | ||
534 | event__parse_sample(event, s->sample_type, &data); | ||
535 | |||
536 | queue_sample_event(event, &data, s); | ||
537 | |||
538 | return 0; | ||
539 | } | ||
540 | |||
286 | static int perf_session__process_event(struct perf_session *self, | 541 | static int perf_session__process_event(struct perf_session *self, |
287 | event_t *event, | 542 | event_t *event, |
288 | struct perf_event_ops *ops, | 543 | struct perf_event_ops *ops, |
@@ -290,12 +545,11 @@ static int perf_session__process_event(struct perf_session *self, | |||
290 | { | 545 | { |
291 | trace_event(event); | 546 | trace_event(event); |
292 | 547 | ||
293 | if (event->header.type < PERF_RECORD_MAX) { | 548 | if (event->header.type < PERF_RECORD_HEADER_MAX) { |
294 | dump_printf("%#Lx [%#x]: PERF_RECORD_%s", | 549 | dump_printf("%#Lx [%#x]: PERF_RECORD_%s", |
295 | offset + head, event->header.size, | 550 | offset + head, event->header.size, |
296 | event__name[event->header.type]); | 551 | event__name[event->header.type]); |
297 | ++event__total[0]; | 552 | hists__inc_nr_events(&self->hists, event->header.type); |
298 | ++event__total[event->header.type]; | ||
299 | } | 553 | } |
300 | 554 | ||
301 | if (self->header.needs_swap && event__swap_ops[event->header.type]) | 555 | if (self->header.needs_swap && event__swap_ops[event->header.type]) |
@@ -303,7 +557,7 @@ static int perf_session__process_event(struct perf_session *self, | |||
303 | 557 | ||
304 | switch (event->header.type) { | 558 | switch (event->header.type) { |
305 | case PERF_RECORD_SAMPLE: | 559 | case PERF_RECORD_SAMPLE: |
306 | return ops->sample(event, self); | 560 | return perf_session__process_sample(event, self, ops); |
307 | case PERF_RECORD_MMAP: | 561 | case PERF_RECORD_MMAP: |
308 | return ops->mmap(event, self); | 562 | return ops->mmap(event, self); |
309 | case PERF_RECORD_COMM: | 563 | case PERF_RECORD_COMM: |
@@ -320,8 +574,20 @@ static int perf_session__process_event(struct perf_session *self, | |||
320 | return ops->throttle(event, self); | 574 | return ops->throttle(event, self); |
321 | case PERF_RECORD_UNTHROTTLE: | 575 | case PERF_RECORD_UNTHROTTLE: |
322 | return ops->unthrottle(event, self); | 576 | return ops->unthrottle(event, self); |
577 | case PERF_RECORD_HEADER_ATTR: | ||
578 | return ops->attr(event, self); | ||
579 | case PERF_RECORD_HEADER_EVENT_TYPE: | ||
580 | return ops->event_type(event, self); | ||
581 | case PERF_RECORD_HEADER_TRACING_DATA: | ||
582 | /* setup for reading amidst mmap */ | ||
583 | lseek(self->fd, offset + head, SEEK_SET); | ||
584 | return ops->tracing_data(event, self); | ||
585 | case PERF_RECORD_HEADER_BUILD_ID: | ||
586 | return ops->build_id(event, self); | ||
587 | case PERF_RECORD_FINISHED_ROUND: | ||
588 | return ops->finished_round(event, self, ops); | ||
323 | default: | 589 | default: |
324 | self->unknown_events++; | 590 | ++self->hists.stats.nr_unknown_events; |
325 | return -1; | 591 | return -1; |
326 | } | 592 | } |
327 | } | 593 | } |
@@ -333,56 +599,114 @@ void perf_event_header__bswap(struct perf_event_header *self) | |||
333 | self->size = bswap_16(self->size); | 599 | self->size = bswap_16(self->size); |
334 | } | 600 | } |
335 | 601 | ||
336 | int perf_header__read_build_ids(struct perf_header *self, | 602 | static struct thread *perf_session__register_idle_thread(struct perf_session *self) |
337 | int input, u64 offset, u64 size) | ||
338 | { | 603 | { |
339 | struct build_id_event bev; | 604 | struct thread *thread = perf_session__findnew(self, 0); |
340 | char filename[PATH_MAX]; | ||
341 | u64 limit = offset + size; | ||
342 | int err = -1; | ||
343 | |||
344 | while (offset < limit) { | ||
345 | struct dso *dso; | ||
346 | ssize_t len; | ||
347 | struct list_head *head = &dsos__user; | ||
348 | 605 | ||
349 | if (read(input, &bev, sizeof(bev)) != sizeof(bev)) | 606 | if (thread == NULL || thread__set_comm(thread, "swapper")) { |
350 | goto out; | 607 | pr_err("problem inserting idle task.\n"); |
608 | thread = NULL; | ||
609 | } | ||
351 | 610 | ||
352 | if (self->needs_swap) | 611 | return thread; |
353 | perf_event_header__bswap(&bev.header); | 612 | } |
354 | 613 | ||
355 | len = bev.header.size - sizeof(bev); | 614 | int do_read(int fd, void *buf, size_t size) |
356 | if (read(input, filename, len) != len) | 615 | { |
357 | goto out; | 616 | void *buf_start = buf; |
358 | 617 | ||
359 | if (bev.header.misc & PERF_RECORD_MISC_KERNEL) | 618 | while (size) { |
360 | head = &dsos__kernel; | 619 | int ret = read(fd, buf, size); |
361 | 620 | ||
362 | dso = __dsos__findnew(head, filename); | 621 | if (ret <= 0) |
363 | if (dso != NULL) { | 622 | return ret; |
364 | dso__set_build_id(dso, &bev.build_id); | ||
365 | if (head == &dsos__kernel && filename[0] == '[') | ||
366 | dso->kernel = 1; | ||
367 | } | ||
368 | 623 | ||
369 | offset += bev.header.size; | 624 | size -= ret; |
625 | buf += ret; | ||
370 | } | 626 | } |
371 | err = 0; | 627 | |
372 | out: | 628 | return buf - buf_start; |
373 | return err; | ||
374 | } | 629 | } |
375 | 630 | ||
376 | static struct thread *perf_session__register_idle_thread(struct perf_session *self) | 631 | #define session_done() (*(volatile int *)(&session_done)) |
632 | volatile int session_done; | ||
633 | |||
634 | static int __perf_session__process_pipe_events(struct perf_session *self, | ||
635 | struct perf_event_ops *ops) | ||
377 | { | 636 | { |
378 | struct thread *thread = perf_session__findnew(self, 0); | 637 | event_t event; |
638 | uint32_t size; | ||
639 | int skip = 0; | ||
640 | u64 head; | ||
641 | int err; | ||
642 | void *p; | ||
379 | 643 | ||
380 | if (thread == NULL || thread__set_comm(thread, "swapper")) { | 644 | perf_event_ops__fill_defaults(ops); |
381 | pr_err("problem inserting idle task.\n"); | 645 | |
382 | thread = NULL; | 646 | head = 0; |
647 | more: | ||
648 | err = do_read(self->fd, &event, sizeof(struct perf_event_header)); | ||
649 | if (err <= 0) { | ||
650 | if (err == 0) | ||
651 | goto done; | ||
652 | |||
653 | pr_err("failed to read event header\n"); | ||
654 | goto out_err; | ||
383 | } | 655 | } |
384 | 656 | ||
385 | return thread; | 657 | if (self->header.needs_swap) |
658 | perf_event_header__bswap(&event.header); | ||
659 | |||
660 | size = event.header.size; | ||
661 | if (size == 0) | ||
662 | size = 8; | ||
663 | |||
664 | p = &event; | ||
665 | p += sizeof(struct perf_event_header); | ||
666 | |||
667 | if (size - sizeof(struct perf_event_header)) { | ||
668 | err = do_read(self->fd, p, | ||
669 | size - sizeof(struct perf_event_header)); | ||
670 | if (err <= 0) { | ||
671 | if (err == 0) { | ||
672 | pr_err("unexpected end of event stream\n"); | ||
673 | goto done; | ||
674 | } | ||
675 | |||
676 | pr_err("failed to read event data\n"); | ||
677 | goto out_err; | ||
678 | } | ||
679 | } | ||
680 | |||
681 | if (size == 0 || | ||
682 | (skip = perf_session__process_event(self, &event, ops, | ||
683 | 0, head)) < 0) { | ||
684 | dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n", | ||
685 | head, event.header.size, event.header.type); | ||
686 | /* | ||
687 | * assume we lost track of the stream, check alignment, and | ||
688 | * increment a single u64 in the hope to catch on again 'soon'. | ||
689 | */ | ||
690 | if (unlikely(head & 7)) | ||
691 | head &= ~7ULL; | ||
692 | |||
693 | size = 8; | ||
694 | } | ||
695 | |||
696 | head += size; | ||
697 | |||
698 | dump_printf("\n%#Lx [%#x]: event: %d\n", | ||
699 | head, event.header.size, event.header.type); | ||
700 | |||
701 | if (skip > 0) | ||
702 | head += skip; | ||
703 | |||
704 | if (!session_done()) | ||
705 | goto more; | ||
706 | done: | ||
707 | err = 0; | ||
708 | out_err: | ||
709 | return err; | ||
386 | } | 710 | } |
387 | 711 | ||
388 | int __perf_session__process_events(struct perf_session *self, | 712 | int __perf_session__process_events(struct perf_session *self, |
@@ -396,6 +720,10 @@ int __perf_session__process_events(struct perf_session *self, | |||
396 | event_t *event; | 720 | event_t *event; |
397 | uint32_t size; | 721 | uint32_t size; |
398 | char *buf; | 722 | char *buf; |
723 | struct ui_progress *progress = ui_progress__new("Processing events...", | ||
724 | self->size); | ||
725 | if (progress == NULL) | ||
726 | return -1; | ||
399 | 727 | ||
400 | perf_event_ops__fill_defaults(ops); | 728 | perf_event_ops__fill_defaults(ops); |
401 | 729 | ||
@@ -424,6 +752,7 @@ remap: | |||
424 | 752 | ||
425 | more: | 753 | more: |
426 | event = (event_t *)(buf + head); | 754 | event = (event_t *)(buf + head); |
755 | ui_progress__update(progress, offset); | ||
427 | 756 | ||
428 | if (self->header.needs_swap) | 757 | if (self->header.needs_swap) |
429 | perf_event_header__bswap(&event->header); | 758 | perf_event_header__bswap(&event->header); |
@@ -473,7 +802,11 @@ more: | |||
473 | goto more; | 802 | goto more; |
474 | done: | 803 | done: |
475 | err = 0; | 804 | err = 0; |
805 | /* do the final flush for ordered samples */ | ||
806 | self->ordered_samples.next_flush = ULLONG_MAX; | ||
807 | flush_sample_queue(self, ops); | ||
476 | out_err: | 808 | out_err: |
809 | ui_progress__delete(progress); | ||
477 | return err; | 810 | return err; |
478 | } | 811 | } |
479 | 812 | ||
@@ -502,9 +835,13 @@ out_getcwd_err: | |||
502 | self->cwdlen = strlen(self->cwd); | 835 | self->cwdlen = strlen(self->cwd); |
503 | } | 836 | } |
504 | 837 | ||
505 | err = __perf_session__process_events(self, self->header.data_offset, | 838 | if (!self->fd_pipe) |
506 | self->header.data_size, | 839 | err = __perf_session__process_events(self, |
507 | self->size, ops); | 840 | self->header.data_offset, |
841 | self->header.data_size, | ||
842 | self->size, ops); | ||
843 | else | ||
844 | err = __perf_session__process_pipe_events(self, ops); | ||
508 | out_err: | 845 | out_err: |
509 | return err; | 846 | return err; |
510 | } | 847 | } |
@@ -519,56 +856,41 @@ bool perf_session__has_traces(struct perf_session *self, const char *msg) | |||
519 | return true; | 856 | return true; |
520 | } | 857 | } |
521 | 858 | ||
522 | int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self, | 859 | int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps, |
523 | const char *symbol_name, | 860 | const char *symbol_name, |
524 | u64 addr) | 861 | u64 addr) |
525 | { | 862 | { |
526 | char *bracket; | 863 | char *bracket; |
527 | enum map_type i; | 864 | enum map_type i; |
865 | struct ref_reloc_sym *ref; | ||
528 | 866 | ||
529 | self->ref_reloc_sym.name = strdup(symbol_name); | 867 | ref = zalloc(sizeof(struct ref_reloc_sym)); |
530 | if (self->ref_reloc_sym.name == NULL) | 868 | if (ref == NULL) |
531 | return -ENOMEM; | 869 | return -ENOMEM; |
532 | 870 | ||
533 | bracket = strchr(self->ref_reloc_sym.name, ']'); | 871 | ref->name = strdup(symbol_name); |
872 | if (ref->name == NULL) { | ||
873 | free(ref); | ||
874 | return -ENOMEM; | ||
875 | } | ||
876 | |||
877 | bracket = strchr(ref->name, ']'); | ||
534 | if (bracket) | 878 | if (bracket) |
535 | *bracket = '\0'; | 879 | *bracket = '\0'; |
536 | 880 | ||
537 | self->ref_reloc_sym.addr = addr; | 881 | ref->addr = addr; |
538 | 882 | ||
539 | for (i = 0; i < MAP__NR_TYPES; ++i) { | 883 | for (i = 0; i < MAP__NR_TYPES; ++i) { |
540 | struct kmap *kmap = map__kmap(self->vmlinux_maps[i]); | 884 | struct kmap *kmap = map__kmap(maps[i]); |
541 | kmap->ref_reloc_sym = &self->ref_reloc_sym; | 885 | kmap->ref_reloc_sym = ref; |
542 | } | 886 | } |
543 | 887 | ||
544 | return 0; | 888 | return 0; |
545 | } | 889 | } |
546 | 890 | ||
547 | static u64 map__reloc_map_ip(struct map *map, u64 ip) | 891 | size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp) |
548 | { | ||
549 | return ip + (s64)map->pgoff; | ||
550 | } | ||
551 | |||
552 | static u64 map__reloc_unmap_ip(struct map *map, u64 ip) | ||
553 | { | ||
554 | return ip - (s64)map->pgoff; | ||
555 | } | ||
556 | |||
557 | void map__reloc_vmlinux(struct map *self) | ||
558 | { | 892 | { |
559 | struct kmap *kmap = map__kmap(self); | 893 | return __dsos__fprintf(&self->host_machine.kernel_dsos, fp) + |
560 | s64 reloc; | 894 | __dsos__fprintf(&self->host_machine.user_dsos, fp) + |
561 | 895 | machines__fprintf_dsos(&self->machines, fp); | |
562 | if (!kmap->ref_reloc_sym || !kmap->ref_reloc_sym->unrelocated_addr) | ||
563 | return; | ||
564 | |||
565 | reloc = (kmap->ref_reloc_sym->unrelocated_addr - | ||
566 | kmap->ref_reloc_sym->addr); | ||
567 | |||
568 | if (!reloc) | ||
569 | return; | ||
570 | |||
571 | self->map_ip = map__reloc_map_ip; | ||
572 | self->unmap_ip = map__reloc_unmap_ip; | ||
573 | self->pgoff = reloc; | ||
574 | } | 896 | } |
diff --git a/tools/perf/util/session.h b/tools/perf/util/session.h index 5c33417eebb3..e7fce486ebe2 100644 --- a/tools/perf/util/session.h +++ b/tools/perf/util/session.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_SESSION_H | 1 | #ifndef __PERF_SESSION_H |
2 | #define __PERF_SESSION_H | 2 | #define __PERF_SESSION_H |
3 | 3 | ||
4 | #include "hist.h" | ||
4 | #include "event.h" | 5 | #include "event.h" |
5 | #include "header.h" | 6 | #include "header.h" |
6 | #include "symbol.h" | 7 | #include "symbol.h" |
@@ -8,45 +9,69 @@ | |||
8 | #include <linux/rbtree.h> | 9 | #include <linux/rbtree.h> |
9 | #include "../../../include/linux/perf_event.h" | 10 | #include "../../../include/linux/perf_event.h" |
10 | 11 | ||
12 | struct sample_queue; | ||
11 | struct ip_callchain; | 13 | struct ip_callchain; |
12 | struct thread; | 14 | struct thread; |
13 | 15 | ||
16 | struct ordered_samples { | ||
17 | u64 last_flush; | ||
18 | u64 next_flush; | ||
19 | u64 max_timestamp; | ||
20 | struct list_head samples_head; | ||
21 | struct sample_queue *last_inserted; | ||
22 | }; | ||
23 | |||
14 | struct perf_session { | 24 | struct perf_session { |
15 | struct perf_header header; | 25 | struct perf_header header; |
16 | unsigned long size; | 26 | unsigned long size; |
17 | unsigned long mmap_window; | 27 | unsigned long mmap_window; |
18 | struct map_groups kmaps; | ||
19 | struct rb_root threads; | 28 | struct rb_root threads; |
20 | struct thread *last_match; | 29 | struct thread *last_match; |
21 | struct map *vmlinux_maps[MAP__NR_TYPES]; | 30 | struct machine host_machine; |
22 | struct events_stats events_stats; | 31 | struct rb_root machines; |
23 | struct rb_root stats_by_id; | 32 | struct rb_root hists_tree; |
24 | unsigned long event_total[PERF_RECORD_MAX]; | 33 | /* |
25 | unsigned long unknown_events; | 34 | * FIXME: should point to the first entry in hists_tree and |
26 | struct rb_root hists; | 35 | * be a hists instance. Right now its only 'report' |
36 | * that is using ->hists_tree while all the rest use | ||
37 | * ->hists. | ||
38 | */ | ||
39 | struct hists hists; | ||
27 | u64 sample_type; | 40 | u64 sample_type; |
28 | struct ref_reloc_sym ref_reloc_sym; | ||
29 | int fd; | 41 | int fd; |
42 | bool fd_pipe; | ||
43 | bool repipe; | ||
30 | int cwdlen; | 44 | int cwdlen; |
31 | char *cwd; | 45 | char *cwd; |
46 | struct ordered_samples ordered_samples; | ||
32 | char filename[0]; | 47 | char filename[0]; |
33 | }; | 48 | }; |
34 | 49 | ||
50 | struct perf_event_ops; | ||
51 | |||
35 | typedef int (*event_op)(event_t *self, struct perf_session *session); | 52 | typedef int (*event_op)(event_t *self, struct perf_session *session); |
53 | typedef int (*event_op2)(event_t *self, struct perf_session *session, | ||
54 | struct perf_event_ops *ops); | ||
36 | 55 | ||
37 | struct perf_event_ops { | 56 | struct perf_event_ops { |
38 | event_op sample, | 57 | event_op sample, |
39 | mmap, | 58 | mmap, |
40 | comm, | 59 | comm, |
41 | fork, | 60 | fork, |
42 | exit, | 61 | exit, |
43 | lost, | 62 | lost, |
44 | read, | 63 | read, |
45 | throttle, | 64 | throttle, |
46 | unthrottle; | 65 | unthrottle, |
66 | attr, | ||
67 | event_type, | ||
68 | tracing_data, | ||
69 | build_id; | ||
70 | event_op2 finished_round; | ||
71 | bool ordered_samples; | ||
47 | }; | 72 | }; |
48 | 73 | ||
49 | struct perf_session *perf_session__new(const char *filename, int mode, bool force); | 74 | struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe); |
50 | void perf_session__delete(struct perf_session *self); | 75 | void perf_session__delete(struct perf_session *self); |
51 | 76 | ||
52 | void perf_event_header__bswap(struct perf_event_header *self); | 77 | void perf_event_header__bswap(struct perf_event_header *self); |
@@ -57,33 +82,66 @@ int __perf_session__process_events(struct perf_session *self, | |||
57 | int perf_session__process_events(struct perf_session *self, | 82 | int perf_session__process_events(struct perf_session *self, |
58 | struct perf_event_ops *event_ops); | 83 | struct perf_event_ops *event_ops); |
59 | 84 | ||
60 | struct symbol **perf_session__resolve_callchain(struct perf_session *self, | 85 | struct map_symbol *perf_session__resolve_callchain(struct perf_session *self, |
61 | struct thread *thread, | 86 | struct thread *thread, |
62 | struct ip_callchain *chain, | 87 | struct ip_callchain *chain, |
63 | struct symbol **parent); | 88 | struct symbol **parent); |
64 | 89 | ||
65 | bool perf_session__has_traces(struct perf_session *self, const char *msg); | 90 | bool perf_session__has_traces(struct perf_session *self, const char *msg); |
66 | 91 | ||
67 | int perf_header__read_build_ids(struct perf_header *self, int input, | 92 | int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps, |
68 | u64 offset, u64 file_size); | ||
69 | |||
70 | int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self, | ||
71 | const char *symbol_name, | 93 | const char *symbol_name, |
72 | u64 addr); | 94 | u64 addr); |
73 | 95 | ||
74 | void mem_bswap_64(void *src, int byte_size); | 96 | void mem_bswap_64(void *src, int byte_size); |
75 | 97 | ||
76 | static inline int __perf_session__create_kernel_maps(struct perf_session *self, | 98 | int perf_session__create_kernel_maps(struct perf_session *self); |
77 | struct dso *kernel) | 99 | |
100 | int do_read(int fd, void *buf, size_t size); | ||
101 | void perf_session__update_sample_type(struct perf_session *self); | ||
102 | |||
103 | static inline | ||
104 | struct machine *perf_session__find_host_machine(struct perf_session *self) | ||
105 | { | ||
106 | return &self->host_machine; | ||
107 | } | ||
108 | |||
109 | static inline | ||
110 | struct machine *perf_session__find_machine(struct perf_session *self, pid_t pid) | ||
111 | { | ||
112 | if (pid == HOST_KERNEL_ID) | ||
113 | return &self->host_machine; | ||
114 | return machines__find(&self->machines, pid); | ||
115 | } | ||
116 | |||
117 | static inline | ||
118 | struct machine *perf_session__findnew_machine(struct perf_session *self, pid_t pid) | ||
119 | { | ||
120 | if (pid == HOST_KERNEL_ID) | ||
121 | return &self->host_machine; | ||
122 | return machines__findnew(&self->machines, pid); | ||
123 | } | ||
124 | |||
125 | static inline | ||
126 | void perf_session__process_machines(struct perf_session *self, | ||
127 | machine__process_t process) | ||
128 | { | ||
129 | process(&self->host_machine, self); | ||
130 | return machines__process(&self->machines, process, self); | ||
131 | } | ||
132 | |||
133 | size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp); | ||
134 | |||
135 | static inline | ||
136 | size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp, | ||
137 | bool with_hits) | ||
78 | { | 138 | { |
79 | return __map_groups__create_kernel_maps(&self->kmaps, | 139 | return machines__fprintf_dsos_buildid(&self->machines, fp, with_hits); |
80 | self->vmlinux_maps, kernel); | ||
81 | } | 140 | } |
82 | 141 | ||
83 | static inline struct map * | 142 | static inline |
84 | perf_session__new_module_map(struct perf_session *self, | 143 | size_t perf_session__fprintf_nr_events(struct perf_session *self, FILE *fp) |
85 | u64 start, const char *filename) | ||
86 | { | 144 | { |
87 | return map_groups__new_module(&self->kmaps, start, filename); | 145 | return hists__fprintf_nr_events(&self->hists, fp); |
88 | } | 146 | } |
89 | #endif /* __PERF_SESSION_H */ | 147 | #endif /* __PERF_SESSION_H */ |
diff --git a/tools/perf/util/sort.c b/tools/perf/util/sort.c index cb0f327de9e8..2316cb5a4116 100644 --- a/tools/perf/util/sort.c +++ b/tools/perf/util/sort.c | |||
@@ -1,10 +1,10 @@ | |||
1 | #include "sort.h" | 1 | #include "sort.h" |
2 | 2 | ||
3 | regex_t parent_regex; | 3 | regex_t parent_regex; |
4 | char default_parent_pattern[] = "^sys_|^do_page_fault"; | 4 | const char default_parent_pattern[] = "^sys_|^do_page_fault"; |
5 | char *parent_pattern = default_parent_pattern; | 5 | const char *parent_pattern = default_parent_pattern; |
6 | char default_sort_order[] = "comm,dso,symbol"; | 6 | const char default_sort_order[] = "comm,dso,symbol"; |
7 | char *sort_order = default_sort_order; | 7 | const char *sort_order = default_sort_order; |
8 | int sort__need_collapse = 0; | 8 | int sort__need_collapse = 0; |
9 | int sort__has_parent = 0; | 9 | int sort__has_parent = 0; |
10 | 10 | ||
@@ -18,39 +18,50 @@ char * field_sep; | |||
18 | 18 | ||
19 | LIST_HEAD(hist_entry__sort_list); | 19 | LIST_HEAD(hist_entry__sort_list); |
20 | 20 | ||
21 | static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf, | ||
22 | size_t size, unsigned int width); | ||
23 | static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf, | ||
24 | size_t size, unsigned int width); | ||
25 | static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf, | ||
26 | size_t size, unsigned int width); | ||
27 | static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf, | ||
28 | size_t size, unsigned int width); | ||
29 | static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf, | ||
30 | size_t size, unsigned int width); | ||
31 | |||
21 | struct sort_entry sort_thread = { | 32 | struct sort_entry sort_thread = { |
22 | .header = "Command: Pid", | 33 | .se_header = "Command: Pid", |
23 | .cmp = sort__thread_cmp, | 34 | .se_cmp = sort__thread_cmp, |
24 | .print = sort__thread_print, | 35 | .se_snprintf = hist_entry__thread_snprintf, |
25 | .width = &threads__col_width, | 36 | .se_width = &threads__col_width, |
26 | }; | 37 | }; |
27 | 38 | ||
28 | struct sort_entry sort_comm = { | 39 | struct sort_entry sort_comm = { |
29 | .header = "Command", | 40 | .se_header = "Command", |
30 | .cmp = sort__comm_cmp, | 41 | .se_cmp = sort__comm_cmp, |
31 | .collapse = sort__comm_collapse, | 42 | .se_collapse = sort__comm_collapse, |
32 | .print = sort__comm_print, | 43 | .se_snprintf = hist_entry__comm_snprintf, |
33 | .width = &comms__col_width, | 44 | .se_width = &comms__col_width, |
34 | }; | 45 | }; |
35 | 46 | ||
36 | struct sort_entry sort_dso = { | 47 | struct sort_entry sort_dso = { |
37 | .header = "Shared Object", | 48 | .se_header = "Shared Object", |
38 | .cmp = sort__dso_cmp, | 49 | .se_cmp = sort__dso_cmp, |
39 | .print = sort__dso_print, | 50 | .se_snprintf = hist_entry__dso_snprintf, |
40 | .width = &dsos__col_width, | 51 | .se_width = &dsos__col_width, |
41 | }; | 52 | }; |
42 | 53 | ||
43 | struct sort_entry sort_sym = { | 54 | struct sort_entry sort_sym = { |
44 | .header = "Symbol", | 55 | .se_header = "Symbol", |
45 | .cmp = sort__sym_cmp, | 56 | .se_cmp = sort__sym_cmp, |
46 | .print = sort__sym_print, | 57 | .se_snprintf = hist_entry__sym_snprintf, |
47 | }; | 58 | }; |
48 | 59 | ||
49 | struct sort_entry sort_parent = { | 60 | struct sort_entry sort_parent = { |
50 | .header = "Parent symbol", | 61 | .se_header = "Parent symbol", |
51 | .cmp = sort__parent_cmp, | 62 | .se_cmp = sort__parent_cmp, |
52 | .print = sort__parent_print, | 63 | .se_snprintf = hist_entry__parent_snprintf, |
53 | .width = &parent_symbol__col_width, | 64 | .se_width = &parent_symbol__col_width, |
54 | }; | 65 | }; |
55 | 66 | ||
56 | struct sort_dimension { | 67 | struct sort_dimension { |
@@ -85,45 +96,38 @@ sort__thread_cmp(struct hist_entry *left, struct hist_entry *right) | |||
85 | return right->thread->pid - left->thread->pid; | 96 | return right->thread->pid - left->thread->pid; |
86 | } | 97 | } |
87 | 98 | ||
88 | int repsep_fprintf(FILE *fp, const char *fmt, ...) | 99 | static int repsep_snprintf(char *bf, size_t size, const char *fmt, ...) |
89 | { | 100 | { |
90 | int n; | 101 | int n; |
91 | va_list ap; | 102 | va_list ap; |
92 | 103 | ||
93 | va_start(ap, fmt); | 104 | va_start(ap, fmt); |
94 | if (!field_sep) | 105 | n = vsnprintf(bf, size, fmt, ap); |
95 | n = vfprintf(fp, fmt, ap); | 106 | if (field_sep && n > 0) { |
96 | else { | 107 | char *sep = bf; |
97 | char *bf = NULL; | 108 | |
98 | n = vasprintf(&bf, fmt, ap); | 109 | while (1) { |
99 | if (n > 0) { | 110 | sep = strchr(sep, *field_sep); |
100 | char *sep = bf; | 111 | if (sep == NULL) |
101 | 112 | break; | |
102 | while (1) { | 113 | *sep = '.'; |
103 | sep = strchr(sep, *field_sep); | ||
104 | if (sep == NULL) | ||
105 | break; | ||
106 | *sep = '.'; | ||
107 | } | ||
108 | } | 114 | } |
109 | fputs(bf, fp); | ||
110 | free(bf); | ||
111 | } | 115 | } |
112 | va_end(ap); | 116 | va_end(ap); |
113 | return n; | 117 | return n; |
114 | } | 118 | } |
115 | 119 | ||
116 | size_t | 120 | static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf, |
117 | sort__thread_print(FILE *fp, struct hist_entry *self, unsigned int width) | 121 | size_t size, unsigned int width) |
118 | { | 122 | { |
119 | return repsep_fprintf(fp, "%*s:%5d", width - 6, | 123 | return repsep_snprintf(bf, size, "%*s:%5d", width, |
120 | self->thread->comm ?: "", self->thread->pid); | 124 | self->thread->comm ?: "", self->thread->pid); |
121 | } | 125 | } |
122 | 126 | ||
123 | size_t | 127 | static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf, |
124 | sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width) | 128 | size_t size, unsigned int width) |
125 | { | 129 | { |
126 | return repsep_fprintf(fp, "%*s", width, self->thread->comm); | 130 | return repsep_snprintf(bf, size, "%*s", width, self->thread->comm); |
127 | } | 131 | } |
128 | 132 | ||
129 | /* --sort dso */ | 133 | /* --sort dso */ |
@@ -131,8 +135,8 @@ sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width) | |||
131 | int64_t | 135 | int64_t |
132 | sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) | 136 | sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) |
133 | { | 137 | { |
134 | struct dso *dso_l = left->map ? left->map->dso : NULL; | 138 | struct dso *dso_l = left->ms.map ? left->ms.map->dso : NULL; |
135 | struct dso *dso_r = right->map ? right->map->dso : NULL; | 139 | struct dso *dso_r = right->ms.map ? right->ms.map->dso : NULL; |
136 | const char *dso_name_l, *dso_name_r; | 140 | const char *dso_name_l, *dso_name_r; |
137 | 141 | ||
138 | if (!dso_l || !dso_r) | 142 | if (!dso_l || !dso_r) |
@@ -149,16 +153,16 @@ sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) | |||
149 | return strcmp(dso_name_l, dso_name_r); | 153 | return strcmp(dso_name_l, dso_name_r); |
150 | } | 154 | } |
151 | 155 | ||
152 | size_t | 156 | static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf, |
153 | sort__dso_print(FILE *fp, struct hist_entry *self, unsigned int width) | 157 | size_t size, unsigned int width) |
154 | { | 158 | { |
155 | if (self->map && self->map->dso) { | 159 | if (self->ms.map && self->ms.map->dso) { |
156 | const char *dso_name = !verbose ? self->map->dso->short_name : | 160 | const char *dso_name = !verbose ? self->ms.map->dso->short_name : |
157 | self->map->dso->long_name; | 161 | self->ms.map->dso->long_name; |
158 | return repsep_fprintf(fp, "%-*s", width, dso_name); | 162 | return repsep_snprintf(bf, size, "%-*s", width, dso_name); |
159 | } | 163 | } |
160 | 164 | ||
161 | return repsep_fprintf(fp, "%*llx", width, (u64)self->ip); | 165 | return repsep_snprintf(bf, size, "%*Lx", width, self->ip); |
162 | } | 166 | } |
163 | 167 | ||
164 | /* --sort symbol */ | 168 | /* --sort symbol */ |
@@ -168,31 +172,31 @@ sort__sym_cmp(struct hist_entry *left, struct hist_entry *right) | |||
168 | { | 172 | { |
169 | u64 ip_l, ip_r; | 173 | u64 ip_l, ip_r; |
170 | 174 | ||
171 | if (left->sym == right->sym) | 175 | if (left->ms.sym == right->ms.sym) |
172 | return 0; | 176 | return 0; |
173 | 177 | ||
174 | ip_l = left->sym ? left->sym->start : left->ip; | 178 | ip_l = left->ms.sym ? left->ms.sym->start : left->ip; |
175 | ip_r = right->sym ? right->sym->start : right->ip; | 179 | ip_r = right->ms.sym ? right->ms.sym->start : right->ip; |
176 | 180 | ||
177 | return (int64_t)(ip_r - ip_l); | 181 | return (int64_t)(ip_r - ip_l); |
178 | } | 182 | } |
179 | 183 | ||
180 | 184 | static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf, | |
181 | size_t | 185 | size_t size, unsigned int width __used) |
182 | sort__sym_print(FILE *fp, struct hist_entry *self, unsigned int width __used) | ||
183 | { | 186 | { |
184 | size_t ret = 0; | 187 | size_t ret = 0; |
185 | 188 | ||
186 | if (verbose) { | 189 | if (verbose) { |
187 | char o = self->map ? dso__symtab_origin(self->map->dso) : '!'; | 190 | char o = self->ms.map ? dso__symtab_origin(self->ms.map->dso) : '!'; |
188 | ret += repsep_fprintf(fp, "%#018llx %c ", (u64)self->ip, o); | 191 | ret += repsep_snprintf(bf, size, "%#018llx %c ", self->ip, o); |
189 | } | 192 | } |
190 | 193 | ||
191 | ret += repsep_fprintf(fp, "[%c] ", self->level); | 194 | ret += repsep_snprintf(bf + ret, size - ret, "[%c] ", self->level); |
192 | if (self->sym) | 195 | if (self->ms.sym) |
193 | ret += repsep_fprintf(fp, "%s", self->sym->name); | 196 | ret += repsep_snprintf(bf + ret, size - ret, "%s", |
197 | self->ms.sym->name); | ||
194 | else | 198 | else |
195 | ret += repsep_fprintf(fp, "%#016llx", (u64)self->ip); | 199 | ret += repsep_snprintf(bf + ret, size - ret, "%#016llx", self->ip); |
196 | 200 | ||
197 | return ret; | 201 | return ret; |
198 | } | 202 | } |
@@ -231,10 +235,10 @@ sort__parent_cmp(struct hist_entry *left, struct hist_entry *right) | |||
231 | return strcmp(sym_l->name, sym_r->name); | 235 | return strcmp(sym_l->name, sym_r->name); |
232 | } | 236 | } |
233 | 237 | ||
234 | size_t | 238 | static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf, |
235 | sort__parent_print(FILE *fp, struct hist_entry *self, unsigned int width) | 239 | size_t size, unsigned int width) |
236 | { | 240 | { |
237 | return repsep_fprintf(fp, "%-*s", width, | 241 | return repsep_snprintf(bf, size, "%-*s", width, |
238 | self->parent ? self->parent->name : "[other]"); | 242 | self->parent ? self->parent->name : "[other]"); |
239 | } | 243 | } |
240 | 244 | ||
@@ -251,7 +255,7 @@ int sort_dimension__add(const char *tok) | |||
251 | if (strncasecmp(tok, sd->name, strlen(tok))) | 255 | if (strncasecmp(tok, sd->name, strlen(tok))) |
252 | continue; | 256 | continue; |
253 | 257 | ||
254 | if (sd->entry->collapse) | 258 | if (sd->entry->se_collapse) |
255 | sort__need_collapse = 1; | 259 | sort__need_collapse = 1; |
256 | 260 | ||
257 | if (sd->entry == &sort_parent) { | 261 | if (sd->entry == &sort_parent) { |
@@ -260,9 +264,8 @@ int sort_dimension__add(const char *tok) | |||
260 | char err[BUFSIZ]; | 264 | char err[BUFSIZ]; |
261 | 265 | ||
262 | regerror(ret, &parent_regex, err, sizeof(err)); | 266 | regerror(ret, &parent_regex, err, sizeof(err)); |
263 | fprintf(stderr, "Invalid regex: %s\n%s", | 267 | pr_err("Invalid regex: %s\n%s", parent_pattern, err); |
264 | parent_pattern, err); | 268 | return -EINVAL; |
265 | exit(-1); | ||
266 | } | 269 | } |
267 | sort__has_parent = 1; | 270 | sort__has_parent = 1; |
268 | } | 271 | } |
diff --git a/tools/perf/util/sort.h b/tools/perf/util/sort.h index 753f9ea99fb0..0d61c4082f43 100644 --- a/tools/perf/util/sort.h +++ b/tools/perf/util/sort.h | |||
@@ -25,10 +25,10 @@ | |||
25 | #include "sort.h" | 25 | #include "sort.h" |
26 | 26 | ||
27 | extern regex_t parent_regex; | 27 | extern regex_t parent_regex; |
28 | extern char *sort_order; | 28 | extern const char *sort_order; |
29 | extern char default_parent_pattern[]; | 29 | extern const char default_parent_pattern[]; |
30 | extern char *parent_pattern; | 30 | extern const char *parent_pattern; |
31 | extern char default_sort_order[]; | 31 | extern const char default_sort_order[]; |
32 | extern int sort__need_collapse; | 32 | extern int sort__need_collapse; |
33 | extern int sort__has_parent; | 33 | extern int sort__has_parent; |
34 | extern char *field_sep; | 34 | extern char *field_sep; |
@@ -43,19 +43,24 @@ extern enum sort_type sort__first_dimension; | |||
43 | 43 | ||
44 | struct hist_entry { | 44 | struct hist_entry { |
45 | struct rb_node rb_node; | 45 | struct rb_node rb_node; |
46 | u64 count; | 46 | u64 period; |
47 | u64 period_sys; | ||
48 | u64 period_us; | ||
49 | u64 period_guest_sys; | ||
50 | u64 period_guest_us; | ||
51 | struct map_symbol ms; | ||
47 | struct thread *thread; | 52 | struct thread *thread; |
48 | struct map *map; | ||
49 | struct symbol *sym; | ||
50 | u64 ip; | 53 | u64 ip; |
54 | u32 nr_events; | ||
51 | char level; | 55 | char level; |
52 | struct symbol *parent; | 56 | u8 filtered; |
53 | struct callchain_node callchain; | 57 | struct symbol *parent; |
54 | union { | 58 | union { |
55 | unsigned long position; | 59 | unsigned long position; |
56 | struct hist_entry *pair; | 60 | struct hist_entry *pair; |
57 | struct rb_root sorted_chain; | 61 | struct rb_root sorted_chain; |
58 | }; | 62 | }; |
63 | struct callchain_node callchain[0]; | ||
59 | }; | 64 | }; |
60 | 65 | ||
61 | enum sort_type { | 66 | enum sort_type { |
@@ -73,12 +78,13 @@ enum sort_type { | |||
73 | struct sort_entry { | 78 | struct sort_entry { |
74 | struct list_head list; | 79 | struct list_head list; |
75 | 80 | ||
76 | const char *header; | 81 | const char *se_header; |
77 | 82 | ||
78 | int64_t (*cmp)(struct hist_entry *, struct hist_entry *); | 83 | int64_t (*se_cmp)(struct hist_entry *, struct hist_entry *); |
79 | int64_t (*collapse)(struct hist_entry *, struct hist_entry *); | 84 | int64_t (*se_collapse)(struct hist_entry *, struct hist_entry *); |
80 | size_t (*print)(FILE *fp, struct hist_entry *, unsigned int width); | 85 | int (*se_snprintf)(struct hist_entry *self, char *bf, size_t size, |
81 | unsigned int *width; | 86 | unsigned int width); |
87 | unsigned int *se_width; | ||
82 | bool elide; | 88 | bool elide; |
83 | }; | 89 | }; |
84 | 90 | ||
@@ -87,7 +93,6 @@ extern struct list_head hist_entry__sort_list; | |||
87 | 93 | ||
88 | void setup_sorting(const char * const usagestr[], const struct option *opts); | 94 | void setup_sorting(const char * const usagestr[], const struct option *opts); |
89 | 95 | ||
90 | extern int repsep_fprintf(FILE *fp, const char *fmt, ...); | ||
91 | extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int); | 96 | extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int); |
92 | extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int); | 97 | extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int); |
93 | extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int); | 98 | extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int); |
diff --git a/tools/perf/util/string.c b/tools/perf/util/string.c index a175949ed216..0409fc7c0058 100644 --- a/tools/perf/util/string.c +++ b/tools/perf/util/string.c | |||
@@ -1,48 +1,5 @@ | |||
1 | #include "string.h" | ||
2 | #include "util.h" | 1 | #include "util.h" |
3 | 2 | #include "string.h" | |
4 | static int hex(char ch) | ||
5 | { | ||
6 | if ((ch >= '0') && (ch <= '9')) | ||
7 | return ch - '0'; | ||
8 | if ((ch >= 'a') && (ch <= 'f')) | ||
9 | return ch - 'a' + 10; | ||
10 | if ((ch >= 'A') && (ch <= 'F')) | ||
11 | return ch - 'A' + 10; | ||
12 | return -1; | ||
13 | } | ||
14 | |||
15 | /* | ||
16 | * While we find nice hex chars, build a long_val. | ||
17 | * Return number of chars processed. | ||
18 | */ | ||
19 | int hex2u64(const char *ptr, u64 *long_val) | ||
20 | { | ||
21 | const char *p = ptr; | ||
22 | *long_val = 0; | ||
23 | |||
24 | while (*p) { | ||
25 | const int hex_val = hex(*p); | ||
26 | |||
27 | if (hex_val < 0) | ||
28 | break; | ||
29 | |||
30 | *long_val = (*long_val << 4) | hex_val; | ||
31 | p++; | ||
32 | } | ||
33 | |||
34 | return p - ptr; | ||
35 | } | ||
36 | |||
37 | char *strxfrchar(char *s, char from, char to) | ||
38 | { | ||
39 | char *p = s; | ||
40 | |||
41 | while ((p = strchr(p, from)) != NULL) | ||
42 | *p++ = to; | ||
43 | |||
44 | return s; | ||
45 | } | ||
46 | 3 | ||
47 | #define K 1024LL | 4 | #define K 1024LL |
48 | /* | 5 | /* |
diff --git a/tools/perf/util/string.h b/tools/perf/util/string.h deleted file mode 100644 index 542e44de3719..000000000000 --- a/tools/perf/util/string.h +++ /dev/null | |||
@@ -1,18 +0,0 @@ | |||
1 | #ifndef __PERF_STRING_H_ | ||
2 | #define __PERF_STRING_H_ | ||
3 | |||
4 | #include <stdbool.h> | ||
5 | #include "types.h" | ||
6 | |||
7 | int hex2u64(const char *ptr, u64 *val); | ||
8 | char *strxfrchar(char *s, char from, char to); | ||
9 | s64 perf_atoll(const char *str); | ||
10 | char **argv_split(const char *str, int *argcp); | ||
11 | void argv_free(char **argv); | ||
12 | bool strglobmatch(const char *str, const char *pat); | ||
13 | bool strlazymatch(const char *str, const char *pat); | ||
14 | |||
15 | #define _STR(x) #x | ||
16 | #define STR(x) _STR(x) | ||
17 | |||
18 | #endif /* __PERF_STRING_H */ | ||
diff --git a/tools/perf/util/symbol.c b/tools/perf/util/symbol.c index c458c4a371d1..a06131f6259a 100644 --- a/tools/perf/util/symbol.c +++ b/tools/perf/util/symbol.c | |||
@@ -1,13 +1,19 @@ | |||
1 | #include "util.h" | 1 | #define _GNU_SOURCE |
2 | #include "../perf.h" | 2 | #include <ctype.h> |
3 | #include "sort.h" | 3 | #include <dirent.h> |
4 | #include "string.h" | 4 | #include <errno.h> |
5 | #include <libgen.h> | ||
6 | #include <stdlib.h> | ||
7 | #include <stdio.h> | ||
8 | #include <string.h> | ||
9 | #include <sys/types.h> | ||
10 | #include <sys/stat.h> | ||
11 | #include <sys/param.h> | ||
12 | #include <fcntl.h> | ||
13 | #include <unistd.h> | ||
5 | #include "symbol.h" | 14 | #include "symbol.h" |
6 | #include "thread.h" | 15 | #include "strlist.h" |
7 | 16 | ||
8 | #include "debug.h" | ||
9 | |||
10 | #include <asm/bug.h> | ||
11 | #include <libelf.h> | 17 | #include <libelf.h> |
12 | #include <gelf.h> | 18 | #include <gelf.h> |
13 | #include <elf.h> | 19 | #include <elf.h> |
@@ -18,22 +24,12 @@ | |||
18 | #define NT_GNU_BUILD_ID 3 | 24 | #define NT_GNU_BUILD_ID 3 |
19 | #endif | 25 | #endif |
20 | 26 | ||
21 | enum dso_origin { | ||
22 | DSO__ORIG_KERNEL = 0, | ||
23 | DSO__ORIG_JAVA_JIT, | ||
24 | DSO__ORIG_BUILD_ID_CACHE, | ||
25 | DSO__ORIG_FEDORA, | ||
26 | DSO__ORIG_UBUNTU, | ||
27 | DSO__ORIG_BUILDID, | ||
28 | DSO__ORIG_DSO, | ||
29 | DSO__ORIG_KMODULE, | ||
30 | DSO__ORIG_NOT_FOUND, | ||
31 | }; | ||
32 | |||
33 | static void dsos__add(struct list_head *head, struct dso *dso); | 27 | static void dsos__add(struct list_head *head, struct dso *dso); |
34 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type); | 28 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type); |
35 | static int dso__load_kernel_sym(struct dso *self, struct map *map, | 29 | static int dso__load_kernel_sym(struct dso *self, struct map *map, |
36 | symbol_filter_t filter); | 30 | symbol_filter_t filter); |
31 | static int dso__load_guest_kernel_sym(struct dso *self, struct map *map, | ||
32 | symbol_filter_t filter); | ||
37 | static int vmlinux_path__nr_entries; | 33 | static int vmlinux_path__nr_entries; |
38 | static char **vmlinux_path; | 34 | static char **vmlinux_path; |
39 | 35 | ||
@@ -126,16 +122,17 @@ static void map_groups__fixup_end(struct map_groups *self) | |||
126 | static struct symbol *symbol__new(u64 start, u64 len, const char *name) | 122 | static struct symbol *symbol__new(u64 start, u64 len, const char *name) |
127 | { | 123 | { |
128 | size_t namelen = strlen(name) + 1; | 124 | size_t namelen = strlen(name) + 1; |
129 | struct symbol *self = zalloc(symbol_conf.priv_size + | 125 | struct symbol *self = calloc(1, (symbol_conf.priv_size + |
130 | sizeof(*self) + namelen); | 126 | sizeof(*self) + namelen)); |
131 | if (self == NULL) | 127 | if (self == NULL) |
132 | return NULL; | 128 | return NULL; |
133 | 129 | ||
134 | if (symbol_conf.priv_size) | 130 | if (symbol_conf.priv_size) |
135 | self = ((void *)self) + symbol_conf.priv_size; | 131 | self = ((void *)self) + symbol_conf.priv_size; |
136 | 132 | ||
137 | self->start = start; | 133 | self->start = start; |
138 | self->end = len ? start + len - 1 : start; | 134 | self->end = len ? start + len - 1 : start; |
135 | self->namelen = namelen - 1; | ||
139 | 136 | ||
140 | pr_debug4("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end); | 137 | pr_debug4("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end); |
141 | 138 | ||
@@ -178,7 +175,7 @@ static void dso__set_basename(struct dso *self) | |||
178 | 175 | ||
179 | struct dso *dso__new(const char *name) | 176 | struct dso *dso__new(const char *name) |
180 | { | 177 | { |
181 | struct dso *self = zalloc(sizeof(*self) + strlen(name) + 1); | 178 | struct dso *self = calloc(1, sizeof(*self) + strlen(name) + 1); |
182 | 179 | ||
183 | if (self != NULL) { | 180 | if (self != NULL) { |
184 | int i; | 181 | int i; |
@@ -192,6 +189,8 @@ struct dso *dso__new(const char *name) | |||
192 | self->loaded = 0; | 189 | self->loaded = 0; |
193 | self->sorted_by_name = 0; | 190 | self->sorted_by_name = 0; |
194 | self->has_build_id = 0; | 191 | self->has_build_id = 0; |
192 | self->kernel = DSO_TYPE_USER; | ||
193 | INIT_LIST_HEAD(&self->node); | ||
195 | } | 194 | } |
196 | 195 | ||
197 | return self; | 196 | return self; |
@@ -408,12 +407,9 @@ int kallsyms__parse(const char *filename, void *arg, | |||
408 | char *symbol_name; | 407 | char *symbol_name; |
409 | 408 | ||
410 | line_len = getline(&line, &n, file); | 409 | line_len = getline(&line, &n, file); |
411 | if (line_len < 0) | 410 | if (line_len < 0 || !line) |
412 | break; | 411 | break; |
413 | 412 | ||
414 | if (!line) | ||
415 | goto out_failure; | ||
416 | |||
417 | line[--line_len] = '\0'; /* \n */ | 413 | line[--line_len] = '\0'; /* \n */ |
418 | 414 | ||
419 | len = hex2u64(line, &start); | 415 | len = hex2u64(line, &start); |
@@ -465,6 +461,7 @@ static int map__process_kallsym_symbol(void *arg, const char *name, | |||
465 | * map__split_kallsyms, when we have split the maps per module | 461 | * map__split_kallsyms, when we have split the maps per module |
466 | */ | 462 | */ |
467 | symbols__insert(root, sym); | 463 | symbols__insert(root, sym); |
464 | |||
468 | return 0; | 465 | return 0; |
469 | } | 466 | } |
470 | 467 | ||
@@ -489,6 +486,7 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
489 | symbol_filter_t filter) | 486 | symbol_filter_t filter) |
490 | { | 487 | { |
491 | struct map_groups *kmaps = map__kmap(map)->kmaps; | 488 | struct map_groups *kmaps = map__kmap(map)->kmaps; |
489 | struct machine *machine = kmaps->machine; | ||
492 | struct map *curr_map = map; | 490 | struct map *curr_map = map; |
493 | struct symbol *pos; | 491 | struct symbol *pos; |
494 | int count = 0; | 492 | int count = 0; |
@@ -510,15 +508,33 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
510 | *module++ = '\0'; | 508 | *module++ = '\0'; |
511 | 509 | ||
512 | if (strcmp(curr_map->dso->short_name, module)) { | 510 | if (strcmp(curr_map->dso->short_name, module)) { |
513 | curr_map = map_groups__find_by_name(kmaps, map->type, module); | 511 | if (curr_map != map && |
512 | self->kernel == DSO_TYPE_GUEST_KERNEL && | ||
513 | machine__is_default_guest(machine)) { | ||
514 | /* | ||
515 | * We assume all symbols of a module are | ||
516 | * continuous in * kallsyms, so curr_map | ||
517 | * points to a module and all its | ||
518 | * symbols are in its kmap. Mark it as | ||
519 | * loaded. | ||
520 | */ | ||
521 | dso__set_loaded(curr_map->dso, | ||
522 | curr_map->type); | ||
523 | } | ||
524 | |||
525 | curr_map = map_groups__find_by_name(kmaps, | ||
526 | map->type, module); | ||
514 | if (curr_map == NULL) { | 527 | if (curr_map == NULL) { |
515 | pr_debug("/proc/{kallsyms,modules} " | 528 | pr_debug("%s/proc/{kallsyms,modules} " |
516 | "inconsistency while looking " | 529 | "inconsistency while looking " |
517 | "for \"%s\" module!\n", module); | 530 | "for \"%s\" module!\n", |
518 | return -1; | 531 | machine->root_dir, module); |
532 | curr_map = map; | ||
533 | goto discard_symbol; | ||
519 | } | 534 | } |
520 | 535 | ||
521 | if (curr_map->dso->loaded) | 536 | if (curr_map->dso->loaded && |
537 | !machine__is_default_guest(machine)) | ||
522 | goto discard_symbol; | 538 | goto discard_symbol; |
523 | } | 539 | } |
524 | /* | 540 | /* |
@@ -531,13 +547,21 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
531 | char dso_name[PATH_MAX]; | 547 | char dso_name[PATH_MAX]; |
532 | struct dso *dso; | 548 | struct dso *dso; |
533 | 549 | ||
534 | snprintf(dso_name, sizeof(dso_name), "[kernel].%d", | 550 | if (self->kernel == DSO_TYPE_GUEST_KERNEL) |
535 | kernel_range++); | 551 | snprintf(dso_name, sizeof(dso_name), |
552 | "[guest.kernel].%d", | ||
553 | kernel_range++); | ||
554 | else | ||
555 | snprintf(dso_name, sizeof(dso_name), | ||
556 | "[kernel].%d", | ||
557 | kernel_range++); | ||
536 | 558 | ||
537 | dso = dso__new(dso_name); | 559 | dso = dso__new(dso_name); |
538 | if (dso == NULL) | 560 | if (dso == NULL) |
539 | return -1; | 561 | return -1; |
540 | 562 | ||
563 | dso->kernel = self->kernel; | ||
564 | |||
541 | curr_map = map__new2(pos->start, dso, map->type); | 565 | curr_map = map__new2(pos->start, dso, map->type); |
542 | if (curr_map == NULL) { | 566 | if (curr_map == NULL) { |
543 | dso__delete(dso); | 567 | dso__delete(dso); |
@@ -561,6 +585,12 @@ discard_symbol: rb_erase(&pos->rb_node, root); | |||
561 | } | 585 | } |
562 | } | 586 | } |
563 | 587 | ||
588 | if (curr_map != map && | ||
589 | self->kernel == DSO_TYPE_GUEST_KERNEL && | ||
590 | machine__is_default_guest(kmaps->machine)) { | ||
591 | dso__set_loaded(curr_map->dso, curr_map->type); | ||
592 | } | ||
593 | |||
564 | return count; | 594 | return count; |
565 | } | 595 | } |
566 | 596 | ||
@@ -571,7 +601,10 @@ int dso__load_kallsyms(struct dso *self, const char *filename, | |||
571 | return -1; | 601 | return -1; |
572 | 602 | ||
573 | symbols__fixup_end(&self->symbols[map->type]); | 603 | symbols__fixup_end(&self->symbols[map->type]); |
574 | self->origin = DSO__ORIG_KERNEL; | 604 | if (self->kernel == DSO_TYPE_GUEST_KERNEL) |
605 | self->origin = DSO__ORIG_GUEST_KERNEL; | ||
606 | else | ||
607 | self->origin = DSO__ORIG_KERNEL; | ||
575 | 608 | ||
576 | return dso__split_kallsyms(self, map, filter); | 609 | return dso__split_kallsyms(self, map, filter); |
577 | } | 610 | } |
@@ -870,8 +903,8 @@ out_close: | |||
870 | if (err == 0) | 903 | if (err == 0) |
871 | return nr; | 904 | return nr; |
872 | out: | 905 | out: |
873 | pr_warning("%s: problems reading %s PLT info.\n", | 906 | pr_debug("%s: problems reading %s PLT info.\n", |
874 | __func__, self->long_name); | 907 | __func__, self->long_name); |
875 | return 0; | 908 | return 0; |
876 | } | 909 | } |
877 | 910 | ||
@@ -958,7 +991,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
958 | nr_syms = shdr.sh_size / shdr.sh_entsize; | 991 | nr_syms = shdr.sh_size / shdr.sh_entsize; |
959 | 992 | ||
960 | memset(&sym, 0, sizeof(sym)); | 993 | memset(&sym, 0, sizeof(sym)); |
961 | if (!self->kernel) { | 994 | if (self->kernel == DSO_TYPE_USER) { |
962 | self->adjust_symbols = (ehdr.e_type == ET_EXEC || | 995 | self->adjust_symbols = (ehdr.e_type == ET_EXEC || |
963 | elf_section_by_name(elf, &ehdr, &shdr, | 996 | elf_section_by_name(elf, &ehdr, &shdr, |
964 | ".gnu.prelink_undo", | 997 | ".gnu.prelink_undo", |
@@ -990,7 +1023,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
990 | 1023 | ||
991 | section_name = elf_sec__name(&shdr, secstrs); | 1024 | section_name = elf_sec__name(&shdr, secstrs); |
992 | 1025 | ||
993 | if (self->kernel || kmodule) { | 1026 | if (self->kernel != DSO_TYPE_USER || kmodule) { |
994 | char dso_name[PATH_MAX]; | 1027 | char dso_name[PATH_MAX]; |
995 | 1028 | ||
996 | if (strcmp(section_name, | 1029 | if (strcmp(section_name, |
@@ -1017,6 +1050,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
1017 | curr_dso = dso__new(dso_name); | 1050 | curr_dso = dso__new(dso_name); |
1018 | if (curr_dso == NULL) | 1051 | if (curr_dso == NULL) |
1019 | goto out_elf_end; | 1052 | goto out_elf_end; |
1053 | curr_dso->kernel = self->kernel; | ||
1020 | curr_map = map__new2(start, curr_dso, | 1054 | curr_map = map__new2(start, curr_dso, |
1021 | map->type); | 1055 | map->type); |
1022 | if (curr_map == NULL) { | 1056 | if (curr_map == NULL) { |
@@ -1025,9 +1059,9 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
1025 | } | 1059 | } |
1026 | curr_map->map_ip = identity__map_ip; | 1060 | curr_map->map_ip = identity__map_ip; |
1027 | curr_map->unmap_ip = identity__map_ip; | 1061 | curr_map->unmap_ip = identity__map_ip; |
1028 | curr_dso->origin = DSO__ORIG_KERNEL; | 1062 | curr_dso->origin = self->origin; |
1029 | map_groups__insert(kmap->kmaps, curr_map); | 1063 | map_groups__insert(kmap->kmaps, curr_map); |
1030 | dsos__add(&dsos__kernel, curr_dso); | 1064 | dsos__add(&self->node, curr_dso); |
1031 | dso__set_loaded(curr_dso, map->type); | 1065 | dso__set_loaded(curr_dso, map->type); |
1032 | } else | 1066 | } else |
1033 | curr_dso = curr_map->dso; | 1067 | curr_dso = curr_map->dso; |
@@ -1089,7 +1123,7 @@ static bool dso__build_id_equal(const struct dso *self, u8 *build_id) | |||
1089 | return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0; | 1123 | return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0; |
1090 | } | 1124 | } |
1091 | 1125 | ||
1092 | static bool __dsos__read_build_ids(struct list_head *head, bool with_hits) | 1126 | bool __dsos__read_build_ids(struct list_head *head, bool with_hits) |
1093 | { | 1127 | { |
1094 | bool have_build_id = false; | 1128 | bool have_build_id = false; |
1095 | struct dso *pos; | 1129 | struct dso *pos; |
@@ -1107,13 +1141,6 @@ static bool __dsos__read_build_ids(struct list_head *head, bool with_hits) | |||
1107 | return have_build_id; | 1141 | return have_build_id; |
1108 | } | 1142 | } |
1109 | 1143 | ||
1110 | bool dsos__read_build_ids(bool with_hits) | ||
1111 | { | ||
1112 | bool kbuildids = __dsos__read_build_ids(&dsos__kernel, with_hits), | ||
1113 | ubuildids = __dsos__read_build_ids(&dsos__user, with_hits); | ||
1114 | return kbuildids || ubuildids; | ||
1115 | } | ||
1116 | |||
1117 | /* | 1144 | /* |
1118 | * Align offset to 4 bytes as needed for note name and descriptor data. | 1145 | * Align offset to 4 bytes as needed for note name and descriptor data. |
1119 | */ | 1146 | */ |
@@ -1248,6 +1275,8 @@ char dso__symtab_origin(const struct dso *self) | |||
1248 | [DSO__ORIG_BUILDID] = 'b', | 1275 | [DSO__ORIG_BUILDID] = 'b', |
1249 | [DSO__ORIG_DSO] = 'd', | 1276 | [DSO__ORIG_DSO] = 'd', |
1250 | [DSO__ORIG_KMODULE] = 'K', | 1277 | [DSO__ORIG_KMODULE] = 'K', |
1278 | [DSO__ORIG_GUEST_KERNEL] = 'g', | ||
1279 | [DSO__ORIG_GUEST_KMODULE] = 'G', | ||
1251 | }; | 1280 | }; |
1252 | 1281 | ||
1253 | if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) | 1282 | if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) |
@@ -1263,11 +1292,20 @@ int dso__load(struct dso *self, struct map *map, symbol_filter_t filter) | |||
1263 | char build_id_hex[BUILD_ID_SIZE * 2 + 1]; | 1292 | char build_id_hex[BUILD_ID_SIZE * 2 + 1]; |
1264 | int ret = -1; | 1293 | int ret = -1; |
1265 | int fd; | 1294 | int fd; |
1295 | struct machine *machine; | ||
1296 | const char *root_dir; | ||
1266 | 1297 | ||
1267 | dso__set_loaded(self, map->type); | 1298 | dso__set_loaded(self, map->type); |
1268 | 1299 | ||
1269 | if (self->kernel) | 1300 | if (self->kernel == DSO_TYPE_KERNEL) |
1270 | return dso__load_kernel_sym(self, map, filter); | 1301 | return dso__load_kernel_sym(self, map, filter); |
1302 | else if (self->kernel == DSO_TYPE_GUEST_KERNEL) | ||
1303 | return dso__load_guest_kernel_sym(self, map, filter); | ||
1304 | |||
1305 | if (map->groups && map->groups->machine) | ||
1306 | machine = map->groups->machine; | ||
1307 | else | ||
1308 | machine = NULL; | ||
1271 | 1309 | ||
1272 | name = malloc(size); | 1310 | name = malloc(size); |
1273 | if (!name) | 1311 | if (!name) |
@@ -1321,6 +1359,13 @@ more: | |||
1321 | case DSO__ORIG_DSO: | 1359 | case DSO__ORIG_DSO: |
1322 | snprintf(name, size, "%s", self->long_name); | 1360 | snprintf(name, size, "%s", self->long_name); |
1323 | break; | 1361 | break; |
1362 | case DSO__ORIG_GUEST_KMODULE: | ||
1363 | if (map->groups && map->groups->machine) | ||
1364 | root_dir = map->groups->machine->root_dir; | ||
1365 | else | ||
1366 | root_dir = ""; | ||
1367 | snprintf(name, size, "%s%s", root_dir, self->long_name); | ||
1368 | break; | ||
1324 | 1369 | ||
1325 | default: | 1370 | default: |
1326 | goto out; | 1371 | goto out; |
@@ -1374,7 +1419,8 @@ struct map *map_groups__find_by_name(struct map_groups *self, | |||
1374 | return NULL; | 1419 | return NULL; |
1375 | } | 1420 | } |
1376 | 1421 | ||
1377 | static int dso__kernel_module_get_build_id(struct dso *self) | 1422 | static int dso__kernel_module_get_build_id(struct dso *self, |
1423 | const char *root_dir) | ||
1378 | { | 1424 | { |
1379 | char filename[PATH_MAX]; | 1425 | char filename[PATH_MAX]; |
1380 | /* | 1426 | /* |
@@ -1384,8 +1430,8 @@ static int dso__kernel_module_get_build_id(struct dso *self) | |||
1384 | const char *name = self->short_name + 1; | 1430 | const char *name = self->short_name + 1; |
1385 | 1431 | ||
1386 | snprintf(filename, sizeof(filename), | 1432 | snprintf(filename, sizeof(filename), |
1387 | "/sys/module/%.*s/notes/.note.gnu.build-id", | 1433 | "%s/sys/module/%.*s/notes/.note.gnu.build-id", |
1388 | (int)strlen(name - 1), name); | 1434 | root_dir, (int)strlen(name) - 1, name); |
1389 | 1435 | ||
1390 | if (sysfs__read_build_id(filename, self->build_id, | 1436 | if (sysfs__read_build_id(filename, self->build_id, |
1391 | sizeof(self->build_id)) == 0) | 1437 | sizeof(self->build_id)) == 0) |
@@ -1394,26 +1440,33 @@ static int dso__kernel_module_get_build_id(struct dso *self) | |||
1394 | return 0; | 1440 | return 0; |
1395 | } | 1441 | } |
1396 | 1442 | ||
1397 | static int map_groups__set_modules_path_dir(struct map_groups *self, char *dirname) | 1443 | static int map_groups__set_modules_path_dir(struct map_groups *self, |
1444 | const char *dir_name) | ||
1398 | { | 1445 | { |
1399 | struct dirent *dent; | 1446 | struct dirent *dent; |
1400 | DIR *dir = opendir(dirname); | 1447 | DIR *dir = opendir(dir_name); |
1401 | 1448 | ||
1402 | if (!dir) { | 1449 | if (!dir) { |
1403 | pr_debug("%s: cannot open %s dir\n", __func__, dirname); | 1450 | pr_debug("%s: cannot open %s dir\n", __func__, dir_name); |
1404 | return -1; | 1451 | return -1; |
1405 | } | 1452 | } |
1406 | 1453 | ||
1407 | while ((dent = readdir(dir)) != NULL) { | 1454 | while ((dent = readdir(dir)) != NULL) { |
1408 | char path[PATH_MAX]; | 1455 | char path[PATH_MAX]; |
1456 | struct stat st; | ||
1409 | 1457 | ||
1410 | if (dent->d_type == DT_DIR) { | 1458 | /*sshfs might return bad dent->d_type, so we have to stat*/ |
1459 | sprintf(path, "%s/%s", dir_name, dent->d_name); | ||
1460 | if (stat(path, &st)) | ||
1461 | continue; | ||
1462 | |||
1463 | if (S_ISDIR(st.st_mode)) { | ||
1411 | if (!strcmp(dent->d_name, ".") || | 1464 | if (!strcmp(dent->d_name, ".") || |
1412 | !strcmp(dent->d_name, "..")) | 1465 | !strcmp(dent->d_name, "..")) |
1413 | continue; | 1466 | continue; |
1414 | 1467 | ||
1415 | snprintf(path, sizeof(path), "%s/%s", | 1468 | snprintf(path, sizeof(path), "%s/%s", |
1416 | dirname, dent->d_name); | 1469 | dir_name, dent->d_name); |
1417 | if (map_groups__set_modules_path_dir(self, path) < 0) | 1470 | if (map_groups__set_modules_path_dir(self, path) < 0) |
1418 | goto failure; | 1471 | goto failure; |
1419 | } else { | 1472 | } else { |
@@ -1433,13 +1486,13 @@ static int map_groups__set_modules_path_dir(struct map_groups *self, char *dirna | |||
1433 | continue; | 1486 | continue; |
1434 | 1487 | ||
1435 | snprintf(path, sizeof(path), "%s/%s", | 1488 | snprintf(path, sizeof(path), "%s/%s", |
1436 | dirname, dent->d_name); | 1489 | dir_name, dent->d_name); |
1437 | 1490 | ||
1438 | long_name = strdup(path); | 1491 | long_name = strdup(path); |
1439 | if (long_name == NULL) | 1492 | if (long_name == NULL) |
1440 | goto failure; | 1493 | goto failure; |
1441 | dso__set_long_name(map->dso, long_name); | 1494 | dso__set_long_name(map->dso, long_name); |
1442 | dso__kernel_module_get_build_id(map->dso); | 1495 | dso__kernel_module_get_build_id(map->dso, ""); |
1443 | } | 1496 | } |
1444 | } | 1497 | } |
1445 | 1498 | ||
@@ -1449,18 +1502,47 @@ failure: | |||
1449 | return -1; | 1502 | return -1; |
1450 | } | 1503 | } |
1451 | 1504 | ||
1452 | static int map_groups__set_modules_path(struct map_groups *self) | 1505 | static char *get_kernel_version(const char *root_dir) |
1453 | { | 1506 | { |
1454 | struct utsname uts; | 1507 | char version[PATH_MAX]; |
1508 | FILE *file; | ||
1509 | char *name, *tmp; | ||
1510 | const char *prefix = "Linux version "; | ||
1511 | |||
1512 | sprintf(version, "%s/proc/version", root_dir); | ||
1513 | file = fopen(version, "r"); | ||
1514 | if (!file) | ||
1515 | return NULL; | ||
1516 | |||
1517 | version[0] = '\0'; | ||
1518 | tmp = fgets(version, sizeof(version), file); | ||
1519 | fclose(file); | ||
1520 | |||
1521 | name = strstr(version, prefix); | ||
1522 | if (!name) | ||
1523 | return NULL; | ||
1524 | name += strlen(prefix); | ||
1525 | tmp = strchr(name, ' '); | ||
1526 | if (tmp) | ||
1527 | *tmp = '\0'; | ||
1528 | |||
1529 | return strdup(name); | ||
1530 | } | ||
1531 | |||
1532 | static int machine__set_modules_path(struct machine *self) | ||
1533 | { | ||
1534 | char *version; | ||
1455 | char modules_path[PATH_MAX]; | 1535 | char modules_path[PATH_MAX]; |
1456 | 1536 | ||
1457 | if (uname(&uts) < 0) | 1537 | version = get_kernel_version(self->root_dir); |
1538 | if (!version) | ||
1458 | return -1; | 1539 | return -1; |
1459 | 1540 | ||
1460 | snprintf(modules_path, sizeof(modules_path), "/lib/modules/%s/kernel", | 1541 | snprintf(modules_path, sizeof(modules_path), "%s/lib/modules/%s/kernel", |
1461 | uts.release); | 1542 | self->root_dir, version); |
1543 | free(version); | ||
1462 | 1544 | ||
1463 | return map_groups__set_modules_path_dir(self, modules_path); | 1545 | return map_groups__set_modules_path_dir(&self->kmaps, modules_path); |
1464 | } | 1546 | } |
1465 | 1547 | ||
1466 | /* | 1548 | /* |
@@ -1470,8 +1552,8 @@ static int map_groups__set_modules_path(struct map_groups *self) | |||
1470 | */ | 1552 | */ |
1471 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) | 1553 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) |
1472 | { | 1554 | { |
1473 | struct map *self = zalloc(sizeof(*self) + | 1555 | struct map *self = calloc(1, (sizeof(*self) + |
1474 | (dso->kernel ? sizeof(struct kmap) : 0)); | 1556 | (dso->kernel ? sizeof(struct kmap) : 0))); |
1475 | if (self != NULL) { | 1557 | if (self != NULL) { |
1476 | /* | 1558 | /* |
1477 | * ->end will be filled after we load all the symbols | 1559 | * ->end will be filled after we load all the symbols |
@@ -1482,11 +1564,11 @@ static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) | |||
1482 | return self; | 1564 | return self; |
1483 | } | 1565 | } |
1484 | 1566 | ||
1485 | struct map *map_groups__new_module(struct map_groups *self, u64 start, | 1567 | struct map *machine__new_module(struct machine *self, u64 start, |
1486 | const char *filename) | 1568 | const char *filename) |
1487 | { | 1569 | { |
1488 | struct map *map; | 1570 | struct map *map; |
1489 | struct dso *dso = __dsos__findnew(&dsos__kernel, filename); | 1571 | struct dso *dso = __dsos__findnew(&self->kernel_dsos, filename); |
1490 | 1572 | ||
1491 | if (dso == NULL) | 1573 | if (dso == NULL) |
1492 | return NULL; | 1574 | return NULL; |
@@ -1495,18 +1577,31 @@ struct map *map_groups__new_module(struct map_groups *self, u64 start, | |||
1495 | if (map == NULL) | 1577 | if (map == NULL) |
1496 | return NULL; | 1578 | return NULL; |
1497 | 1579 | ||
1498 | dso->origin = DSO__ORIG_KMODULE; | 1580 | if (machine__is_host(self)) |
1499 | map_groups__insert(self, map); | 1581 | dso->origin = DSO__ORIG_KMODULE; |
1582 | else | ||
1583 | dso->origin = DSO__ORIG_GUEST_KMODULE; | ||
1584 | map_groups__insert(&self->kmaps, map); | ||
1500 | return map; | 1585 | return map; |
1501 | } | 1586 | } |
1502 | 1587 | ||
1503 | static int map_groups__create_modules(struct map_groups *self) | 1588 | static int machine__create_modules(struct machine *self) |
1504 | { | 1589 | { |
1505 | char *line = NULL; | 1590 | char *line = NULL; |
1506 | size_t n; | 1591 | size_t n; |
1507 | FILE *file = fopen("/proc/modules", "r"); | 1592 | FILE *file; |
1508 | struct map *map; | 1593 | struct map *map; |
1594 | const char *modules; | ||
1595 | char path[PATH_MAX]; | ||
1596 | |||
1597 | if (machine__is_default_guest(self)) | ||
1598 | modules = symbol_conf.default_guest_modules; | ||
1599 | else { | ||
1600 | sprintf(path, "%s/proc/modules", self->root_dir); | ||
1601 | modules = path; | ||
1602 | } | ||
1509 | 1603 | ||
1604 | file = fopen(modules, "r"); | ||
1510 | if (file == NULL) | 1605 | if (file == NULL) |
1511 | return -1; | 1606 | return -1; |
1512 | 1607 | ||
@@ -1538,16 +1633,16 @@ static int map_groups__create_modules(struct map_groups *self) | |||
1538 | *sep = '\0'; | 1633 | *sep = '\0'; |
1539 | 1634 | ||
1540 | snprintf(name, sizeof(name), "[%s]", line); | 1635 | snprintf(name, sizeof(name), "[%s]", line); |
1541 | map = map_groups__new_module(self, start, name); | 1636 | map = machine__new_module(self, start, name); |
1542 | if (map == NULL) | 1637 | if (map == NULL) |
1543 | goto out_delete_line; | 1638 | goto out_delete_line; |
1544 | dso__kernel_module_get_build_id(map->dso); | 1639 | dso__kernel_module_get_build_id(map->dso, self->root_dir); |
1545 | } | 1640 | } |
1546 | 1641 | ||
1547 | free(line); | 1642 | free(line); |
1548 | fclose(file); | 1643 | fclose(file); |
1549 | 1644 | ||
1550 | return map_groups__set_modules_path(self); | 1645 | return machine__set_modules_path(self); |
1551 | 1646 | ||
1552 | out_delete_line: | 1647 | out_delete_line: |
1553 | free(line); | 1648 | free(line); |
@@ -1714,8 +1809,56 @@ out_fixup: | |||
1714 | return err; | 1809 | return err; |
1715 | } | 1810 | } |
1716 | 1811 | ||
1717 | LIST_HEAD(dsos__user); | 1812 | static int dso__load_guest_kernel_sym(struct dso *self, struct map *map, |
1718 | LIST_HEAD(dsos__kernel); | 1813 | symbol_filter_t filter) |
1814 | { | ||
1815 | int err; | ||
1816 | const char *kallsyms_filename = NULL; | ||
1817 | struct machine *machine; | ||
1818 | char path[PATH_MAX]; | ||
1819 | |||
1820 | if (!map->groups) { | ||
1821 | pr_debug("Guest kernel map hasn't the point to groups\n"); | ||
1822 | return -1; | ||
1823 | } | ||
1824 | machine = map->groups->machine; | ||
1825 | |||
1826 | if (machine__is_default_guest(machine)) { | ||
1827 | /* | ||
1828 | * if the user specified a vmlinux filename, use it and only | ||
1829 | * it, reporting errors to the user if it cannot be used. | ||
1830 | * Or use file guest_kallsyms inputted by user on commandline | ||
1831 | */ | ||
1832 | if (symbol_conf.default_guest_vmlinux_name != NULL) { | ||
1833 | err = dso__load_vmlinux(self, map, | ||
1834 | symbol_conf.default_guest_vmlinux_name, filter); | ||
1835 | goto out_try_fixup; | ||
1836 | } | ||
1837 | |||
1838 | kallsyms_filename = symbol_conf.default_guest_kallsyms; | ||
1839 | if (!kallsyms_filename) | ||
1840 | return -1; | ||
1841 | } else { | ||
1842 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
1843 | kallsyms_filename = path; | ||
1844 | } | ||
1845 | |||
1846 | err = dso__load_kallsyms(self, kallsyms_filename, map, filter); | ||
1847 | if (err > 0) | ||
1848 | pr_debug("Using %s for symbols\n", kallsyms_filename); | ||
1849 | |||
1850 | out_try_fixup: | ||
1851 | if (err > 0) { | ||
1852 | if (kallsyms_filename != NULL) { | ||
1853 | machine__mmap_name(machine, path, sizeof(path)); | ||
1854 | dso__set_long_name(self, strdup(path)); | ||
1855 | } | ||
1856 | map__fixup_start(map); | ||
1857 | map__fixup_end(map); | ||
1858 | } | ||
1859 | |||
1860 | return err; | ||
1861 | } | ||
1719 | 1862 | ||
1720 | static void dsos__add(struct list_head *head, struct dso *dso) | 1863 | static void dsos__add(struct list_head *head, struct dso *dso) |
1721 | { | 1864 | { |
@@ -1747,21 +1890,32 @@ struct dso *__dsos__findnew(struct list_head *head, const char *name) | |||
1747 | return dso; | 1890 | return dso; |
1748 | } | 1891 | } |
1749 | 1892 | ||
1750 | static void __dsos__fprintf(struct list_head *head, FILE *fp) | 1893 | size_t __dsos__fprintf(struct list_head *head, FILE *fp) |
1751 | { | 1894 | { |
1752 | struct dso *pos; | 1895 | struct dso *pos; |
1896 | size_t ret = 0; | ||
1753 | 1897 | ||
1754 | list_for_each_entry(pos, head, node) { | 1898 | list_for_each_entry(pos, head, node) { |
1755 | int i; | 1899 | int i; |
1756 | for (i = 0; i < MAP__NR_TYPES; ++i) | 1900 | for (i = 0; i < MAP__NR_TYPES; ++i) |
1757 | dso__fprintf(pos, i, fp); | 1901 | ret += dso__fprintf(pos, i, fp); |
1758 | } | 1902 | } |
1903 | |||
1904 | return ret; | ||
1759 | } | 1905 | } |
1760 | 1906 | ||
1761 | void dsos__fprintf(FILE *fp) | 1907 | size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp) |
1762 | { | 1908 | { |
1763 | __dsos__fprintf(&dsos__kernel, fp); | 1909 | struct rb_node *nd; |
1764 | __dsos__fprintf(&dsos__user, fp); | 1910 | size_t ret = 0; |
1911 | |||
1912 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
1913 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
1914 | ret += __dsos__fprintf(&pos->kernel_dsos, fp); | ||
1915 | ret += __dsos__fprintf(&pos->user_dsos, fp); | ||
1916 | } | ||
1917 | |||
1918 | return ret; | ||
1765 | } | 1919 | } |
1766 | 1920 | ||
1767 | static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, | 1921 | static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, |
@@ -1779,10 +1933,17 @@ static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, | |||
1779 | return ret; | 1933 | return ret; |
1780 | } | 1934 | } |
1781 | 1935 | ||
1782 | size_t dsos__fprintf_buildid(FILE *fp, bool with_hits) | 1936 | size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits) |
1783 | { | 1937 | { |
1784 | return (__dsos__fprintf_buildid(&dsos__kernel, fp, with_hits) + | 1938 | struct rb_node *nd; |
1785 | __dsos__fprintf_buildid(&dsos__user, fp, with_hits)); | 1939 | size_t ret = 0; |
1940 | |||
1941 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
1942 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
1943 | ret += __dsos__fprintf_buildid(&pos->kernel_dsos, fp, with_hits); | ||
1944 | ret += __dsos__fprintf_buildid(&pos->user_dsos, fp, with_hits); | ||
1945 | } | ||
1946 | return ret; | ||
1786 | } | 1947 | } |
1787 | 1948 | ||
1788 | struct dso *dso__new_kernel(const char *name) | 1949 | struct dso *dso__new_kernel(const char *name) |
@@ -1791,55 +1952,98 @@ struct dso *dso__new_kernel(const char *name) | |||
1791 | 1952 | ||
1792 | if (self != NULL) { | 1953 | if (self != NULL) { |
1793 | dso__set_short_name(self, "[kernel]"); | 1954 | dso__set_short_name(self, "[kernel]"); |
1794 | self->kernel = 1; | 1955 | self->kernel = DSO_TYPE_KERNEL; |
1795 | } | 1956 | } |
1796 | 1957 | ||
1797 | return self; | 1958 | return self; |
1798 | } | 1959 | } |
1799 | 1960 | ||
1800 | void dso__read_running_kernel_build_id(struct dso *self) | 1961 | static struct dso *dso__new_guest_kernel(struct machine *machine, |
1962 | const char *name) | ||
1801 | { | 1963 | { |
1802 | if (sysfs__read_build_id("/sys/kernel/notes", self->build_id, | 1964 | char bf[PATH_MAX]; |
1965 | struct dso *self = dso__new(name ?: machine__mmap_name(machine, bf, sizeof(bf))); | ||
1966 | |||
1967 | if (self != NULL) { | ||
1968 | dso__set_short_name(self, "[guest.kernel]"); | ||
1969 | self->kernel = DSO_TYPE_GUEST_KERNEL; | ||
1970 | } | ||
1971 | |||
1972 | return self; | ||
1973 | } | ||
1974 | |||
1975 | void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine) | ||
1976 | { | ||
1977 | char path[PATH_MAX]; | ||
1978 | |||
1979 | if (machine__is_default_guest(machine)) | ||
1980 | return; | ||
1981 | sprintf(path, "%s/sys/kernel/notes", machine->root_dir); | ||
1982 | if (sysfs__read_build_id(path, self->build_id, | ||
1803 | sizeof(self->build_id)) == 0) | 1983 | sizeof(self->build_id)) == 0) |
1804 | self->has_build_id = true; | 1984 | self->has_build_id = true; |
1805 | } | 1985 | } |
1806 | 1986 | ||
1807 | static struct dso *dsos__create_kernel(const char *vmlinux) | 1987 | static struct dso *machine__create_kernel(struct machine *self) |
1808 | { | 1988 | { |
1809 | struct dso *kernel = dso__new_kernel(vmlinux); | 1989 | const char *vmlinux_name = NULL; |
1990 | struct dso *kernel; | ||
1810 | 1991 | ||
1811 | if (kernel != NULL) { | 1992 | if (machine__is_host(self)) { |
1812 | dso__read_running_kernel_build_id(kernel); | 1993 | vmlinux_name = symbol_conf.vmlinux_name; |
1813 | dsos__add(&dsos__kernel, kernel); | 1994 | kernel = dso__new_kernel(vmlinux_name); |
1995 | } else { | ||
1996 | if (machine__is_default_guest(self)) | ||
1997 | vmlinux_name = symbol_conf.default_guest_vmlinux_name; | ||
1998 | kernel = dso__new_guest_kernel(self, vmlinux_name); | ||
1814 | } | 1999 | } |
1815 | 2000 | ||
2001 | if (kernel != NULL) { | ||
2002 | dso__read_running_kernel_build_id(kernel, self); | ||
2003 | dsos__add(&self->kernel_dsos, kernel); | ||
2004 | } | ||
1816 | return kernel; | 2005 | return kernel; |
1817 | } | 2006 | } |
1818 | 2007 | ||
1819 | int __map_groups__create_kernel_maps(struct map_groups *self, | 2008 | int __machine__create_kernel_maps(struct machine *self, struct dso *kernel) |
1820 | struct map *vmlinux_maps[MAP__NR_TYPES], | ||
1821 | struct dso *kernel) | ||
1822 | { | 2009 | { |
1823 | enum map_type type; | 2010 | enum map_type type; |
1824 | 2011 | ||
1825 | for (type = 0; type < MAP__NR_TYPES; ++type) { | 2012 | for (type = 0; type < MAP__NR_TYPES; ++type) { |
1826 | struct kmap *kmap; | 2013 | struct kmap *kmap; |
1827 | 2014 | ||
1828 | vmlinux_maps[type] = map__new2(0, kernel, type); | 2015 | self->vmlinux_maps[type] = map__new2(0, kernel, type); |
1829 | if (vmlinux_maps[type] == NULL) | 2016 | if (self->vmlinux_maps[type] == NULL) |
1830 | return -1; | 2017 | return -1; |
1831 | 2018 | ||
1832 | vmlinux_maps[type]->map_ip = | 2019 | self->vmlinux_maps[type]->map_ip = |
1833 | vmlinux_maps[type]->unmap_ip = identity__map_ip; | 2020 | self->vmlinux_maps[type]->unmap_ip = identity__map_ip; |
1834 | 2021 | ||
1835 | kmap = map__kmap(vmlinux_maps[type]); | 2022 | kmap = map__kmap(self->vmlinux_maps[type]); |
1836 | kmap->kmaps = self; | 2023 | kmap->kmaps = &self->kmaps; |
1837 | map_groups__insert(self, vmlinux_maps[type]); | 2024 | map_groups__insert(&self->kmaps, self->vmlinux_maps[type]); |
1838 | } | 2025 | } |
1839 | 2026 | ||
1840 | return 0; | 2027 | return 0; |
1841 | } | 2028 | } |
1842 | 2029 | ||
2030 | int machine__create_kernel_maps(struct machine *self) | ||
2031 | { | ||
2032 | struct dso *kernel = machine__create_kernel(self); | ||
2033 | |||
2034 | if (kernel == NULL || | ||
2035 | __machine__create_kernel_maps(self, kernel) < 0) | ||
2036 | return -1; | ||
2037 | |||
2038 | if (symbol_conf.use_modules && machine__create_modules(self) < 0) | ||
2039 | pr_debug("Problems creating module maps, continuing anyway...\n"); | ||
2040 | /* | ||
2041 | * Now that we have all the maps created, just set the ->end of them: | ||
2042 | */ | ||
2043 | map_groups__fixup_end(&self->kmaps); | ||
2044 | return 0; | ||
2045 | } | ||
2046 | |||
1843 | static void vmlinux_path__exit(void) | 2047 | static void vmlinux_path__exit(void) |
1844 | { | 2048 | { |
1845 | while (--vmlinux_path__nr_entries >= 0) { | 2049 | while (--vmlinux_path__nr_entries >= 0) { |
@@ -1895,6 +2099,17 @@ out_fail: | |||
1895 | return -1; | 2099 | return -1; |
1896 | } | 2100 | } |
1897 | 2101 | ||
2102 | size_t vmlinux_path__fprintf(FILE *fp) | ||
2103 | { | ||
2104 | int i; | ||
2105 | size_t printed = 0; | ||
2106 | |||
2107 | for (i = 0; i < vmlinux_path__nr_entries; ++i) | ||
2108 | printed += fprintf(fp, "[%d] %s\n", i, vmlinux_path[i]); | ||
2109 | |||
2110 | return printed; | ||
2111 | } | ||
2112 | |||
1898 | static int setup_list(struct strlist **list, const char *list_str, | 2113 | static int setup_list(struct strlist **list, const char *list_str, |
1899 | const char *list_name) | 2114 | const char *list_name) |
1900 | { | 2115 | { |
@@ -1945,22 +2160,129 @@ out_free_comm_list: | |||
1945 | return -1; | 2160 | return -1; |
1946 | } | 2161 | } |
1947 | 2162 | ||
1948 | int map_groups__create_kernel_maps(struct map_groups *self, | 2163 | int machines__create_kernel_maps(struct rb_root *self, pid_t pid) |
1949 | struct map *vmlinux_maps[MAP__NR_TYPES]) | ||
1950 | { | 2164 | { |
1951 | struct dso *kernel = dsos__create_kernel(symbol_conf.vmlinux_name); | 2165 | struct machine *machine = machines__findnew(self, pid); |
1952 | 2166 | ||
1953 | if (kernel == NULL) | 2167 | if (machine == NULL) |
1954 | return -1; | 2168 | return -1; |
1955 | 2169 | ||
1956 | if (__map_groups__create_kernel_maps(self, vmlinux_maps, kernel) < 0) | 2170 | return machine__create_kernel_maps(machine); |
1957 | return -1; | 2171 | } |
1958 | 2172 | ||
1959 | if (symbol_conf.use_modules && map_groups__create_modules(self) < 0) | 2173 | static int hex(char ch) |
1960 | pr_debug("Problems creating module maps, continuing anyway...\n"); | 2174 | { |
1961 | /* | 2175 | if ((ch >= '0') && (ch <= '9')) |
1962 | * Now that we have all the maps created, just set the ->end of them: | 2176 | return ch - '0'; |
1963 | */ | 2177 | if ((ch >= 'a') && (ch <= 'f')) |
1964 | map_groups__fixup_end(self); | 2178 | return ch - 'a' + 10; |
1965 | return 0; | 2179 | if ((ch >= 'A') && (ch <= 'F')) |
2180 | return ch - 'A' + 10; | ||
2181 | return -1; | ||
2182 | } | ||
2183 | |||
2184 | /* | ||
2185 | * While we find nice hex chars, build a long_val. | ||
2186 | * Return number of chars processed. | ||
2187 | */ | ||
2188 | int hex2u64(const char *ptr, u64 *long_val) | ||
2189 | { | ||
2190 | const char *p = ptr; | ||
2191 | *long_val = 0; | ||
2192 | |||
2193 | while (*p) { | ||
2194 | const int hex_val = hex(*p); | ||
2195 | |||
2196 | if (hex_val < 0) | ||
2197 | break; | ||
2198 | |||
2199 | *long_val = (*long_val << 4) | hex_val; | ||
2200 | p++; | ||
2201 | } | ||
2202 | |||
2203 | return p - ptr; | ||
2204 | } | ||
2205 | |||
2206 | char *strxfrchar(char *s, char from, char to) | ||
2207 | { | ||
2208 | char *p = s; | ||
2209 | |||
2210 | while ((p = strchr(p, from)) != NULL) | ||
2211 | *p++ = to; | ||
2212 | |||
2213 | return s; | ||
2214 | } | ||
2215 | |||
2216 | int machines__create_guest_kernel_maps(struct rb_root *self) | ||
2217 | { | ||
2218 | int ret = 0; | ||
2219 | struct dirent **namelist = NULL; | ||
2220 | int i, items = 0; | ||
2221 | char path[PATH_MAX]; | ||
2222 | pid_t pid; | ||
2223 | |||
2224 | if (symbol_conf.default_guest_vmlinux_name || | ||
2225 | symbol_conf.default_guest_modules || | ||
2226 | symbol_conf.default_guest_kallsyms) { | ||
2227 | machines__create_kernel_maps(self, DEFAULT_GUEST_KERNEL_ID); | ||
2228 | } | ||
2229 | |||
2230 | if (symbol_conf.guestmount) { | ||
2231 | items = scandir(symbol_conf.guestmount, &namelist, NULL, NULL); | ||
2232 | if (items <= 0) | ||
2233 | return -ENOENT; | ||
2234 | for (i = 0; i < items; i++) { | ||
2235 | if (!isdigit(namelist[i]->d_name[0])) { | ||
2236 | /* Filter out . and .. */ | ||
2237 | continue; | ||
2238 | } | ||
2239 | pid = atoi(namelist[i]->d_name); | ||
2240 | sprintf(path, "%s/%s/proc/kallsyms", | ||
2241 | symbol_conf.guestmount, | ||
2242 | namelist[i]->d_name); | ||
2243 | ret = access(path, R_OK); | ||
2244 | if (ret) { | ||
2245 | pr_debug("Can't access file %s\n", path); | ||
2246 | goto failure; | ||
2247 | } | ||
2248 | machines__create_kernel_maps(self, pid); | ||
2249 | } | ||
2250 | failure: | ||
2251 | free(namelist); | ||
2252 | } | ||
2253 | |||
2254 | return ret; | ||
2255 | } | ||
2256 | |||
2257 | int machine__load_kallsyms(struct machine *self, const char *filename, | ||
2258 | enum map_type type, symbol_filter_t filter) | ||
2259 | { | ||
2260 | struct map *map = self->vmlinux_maps[type]; | ||
2261 | int ret = dso__load_kallsyms(map->dso, filename, map, filter); | ||
2262 | |||
2263 | if (ret > 0) { | ||
2264 | dso__set_loaded(map->dso, type); | ||
2265 | /* | ||
2266 | * Since /proc/kallsyms will have multiple sessions for the | ||
2267 | * kernel, with modules between them, fixup the end of all | ||
2268 | * sections. | ||
2269 | */ | ||
2270 | __map_groups__fixup_end(&self->kmaps, type); | ||
2271 | } | ||
2272 | |||
2273 | return ret; | ||
2274 | } | ||
2275 | |||
2276 | int machine__load_vmlinux_path(struct machine *self, enum map_type type, | ||
2277 | symbol_filter_t filter) | ||
2278 | { | ||
2279 | struct map *map = self->vmlinux_maps[type]; | ||
2280 | int ret = dso__load_vmlinux_path(map->dso, map, filter); | ||
2281 | |||
2282 | if (ret > 0) { | ||
2283 | dso__set_loaded(map->dso, type); | ||
2284 | map__reloc_vmlinux(map); | ||
2285 | } | ||
2286 | |||
2287 | return ret; | ||
1966 | } | 2288 | } |
diff --git a/tools/perf/util/symbol.h b/tools/perf/util/symbol.h index f30a37428919..032469e41876 100644 --- a/tools/perf/util/symbol.h +++ b/tools/perf/util/symbol.h | |||
@@ -3,10 +3,11 @@ | |||
3 | 3 | ||
4 | #include <linux/types.h> | 4 | #include <linux/types.h> |
5 | #include <stdbool.h> | 5 | #include <stdbool.h> |
6 | #include "types.h" | 6 | #include <stdint.h> |
7 | #include "map.h" | ||
7 | #include <linux/list.h> | 8 | #include <linux/list.h> |
8 | #include <linux/rbtree.h> | 9 | #include <linux/rbtree.h> |
9 | #include "event.h" | 10 | #include <stdio.h> |
10 | 11 | ||
11 | #define DEBUG_CACHE_DIR ".debug" | 12 | #define DEBUG_CACHE_DIR ".debug" |
12 | 13 | ||
@@ -29,6 +30,9 @@ static inline char *bfd_demangle(void __used *v, const char __used *c, | |||
29 | #endif | 30 | #endif |
30 | #endif | 31 | #endif |
31 | 32 | ||
33 | int hex2u64(const char *ptr, u64 *val); | ||
34 | char *strxfrchar(char *s, char from, char to); | ||
35 | |||
32 | /* | 36 | /* |
33 | * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP; | 37 | * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP; |
34 | * for newer versions we can use mmap to reduce memory usage: | 38 | * for newer versions we can use mmap to reduce memory usage: |
@@ -44,10 +48,13 @@ static inline char *bfd_demangle(void __used *v, const char __used *c, | |||
44 | #define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */ | 48 | #define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */ |
45 | #endif | 49 | #endif |
46 | 50 | ||
51 | #define BUILD_ID_SIZE 20 | ||
52 | |||
47 | struct symbol { | 53 | struct symbol { |
48 | struct rb_node rb_node; | 54 | struct rb_node rb_node; |
49 | u64 start; | 55 | u64 start; |
50 | u64 end; | 56 | u64 end; |
57 | u16 namelen; | ||
51 | char name[0]; | 58 | char name[0]; |
52 | }; | 59 | }; |
53 | 60 | ||
@@ -63,10 +70,15 @@ struct symbol_conf { | |||
63 | show_nr_samples, | 70 | show_nr_samples, |
64 | use_callchain, | 71 | use_callchain, |
65 | exclude_other, | 72 | exclude_other, |
66 | full_paths; | 73 | full_paths, |
74 | show_cpu_utilization; | ||
67 | const char *vmlinux_name, | 75 | const char *vmlinux_name, |
68 | *field_sep; | 76 | *field_sep; |
69 | char *dso_list_str, | 77 | const char *default_guest_vmlinux_name, |
78 | *default_guest_kallsyms, | ||
79 | *default_guest_modules; | ||
80 | const char *guestmount; | ||
81 | const char *dso_list_str, | ||
70 | *comm_list_str, | 82 | *comm_list_str, |
71 | *sym_list_str, | 83 | *sym_list_str, |
72 | *col_width_list_str; | 84 | *col_width_list_str; |
@@ -88,6 +100,11 @@ struct ref_reloc_sym { | |||
88 | u64 unrelocated_addr; | 100 | u64 unrelocated_addr; |
89 | }; | 101 | }; |
90 | 102 | ||
103 | struct map_symbol { | ||
104 | struct map *map; | ||
105 | struct symbol *sym; | ||
106 | }; | ||
107 | |||
91 | struct addr_location { | 108 | struct addr_location { |
92 | struct thread *thread; | 109 | struct thread *thread; |
93 | struct map *map; | 110 | struct map *map; |
@@ -95,6 +112,13 @@ struct addr_location { | |||
95 | u64 addr; | 112 | u64 addr; |
96 | char level; | 113 | char level; |
97 | bool filtered; | 114 | bool filtered; |
115 | unsigned int cpumode; | ||
116 | }; | ||
117 | |||
118 | enum dso_kernel_type { | ||
119 | DSO_TYPE_USER = 0, | ||
120 | DSO_TYPE_KERNEL, | ||
121 | DSO_TYPE_GUEST_KERNEL | ||
98 | }; | 122 | }; |
99 | 123 | ||
100 | struct dso { | 124 | struct dso { |
@@ -104,8 +128,9 @@ struct dso { | |||
104 | u8 adjust_symbols:1; | 128 | u8 adjust_symbols:1; |
105 | u8 slen_calculated:1; | 129 | u8 slen_calculated:1; |
106 | u8 has_build_id:1; | 130 | u8 has_build_id:1; |
107 | u8 kernel:1; | 131 | enum dso_kernel_type kernel; |
108 | u8 hit:1; | 132 | u8 hit:1; |
133 | u8 annotate_warned:1; | ||
109 | unsigned char origin; | 134 | unsigned char origin; |
110 | u8 sorted_by_name; | 135 | u8 sorted_by_name; |
111 | u8 loaded; | 136 | u8 loaded; |
@@ -131,42 +156,65 @@ static inline void dso__set_loaded(struct dso *self, enum map_type type) | |||
131 | 156 | ||
132 | void dso__sort_by_name(struct dso *self, enum map_type type); | 157 | void dso__sort_by_name(struct dso *self, enum map_type type); |
133 | 158 | ||
134 | extern struct list_head dsos__user, dsos__kernel; | ||
135 | |||
136 | struct dso *__dsos__findnew(struct list_head *head, const char *name); | 159 | struct dso *__dsos__findnew(struct list_head *head, const char *name); |
137 | 160 | ||
138 | static inline struct dso *dsos__findnew(const char *name) | ||
139 | { | ||
140 | return __dsos__findnew(&dsos__user, name); | ||
141 | } | ||
142 | |||
143 | int dso__load(struct dso *self, struct map *map, symbol_filter_t filter); | 161 | int dso__load(struct dso *self, struct map *map, symbol_filter_t filter); |
144 | int dso__load_vmlinux_path(struct dso *self, struct map *map, | 162 | int dso__load_vmlinux_path(struct dso *self, struct map *map, |
145 | symbol_filter_t filter); | 163 | symbol_filter_t filter); |
146 | int dso__load_kallsyms(struct dso *self, const char *filename, struct map *map, | 164 | int dso__load_kallsyms(struct dso *self, const char *filename, struct map *map, |
147 | symbol_filter_t filter); | 165 | symbol_filter_t filter); |
148 | void dsos__fprintf(FILE *fp); | 166 | int machine__load_kallsyms(struct machine *self, const char *filename, |
149 | size_t dsos__fprintf_buildid(FILE *fp, bool with_hits); | 167 | enum map_type type, symbol_filter_t filter); |
168 | int machine__load_vmlinux_path(struct machine *self, enum map_type type, | ||
169 | symbol_filter_t filter); | ||
170 | |||
171 | size_t __dsos__fprintf(struct list_head *head, FILE *fp); | ||
172 | |||
173 | size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp); | ||
174 | size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits); | ||
150 | 175 | ||
151 | size_t dso__fprintf_buildid(struct dso *self, FILE *fp); | 176 | size_t dso__fprintf_buildid(struct dso *self, FILE *fp); |
152 | size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp); | 177 | size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp); |
178 | |||
179 | enum dso_origin { | ||
180 | DSO__ORIG_KERNEL = 0, | ||
181 | DSO__ORIG_GUEST_KERNEL, | ||
182 | DSO__ORIG_JAVA_JIT, | ||
183 | DSO__ORIG_BUILD_ID_CACHE, | ||
184 | DSO__ORIG_FEDORA, | ||
185 | DSO__ORIG_UBUNTU, | ||
186 | DSO__ORIG_BUILDID, | ||
187 | DSO__ORIG_DSO, | ||
188 | DSO__ORIG_GUEST_KMODULE, | ||
189 | DSO__ORIG_KMODULE, | ||
190 | DSO__ORIG_NOT_FOUND, | ||
191 | }; | ||
192 | |||
153 | char dso__symtab_origin(const struct dso *self); | 193 | char dso__symtab_origin(const struct dso *self); |
154 | void dso__set_long_name(struct dso *self, char *name); | 194 | void dso__set_long_name(struct dso *self, char *name); |
155 | void dso__set_build_id(struct dso *self, void *build_id); | 195 | void dso__set_build_id(struct dso *self, void *build_id); |
156 | void dso__read_running_kernel_build_id(struct dso *self); | 196 | void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine); |
157 | struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr); | 197 | struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr); |
158 | struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type, | 198 | struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type, |
159 | const char *name); | 199 | const char *name); |
160 | 200 | ||
161 | int filename__read_build_id(const char *filename, void *bf, size_t size); | 201 | int filename__read_build_id(const char *filename, void *bf, size_t size); |
162 | int sysfs__read_build_id(const char *filename, void *bf, size_t size); | 202 | int sysfs__read_build_id(const char *filename, void *bf, size_t size); |
163 | bool dsos__read_build_ids(bool with_hits); | 203 | bool __dsos__read_build_ids(struct list_head *head, bool with_hits); |
164 | int build_id__sprintf(const u8 *self, int len, char *bf); | 204 | int build_id__sprintf(const u8 *self, int len, char *bf); |
165 | int kallsyms__parse(const char *filename, void *arg, | 205 | int kallsyms__parse(const char *filename, void *arg, |
166 | int (*process_symbol)(void *arg, const char *name, | 206 | int (*process_symbol)(void *arg, const char *name, |
167 | char type, u64 start)); | 207 | char type, u64 start)); |
168 | 208 | ||
209 | int __machine__create_kernel_maps(struct machine *self, struct dso *kernel); | ||
210 | int machine__create_kernel_maps(struct machine *self); | ||
211 | |||
212 | int machines__create_kernel_maps(struct rb_root *self, pid_t pid); | ||
213 | int machines__create_guest_kernel_maps(struct rb_root *self); | ||
214 | |||
169 | int symbol__init(void); | 215 | int symbol__init(void); |
170 | bool symbol_type__is_a(char symbol_type, enum map_type map_type); | 216 | bool symbol_type__is_a(char symbol_type, enum map_type map_type); |
171 | 217 | ||
218 | size_t vmlinux_path__fprintf(FILE *fp); | ||
219 | |||
172 | #endif /* __PERF_SYMBOL */ | 220 | #endif /* __PERF_SYMBOL */ |
diff --git a/tools/perf/util/thread.c b/tools/perf/util/thread.c index fa968312ee7d..1f7ecd47f499 100644 --- a/tools/perf/util/thread.c +++ b/tools/perf/util/thread.c | |||
@@ -7,13 +7,35 @@ | |||
7 | #include "util.h" | 7 | #include "util.h" |
8 | #include "debug.h" | 8 | #include "debug.h" |
9 | 9 | ||
10 | void map_groups__init(struct map_groups *self) | 10 | int find_all_tid(int pid, pid_t ** all_tid) |
11 | { | 11 | { |
12 | char name[256]; | ||
13 | int items; | ||
14 | struct dirent **namelist = NULL; | ||
15 | int ret = 0; | ||
12 | int i; | 16 | int i; |
13 | for (i = 0; i < MAP__NR_TYPES; ++i) { | 17 | |
14 | self->maps[i] = RB_ROOT; | 18 | sprintf(name, "/proc/%d/task", pid); |
15 | INIT_LIST_HEAD(&self->removed_maps[i]); | 19 | items = scandir(name, &namelist, NULL, NULL); |
20 | if (items <= 0) | ||
21 | return -ENOENT; | ||
22 | *all_tid = malloc(sizeof(pid_t) * items); | ||
23 | if (!*all_tid) { | ||
24 | ret = -ENOMEM; | ||
25 | goto failure; | ||
16 | } | 26 | } |
27 | |||
28 | for (i = 0; i < items; i++) | ||
29 | (*all_tid)[i] = atoi(namelist[i]->d_name); | ||
30 | |||
31 | ret = items; | ||
32 | |||
33 | failure: | ||
34 | for (i=0; i<items; i++) | ||
35 | free(namelist[i]); | ||
36 | free(namelist); | ||
37 | |||
38 | return ret; | ||
17 | } | 39 | } |
18 | 40 | ||
19 | static struct thread *thread__new(pid_t pid) | 41 | static struct thread *thread__new(pid_t pid) |
@@ -31,28 +53,6 @@ static struct thread *thread__new(pid_t pid) | |||
31 | return self; | 53 | return self; |
32 | } | 54 | } |
33 | 55 | ||
34 | static void map_groups__flush(struct map_groups *self) | ||
35 | { | ||
36 | int type; | ||
37 | |||
38 | for (type = 0; type < MAP__NR_TYPES; type++) { | ||
39 | struct rb_root *root = &self->maps[type]; | ||
40 | struct rb_node *next = rb_first(root); | ||
41 | |||
42 | while (next) { | ||
43 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
44 | next = rb_next(&pos->rb_node); | ||
45 | rb_erase(&pos->rb_node, root); | ||
46 | /* | ||
47 | * We may have references to this map, for | ||
48 | * instance in some hist_entry instances, so | ||
49 | * just move them to a separate list. | ||
50 | */ | ||
51 | list_add_tail(&pos->node, &self->removed_maps[pos->type]); | ||
52 | } | ||
53 | } | ||
54 | } | ||
55 | |||
56 | int thread__set_comm(struct thread *self, const char *comm) | 56 | int thread__set_comm(struct thread *self, const char *comm) |
57 | { | 57 | { |
58 | int err; | 58 | int err; |
@@ -79,69 +79,10 @@ int thread__comm_len(struct thread *self) | |||
79 | return self->comm_len; | 79 | return self->comm_len; |
80 | } | 80 | } |
81 | 81 | ||
82 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
83 | enum map_type type, FILE *fp) | ||
84 | { | ||
85 | size_t printed = fprintf(fp, "%s:\n", map_type__name[type]); | ||
86 | struct rb_node *nd; | ||
87 | |||
88 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
89 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
90 | printed += fprintf(fp, "Map:"); | ||
91 | printed += map__fprintf(pos, fp); | ||
92 | if (verbose > 2) { | ||
93 | printed += dso__fprintf(pos->dso, type, fp); | ||
94 | printed += fprintf(fp, "--\n"); | ||
95 | } | ||
96 | } | ||
97 | |||
98 | return printed; | ||
99 | } | ||
100 | |||
101 | size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp) | ||
102 | { | ||
103 | size_t printed = 0, i; | ||
104 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
105 | printed += __map_groups__fprintf_maps(self, i, fp); | ||
106 | return printed; | ||
107 | } | ||
108 | |||
109 | static size_t __map_groups__fprintf_removed_maps(struct map_groups *self, | ||
110 | enum map_type type, FILE *fp) | ||
111 | { | ||
112 | struct map *pos; | ||
113 | size_t printed = 0; | ||
114 | |||
115 | list_for_each_entry(pos, &self->removed_maps[type], node) { | ||
116 | printed += fprintf(fp, "Map:"); | ||
117 | printed += map__fprintf(pos, fp); | ||
118 | if (verbose > 1) { | ||
119 | printed += dso__fprintf(pos->dso, type, fp); | ||
120 | printed += fprintf(fp, "--\n"); | ||
121 | } | ||
122 | } | ||
123 | return printed; | ||
124 | } | ||
125 | |||
126 | static size_t map_groups__fprintf_removed_maps(struct map_groups *self, FILE *fp) | ||
127 | { | ||
128 | size_t printed = 0, i; | ||
129 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
130 | printed += __map_groups__fprintf_removed_maps(self, i, fp); | ||
131 | return printed; | ||
132 | } | ||
133 | |||
134 | static size_t map_groups__fprintf(struct map_groups *self, FILE *fp) | ||
135 | { | ||
136 | size_t printed = map_groups__fprintf_maps(self, fp); | ||
137 | printed += fprintf(fp, "Removed maps:\n"); | ||
138 | return printed + map_groups__fprintf_removed_maps(self, fp); | ||
139 | } | ||
140 | |||
141 | static size_t thread__fprintf(struct thread *self, FILE *fp) | 82 | static size_t thread__fprintf(struct thread *self, FILE *fp) |
142 | { | 83 | { |
143 | return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) + | 84 | return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) + |
144 | map_groups__fprintf(&self->mg, fp); | 85 | map_groups__fprintf(&self->mg, verbose, fp); |
145 | } | 86 | } |
146 | 87 | ||
147 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) | 88 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) |
@@ -183,127 +124,12 @@ struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) | |||
183 | return th; | 124 | return th; |
184 | } | 125 | } |
185 | 126 | ||
186 | static int map_groups__fixup_overlappings(struct map_groups *self, | ||
187 | struct map *map) | ||
188 | { | ||
189 | struct rb_root *root = &self->maps[map->type]; | ||
190 | struct rb_node *next = rb_first(root); | ||
191 | |||
192 | while (next) { | ||
193 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
194 | next = rb_next(&pos->rb_node); | ||
195 | |||
196 | if (!map__overlap(pos, map)) | ||
197 | continue; | ||
198 | |||
199 | if (verbose >= 2) { | ||
200 | fputs("overlapping maps:\n", stderr); | ||
201 | map__fprintf(map, stderr); | ||
202 | map__fprintf(pos, stderr); | ||
203 | } | ||
204 | |||
205 | rb_erase(&pos->rb_node, root); | ||
206 | /* | ||
207 | * We may have references to this map, for instance in some | ||
208 | * hist_entry instances, so just move them to a separate | ||
209 | * list. | ||
210 | */ | ||
211 | list_add_tail(&pos->node, &self->removed_maps[map->type]); | ||
212 | /* | ||
213 | * Now check if we need to create new maps for areas not | ||
214 | * overlapped by the new map: | ||
215 | */ | ||
216 | if (map->start > pos->start) { | ||
217 | struct map *before = map__clone(pos); | ||
218 | |||
219 | if (before == NULL) | ||
220 | return -ENOMEM; | ||
221 | |||
222 | before->end = map->start - 1; | ||
223 | map_groups__insert(self, before); | ||
224 | if (verbose >= 2) | ||
225 | map__fprintf(before, stderr); | ||
226 | } | ||
227 | |||
228 | if (map->end < pos->end) { | ||
229 | struct map *after = map__clone(pos); | ||
230 | |||
231 | if (after == NULL) | ||
232 | return -ENOMEM; | ||
233 | |||
234 | after->start = map->end + 1; | ||
235 | map_groups__insert(self, after); | ||
236 | if (verbose >= 2) | ||
237 | map__fprintf(after, stderr); | ||
238 | } | ||
239 | } | ||
240 | |||
241 | return 0; | ||
242 | } | ||
243 | |||
244 | void maps__insert(struct rb_root *maps, struct map *map) | ||
245 | { | ||
246 | struct rb_node **p = &maps->rb_node; | ||
247 | struct rb_node *parent = NULL; | ||
248 | const u64 ip = map->start; | ||
249 | struct map *m; | ||
250 | |||
251 | while (*p != NULL) { | ||
252 | parent = *p; | ||
253 | m = rb_entry(parent, struct map, rb_node); | ||
254 | if (ip < m->start) | ||
255 | p = &(*p)->rb_left; | ||
256 | else | ||
257 | p = &(*p)->rb_right; | ||
258 | } | ||
259 | |||
260 | rb_link_node(&map->rb_node, parent, p); | ||
261 | rb_insert_color(&map->rb_node, maps); | ||
262 | } | ||
263 | |||
264 | struct map *maps__find(struct rb_root *maps, u64 ip) | ||
265 | { | ||
266 | struct rb_node **p = &maps->rb_node; | ||
267 | struct rb_node *parent = NULL; | ||
268 | struct map *m; | ||
269 | |||
270 | while (*p != NULL) { | ||
271 | parent = *p; | ||
272 | m = rb_entry(parent, struct map, rb_node); | ||
273 | if (ip < m->start) | ||
274 | p = &(*p)->rb_left; | ||
275 | else if (ip > m->end) | ||
276 | p = &(*p)->rb_right; | ||
277 | else | ||
278 | return m; | ||
279 | } | ||
280 | |||
281 | return NULL; | ||
282 | } | ||
283 | |||
284 | void thread__insert_map(struct thread *self, struct map *map) | 127 | void thread__insert_map(struct thread *self, struct map *map) |
285 | { | 128 | { |
286 | map_groups__fixup_overlappings(&self->mg, map); | 129 | map_groups__fixup_overlappings(&self->mg, map, verbose, stderr); |
287 | map_groups__insert(&self->mg, map); | 130 | map_groups__insert(&self->mg, map); |
288 | } | 131 | } |
289 | 132 | ||
290 | /* | ||
291 | * XXX This should not really _copy_ te maps, but refcount them. | ||
292 | */ | ||
293 | static int map_groups__clone(struct map_groups *self, | ||
294 | struct map_groups *parent, enum map_type type) | ||
295 | { | ||
296 | struct rb_node *nd; | ||
297 | for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) { | ||
298 | struct map *map = rb_entry(nd, struct map, rb_node); | ||
299 | struct map *new = map__clone(map); | ||
300 | if (new == NULL) | ||
301 | return -ENOMEM; | ||
302 | map_groups__insert(self, new); | ||
303 | } | ||
304 | return 0; | ||
305 | } | ||
306 | |||
307 | int thread__fork(struct thread *self, struct thread *parent) | 133 | int thread__fork(struct thread *self, struct thread *parent) |
308 | { | 134 | { |
309 | int i; | 135 | int i; |
@@ -336,15 +162,3 @@ size_t perf_session__fprintf(struct perf_session *self, FILE *fp) | |||
336 | 162 | ||
337 | return ret; | 163 | return ret; |
338 | } | 164 | } |
339 | |||
340 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
341 | enum map_type type, u64 addr, | ||
342 | symbol_filter_t filter) | ||
343 | { | ||
344 | struct map *map = map_groups__find(self, type, addr); | ||
345 | |||
346 | if (map != NULL) | ||
347 | return map__find_symbol(map, map->map_ip(map, addr), filter); | ||
348 | |||
349 | return NULL; | ||
350 | } | ||
diff --git a/tools/perf/util/thread.h b/tools/perf/util/thread.h index dcf70303e58e..1dfd9ff8bdcd 100644 --- a/tools/perf/util/thread.h +++ b/tools/perf/util/thread.h | |||
@@ -5,14 +5,6 @@ | |||
5 | #include <unistd.h> | 5 | #include <unistd.h> |
6 | #include "symbol.h" | 6 | #include "symbol.h" |
7 | 7 | ||
8 | struct map_groups { | ||
9 | struct rb_root maps[MAP__NR_TYPES]; | ||
10 | struct list_head removed_maps[MAP__NR_TYPES]; | ||
11 | }; | ||
12 | |||
13 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
14 | enum map_type type, FILE *fp); | ||
15 | |||
16 | struct thread { | 8 | struct thread { |
17 | struct rb_node rb_node; | 9 | struct rb_node rb_node; |
18 | struct map_groups mg; | 10 | struct map_groups mg; |
@@ -23,29 +15,16 @@ struct thread { | |||
23 | int comm_len; | 15 | int comm_len; |
24 | }; | 16 | }; |
25 | 17 | ||
26 | void map_groups__init(struct map_groups *self); | 18 | struct perf_session; |
19 | |||
20 | int find_all_tid(int pid, pid_t ** all_tid); | ||
27 | int thread__set_comm(struct thread *self, const char *comm); | 21 | int thread__set_comm(struct thread *self, const char *comm); |
28 | int thread__comm_len(struct thread *self); | 22 | int thread__comm_len(struct thread *self); |
29 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid); | 23 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid); |
30 | void thread__insert_map(struct thread *self, struct map *map); | 24 | void thread__insert_map(struct thread *self, struct map *map); |
31 | int thread__fork(struct thread *self, struct thread *parent); | 25 | int thread__fork(struct thread *self, struct thread *parent); |
32 | size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp); | ||
33 | size_t perf_session__fprintf(struct perf_session *self, FILE *fp); | 26 | size_t perf_session__fprintf(struct perf_session *self, FILE *fp); |
34 | 27 | ||
35 | void maps__insert(struct rb_root *maps, struct map *map); | ||
36 | struct map *maps__find(struct rb_root *maps, u64 addr); | ||
37 | |||
38 | static inline void map_groups__insert(struct map_groups *self, struct map *map) | ||
39 | { | ||
40 | maps__insert(&self->maps[map->type], map); | ||
41 | } | ||
42 | |||
43 | static inline struct map *map_groups__find(struct map_groups *self, | ||
44 | enum map_type type, u64 addr) | ||
45 | { | ||
46 | return maps__find(&self->maps[type], addr); | ||
47 | } | ||
48 | |||
49 | static inline struct map *thread__find_map(struct thread *self, | 28 | static inline struct map *thread__find_map(struct thread *self, |
50 | enum map_type type, u64 addr) | 29 | enum map_type type, u64 addr) |
51 | { | 30 | { |
@@ -54,34 +33,12 @@ static inline struct map *thread__find_map(struct thread *self, | |||
54 | 33 | ||
55 | void thread__find_addr_map(struct thread *self, | 34 | void thread__find_addr_map(struct thread *self, |
56 | struct perf_session *session, u8 cpumode, | 35 | struct perf_session *session, u8 cpumode, |
57 | enum map_type type, u64 addr, | 36 | enum map_type type, pid_t pid, u64 addr, |
58 | struct addr_location *al); | 37 | struct addr_location *al); |
59 | 38 | ||
60 | void thread__find_addr_location(struct thread *self, | 39 | void thread__find_addr_location(struct thread *self, |
61 | struct perf_session *session, u8 cpumode, | 40 | struct perf_session *session, u8 cpumode, |
62 | enum map_type type, u64 addr, | 41 | enum map_type type, pid_t pid, u64 addr, |
63 | struct addr_location *al, | 42 | struct addr_location *al, |
64 | symbol_filter_t filter); | 43 | symbol_filter_t filter); |
65 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
66 | enum map_type type, u64 addr, | ||
67 | symbol_filter_t filter); | ||
68 | |||
69 | static inline struct symbol *map_groups__find_function(struct map_groups *self, | ||
70 | u64 addr, | ||
71 | symbol_filter_t filter) | ||
72 | { | ||
73 | return map_groups__find_symbol(self, MAP__FUNCTION, addr, filter); | ||
74 | } | ||
75 | |||
76 | struct map *map_groups__find_by_name(struct map_groups *self, | ||
77 | enum map_type type, const char *name); | ||
78 | |||
79 | int __map_groups__create_kernel_maps(struct map_groups *self, | ||
80 | struct map *vmlinux_maps[MAP__NR_TYPES], | ||
81 | struct dso *kernel); | ||
82 | int map_groups__create_kernel_maps(struct map_groups *self, | ||
83 | struct map *vmlinux_maps[MAP__NR_TYPES]); | ||
84 | |||
85 | struct map *map_groups__new_module(struct map_groups *self, u64 start, | ||
86 | const char *filename); | ||
87 | #endif /* __PERF_THREAD_H */ | 44 | #endif /* __PERF_THREAD_H */ |
diff --git a/tools/perf/util/trace-event-info.c b/tools/perf/util/trace-event-info.c index 5ea8973ad331..b1572601286c 100644 --- a/tools/perf/util/trace-event-info.c +++ b/tools/perf/util/trace-event-info.c | |||
@@ -154,10 +154,17 @@ static void put_tracing_file(char *file) | |||
154 | free(file); | 154 | free(file); |
155 | } | 155 | } |
156 | 156 | ||
157 | static ssize_t calc_data_size; | ||
158 | |||
157 | static ssize_t write_or_die(const void *buf, size_t len) | 159 | static ssize_t write_or_die(const void *buf, size_t len) |
158 | { | 160 | { |
159 | int ret; | 161 | int ret; |
160 | 162 | ||
163 | if (calc_data_size) { | ||
164 | calc_data_size += len; | ||
165 | return len; | ||
166 | } | ||
167 | |||
161 | ret = write(output_fd, buf, len); | 168 | ret = write(output_fd, buf, len); |
162 | if (ret < 0) | 169 | if (ret < 0) |
163 | die("writing to '%s'", output_file); | 170 | die("writing to '%s'", output_file); |
@@ -480,6 +487,17 @@ get_tracepoints_path(struct perf_event_attr *pattrs, int nb_events) | |||
480 | return nr_tracepoints > 0 ? path.next : NULL; | 487 | return nr_tracepoints > 0 ? path.next : NULL; |
481 | } | 488 | } |
482 | 489 | ||
490 | bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events) | ||
491 | { | ||
492 | int i; | ||
493 | |||
494 | for (i = 0; i < nb_events; i++) | ||
495 | if (pattrs[i].type == PERF_TYPE_TRACEPOINT) | ||
496 | return true; | ||
497 | |||
498 | return false; | ||
499 | } | ||
500 | |||
483 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) | 501 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) |
484 | { | 502 | { |
485 | char buf[BUFSIZ]; | 503 | char buf[BUFSIZ]; |
@@ -526,3 +544,20 @@ int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) | |||
526 | 544 | ||
527 | return 0; | 545 | return 0; |
528 | } | 546 | } |
547 | |||
548 | ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs, | ||
549 | int nb_events) | ||
550 | { | ||
551 | ssize_t size; | ||
552 | int err = 0; | ||
553 | |||
554 | calc_data_size = 1; | ||
555 | err = read_tracing_data(fd, pattrs, nb_events); | ||
556 | size = calc_data_size - 1; | ||
557 | calc_data_size = 0; | ||
558 | |||
559 | if (err < 0) | ||
560 | return err; | ||
561 | |||
562 | return size; | ||
563 | } | ||
diff --git a/tools/perf/util/trace-event-parse.c b/tools/perf/util/trace-event-parse.c index 613c9cc90570..73a02223c629 100644 --- a/tools/perf/util/trace-event-parse.c +++ b/tools/perf/util/trace-event-parse.c | |||
@@ -37,10 +37,12 @@ int header_page_ts_offset; | |||
37 | int header_page_ts_size; | 37 | int header_page_ts_size; |
38 | int header_page_size_offset; | 38 | int header_page_size_offset; |
39 | int header_page_size_size; | 39 | int header_page_size_size; |
40 | int header_page_overwrite_offset; | ||
41 | int header_page_overwrite_size; | ||
40 | int header_page_data_offset; | 42 | int header_page_data_offset; |
41 | int header_page_data_size; | 43 | int header_page_data_size; |
42 | 44 | ||
43 | int latency_format; | 45 | bool latency_format; |
44 | 46 | ||
45 | static char *input_buf; | 47 | static char *input_buf; |
46 | static unsigned long long input_buf_ptr; | 48 | static unsigned long long input_buf_ptr; |
@@ -628,23 +630,32 @@ static int test_type(enum event_type type, enum event_type expect) | |||
628 | return 0; | 630 | return 0; |
629 | } | 631 | } |
630 | 632 | ||
631 | static int test_type_token(enum event_type type, char *token, | 633 | static int __test_type_token(enum event_type type, char *token, |
632 | enum event_type expect, const char *expect_tok) | 634 | enum event_type expect, const char *expect_tok, |
635 | bool warn) | ||
633 | { | 636 | { |
634 | if (type != expect) { | 637 | if (type != expect) { |
635 | warning("Error: expected type %d but read %d", | 638 | if (warn) |
636 | expect, type); | 639 | warning("Error: expected type %d but read %d", |
640 | expect, type); | ||
637 | return -1; | 641 | return -1; |
638 | } | 642 | } |
639 | 643 | ||
640 | if (strcmp(token, expect_tok) != 0) { | 644 | if (strcmp(token, expect_tok) != 0) { |
641 | warning("Error: expected '%s' but read '%s'", | 645 | if (warn) |
642 | expect_tok, token); | 646 | warning("Error: expected '%s' but read '%s'", |
647 | expect_tok, token); | ||
643 | return -1; | 648 | return -1; |
644 | } | 649 | } |
645 | return 0; | 650 | return 0; |
646 | } | 651 | } |
647 | 652 | ||
653 | static int test_type_token(enum event_type type, char *token, | ||
654 | enum event_type expect, const char *expect_tok) | ||
655 | { | ||
656 | return __test_type_token(type, token, expect, expect_tok, true); | ||
657 | } | ||
658 | |||
648 | static int __read_expect_type(enum event_type expect, char **tok, int newline_ok) | 659 | static int __read_expect_type(enum event_type expect, char **tok, int newline_ok) |
649 | { | 660 | { |
650 | enum event_type type; | 661 | enum event_type type; |
@@ -661,7 +672,8 @@ static int read_expect_type(enum event_type expect, char **tok) | |||
661 | return __read_expect_type(expect, tok, 1); | 672 | return __read_expect_type(expect, tok, 1); |
662 | } | 673 | } |
663 | 674 | ||
664 | static int __read_expected(enum event_type expect, const char *str, int newline_ok) | 675 | static int __read_expected(enum event_type expect, const char *str, |
676 | int newline_ok, bool warn) | ||
665 | { | 677 | { |
666 | enum event_type type; | 678 | enum event_type type; |
667 | char *token; | 679 | char *token; |
@@ -672,7 +684,7 @@ static int __read_expected(enum event_type expect, const char *str, int newline_ | |||
672 | else | 684 | else |
673 | type = read_token_item(&token); | 685 | type = read_token_item(&token); |
674 | 686 | ||
675 | ret = test_type_token(type, token, expect, str); | 687 | ret = __test_type_token(type, token, expect, str, warn); |
676 | 688 | ||
677 | free_token(token); | 689 | free_token(token); |
678 | 690 | ||
@@ -681,12 +693,12 @@ static int __read_expected(enum event_type expect, const char *str, int newline_ | |||
681 | 693 | ||
682 | static int read_expected(enum event_type expect, const char *str) | 694 | static int read_expected(enum event_type expect, const char *str) |
683 | { | 695 | { |
684 | return __read_expected(expect, str, 1); | 696 | return __read_expected(expect, str, 1, true); |
685 | } | 697 | } |
686 | 698 | ||
687 | static int read_expected_item(enum event_type expect, const char *str) | 699 | static int read_expected_item(enum event_type expect, const char *str) |
688 | { | 700 | { |
689 | return __read_expected(expect, str, 0); | 701 | return __read_expected(expect, str, 0, true); |
690 | } | 702 | } |
691 | 703 | ||
692 | static char *event_read_name(void) | 704 | static char *event_read_name(void) |
@@ -744,7 +756,7 @@ static int field_is_string(struct format_field *field) | |||
744 | 756 | ||
745 | static int field_is_dynamic(struct format_field *field) | 757 | static int field_is_dynamic(struct format_field *field) |
746 | { | 758 | { |
747 | if (!strcmp(field->type, "__data_loc")) | 759 | if (!strncmp(field->type, "__data_loc", 10)) |
748 | return 1; | 760 | return 1; |
749 | 761 | ||
750 | return 0; | 762 | return 0; |
@@ -3087,88 +3099,6 @@ static void print_args(struct print_arg *args) | |||
3087 | } | 3099 | } |
3088 | } | 3100 | } |
3089 | 3101 | ||
3090 | static void parse_header_field(const char *field, | ||
3091 | int *offset, int *size) | ||
3092 | { | ||
3093 | char *token; | ||
3094 | int type; | ||
3095 | |||
3096 | if (read_expected(EVENT_ITEM, "field") < 0) | ||
3097 | return; | ||
3098 | if (read_expected(EVENT_OP, ":") < 0) | ||
3099 | return; | ||
3100 | |||
3101 | /* type */ | ||
3102 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3103 | goto fail; | ||
3104 | free_token(token); | ||
3105 | |||
3106 | if (read_expected(EVENT_ITEM, field) < 0) | ||
3107 | return; | ||
3108 | if (read_expected(EVENT_OP, ";") < 0) | ||
3109 | return; | ||
3110 | if (read_expected(EVENT_ITEM, "offset") < 0) | ||
3111 | return; | ||
3112 | if (read_expected(EVENT_OP, ":") < 0) | ||
3113 | return; | ||
3114 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3115 | goto fail; | ||
3116 | *offset = atoi(token); | ||
3117 | free_token(token); | ||
3118 | if (read_expected(EVENT_OP, ";") < 0) | ||
3119 | return; | ||
3120 | if (read_expected(EVENT_ITEM, "size") < 0) | ||
3121 | return; | ||
3122 | if (read_expected(EVENT_OP, ":") < 0) | ||
3123 | return; | ||
3124 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3125 | goto fail; | ||
3126 | *size = atoi(token); | ||
3127 | free_token(token); | ||
3128 | if (read_expected(EVENT_OP, ";") < 0) | ||
3129 | return; | ||
3130 | type = read_token(&token); | ||
3131 | if (type != EVENT_NEWLINE) { | ||
3132 | /* newer versions of the kernel have a "signed" type */ | ||
3133 | if (type != EVENT_ITEM) | ||
3134 | goto fail; | ||
3135 | |||
3136 | if (strcmp(token, "signed") != 0) | ||
3137 | goto fail; | ||
3138 | |||
3139 | free_token(token); | ||
3140 | |||
3141 | if (read_expected(EVENT_OP, ":") < 0) | ||
3142 | return; | ||
3143 | |||
3144 | if (read_expect_type(EVENT_ITEM, &token)) | ||
3145 | goto fail; | ||
3146 | |||
3147 | free_token(token); | ||
3148 | if (read_expected(EVENT_OP, ";") < 0) | ||
3149 | return; | ||
3150 | |||
3151 | if (read_expect_type(EVENT_NEWLINE, &token)) | ||
3152 | goto fail; | ||
3153 | } | ||
3154 | fail: | ||
3155 | free_token(token); | ||
3156 | } | ||
3157 | |||
3158 | int parse_header_page(char *buf, unsigned long size) | ||
3159 | { | ||
3160 | init_input_buf(buf, size); | ||
3161 | |||
3162 | parse_header_field("timestamp", &header_page_ts_offset, | ||
3163 | &header_page_ts_size); | ||
3164 | parse_header_field("commit", &header_page_size_offset, | ||
3165 | &header_page_size_size); | ||
3166 | parse_header_field("data", &header_page_data_offset, | ||
3167 | &header_page_data_size); | ||
3168 | |||
3169 | return 0; | ||
3170 | } | ||
3171 | |||
3172 | int parse_ftrace_file(char *buf, unsigned long size) | 3102 | int parse_ftrace_file(char *buf, unsigned long size) |
3173 | { | 3103 | { |
3174 | struct format_field *field; | 3104 | struct format_field *field; |
diff --git a/tools/perf/util/trace-event-read.c b/tools/perf/util/trace-event-read.c index 7cd1193918c7..cb54cd002f49 100644 --- a/tools/perf/util/trace-event-read.c +++ b/tools/perf/util/trace-event-read.c | |||
@@ -50,14 +50,51 @@ static int long_size; | |||
50 | 50 | ||
51 | static unsigned long page_size; | 51 | static unsigned long page_size; |
52 | 52 | ||
53 | static ssize_t calc_data_size; | ||
54 | static bool repipe; | ||
55 | |||
56 | /* If it fails, the next read will report it */ | ||
57 | static void skip(int size) | ||
58 | { | ||
59 | lseek(input_fd, size, SEEK_CUR); | ||
60 | } | ||
61 | |||
62 | static int do_read(int fd, void *buf, int size) | ||
63 | { | ||
64 | int rsize = size; | ||
65 | |||
66 | while (size) { | ||
67 | int ret = read(fd, buf, size); | ||
68 | |||
69 | if (ret <= 0) | ||
70 | return -1; | ||
71 | |||
72 | if (repipe) { | ||
73 | int retw = write(STDOUT_FILENO, buf, ret); | ||
74 | |||
75 | if (retw <= 0 || retw != ret) | ||
76 | die("repiping input file"); | ||
77 | } | ||
78 | |||
79 | size -= ret; | ||
80 | buf += ret; | ||
81 | } | ||
82 | |||
83 | return rsize; | ||
84 | } | ||
85 | |||
53 | static int read_or_die(void *data, int size) | 86 | static int read_or_die(void *data, int size) |
54 | { | 87 | { |
55 | int r; | 88 | int r; |
56 | 89 | ||
57 | r = read(input_fd, data, size); | 90 | r = do_read(input_fd, data, size); |
58 | if (r != size) | 91 | if (r <= 0) |
59 | die("reading input file (size expected=%d received=%d)", | 92 | die("reading input file (size expected=%d received=%d)", |
60 | size, r); | 93 | size, r); |
94 | |||
95 | if (calc_data_size) | ||
96 | calc_data_size += r; | ||
97 | |||
61 | return r; | 98 | return r; |
62 | } | 99 | } |
63 | 100 | ||
@@ -82,57 +119,36 @@ static char *read_string(void) | |||
82 | char buf[BUFSIZ]; | 119 | char buf[BUFSIZ]; |
83 | char *str = NULL; | 120 | char *str = NULL; |
84 | int size = 0; | 121 | int size = 0; |
85 | int i; | ||
86 | off_t r; | 122 | off_t r; |
123 | char c; | ||
87 | 124 | ||
88 | for (;;) { | 125 | for (;;) { |
89 | r = read(input_fd, buf, BUFSIZ); | 126 | r = read(input_fd, &c, 1); |
90 | if (r < 0) | 127 | if (r < 0) |
91 | die("reading input file"); | 128 | die("reading input file"); |
92 | 129 | ||
93 | if (!r) | 130 | if (!r) |
94 | die("no data"); | 131 | die("no data"); |
95 | 132 | ||
96 | for (i = 0; i < r; i++) { | 133 | if (repipe) { |
97 | if (!buf[i]) | 134 | int retw = write(STDOUT_FILENO, &c, 1); |
98 | break; | ||
99 | } | ||
100 | if (i < r) | ||
101 | break; | ||
102 | 135 | ||
103 | if (str) { | 136 | if (retw <= 0 || retw != r) |
104 | size += BUFSIZ; | 137 | die("repiping input file string"); |
105 | str = realloc(str, size); | ||
106 | if (!str) | ||
107 | die("malloc of size %d", size); | ||
108 | memcpy(str + (size - BUFSIZ), buf, BUFSIZ); | ||
109 | } else { | ||
110 | size = BUFSIZ; | ||
111 | str = malloc_or_die(size); | ||
112 | memcpy(str, buf, size); | ||
113 | } | 138 | } |
114 | } | ||
115 | 139 | ||
116 | /* trailing \0: */ | 140 | buf[size++] = c; |
117 | i++; | 141 | |
118 | 142 | if (!c) | |
119 | /* move the file descriptor to the end of the string */ | 143 | break; |
120 | r = lseek(input_fd, -(r - i), SEEK_CUR); | ||
121 | if (r == (off_t)-1) | ||
122 | die("lseek"); | ||
123 | |||
124 | if (str) { | ||
125 | size += i; | ||
126 | str = realloc(str, size); | ||
127 | if (!str) | ||
128 | die("malloc of size %d", size); | ||
129 | memcpy(str + (size - i), buf, i); | ||
130 | } else { | ||
131 | size = i; | ||
132 | str = malloc_or_die(i); | ||
133 | memcpy(str, buf, i); | ||
134 | } | 144 | } |
135 | 145 | ||
146 | if (calc_data_size) | ||
147 | calc_data_size += size; | ||
148 | |||
149 | str = malloc_or_die(size); | ||
150 | memcpy(str, buf, size); | ||
151 | |||
136 | return str; | 152 | return str; |
137 | } | 153 | } |
138 | 154 | ||
@@ -174,7 +190,6 @@ static void read_ftrace_printk(void) | |||
174 | static void read_header_files(void) | 190 | static void read_header_files(void) |
175 | { | 191 | { |
176 | unsigned long long size; | 192 | unsigned long long size; |
177 | char *header_page; | ||
178 | char *header_event; | 193 | char *header_event; |
179 | char buf[BUFSIZ]; | 194 | char buf[BUFSIZ]; |
180 | 195 | ||
@@ -184,10 +199,7 @@ static void read_header_files(void) | |||
184 | die("did not read header page"); | 199 | die("did not read header page"); |
185 | 200 | ||
186 | size = read8(); | 201 | size = read8(); |
187 | header_page = malloc_or_die(size); | 202 | skip(size); |
188 | read_or_die(header_page, size); | ||
189 | parse_header_page(header_page, size); | ||
190 | free(header_page); | ||
191 | 203 | ||
192 | /* | 204 | /* |
193 | * The size field in the page is of type long, | 205 | * The size field in the page is of type long, |
@@ -459,7 +471,7 @@ struct record *trace_read_data(int cpu) | |||
459 | return data; | 471 | return data; |
460 | } | 472 | } |
461 | 473 | ||
462 | void trace_report(int fd) | 474 | ssize_t trace_report(int fd, bool __repipe) |
463 | { | 475 | { |
464 | char buf[BUFSIZ]; | 476 | char buf[BUFSIZ]; |
465 | char test[] = { 23, 8, 68 }; | 477 | char test[] = { 23, 8, 68 }; |
@@ -467,6 +479,10 @@ void trace_report(int fd) | |||
467 | int show_version = 0; | 479 | int show_version = 0; |
468 | int show_funcs = 0; | 480 | int show_funcs = 0; |
469 | int show_printk = 0; | 481 | int show_printk = 0; |
482 | ssize_t size; | ||
483 | |||
484 | calc_data_size = 1; | ||
485 | repipe = __repipe; | ||
470 | 486 | ||
471 | input_fd = fd; | 487 | input_fd = fd; |
472 | 488 | ||
@@ -499,14 +515,18 @@ void trace_report(int fd) | |||
499 | read_proc_kallsyms(); | 515 | read_proc_kallsyms(); |
500 | read_ftrace_printk(); | 516 | read_ftrace_printk(); |
501 | 517 | ||
518 | size = calc_data_size - 1; | ||
519 | calc_data_size = 0; | ||
520 | repipe = false; | ||
521 | |||
502 | if (show_funcs) { | 522 | if (show_funcs) { |
503 | print_funcs(); | 523 | print_funcs(); |
504 | return; | 524 | return size; |
505 | } | 525 | } |
506 | if (show_printk) { | 526 | if (show_printk) { |
507 | print_printk(); | 527 | print_printk(); |
508 | return; | 528 | return size; |
509 | } | 529 | } |
510 | 530 | ||
511 | return; | 531 | return size; |
512 | } | 532 | } |
diff --git a/tools/perf/util/trace-event.h b/tools/perf/util/trace-event.h index c3269b937db4..406d452956db 100644 --- a/tools/perf/util/trace-event.h +++ b/tools/perf/util/trace-event.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_TRACE_EVENTS_H | 1 | #ifndef __PERF_TRACE_EVENTS_H |
2 | #define __PERF_TRACE_EVENTS_H | 2 | #define __PERF_TRACE_EVENTS_H |
3 | 3 | ||
4 | #include <stdbool.h> | ||
4 | #include "parse-events.h" | 5 | #include "parse-events.h" |
5 | 6 | ||
6 | #define __unused __attribute__((unused)) | 7 | #define __unused __attribute__((unused)) |
@@ -162,7 +163,7 @@ struct record *trace_read_data(int cpu); | |||
162 | 163 | ||
163 | void parse_set_info(int nr_cpus, int long_sz); | 164 | void parse_set_info(int nr_cpus, int long_sz); |
164 | 165 | ||
165 | void trace_report(int fd); | 166 | ssize_t trace_report(int fd, bool repipe); |
166 | 167 | ||
167 | void *malloc_or_die(unsigned int size); | 168 | void *malloc_or_die(unsigned int size); |
168 | 169 | ||
@@ -241,9 +242,8 @@ extern int header_page_size_size; | |||
241 | extern int header_page_data_offset; | 242 | extern int header_page_data_offset; |
242 | extern int header_page_data_size; | 243 | extern int header_page_data_size; |
243 | 244 | ||
244 | extern int latency_format; | 245 | extern bool latency_format; |
245 | 246 | ||
246 | int parse_header_page(char *buf, unsigned long size); | ||
247 | int trace_parse_common_type(void *data); | 247 | int trace_parse_common_type(void *data); |
248 | int trace_parse_common_pid(void *data); | 248 | int trace_parse_common_pid(void *data); |
249 | int parse_common_pc(void *data); | 249 | int parse_common_pc(void *data); |
@@ -258,6 +258,8 @@ void *raw_field_ptr(struct event *event, const char *name, void *data); | |||
258 | unsigned long long eval_flag(const char *flag); | 258 | unsigned long long eval_flag(const char *flag); |
259 | 259 | ||
260 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events); | 260 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events); |
261 | ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs, | ||
262 | int nb_events); | ||
261 | 263 | ||
262 | /* taken from kernel/trace/trace.h */ | 264 | /* taken from kernel/trace/trace.h */ |
263 | enum trace_flag_type { | 265 | enum trace_flag_type { |
diff --git a/tools/perf/util/util.c b/tools/perf/util/util.c index f9b890fde681..214265674ddd 100644 --- a/tools/perf/util/util.c +++ b/tools/perf/util/util.c | |||
@@ -92,3 +92,25 @@ out_close_from: | |||
92 | out: | 92 | out: |
93 | return err; | 93 | return err; |
94 | } | 94 | } |
95 | |||
96 | unsigned long convert_unit(unsigned long value, char *unit) | ||
97 | { | ||
98 | *unit = ' '; | ||
99 | |||
100 | if (value > 1000) { | ||
101 | value /= 1000; | ||
102 | *unit = 'K'; | ||
103 | } | ||
104 | |||
105 | if (value > 1000) { | ||
106 | value /= 1000; | ||
107 | *unit = 'M'; | ||
108 | } | ||
109 | |||
110 | if (value > 1000) { | ||
111 | value /= 1000; | ||
112 | *unit = 'G'; | ||
113 | } | ||
114 | |||
115 | return value; | ||
116 | } | ||
diff --git a/tools/perf/util/util.h b/tools/perf/util/util.h index 0f5b2a6f1080..0795bf304b19 100644 --- a/tools/perf/util/util.h +++ b/tools/perf/util/util.h | |||
@@ -42,12 +42,14 @@ | |||
42 | #define _ALL_SOURCE 1 | 42 | #define _ALL_SOURCE 1 |
43 | #define _GNU_SOURCE 1 | 43 | #define _GNU_SOURCE 1 |
44 | #define _BSD_SOURCE 1 | 44 | #define _BSD_SOURCE 1 |
45 | #define HAS_BOOL | ||
45 | 46 | ||
46 | #include <unistd.h> | 47 | #include <unistd.h> |
47 | #include <stdio.h> | 48 | #include <stdio.h> |
48 | #include <sys/stat.h> | 49 | #include <sys/stat.h> |
49 | #include <sys/statfs.h> | 50 | #include <sys/statfs.h> |
50 | #include <fcntl.h> | 51 | #include <fcntl.h> |
52 | #include <stdbool.h> | ||
51 | #include <stddef.h> | 53 | #include <stddef.h> |
52 | #include <stdlib.h> | 54 | #include <stdlib.h> |
53 | #include <stdarg.h> | 55 | #include <stdarg.h> |
@@ -78,6 +80,7 @@ | |||
78 | #include <pwd.h> | 80 | #include <pwd.h> |
79 | #include <inttypes.h> | 81 | #include <inttypes.h> |
80 | #include "../../../include/linux/magic.h" | 82 | #include "../../../include/linux/magic.h" |
83 | #include "types.h" | ||
81 | 84 | ||
82 | 85 | ||
83 | #ifndef NO_ICONV | 86 | #ifndef NO_ICONV |
@@ -295,6 +298,13 @@ extern void *xmemdupz(const void *data, size_t len); | |||
295 | extern char *xstrndup(const char *str, size_t len); | 298 | extern char *xstrndup(const char *str, size_t len); |
296 | extern void *xrealloc(void *ptr, size_t size) __attribute__((weak)); | 299 | extern void *xrealloc(void *ptr, size_t size) __attribute__((weak)); |
297 | 300 | ||
301 | static inline void *xzalloc(size_t size) | ||
302 | { | ||
303 | void *buf = xmalloc(size); | ||
304 | |||
305 | return memset(buf, 0, size); | ||
306 | } | ||
307 | |||
298 | static inline void *zalloc(size_t size) | 308 | static inline void *zalloc(size_t size) |
299 | { | 309 | { |
300 | return calloc(1, size); | 310 | return calloc(1, size); |
@@ -309,6 +319,7 @@ static inline int has_extension(const char *filename, const char *ext) | |||
309 | { | 319 | { |
310 | size_t len = strlen(filename); | 320 | size_t len = strlen(filename); |
311 | size_t extlen = strlen(ext); | 321 | size_t extlen = strlen(ext); |
322 | |||
312 | return len > extlen && !memcmp(filename + len - extlen, ext, extlen); | 323 | return len > extlen && !memcmp(filename + len - extlen, ext, extlen); |
313 | } | 324 | } |
314 | 325 | ||
@@ -322,6 +333,7 @@ static inline int has_extension(const char *filename, const char *ext) | |||
322 | #undef isalnum | 333 | #undef isalnum |
323 | #undef tolower | 334 | #undef tolower |
324 | #undef toupper | 335 | #undef toupper |
336 | |||
325 | extern unsigned char sane_ctype[256]; | 337 | extern unsigned char sane_ctype[256]; |
326 | #define GIT_SPACE 0x01 | 338 | #define GIT_SPACE 0x01 |
327 | #define GIT_DIGIT 0x02 | 339 | #define GIT_DIGIT 0x02 |
@@ -406,4 +418,14 @@ void git_qsort(void *base, size_t nmemb, size_t size, | |||
406 | int mkdir_p(char *path, mode_t mode); | 418 | int mkdir_p(char *path, mode_t mode); |
407 | int copyfile(const char *from, const char *to); | 419 | int copyfile(const char *from, const char *to); |
408 | 420 | ||
421 | s64 perf_atoll(const char *str); | ||
422 | char **argv_split(const char *str, int *argcp); | ||
423 | void argv_free(char **argv); | ||
424 | bool strglobmatch(const char *str, const char *pat); | ||
425 | bool strlazymatch(const char *str, const char *pat); | ||
426 | unsigned long convert_unit(unsigned long value, char *unit); | ||
427 | |||
428 | #define _STR(x) #x | ||
429 | #define STR(x) _STR(x) | ||
430 | |||
409 | #endif | 431 | #endif |