diff options
Diffstat (limited to 'tools')
131 files changed, 10095 insertions, 3463 deletions
diff --git a/tools/perf/Documentation/perf-annotate.txt b/tools/perf/Documentation/perf-annotate.txt index c9dcade06831..5164a655c39f 100644 --- a/tools/perf/Documentation/perf-annotate.txt +++ b/tools/perf/Documentation/perf-annotate.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-annotate(1) | 1 | perf-annotate(1) |
2 | ============== | 2 | ================ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-bench.txt b/tools/perf/Documentation/perf-bench.txt index ae525ac5a2ce..a3dbadb26ef5 100644 --- a/tools/perf/Documentation/perf-bench.txt +++ b/tools/perf/Documentation/perf-bench.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-bench(1) | 1 | perf-bench(1) |
2 | ============ | 2 | ============= |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
@@ -19,12 +19,12 @@ COMMON OPTIONS | |||
19 | -f:: | 19 | -f:: |
20 | --format=:: | 20 | --format=:: |
21 | Specify format style. | 21 | Specify format style. |
22 | Current available format styles are, | 22 | Current available format styles are: |
23 | 23 | ||
24 | 'default':: | 24 | 'default':: |
25 | Default style. This is mainly for human reading. | 25 | Default style. This is mainly for human reading. |
26 | --------------------- | 26 | --------------------- |
27 | % perf bench sched pipe # with no style specify | 27 | % perf bench sched pipe # with no style specified |
28 | (executing 1000000 pipe operations between two tasks) | 28 | (executing 1000000 pipe operations between two tasks) |
29 | Total time:5.855 sec | 29 | Total time:5.855 sec |
30 | 5.855061 usecs/op | 30 | 5.855061 usecs/op |
@@ -79,7 +79,7 @@ options (20 sender and receiver processes per group) | |||
79 | 79 | ||
80 | Total time:0.308 sec | 80 | Total time:0.308 sec |
81 | 81 | ||
82 | % perf bench sched messaging -t -g 20 # be multi-thread,with 20 groups | 82 | % perf bench sched messaging -t -g 20 # be multi-thread, with 20 groups |
83 | (20 sender and receiver threads per group) | 83 | (20 sender and receiver threads per group) |
84 | (20 groups == 800 threads run) | 84 | (20 groups == 800 threads run) |
85 | 85 | ||
diff --git a/tools/perf/Documentation/perf-buildid-cache.txt b/tools/perf/Documentation/perf-buildid-cache.txt index 88bc3b519746..5d1a9500277f 100644 --- a/tools/perf/Documentation/perf-buildid-cache.txt +++ b/tools/perf/Documentation/perf-buildid-cache.txt | |||
@@ -8,7 +8,7 @@ perf-buildid-cache - Manage build-id cache. | |||
8 | SYNOPSIS | 8 | SYNOPSIS |
9 | -------- | 9 | -------- |
10 | [verse] | 10 | [verse] |
11 | 'perf buildid-list <options>' | 11 | 'perf buildid-cache <options>' |
12 | 12 | ||
13 | DESCRIPTION | 13 | DESCRIPTION |
14 | ----------- | 14 | ----------- |
@@ -30,4 +30,4 @@ OPTIONS | |||
30 | 30 | ||
31 | SEE ALSO | 31 | SEE ALSO |
32 | -------- | 32 | -------- |
33 | linkperf:perf-record[1], linkperf:perf-report[1] | 33 | linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-buildid-list[1] |
diff --git a/tools/perf/Documentation/perf-diff.txt b/tools/perf/Documentation/perf-diff.txt index 8974e208cba6..20d97d84ea1c 100644 --- a/tools/perf/Documentation/perf-diff.txt +++ b/tools/perf/Documentation/perf-diff.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-diff(1) | 1 | perf-diff(1) |
2 | ============== | 2 | ============ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-inject.txt b/tools/perf/Documentation/perf-inject.txt new file mode 100644 index 000000000000..025630d43cd2 --- /dev/null +++ b/tools/perf/Documentation/perf-inject.txt | |||
@@ -0,0 +1,35 @@ | |||
1 | perf-inject(1) | ||
2 | ============== | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-inject - Filter to augment the events stream with additional information | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf inject <options>' | ||
12 | |||
13 | DESCRIPTION | ||
14 | ----------- | ||
15 | perf-inject reads a perf-record event stream and repipes it to stdout. At any | ||
16 | point the processing code can inject other events into the event stream - in | ||
17 | this case build-ids (-b option) are read and injected as needed into the event | ||
18 | stream. | ||
19 | |||
20 | Build-ids are just the first user of perf-inject - potentially anything that | ||
21 | needs userspace processing to augment the events stream with additional | ||
22 | information could make use of this facility. | ||
23 | |||
24 | OPTIONS | ||
25 | ------- | ||
26 | -b:: | ||
27 | --build-ids=:: | ||
28 | Inject build-ids into the output stream | ||
29 | -v:: | ||
30 | --verbose:: | ||
31 | Be more verbose. | ||
32 | |||
33 | SEE ALSO | ||
34 | -------- | ||
35 | linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-archive[1] | ||
diff --git a/tools/perf/Documentation/perf-kmem.txt b/tools/perf/Documentation/perf-kmem.txt index eac4d852e7cd..a52fcde894c7 100644 --- a/tools/perf/Documentation/perf-kmem.txt +++ b/tools/perf/Documentation/perf-kmem.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-kmem(1) | 1 | perf-kmem(1) |
2 | ============== | 2 | ============ |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Documentation/perf-kvm.txt b/tools/perf/Documentation/perf-kvm.txt new file mode 100644 index 000000000000..d004e19fe6d6 --- /dev/null +++ b/tools/perf/Documentation/perf-kvm.txt | |||
@@ -0,0 +1,68 @@ | |||
1 | perf-kvm(1) | ||
2 | =========== | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-kvm - Tool to trace/measure kvm guest os | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf kvm' [--host] [--guest] [--guestmount=<path> | ||
12 | [--guestkallsyms=<path> --guestmodules=<path> | --guestvmlinux=<path>]] | ||
13 | {top|record|report|diff|buildid-list} | ||
14 | 'perf kvm' [--host] [--guest] [--guestkallsyms=<path> --guestmodules=<path> | ||
15 | | --guestvmlinux=<path>] {top|record|report|diff|buildid-list} | ||
16 | |||
17 | DESCRIPTION | ||
18 | ----------- | ||
19 | There are a couple of variants of perf kvm: | ||
20 | |||
21 | 'perf kvm [options] top <command>' to generates and displays | ||
22 | a performance counter profile of guest os in realtime | ||
23 | of an arbitrary workload. | ||
24 | |||
25 | 'perf kvm record <command>' to record the performance couinter profile | ||
26 | of an arbitrary workload and save it into a perf data file. If both | ||
27 | --host and --guest are input, the perf data file name is perf.data.kvm. | ||
28 | If there is no --host but --guest, the file name is perf.data.guest. | ||
29 | If there is no --guest but --host, the file name is perf.data.host. | ||
30 | |||
31 | 'perf kvm report' to display the performance counter profile information | ||
32 | recorded via perf kvm record. | ||
33 | |||
34 | 'perf kvm diff' to displays the performance difference amongst two perf.data | ||
35 | files captured via perf record. | ||
36 | |||
37 | 'perf kvm buildid-list' to display the buildids found in a perf data file, | ||
38 | so that other tools can be used to fetch packages with matching symbol tables | ||
39 | for use by perf report. | ||
40 | |||
41 | OPTIONS | ||
42 | ------- | ||
43 | --host=:: | ||
44 | Collect host side performance profile. | ||
45 | --guest=:: | ||
46 | Collect guest side performance profile. | ||
47 | --guestmount=<path>:: | ||
48 | Guest os root file system mount directory. Users mounts guest os | ||
49 | root directories under <path> by a specific filesystem access method, | ||
50 | typically, sshfs. For example, start 2 guest os. The one's pid is 8888 | ||
51 | and the other's is 9999. | ||
52 | #mkdir ~/guestmount; cd ~/guestmount | ||
53 | #sshfs -o allow_other,direct_io -p 5551 localhost:/ 8888/ | ||
54 | #sshfs -o allow_other,direct_io -p 5552 localhost:/ 9999/ | ||
55 | #perf kvm --host --guest --guestmount=~/guestmount top | ||
56 | --guestkallsyms=<path>:: | ||
57 | Guest os /proc/kallsyms file copy. 'perf' kvm' reads it to get guest | ||
58 | kernel symbols. Users copy it out from guest os. | ||
59 | --guestmodules=<path>:: | ||
60 | Guest os /proc/modules file copy. 'perf' kvm' reads it to get guest | ||
61 | kernel module information. Users copy it out from guest os. | ||
62 | --guestvmlinux=<path>:: | ||
63 | Guest os kernel vmlinux. | ||
64 | |||
65 | SEE ALSO | ||
66 | -------- | ||
67 | linkperf:perf-top[1], linkperf:perf-record[1], linkperf:perf-report[1], | ||
68 | linkperf:perf-diff[1], linkperf:perf-buildid-list[1] | ||
diff --git a/tools/perf/Documentation/perf-list.txt b/tools/perf/Documentation/perf-list.txt index 8290b9422668..43e3dd284b90 100644 --- a/tools/perf/Documentation/perf-list.txt +++ b/tools/perf/Documentation/perf-list.txt | |||
@@ -15,6 +15,35 @@ DESCRIPTION | |||
15 | This command displays the symbolic event types which can be selected in the | 15 | This command displays the symbolic event types which can be selected in the |
16 | various perf commands with the -e option. | 16 | various perf commands with the -e option. |
17 | 17 | ||
18 | RAW HARDWARE EVENT DESCRIPTOR | ||
19 | ----------------------------- | ||
20 | Even when an event is not available in a symbolic form within perf right now, | ||
21 | it can be encoded in a per processor specific way. | ||
22 | |||
23 | For instance For x86 CPUs NNN represents the raw register encoding with the | ||
24 | layout of IA32_PERFEVTSELx MSRs (see [Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide] Figure 30-1 Layout | ||
25 | of IA32_PERFEVTSELx MSRs) or AMD's PerfEvtSeln (see [AMD64 Architecture Programmer’s Manual Volume 2: System Programming], Page 344, | ||
26 | Figure 13-7 Performance Event-Select Register (PerfEvtSeln)). | ||
27 | |||
28 | Example: | ||
29 | |||
30 | If the Intel docs for a QM720 Core i7 describe an event as: | ||
31 | |||
32 | Event Umask Event Mask | ||
33 | Num. Value Mnemonic Description Comment | ||
34 | |||
35 | A8H 01H LSD.UOPS Counts the number of micro-ops Use cmask=1 and | ||
36 | delivered by loop stream detector invert to count | ||
37 | cycles | ||
38 | |||
39 | raw encoding of 0x1A8 can be used: | ||
40 | |||
41 | perf stat -e r1a8 -a sleep 1 | ||
42 | perf record -e r1a8 ... | ||
43 | |||
44 | You should refer to the processor specific documentation for getting these | ||
45 | details. Some of them are referenced in the SEE ALSO section below. | ||
46 | |||
18 | OPTIONS | 47 | OPTIONS |
19 | ------- | 48 | ------- |
20 | None | 49 | None |
@@ -22,4 +51,6 @@ None | |||
22 | SEE ALSO | 51 | SEE ALSO |
23 | -------- | 52 | -------- |
24 | linkperf:perf-stat[1], linkperf:perf-top[1], | 53 | linkperf:perf-stat[1], linkperf:perf-top[1], |
25 | linkperf:perf-record[1] | 54 | linkperf:perf-record[1], |
55 | http://www.intel.com/Assets/PDF/manual/253669.pdf[Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide], | ||
56 | http://support.amd.com/us/Processor_TechDocs/24593.pdf[AMD64 Architecture Programmer’s Manual Volume 2: System Programming] | ||
diff --git a/tools/perf/Documentation/perf-probe.txt b/tools/perf/Documentation/perf-probe.txt index 34202b1be0bb..94a258c96a44 100644 --- a/tools/perf/Documentation/perf-probe.txt +++ b/tools/perf/Documentation/perf-probe.txt | |||
@@ -57,6 +57,14 @@ OPTIONS | |||
57 | --force:: | 57 | --force:: |
58 | Forcibly add events with existing name. | 58 | Forcibly add events with existing name. |
59 | 59 | ||
60 | -n:: | ||
61 | --dry-run:: | ||
62 | Dry run. With this option, --add and --del doesn't execute actual | ||
63 | adding and removal operations. | ||
64 | |||
65 | --max-probes:: | ||
66 | Set the maximum number of probe points for an event. Default is 128. | ||
67 | |||
60 | PROBE SYNTAX | 68 | PROBE SYNTAX |
61 | ------------ | 69 | ------------ |
62 | Probe points are defined by following syntax. | 70 | Probe points are defined by following syntax. |
@@ -74,13 +82,22 @@ Probe points are defined by following syntax. | |||
74 | 'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'. | 82 | 'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'. |
75 | 'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, ':RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. And ';PTN' means lazy matching pattern (see LAZY MATCHING). Note that ';PTN' must be the end of the probe point definition. In addition, '@SRC' specifies a source file which has that function. | 83 | 'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, ':RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. And ';PTN' means lazy matching pattern (see LAZY MATCHING). Note that ';PTN' must be the end of the probe point definition. In addition, '@SRC' specifies a source file which has that function. |
76 | It is also possible to specify a probe point by the source line number or lazy matching by using 'SRC:ALN' or 'SRC;PTN' syntax, where 'SRC' is the source file path, ':ALN' is the line number and ';PTN' is the lazy matching pattern. | 84 | It is also possible to specify a probe point by the source line number or lazy matching by using 'SRC:ALN' or 'SRC;PTN' syntax, where 'SRC' is the source file path, ':ALN' is the line number and ';PTN' is the lazy matching pattern. |
77 | 'ARG' specifies the arguments of this probe point. You can use the name of local variable, or kprobe-tracer argument format (e.g. $retval, %ax, etc). | 85 | 'ARG' specifies the arguments of this probe point, (see PROBE ARGUMENT). |
86 | |||
87 | PROBE ARGUMENT | ||
88 | -------------- | ||
89 | Each probe argument follows below syntax. | ||
90 | |||
91 | [NAME=]LOCALVAR|$retval|%REG|@SYMBOL[:TYPE] | ||
92 | |||
93 | 'NAME' specifies the name of this argument (optional). You can use the name of local variable, local data structure member (e.g. var->field, var.field2), or kprobe-tracer argument format (e.g. $retval, %ax, etc). Note that the name of this argument will be set as the last member name if you specify a local data structure member (e.g. field2 for 'var->field1.field2'.) | ||
94 | 'TYPE' casts the type of this argument (optional). If omitted, perf probe automatically set the type based on debuginfo. | ||
78 | 95 | ||
79 | LINE SYNTAX | 96 | LINE SYNTAX |
80 | ----------- | 97 | ----------- |
81 | Line range is descripted by following syntax. | 98 | Line range is descripted by following syntax. |
82 | 99 | ||
83 | "FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]" | 100 | "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]" |
84 | 101 | ||
85 | FUNC specifies the function name of showing lines. 'RLN' is the start line | 102 | FUNC specifies the function name of showing lines. 'RLN' is the start line |
86 | number from function entry line, and 'RLN2' is the end line number. As same as | 103 | number from function entry line, and 'RLN2' is the end line number. As same as |
diff --git a/tools/perf/Documentation/perf-record.txt b/tools/perf/Documentation/perf-record.txt index fc46c0b40f6e..34e255fc3e2f 100644 --- a/tools/perf/Documentation/perf-record.txt +++ b/tools/perf/Documentation/perf-record.txt | |||
@@ -58,7 +58,7 @@ OPTIONS | |||
58 | 58 | ||
59 | -f:: | 59 | -f:: |
60 | --force:: | 60 | --force:: |
61 | Overwrite existing data file. | 61 | Overwrite existing data file. (deprecated) |
62 | 62 | ||
63 | -c:: | 63 | -c:: |
64 | --count=:: | 64 | --count=:: |
@@ -69,8 +69,8 @@ OPTIONS | |||
69 | Output file name. | 69 | Output file name. |
70 | 70 | ||
71 | -i:: | 71 | -i:: |
72 | --inherit:: | 72 | --no-inherit:: |
73 | Child tasks inherit counters. | 73 | Child tasks do not inherit counters. |
74 | -F:: | 74 | -F:: |
75 | --freq=:: | 75 | --freq=:: |
76 | Profile at this frequency. | 76 | Profile at this frequency. |
@@ -101,7 +101,7 @@ OPTIONS | |||
101 | 101 | ||
102 | -R:: | 102 | -R:: |
103 | --raw-samples:: | 103 | --raw-samples:: |
104 | Collect raw sample records from all opened counters (typically for tracepoint counters). | 104 | Collect raw sample records from all opened counters (default for tracepoint counters). |
105 | 105 | ||
106 | SEE ALSO | 106 | SEE ALSO |
107 | -------- | 107 | -------- |
diff --git a/tools/perf/Documentation/perf-sched.txt b/tools/perf/Documentation/perf-sched.txt index 1ce79198997b..8417644a6166 100644 --- a/tools/perf/Documentation/perf-sched.txt +++ b/tools/perf/Documentation/perf-sched.txt | |||
@@ -12,7 +12,7 @@ SYNOPSIS | |||
12 | 12 | ||
13 | DESCRIPTION | 13 | DESCRIPTION |
14 | ----------- | 14 | ----------- |
15 | There's four variants of perf sched: | 15 | There are four variants of perf sched: |
16 | 16 | ||
17 | 'perf sched record <command>' to record the scheduling events | 17 | 'perf sched record <command>' to record the scheduling events |
18 | of an arbitrary workload. | 18 | of an arbitrary workload. |
@@ -27,7 +27,7 @@ There's four variants of perf sched: | |||
27 | via perf sched record. (this is done by starting up mockup threads | 27 | via perf sched record. (this is done by starting up mockup threads |
28 | that mimic the workload based on the events in the trace. These | 28 | that mimic the workload based on the events in the trace. These |
29 | threads can then replay the timings (CPU runtime and sleep patterns) | 29 | threads can then replay the timings (CPU runtime and sleep patterns) |
30 | of the workload as it occured when it was recorded - and can repeat | 30 | of the workload as it occurred when it was recorded - and can repeat |
31 | it a number of times, measuring its performance.) | 31 | it a number of times, measuring its performance.) |
32 | 32 | ||
33 | OPTIONS | 33 | OPTIONS |
diff --git a/tools/perf/Documentation/perf-stat.txt b/tools/perf/Documentation/perf-stat.txt index 484080dd5b6f..2cab8e8c33d0 100644 --- a/tools/perf/Documentation/perf-stat.txt +++ b/tools/perf/Documentation/perf-stat.txt | |||
@@ -31,8 +31,8 @@ OPTIONS | |||
31 | hexadecimal event descriptor. | 31 | hexadecimal event descriptor. |
32 | 32 | ||
33 | -i:: | 33 | -i:: |
34 | --inherit:: | 34 | --no-inherit:: |
35 | child tasks inherit counters | 35 | child tasks do not inherit counters |
36 | -p:: | 36 | -p:: |
37 | --pid=<pid>:: | 37 | --pid=<pid>:: |
38 | stat events on existing pid | 38 | stat events on existing pid |
diff --git a/tools/perf/Documentation/perf-test.txt b/tools/perf/Documentation/perf-test.txt new file mode 100644 index 000000000000..1c4b5f5b7f71 --- /dev/null +++ b/tools/perf/Documentation/perf-test.txt | |||
@@ -0,0 +1,22 @@ | |||
1 | perf-test(1) | ||
2 | ============ | ||
3 | |||
4 | NAME | ||
5 | ---- | ||
6 | perf-test - Runs sanity tests. | ||
7 | |||
8 | SYNOPSIS | ||
9 | -------- | ||
10 | [verse] | ||
11 | 'perf test <options>' | ||
12 | |||
13 | DESCRIPTION | ||
14 | ----------- | ||
15 | This command does assorted sanity tests, initially thru linked routines but | ||
16 | also will look for a directory with more tests in the form of scripts. | ||
17 | |||
18 | OPTIONS | ||
19 | ------- | ||
20 | -v:: | ||
21 | --verbose:: | ||
22 | Be more verbose. | ||
diff --git a/tools/perf/Documentation/perf-trace-perl.txt b/tools/perf/Documentation/perf-trace-perl.txt index d729cee8d987..ee6525ee6d69 100644 --- a/tools/perf/Documentation/perf-trace-perl.txt +++ b/tools/perf/Documentation/perf-trace-perl.txt | |||
@@ -49,12 +49,10 @@ available as calls back into the perf executable (see below). | |||
49 | As an example, the following perf record command can be used to record | 49 | As an example, the following perf record command can be used to record |
50 | all sched_wakeup events in the system: | 50 | all sched_wakeup events in the system: |
51 | 51 | ||
52 | # perf record -c 1 -f -a -M -R -e sched:sched_wakeup | 52 | # perf record -a -e sched:sched_wakeup |
53 | 53 | ||
54 | Traces meant to be processed using a script should be recorded with | 54 | Traces meant to be processed using a script should be recorded with |
55 | the above options: -c 1 says to sample every event, -a to enable | 55 | the above option: -a to enable system-wide collection. |
56 | system-wide collection, -M to multiplex the output, and -R to collect | ||
57 | raw samples. | ||
58 | 56 | ||
59 | The format file for the sched_wakep event defines the following fields | 57 | The format file for the sched_wakep event defines the following fields |
60 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): | 58 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): |
diff --git a/tools/perf/Documentation/perf-trace-python.txt b/tools/perf/Documentation/perf-trace-python.txt index a241aca77184..693be804dd3d 100644 --- a/tools/perf/Documentation/perf-trace-python.txt +++ b/tools/perf/Documentation/perf-trace-python.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-trace-python(1) | 1 | perf-trace-python(1) |
2 | ================== | 2 | ==================== |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
@@ -93,7 +93,7 @@ don't care how it exited, so we'll use 'perf record' to record only | |||
93 | the sys_enter events: | 93 | the sys_enter events: |
94 | 94 | ||
95 | ---- | 95 | ---- |
96 | # perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 96 | # perf record -a -e raw_syscalls:sys_enter |
97 | 97 | ||
98 | ^C[ perf record: Woken up 1 times to write data ] | 98 | ^C[ perf record: Woken up 1 times to write data ] |
99 | [ perf record: Captured and wrote 56.545 MB perf.data (~2470503 samples) ] | 99 | [ perf record: Captured and wrote 56.545 MB perf.data (~2470503 samples) ] |
@@ -182,7 +182,7 @@ mean either that the record step recorded event types that it wasn't | |||
182 | really interested in, or the script was run against a trace file that | 182 | really interested in, or the script was run against a trace file that |
183 | doesn't correspond to the script. | 183 | doesn't correspond to the script. |
184 | 184 | ||
185 | The script generated by -g option option simply prints a line for each | 185 | The script generated by -g option simply prints a line for each |
186 | event found in the trace stream i.e. it basically just dumps the event | 186 | event found in the trace stream i.e. it basically just dumps the event |
187 | and its parameter values to stdout. The print_header() function is | 187 | and its parameter values to stdout. The print_header() function is |
188 | simply a utility function used for that purpose. Let's rename the | 188 | simply a utility function used for that purpose. Let's rename the |
@@ -359,7 +359,7 @@ your script: | |||
359 | # cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-record | 359 | # cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-record |
360 | 360 | ||
361 | #!/bin/bash | 361 | #!/bin/bash |
362 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 362 | perf record -a -e raw_syscalls:sys_enter |
363 | ---- | 363 | ---- |
364 | 364 | ||
365 | The 'report' script is also a shell script with the same base name as | 365 | The 'report' script is also a shell script with the same base name as |
@@ -449,12 +449,10 @@ available as calls back into the perf executable (see below). | |||
449 | As an example, the following perf record command can be used to record | 449 | As an example, the following perf record command can be used to record |
450 | all sched_wakeup events in the system: | 450 | all sched_wakeup events in the system: |
451 | 451 | ||
452 | # perf record -c 1 -f -a -M -R -e sched:sched_wakeup | 452 | # perf record -a -e sched:sched_wakeup |
453 | 453 | ||
454 | Traces meant to be processed using a script should be recorded with | 454 | Traces meant to be processed using a script should be recorded with |
455 | the above options: -c 1 says to sample every event, -a to enable | 455 | the above option: -a to enable system-wide collection. |
456 | system-wide collection, -M to multiplex the output, and -R to collect | ||
457 | raw samples. | ||
458 | 456 | ||
459 | The format file for the sched_wakep event defines the following fields | 457 | The format file for the sched_wakep event defines the following fields |
460 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): | 458 | (see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): |
@@ -584,7 +582,7 @@ files: | |||
584 | flag_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the flag field field_name of event event_name | 582 | flag_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the flag field field_name of event event_name |
585 | symbol_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the symbolic field field_name of event event_name | 583 | symbol_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the symbolic field field_name of event event_name |
586 | 584 | ||
587 | The *autodict* function returns a special special kind of Python | 585 | The *autodict* function returns a special kind of Python |
588 | dictionary that implements Perl's 'autovivifying' hashes in Python | 586 | dictionary that implements Perl's 'autovivifying' hashes in Python |
589 | i.e. with autovivifying hashes, you can assign nested hash values | 587 | i.e. with autovivifying hashes, you can assign nested hash values |
590 | without having to go to the trouble of creating intermediate levels if | 588 | without having to go to the trouble of creating intermediate levels if |
diff --git a/tools/perf/Documentation/perf-trace.txt b/tools/perf/Documentation/perf-trace.txt index 8879299cd9df..122ec9dc4853 100644 --- a/tools/perf/Documentation/perf-trace.txt +++ b/tools/perf/Documentation/perf-trace.txt | |||
@@ -1,5 +1,5 @@ | |||
1 | perf-trace(1) | 1 | perf-trace(1) |
2 | ============== | 2 | ============= |
3 | 3 | ||
4 | NAME | 4 | NAME |
5 | ---- | 5 | ---- |
diff --git a/tools/perf/Makefile b/tools/perf/Makefile index bc0f670a8338..a9281cca4114 100644 --- a/tools/perf/Makefile +++ b/tools/perf/Makefile | |||
@@ -1,3 +1,7 @@ | |||
1 | ifeq ("$(origin O)", "command line") | ||
2 | OUTPUT := $(O)/ | ||
3 | endif | ||
4 | |||
1 | # The default target of this Makefile is... | 5 | # The default target of this Makefile is... |
2 | all:: | 6 | all:: |
3 | 7 | ||
@@ -150,10 +154,17 @@ all:: | |||
150 | # Define LDFLAGS=-static to build a static binary. | 154 | # Define LDFLAGS=-static to build a static binary. |
151 | # | 155 | # |
152 | # Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds. | 156 | # Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds. |
157 | # | ||
158 | # Define NO_DWARF if you do not want debug-info analysis feature at all. | ||
153 | 159 | ||
154 | PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE | 160 | $(shell sh -c 'mkdir -p $(OUTPUT)scripts/python/Perf-Trace-Util/' 2> /dev/null) |
155 | @$(SHELL_PATH) util/PERF-VERSION-GEN | 161 | $(shell sh -c 'mkdir -p $(OUTPUT)scripts/perl/Perf-Trace-Util/' 2> /dev/null) |
156 | -include PERF-VERSION-FILE | 162 | $(shell sh -c 'mkdir -p $(OUTPUT)util/scripting-engines/' 2> /dev/null) |
163 | $(shell sh -c 'mkdir $(OUTPUT)bench' 2> /dev/null) | ||
164 | |||
165 | $(OUTPUT)PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE | ||
166 | @$(SHELL_PATH) util/PERF-VERSION-GEN $(OUTPUT) | ||
167 | -include $(OUTPUT)PERF-VERSION-FILE | ||
157 | 168 | ||
158 | uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not') | 169 | uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not') |
159 | uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not') | 170 | uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not') |
@@ -162,6 +173,22 @@ uname_R := $(shell sh -c 'uname -r 2>/dev/null || echo not') | |||
162 | uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not') | 173 | uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not') |
163 | uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not') | 174 | uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not') |
164 | 175 | ||
176 | ARCH ?= $(shell echo $(uname_M) | sed -e s/i.86/i386/ -e s/sun4u/sparc64/ \ | ||
177 | -e s/arm.*/arm/ -e s/sa110/arm/ \ | ||
178 | -e s/s390x/s390/ -e s/parisc64/parisc/ \ | ||
179 | -e s/ppc.*/powerpc/ -e s/mips.*/mips/ \ | ||
180 | -e s/sh[234].*/sh/ ) | ||
181 | |||
182 | # Additional ARCH settings for x86 | ||
183 | ifeq ($(ARCH),i386) | ||
184 | ARCH := x86 | ||
185 | endif | ||
186 | ifeq ($(ARCH),x86_64) | ||
187 | ARCH := x86 | ||
188 | endif | ||
189 | |||
190 | $(shell sh -c 'mkdir -p $(OUTPUT)arch/$(ARCH)/util/' 2> /dev/null) | ||
191 | |||
165 | # CFLAGS and LDFLAGS are for the users to override from the command line. | 192 | # CFLAGS and LDFLAGS are for the users to override from the command line. |
166 | 193 | ||
167 | # | 194 | # |
@@ -274,7 +301,7 @@ endif | |||
274 | # Those must not be GNU-specific; they are shared with perl/ which may | 301 | # Those must not be GNU-specific; they are shared with perl/ which may |
275 | # be built by a different compiler. (Note that this is an artifact now | 302 | # be built by a different compiler. (Note that this is an artifact now |
276 | # but it still might be nice to keep that distinction.) | 303 | # but it still might be nice to keep that distinction.) |
277 | BASIC_CFLAGS = -Iutil/include | 304 | BASIC_CFLAGS = -Iutil/include -Iarch/$(ARCH)/include |
278 | BASIC_LDFLAGS = | 305 | BASIC_LDFLAGS = |
279 | 306 | ||
280 | # Guard against environment variables | 307 | # Guard against environment variables |
@@ -308,7 +335,7 @@ PROGRAMS += $(EXTRA_PROGRAMS) | |||
308 | # | 335 | # |
309 | # Single 'perf' binary right now: | 336 | # Single 'perf' binary right now: |
310 | # | 337 | # |
311 | PROGRAMS += perf | 338 | PROGRAMS += $(OUTPUT)perf |
312 | 339 | ||
313 | # List built-in command $C whose implementation cmd_$C() is not in | 340 | # List built-in command $C whose implementation cmd_$C() is not in |
314 | # builtin-$C.o but is linked in as part of some other command. | 341 | # builtin-$C.o but is linked in as part of some other command. |
@@ -318,7 +345,7 @@ PROGRAMS += perf | |||
318 | ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS) | 345 | ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS) |
319 | 346 | ||
320 | # what 'all' will build but not install in perfexecdir | 347 | # what 'all' will build but not install in perfexecdir |
321 | OTHER_PROGRAMS = perf$X | 348 | OTHER_PROGRAMS = $(OUTPUT)perf$X |
322 | 349 | ||
323 | # Set paths to tools early so that they can be used for version tests. | 350 | # Set paths to tools early so that they can be used for version tests. |
324 | ifndef SHELL_PATH | 351 | ifndef SHELL_PATH |
@@ -330,7 +357,7 @@ endif | |||
330 | 357 | ||
331 | export PERL_PATH | 358 | export PERL_PATH |
332 | 359 | ||
333 | LIB_FILE=libperf.a | 360 | LIB_FILE=$(OUTPUT)libperf.a |
334 | 361 | ||
335 | LIB_H += ../../include/linux/perf_event.h | 362 | LIB_H += ../../include/linux/perf_event.h |
336 | LIB_H += ../../include/linux/rbtree.h | 363 | LIB_H += ../../include/linux/rbtree.h |
@@ -350,12 +377,13 @@ LIB_H += util/include/linux/rbtree.h | |||
350 | LIB_H += util/include/linux/string.h | 377 | LIB_H += util/include/linux/string.h |
351 | LIB_H += util/include/linux/types.h | 378 | LIB_H += util/include/linux/types.h |
352 | LIB_H += util/include/asm/asm-offsets.h | 379 | LIB_H += util/include/asm/asm-offsets.h |
353 | LIB_H += util/include/asm/bitops.h | ||
354 | LIB_H += util/include/asm/bug.h | 380 | LIB_H += util/include/asm/bug.h |
355 | LIB_H += util/include/asm/byteorder.h | 381 | LIB_H += util/include/asm/byteorder.h |
382 | LIB_H += util/include/asm/hweight.h | ||
356 | LIB_H += util/include/asm/swab.h | 383 | LIB_H += util/include/asm/swab.h |
357 | LIB_H += util/include/asm/system.h | 384 | LIB_H += util/include/asm/system.h |
358 | LIB_H += util/include/asm/uaccess.h | 385 | LIB_H += util/include/asm/uaccess.h |
386 | LIB_H += util/include/dwarf-regs.h | ||
359 | LIB_H += perf.h | 387 | LIB_H += perf.h |
360 | LIB_H += util/cache.h | 388 | LIB_H += util/cache.h |
361 | LIB_H += util/callchain.h | 389 | LIB_H += util/callchain.h |
@@ -375,7 +403,6 @@ LIB_H += util/header.h | |||
375 | LIB_H += util/help.h | 403 | LIB_H += util/help.h |
376 | LIB_H += util/session.h | 404 | LIB_H += util/session.h |
377 | LIB_H += util/strbuf.h | 405 | LIB_H += util/strbuf.h |
378 | LIB_H += util/string.h | ||
379 | LIB_H += util/strlist.h | 406 | LIB_H += util/strlist.h |
380 | LIB_H += util/svghelper.h | 407 | LIB_H += util/svghelper.h |
381 | LIB_H += util/run-command.h | 408 | LIB_H += util/run-command.h |
@@ -389,79 +416,83 @@ LIB_H += util/thread.h | |||
389 | LIB_H += util/trace-event.h | 416 | LIB_H += util/trace-event.h |
390 | LIB_H += util/probe-finder.h | 417 | LIB_H += util/probe-finder.h |
391 | LIB_H += util/probe-event.h | 418 | LIB_H += util/probe-event.h |
419 | LIB_H += util/pstack.h | ||
392 | LIB_H += util/cpumap.h | 420 | LIB_H += util/cpumap.h |
393 | 421 | ||
394 | LIB_OBJS += util/abspath.o | 422 | LIB_OBJS += $(OUTPUT)util/abspath.o |
395 | LIB_OBJS += util/alias.o | 423 | LIB_OBJS += $(OUTPUT)util/alias.o |
396 | LIB_OBJS += util/build-id.o | 424 | LIB_OBJS += $(OUTPUT)util/build-id.o |
397 | LIB_OBJS += util/config.o | 425 | LIB_OBJS += $(OUTPUT)util/config.o |
398 | LIB_OBJS += util/ctype.o | 426 | LIB_OBJS += $(OUTPUT)util/ctype.o |
399 | LIB_OBJS += util/debugfs.o | 427 | LIB_OBJS += $(OUTPUT)util/debugfs.o |
400 | LIB_OBJS += util/environment.o | 428 | LIB_OBJS += $(OUTPUT)util/environment.o |
401 | LIB_OBJS += util/event.o | 429 | LIB_OBJS += $(OUTPUT)util/event.o |
402 | LIB_OBJS += util/exec_cmd.o | 430 | LIB_OBJS += $(OUTPUT)util/exec_cmd.o |
403 | LIB_OBJS += util/help.o | 431 | LIB_OBJS += $(OUTPUT)util/help.o |
404 | LIB_OBJS += util/levenshtein.o | 432 | LIB_OBJS += $(OUTPUT)util/levenshtein.o |
405 | LIB_OBJS += util/parse-options.o | 433 | LIB_OBJS += $(OUTPUT)util/parse-options.o |
406 | LIB_OBJS += util/parse-events.o | 434 | LIB_OBJS += $(OUTPUT)util/parse-events.o |
407 | LIB_OBJS += util/path.o | 435 | LIB_OBJS += $(OUTPUT)util/path.o |
408 | LIB_OBJS += util/rbtree.o | 436 | LIB_OBJS += $(OUTPUT)util/rbtree.o |
409 | LIB_OBJS += util/bitmap.o | 437 | LIB_OBJS += $(OUTPUT)util/bitmap.o |
410 | LIB_OBJS += util/hweight.o | 438 | LIB_OBJS += $(OUTPUT)util/hweight.o |
411 | LIB_OBJS += util/find_next_bit.o | 439 | LIB_OBJS += $(OUTPUT)util/run-command.o |
412 | LIB_OBJS += util/run-command.o | 440 | LIB_OBJS += $(OUTPUT)util/quote.o |
413 | LIB_OBJS += util/quote.o | 441 | LIB_OBJS += $(OUTPUT)util/strbuf.o |
414 | LIB_OBJS += util/strbuf.o | 442 | LIB_OBJS += $(OUTPUT)util/string.o |
415 | LIB_OBJS += util/string.o | 443 | LIB_OBJS += $(OUTPUT)util/strlist.o |
416 | LIB_OBJS += util/strlist.o | 444 | LIB_OBJS += $(OUTPUT)util/usage.o |
417 | LIB_OBJS += util/usage.o | 445 | LIB_OBJS += $(OUTPUT)util/wrapper.o |
418 | LIB_OBJS += util/wrapper.o | 446 | LIB_OBJS += $(OUTPUT)util/sigchain.o |
419 | LIB_OBJS += util/sigchain.o | 447 | LIB_OBJS += $(OUTPUT)util/symbol.o |
420 | LIB_OBJS += util/symbol.o | 448 | LIB_OBJS += $(OUTPUT)util/color.o |
421 | LIB_OBJS += util/color.o | 449 | LIB_OBJS += $(OUTPUT)util/pager.o |
422 | LIB_OBJS += util/pager.o | 450 | LIB_OBJS += $(OUTPUT)util/header.o |
423 | LIB_OBJS += util/header.o | 451 | LIB_OBJS += $(OUTPUT)util/callchain.o |
424 | LIB_OBJS += util/callchain.o | 452 | LIB_OBJS += $(OUTPUT)util/values.o |
425 | LIB_OBJS += util/values.o | 453 | LIB_OBJS += $(OUTPUT)util/debug.o |
426 | LIB_OBJS += util/debug.o | 454 | LIB_OBJS += $(OUTPUT)util/map.o |
427 | LIB_OBJS += util/map.o | 455 | LIB_OBJS += $(OUTPUT)util/pstack.o |
428 | LIB_OBJS += util/session.o | 456 | LIB_OBJS += $(OUTPUT)util/session.o |
429 | LIB_OBJS += util/thread.o | 457 | LIB_OBJS += $(OUTPUT)util/thread.o |
430 | LIB_OBJS += util/trace-event-parse.o | 458 | LIB_OBJS += $(OUTPUT)util/trace-event-parse.o |
431 | LIB_OBJS += util/trace-event-read.o | 459 | LIB_OBJS += $(OUTPUT)util/trace-event-read.o |
432 | LIB_OBJS += util/trace-event-info.o | 460 | LIB_OBJS += $(OUTPUT)util/trace-event-info.o |
433 | LIB_OBJS += util/trace-event-scripting.o | 461 | LIB_OBJS += $(OUTPUT)util/trace-event-scripting.o |
434 | LIB_OBJS += util/svghelper.o | 462 | LIB_OBJS += $(OUTPUT)util/svghelper.o |
435 | LIB_OBJS += util/sort.o | 463 | LIB_OBJS += $(OUTPUT)util/sort.o |
436 | LIB_OBJS += util/hist.o | 464 | LIB_OBJS += $(OUTPUT)util/hist.o |
437 | LIB_OBJS += util/probe-event.o | 465 | LIB_OBJS += $(OUTPUT)util/probe-event.o |
438 | LIB_OBJS += util/util.o | 466 | LIB_OBJS += $(OUTPUT)util/util.o |
439 | LIB_OBJS += util/cpumap.o | 467 | LIB_OBJS += $(OUTPUT)util/cpumap.o |
440 | 468 | ||
441 | BUILTIN_OBJS += builtin-annotate.o | 469 | BUILTIN_OBJS += $(OUTPUT)builtin-annotate.o |
442 | 470 | ||
443 | BUILTIN_OBJS += builtin-bench.o | 471 | BUILTIN_OBJS += $(OUTPUT)builtin-bench.o |
444 | 472 | ||
445 | # Benchmark modules | 473 | # Benchmark modules |
446 | BUILTIN_OBJS += bench/sched-messaging.o | 474 | BUILTIN_OBJS += $(OUTPUT)bench/sched-messaging.o |
447 | BUILTIN_OBJS += bench/sched-pipe.o | 475 | BUILTIN_OBJS += $(OUTPUT)bench/sched-pipe.o |
448 | BUILTIN_OBJS += bench/mem-memcpy.o | 476 | BUILTIN_OBJS += $(OUTPUT)bench/mem-memcpy.o |
449 | 477 | ||
450 | BUILTIN_OBJS += builtin-diff.o | 478 | BUILTIN_OBJS += $(OUTPUT)builtin-diff.o |
451 | BUILTIN_OBJS += builtin-help.o | 479 | BUILTIN_OBJS += $(OUTPUT)builtin-help.o |
452 | BUILTIN_OBJS += builtin-sched.o | 480 | BUILTIN_OBJS += $(OUTPUT)builtin-sched.o |
453 | BUILTIN_OBJS += builtin-buildid-list.o | 481 | BUILTIN_OBJS += $(OUTPUT)builtin-buildid-list.o |
454 | BUILTIN_OBJS += builtin-buildid-cache.o | 482 | BUILTIN_OBJS += $(OUTPUT)builtin-buildid-cache.o |
455 | BUILTIN_OBJS += builtin-list.o | 483 | BUILTIN_OBJS += $(OUTPUT)builtin-list.o |
456 | BUILTIN_OBJS += builtin-record.o | 484 | BUILTIN_OBJS += $(OUTPUT)builtin-record.o |
457 | BUILTIN_OBJS += builtin-report.o | 485 | BUILTIN_OBJS += $(OUTPUT)builtin-report.o |
458 | BUILTIN_OBJS += builtin-stat.o | 486 | BUILTIN_OBJS += $(OUTPUT)builtin-stat.o |
459 | BUILTIN_OBJS += builtin-timechart.o | 487 | BUILTIN_OBJS += $(OUTPUT)builtin-timechart.o |
460 | BUILTIN_OBJS += builtin-top.o | 488 | BUILTIN_OBJS += $(OUTPUT)builtin-top.o |
461 | BUILTIN_OBJS += builtin-trace.o | 489 | BUILTIN_OBJS += $(OUTPUT)builtin-trace.o |
462 | BUILTIN_OBJS += builtin-probe.o | 490 | BUILTIN_OBJS += $(OUTPUT)builtin-probe.o |
463 | BUILTIN_OBJS += builtin-kmem.o | 491 | BUILTIN_OBJS += $(OUTPUT)builtin-kmem.o |
464 | BUILTIN_OBJS += builtin-lock.o | 492 | BUILTIN_OBJS += $(OUTPUT)builtin-lock.o |
493 | BUILTIN_OBJS += $(OUTPUT)builtin-kvm.o | ||
494 | BUILTIN_OBJS += $(OUTPUT)builtin-test.o | ||
495 | BUILTIN_OBJS += $(OUTPUT)builtin-inject.o | ||
465 | 496 | ||
466 | PERFLIBS = $(LIB_FILE) | 497 | PERFLIBS = $(LIB_FILE) |
467 | 498 | ||
@@ -476,6 +507,15 @@ PERFLIBS = $(LIB_FILE) | |||
476 | -include config.mak.autogen | 507 | -include config.mak.autogen |
477 | -include config.mak | 508 | -include config.mak |
478 | 509 | ||
510 | ifndef NO_DWARF | ||
511 | ifneq ($(shell sh -c "(echo '\#include <dwarf.h>'; echo '\#include <libdw.h>'; echo '\#include <version.h>'; echo '\#ifndef _ELFUTILS_PREREQ'; echo '\#error'; echo '\#endif'; echo 'int main(void) { Dwarf *dbg; dbg = dwarf_begin(0, DWARF_C_READ); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -I/usr/include/elfutils -ldw -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | ||
512 | msg := $(warning No libdw.h found or old libdw.h found or elfutils is older than 0.138, disables dwarf support. Please install new elfutils-devel/libdw-dev); | ||
513 | NO_DWARF := 1 | ||
514 | endif # Dwarf support | ||
515 | endif # NO_DWARF | ||
516 | |||
517 | -include arch/$(ARCH)/Makefile | ||
518 | |||
479 | ifeq ($(uname_S),Darwin) | 519 | ifeq ($(uname_S),Darwin) |
480 | ifndef NO_FINK | 520 | ifndef NO_FINK |
481 | ifeq ($(shell test -d /sw/lib && echo y),y) | 521 | ifeq ($(shell test -d /sw/lib && echo y),y) |
@@ -492,6 +532,10 @@ ifeq ($(uname_S),Darwin) | |||
492 | PTHREAD_LIBS = | 532 | PTHREAD_LIBS = |
493 | endif | 533 | endif |
494 | 534 | ||
535 | ifneq ($(OUTPUT),) | ||
536 | BASIC_CFLAGS += -I$(OUTPUT) | ||
537 | endif | ||
538 | |||
495 | ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 539 | ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) |
496 | ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 540 | ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) |
497 | msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static); | 541 | msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static); |
@@ -504,13 +548,24 @@ else | |||
504 | msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]); | 548 | msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]); |
505 | endif | 549 | endif |
506 | 550 | ||
507 | ifneq ($(shell sh -c "(echo '\#include <dwarf.h>'; echo '\#include <libdw.h>'; echo 'int main(void) { Dwarf *dbg; dbg = dwarf_begin(0, DWARF_C_READ); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -I/usr/include/elfutils -ldw -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | 551 | ifndef NO_DWARF |
508 | msg := $(warning No libdw.h found or old libdw.h found, disables dwarf support. Please install elfutils-devel/elfutils-dev); | 552 | ifeq ($(origin PERF_HAVE_DWARF_REGS), undefined) |
509 | BASIC_CFLAGS += -DNO_DWARF_SUPPORT | 553 | msg := $(warning DWARF register mappings have not been defined for architecture $(ARCH), DWARF support disabled); |
510 | else | 554 | else |
511 | BASIC_CFLAGS += -I/usr/include/elfutils | 555 | BASIC_CFLAGS += -I/usr/include/elfutils -DDWARF_SUPPORT |
512 | EXTLIBS += -lelf -ldw | 556 | EXTLIBS += -lelf -ldw |
513 | LIB_OBJS += util/probe-finder.o | 557 | LIB_OBJS += $(OUTPUT)util/probe-finder.o |
558 | endif # PERF_HAVE_DWARF_REGS | ||
559 | endif # NO_DWARF | ||
560 | |||
561 | ifneq ($(shell sh -c "(echo '\#include <newt.h>'; echo 'int main(void) { newtInit(); newtCls(); return newtFinished(); }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -lnewt -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) | ||
562 | msg := $(warning newt not found, disables TUI support. Please install newt-devel or libnewt-dev); | ||
563 | BASIC_CFLAGS += -DNO_NEWT_SUPPORT | ||
564 | else | ||
565 | # Fedora has /usr/include/slang/slang.h, but ubuntu /usr/include/slang.h | ||
566 | BASIC_CFLAGS += -I/usr/include/slang | ||
567 | EXTLIBS += -lnewt | ||
568 | LIB_OBJS += $(OUTPUT)util/newt.o | ||
514 | endif | 569 | endif |
515 | 570 | ||
516 | ifndef NO_LIBPERL | 571 | ifndef NO_LIBPERL |
@@ -522,8 +577,8 @@ ifneq ($(shell sh -c "(echo '\#include <EXTERN.h>'; echo '\#include <perl.h>'; e | |||
522 | BASIC_CFLAGS += -DNO_LIBPERL | 577 | BASIC_CFLAGS += -DNO_LIBPERL |
523 | else | 578 | else |
524 | ALL_LDFLAGS += $(PERL_EMBED_LDOPTS) | 579 | ALL_LDFLAGS += $(PERL_EMBED_LDOPTS) |
525 | LIB_OBJS += util/scripting-engines/trace-event-perl.o | 580 | LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-perl.o |
526 | LIB_OBJS += scripts/perl/Perf-Trace-Util/Context.o | 581 | LIB_OBJS += $(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o |
527 | endif | 582 | endif |
528 | 583 | ||
529 | ifndef NO_LIBPYTHON | 584 | ifndef NO_LIBPYTHON |
@@ -531,16 +586,19 @@ PYTHON_EMBED_LDOPTS = `python-config --ldflags 2>/dev/null` | |||
531 | PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null` | 586 | PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null` |
532 | endif | 587 | endif |
533 | 588 | ||
534 | ifneq ($(shell sh -c "(echo '\#include <Python.h>'; echo 'int main(void) { Py_Initialize(); return 0; }') | $(CC) -x c - $(PYTHON_EMBED_CCOPTS) -o /dev/null $(PYTHON_EMBED_LDOPTS) > /dev/null 2>&1 && echo y"), y) | 589 | ifneq ($(shell sh -c "(echo '\#include <Python.h>'; echo 'int main(void) { Py_Initialize(); return 0; }') | $(CC) -x c - $(PYTHON_EMBED_CCOPTS) -o $(BITBUCKET) $(PYTHON_EMBED_LDOPTS) > /dev/null 2>&1 && echo y"), y) |
535 | BASIC_CFLAGS += -DNO_LIBPYTHON | 590 | BASIC_CFLAGS += -DNO_LIBPYTHON |
536 | else | 591 | else |
537 | ALL_LDFLAGS += $(PYTHON_EMBED_LDOPTS) | 592 | ALL_LDFLAGS += $(PYTHON_EMBED_LDOPTS) |
538 | LIB_OBJS += util/scripting-engines/trace-event-python.o | 593 | LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-python.o |
539 | LIB_OBJS += scripts/python/Perf-Trace-Util/Context.o | 594 | LIB_OBJS += $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o |
540 | endif | 595 | endif |
541 | 596 | ||
542 | ifdef NO_DEMANGLE | 597 | ifdef NO_DEMANGLE |
543 | BASIC_CFLAGS += -DNO_DEMANGLE | 598 | BASIC_CFLAGS += -DNO_DEMANGLE |
599 | else ifdef HAVE_CPLUS_DEMANGLE | ||
600 | EXTLIBS += -liberty | ||
601 | BASIC_CFLAGS += -DHAVE_CPLUS_DEMANGLE | ||
544 | else | 602 | else |
545 | has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y") | 603 | has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y") |
546 | 604 | ||
@@ -607,53 +665,53 @@ ifdef NO_C99_FORMAT | |||
607 | endif | 665 | endif |
608 | ifdef SNPRINTF_RETURNS_BOGUS | 666 | ifdef SNPRINTF_RETURNS_BOGUS |
609 | COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS | 667 | COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS |
610 | COMPAT_OBJS += compat/snprintf.o | 668 | COMPAT_OBJS += $(OUTPUT)compat/snprintf.o |
611 | endif | 669 | endif |
612 | ifdef FREAD_READS_DIRECTORIES | 670 | ifdef FREAD_READS_DIRECTORIES |
613 | COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES | 671 | COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES |
614 | COMPAT_OBJS += compat/fopen.o | 672 | COMPAT_OBJS += $(OUTPUT)compat/fopen.o |
615 | endif | 673 | endif |
616 | ifdef NO_SYMLINK_HEAD | 674 | ifdef NO_SYMLINK_HEAD |
617 | BASIC_CFLAGS += -DNO_SYMLINK_HEAD | 675 | BASIC_CFLAGS += -DNO_SYMLINK_HEAD |
618 | endif | 676 | endif |
619 | ifdef NO_STRCASESTR | 677 | ifdef NO_STRCASESTR |
620 | COMPAT_CFLAGS += -DNO_STRCASESTR | 678 | COMPAT_CFLAGS += -DNO_STRCASESTR |
621 | COMPAT_OBJS += compat/strcasestr.o | 679 | COMPAT_OBJS += $(OUTPUT)compat/strcasestr.o |
622 | endif | 680 | endif |
623 | ifdef NO_STRTOUMAX | 681 | ifdef NO_STRTOUMAX |
624 | COMPAT_CFLAGS += -DNO_STRTOUMAX | 682 | COMPAT_CFLAGS += -DNO_STRTOUMAX |
625 | COMPAT_OBJS += compat/strtoumax.o | 683 | COMPAT_OBJS += $(OUTPUT)compat/strtoumax.o |
626 | endif | 684 | endif |
627 | ifdef NO_STRTOULL | 685 | ifdef NO_STRTOULL |
628 | COMPAT_CFLAGS += -DNO_STRTOULL | 686 | COMPAT_CFLAGS += -DNO_STRTOULL |
629 | endif | 687 | endif |
630 | ifdef NO_SETENV | 688 | ifdef NO_SETENV |
631 | COMPAT_CFLAGS += -DNO_SETENV | 689 | COMPAT_CFLAGS += -DNO_SETENV |
632 | COMPAT_OBJS += compat/setenv.o | 690 | COMPAT_OBJS += $(OUTPUT)compat/setenv.o |
633 | endif | 691 | endif |
634 | ifdef NO_MKDTEMP | 692 | ifdef NO_MKDTEMP |
635 | COMPAT_CFLAGS += -DNO_MKDTEMP | 693 | COMPAT_CFLAGS += -DNO_MKDTEMP |
636 | COMPAT_OBJS += compat/mkdtemp.o | 694 | COMPAT_OBJS += $(OUTPUT)compat/mkdtemp.o |
637 | endif | 695 | endif |
638 | ifdef NO_UNSETENV | 696 | ifdef NO_UNSETENV |
639 | COMPAT_CFLAGS += -DNO_UNSETENV | 697 | COMPAT_CFLAGS += -DNO_UNSETENV |
640 | COMPAT_OBJS += compat/unsetenv.o | 698 | COMPAT_OBJS += $(OUTPUT)compat/unsetenv.o |
641 | endif | 699 | endif |
642 | ifdef NO_SYS_SELECT_H | 700 | ifdef NO_SYS_SELECT_H |
643 | BASIC_CFLAGS += -DNO_SYS_SELECT_H | 701 | BASIC_CFLAGS += -DNO_SYS_SELECT_H |
644 | endif | 702 | endif |
645 | ifdef NO_MMAP | 703 | ifdef NO_MMAP |
646 | COMPAT_CFLAGS += -DNO_MMAP | 704 | COMPAT_CFLAGS += -DNO_MMAP |
647 | COMPAT_OBJS += compat/mmap.o | 705 | COMPAT_OBJS += $(OUTPUT)compat/mmap.o |
648 | else | 706 | else |
649 | ifdef USE_WIN32_MMAP | 707 | ifdef USE_WIN32_MMAP |
650 | COMPAT_CFLAGS += -DUSE_WIN32_MMAP | 708 | COMPAT_CFLAGS += -DUSE_WIN32_MMAP |
651 | COMPAT_OBJS += compat/win32mmap.o | 709 | COMPAT_OBJS += $(OUTPUT)compat/win32mmap.o |
652 | endif | 710 | endif |
653 | endif | 711 | endif |
654 | ifdef NO_PREAD | 712 | ifdef NO_PREAD |
655 | COMPAT_CFLAGS += -DNO_PREAD | 713 | COMPAT_CFLAGS += -DNO_PREAD |
656 | COMPAT_OBJS += compat/pread.o | 714 | COMPAT_OBJS += $(OUTPUT)compat/pread.o |
657 | endif | 715 | endif |
658 | ifdef NO_FAST_WORKING_DIRECTORY | 716 | ifdef NO_FAST_WORKING_DIRECTORY |
659 | BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY | 717 | BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY |
@@ -675,10 +733,10 @@ else | |||
675 | endif | 733 | endif |
676 | endif | 734 | endif |
677 | ifdef NO_INET_NTOP | 735 | ifdef NO_INET_NTOP |
678 | LIB_OBJS += compat/inet_ntop.o | 736 | LIB_OBJS += $(OUTPUT)compat/inet_ntop.o |
679 | endif | 737 | endif |
680 | ifdef NO_INET_PTON | 738 | ifdef NO_INET_PTON |
681 | LIB_OBJS += compat/inet_pton.o | 739 | LIB_OBJS += $(OUTPUT)compat/inet_pton.o |
682 | endif | 740 | endif |
683 | 741 | ||
684 | ifdef NO_ICONV | 742 | ifdef NO_ICONV |
@@ -695,15 +753,15 @@ endif | |||
695 | 753 | ||
696 | ifdef PPC_SHA1 | 754 | ifdef PPC_SHA1 |
697 | SHA1_HEADER = "ppc/sha1.h" | 755 | SHA1_HEADER = "ppc/sha1.h" |
698 | LIB_OBJS += ppc/sha1.o ppc/sha1ppc.o | 756 | LIB_OBJS += $(OUTPUT)ppc/sha1.o ppc/sha1ppc.o |
699 | else | 757 | else |
700 | ifdef ARM_SHA1 | 758 | ifdef ARM_SHA1 |
701 | SHA1_HEADER = "arm/sha1.h" | 759 | SHA1_HEADER = "arm/sha1.h" |
702 | LIB_OBJS += arm/sha1.o arm/sha1_arm.o | 760 | LIB_OBJS += $(OUTPUT)arm/sha1.o $(OUTPUT)arm/sha1_arm.o |
703 | else | 761 | else |
704 | ifdef MOZILLA_SHA1 | 762 | ifdef MOZILLA_SHA1 |
705 | SHA1_HEADER = "mozilla-sha1/sha1.h" | 763 | SHA1_HEADER = "mozilla-sha1/sha1.h" |
706 | LIB_OBJS += mozilla-sha1/sha1.o | 764 | LIB_OBJS += $(OUTPUT)mozilla-sha1/sha1.o |
707 | else | 765 | else |
708 | SHA1_HEADER = <openssl/sha.h> | 766 | SHA1_HEADER = <openssl/sha.h> |
709 | EXTLIBS += $(LIB_4_CRYPTO) | 767 | EXTLIBS += $(LIB_4_CRYPTO) |
@@ -715,15 +773,15 @@ ifdef NO_PERL_MAKEMAKER | |||
715 | endif | 773 | endif |
716 | ifdef NO_HSTRERROR | 774 | ifdef NO_HSTRERROR |
717 | COMPAT_CFLAGS += -DNO_HSTRERROR | 775 | COMPAT_CFLAGS += -DNO_HSTRERROR |
718 | COMPAT_OBJS += compat/hstrerror.o | 776 | COMPAT_OBJS += $(OUTPUT)compat/hstrerror.o |
719 | endif | 777 | endif |
720 | ifdef NO_MEMMEM | 778 | ifdef NO_MEMMEM |
721 | COMPAT_CFLAGS += -DNO_MEMMEM | 779 | COMPAT_CFLAGS += -DNO_MEMMEM |
722 | COMPAT_OBJS += compat/memmem.o | 780 | COMPAT_OBJS += $(OUTPUT)compat/memmem.o |
723 | endif | 781 | endif |
724 | ifdef INTERNAL_QSORT | 782 | ifdef INTERNAL_QSORT |
725 | COMPAT_CFLAGS += -DINTERNAL_QSORT | 783 | COMPAT_CFLAGS += -DINTERNAL_QSORT |
726 | COMPAT_OBJS += compat/qsort.o | 784 | COMPAT_OBJS += $(OUTPUT)compat/qsort.o |
727 | endif | 785 | endif |
728 | ifdef RUNTIME_PREFIX | 786 | ifdef RUNTIME_PREFIX |
729 | COMPAT_CFLAGS += -DRUNTIME_PREFIX | 787 | COMPAT_CFLAGS += -DRUNTIME_PREFIX |
@@ -803,7 +861,7 @@ export TAR INSTALL DESTDIR SHELL_PATH | |||
803 | 861 | ||
804 | SHELL = $(SHELL_PATH) | 862 | SHELL = $(SHELL_PATH) |
805 | 863 | ||
806 | all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) PERF-BUILD-OPTIONS | 864 | all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) $(OUTPUT)PERF-BUILD-OPTIONS |
807 | ifneq (,$X) | 865 | ifneq (,$X) |
808 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';) | 866 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';) |
809 | endif | 867 | endif |
@@ -815,39 +873,39 @@ please_set_SHELL_PATH_to_a_more_modern_shell: | |||
815 | 873 | ||
816 | shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell | 874 | shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell |
817 | 875 | ||
818 | strip: $(PROGRAMS) perf$X | 876 | strip: $(PROGRAMS) $(OUTPUT)perf$X |
819 | $(STRIP) $(STRIP_OPTS) $(PROGRAMS) perf$X | 877 | $(STRIP) $(STRIP_OPTS) $(PROGRAMS) $(OUTPUT)perf$X |
820 | 878 | ||
821 | perf.o: perf.c common-cmds.h PERF-CFLAGS | 879 | $(OUTPUT)perf.o: perf.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
822 | $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \ | 880 | $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \ |
823 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 881 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
824 | $(ALL_CFLAGS) -c $(filter %.c,$^) | 882 | $(ALL_CFLAGS) -c $(filter %.c,$^) -o $@ |
825 | 883 | ||
826 | perf$X: perf.o $(BUILTIN_OBJS) $(PERFLIBS) | 884 | $(OUTPUT)perf$X: $(OUTPUT)perf.o $(BUILTIN_OBJS) $(PERFLIBS) |
827 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ perf.o \ | 885 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(OUTPUT)perf.o \ |
828 | $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS) | 886 | $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS) |
829 | 887 | ||
830 | builtin-help.o: builtin-help.c common-cmds.h PERF-CFLAGS | 888 | $(OUTPUT)builtin-help.o: builtin-help.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
831 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 889 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
832 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 890 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
833 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ | 891 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ |
834 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< | 892 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< |
835 | 893 | ||
836 | builtin-timechart.o: builtin-timechart.c common-cmds.h PERF-CFLAGS | 894 | $(OUTPUT)builtin-timechart.o: builtin-timechart.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS |
837 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 895 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
838 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ | 896 | '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ |
839 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ | 897 | '-DPERF_MAN_PATH="$(mandir_SQ)"' \ |
840 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< | 898 | '-DPERF_INFO_PATH="$(infodir_SQ)"' $< |
841 | 899 | ||
842 | $(BUILT_INS): perf$X | 900 | $(BUILT_INS): $(OUTPUT)perf$X |
843 | $(QUIET_BUILT_IN)$(RM) $@ && \ | 901 | $(QUIET_BUILT_IN)$(RM) $@ && \ |
844 | ln perf$X $@ 2>/dev/null || \ | 902 | ln perf$X $@ 2>/dev/null || \ |
845 | ln -s perf$X $@ 2>/dev/null || \ | 903 | ln -s perf$X $@ 2>/dev/null || \ |
846 | cp perf$X $@ | 904 | cp perf$X $@ |
847 | 905 | ||
848 | common-cmds.h: util/generate-cmdlist.sh command-list.txt | 906 | $(OUTPUT)common-cmds.h: util/generate-cmdlist.sh command-list.txt |
849 | 907 | ||
850 | common-cmds.h: $(wildcard Documentation/perf-*.txt) | 908 | $(OUTPUT)common-cmds.h: $(wildcard Documentation/perf-*.txt) |
851 | $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@ | 909 | $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@ |
852 | 910 | ||
853 | $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh | 911 | $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh |
@@ -859,7 +917,7 @@ $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh | |||
859 | -e 's/@@NO_CURL@@/$(NO_CURL)/g' \ | 917 | -e 's/@@NO_CURL@@/$(NO_CURL)/g' \ |
860 | $@.sh >$@+ && \ | 918 | $@.sh >$@+ && \ |
861 | chmod +x $@+ && \ | 919 | chmod +x $@+ && \ |
862 | mv $@+ $@ | 920 | mv $@+ $(OUTPUT)$@ |
863 | 921 | ||
864 | configure: configure.ac | 922 | configure: configure.ac |
865 | $(QUIET_GEN)$(RM) $@ $<+ && \ | 923 | $(QUIET_GEN)$(RM) $@ $<+ && \ |
@@ -869,60 +927,50 @@ configure: configure.ac | |||
869 | $(RM) $<+ | 927 | $(RM) $<+ |
870 | 928 | ||
871 | # These can record PERF_VERSION | 929 | # These can record PERF_VERSION |
872 | perf.o perf.spec \ | 930 | $(OUTPUT)perf.o perf.spec \ |
873 | $(patsubst %.sh,%,$(SCRIPT_SH)) \ | 931 | $(patsubst %.sh,%,$(SCRIPT_SH)) \ |
874 | $(patsubst %.perl,%,$(SCRIPT_PERL)) \ | 932 | $(patsubst %.perl,%,$(SCRIPT_PERL)) \ |
875 | : PERF-VERSION-FILE | 933 | : $(OUTPUT)PERF-VERSION-FILE |
876 | 934 | ||
877 | %.o: %.c PERF-CFLAGS | 935 | $(OUTPUT)%.o: %.c $(OUTPUT)PERF-CFLAGS |
878 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< | 936 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $< |
879 | %.s: %.c PERF-CFLAGS | 937 | $(OUTPUT)%.s: %.c $(OUTPUT)PERF-CFLAGS |
880 | $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $< | 938 | $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $< |
881 | %.o: %.S | 939 | $(OUTPUT)%.o: %.S |
882 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< | 940 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $< |
883 | 941 | ||
884 | util/exec_cmd.o: util/exec_cmd.c PERF-CFLAGS | 942 | $(OUTPUT)util/exec_cmd.o: util/exec_cmd.c $(OUTPUT)PERF-CFLAGS |
885 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ | 943 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \ |
886 | '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \ | 944 | '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \ |
887 | '-DBINDIR="$(bindir_relative_SQ)"' \ | 945 | '-DBINDIR="$(bindir_relative_SQ)"' \ |
888 | '-DPREFIX="$(prefix_SQ)"' \ | 946 | '-DPREFIX="$(prefix_SQ)"' \ |
889 | $< | 947 | $< |
890 | 948 | ||
891 | builtin-init-db.o: builtin-init-db.c PERF-CFLAGS | 949 | $(OUTPUT)builtin-init-db.o: builtin-init-db.c $(OUTPUT)PERF-CFLAGS |
892 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $< | 950 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $< |
893 | |||
894 | util/config.o: util/config.c PERF-CFLAGS | ||
895 | $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | ||
896 | |||
897 | util/rbtree.o: ../../lib/rbtree.c PERF-CFLAGS | ||
898 | $(QUIET_CC)$(CC) -o util/rbtree.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | ||
899 | |||
900 | # some perf warning policies can't fit to lib/bitmap.c, eg: it warns about variable shadowing | ||
901 | # from <string.h> that comes from kernel headers wrapping. | ||
902 | KBITMAP_FLAGS=`echo $(ALL_CFLAGS) | sed s/-Wshadow// | sed s/-Wswitch-default// | sed s/-Wextra//` | ||
903 | 951 | ||
904 | util/bitmap.o: ../../lib/bitmap.c PERF-CFLAGS | 952 | $(OUTPUT)util/config.o: util/config.c $(OUTPUT)PERF-CFLAGS |
905 | $(QUIET_CC)$(CC) -o util/bitmap.o -c $(KBITMAP_FLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 953 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< |
906 | 954 | ||
907 | util/hweight.o: ../../lib/hweight.c PERF-CFLAGS | 955 | $(OUTPUT)util/newt.o: util/newt.c $(OUTPUT)PERF-CFLAGS |
908 | $(QUIET_CC)$(CC) -o util/hweight.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 956 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $< |
909 | 957 | ||
910 | util/find_next_bit.o: ../../lib/find_next_bit.c PERF-CFLAGS | 958 | $(OUTPUT)util/rbtree.o: ../../lib/rbtree.c $(OUTPUT)PERF-CFLAGS |
911 | $(QUIET_CC)$(CC) -o util/find_next_bit.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< | 959 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< |
912 | 960 | ||
913 | util/scripting-engines/trace-event-perl.o: util/scripting-engines/trace-event-perl.c PERF-CFLAGS | 961 | $(OUTPUT)util/scripting-engines/trace-event-perl.o: util/scripting-engines/trace-event-perl.c $(OUTPUT)PERF-CFLAGS |
914 | $(QUIET_CC)$(CC) -o util/scripting-engines/trace-event-perl.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< | 962 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< |
915 | 963 | ||
916 | scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c PERF-CFLAGS | 964 | $(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS |
917 | $(QUIET_CC)$(CC) -o scripts/perl/Perf-Trace-Util/Context.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< | 965 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< |
918 | 966 | ||
919 | util/scripting-engines/trace-event-python.o: util/scripting-engines/trace-event-python.c PERF-CFLAGS | 967 | $(OUTPUT)util/scripting-engines/trace-event-python.o: util/scripting-engines/trace-event-python.c $(OUTPUT)PERF-CFLAGS |
920 | $(QUIET_CC)$(CC) -o util/scripting-engines/trace-event-python.o -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< | 968 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< |
921 | 969 | ||
922 | scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c PERF-CFLAGS | 970 | $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS |
923 | $(QUIET_CC)$(CC) -o scripts/python/Perf-Trace-Util/Context.o -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< | 971 | $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< |
924 | 972 | ||
925 | perf-%$X: %.o $(PERFLIBS) | 973 | $(OUTPUT)perf-%$X: %.o $(PERFLIBS) |
926 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS) | 974 | $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS) |
927 | 975 | ||
928 | $(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H) | 976 | $(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H) |
@@ -963,17 +1011,17 @@ cscope: | |||
963 | TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\ | 1011 | TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\ |
964 | $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ) | 1012 | $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ) |
965 | 1013 | ||
966 | PERF-CFLAGS: .FORCE-PERF-CFLAGS | 1014 | $(OUTPUT)PERF-CFLAGS: .FORCE-PERF-CFLAGS |
967 | @FLAGS='$(TRACK_CFLAGS)'; \ | 1015 | @FLAGS='$(TRACK_CFLAGS)'; \ |
968 | if test x"$$FLAGS" != x"`cat PERF-CFLAGS 2>/dev/null`" ; then \ | 1016 | if test x"$$FLAGS" != x"`cat $(OUTPUT)PERF-CFLAGS 2>/dev/null`" ; then \ |
969 | echo 1>&2 " * new build flags or prefix"; \ | 1017 | echo 1>&2 " * new build flags or prefix"; \ |
970 | echo "$$FLAGS" >PERF-CFLAGS; \ | 1018 | echo "$$FLAGS" >$(OUTPUT)PERF-CFLAGS; \ |
971 | fi | 1019 | fi |
972 | 1020 | ||
973 | # We need to apply sq twice, once to protect from the shell | 1021 | # We need to apply sq twice, once to protect from the shell |
974 | # that runs PERF-BUILD-OPTIONS, and then again to protect it | 1022 | # that runs $(OUTPUT)PERF-BUILD-OPTIONS, and then again to protect it |
975 | # and the first level quoting from the shell that runs "echo". | 1023 | # and the first level quoting from the shell that runs "echo". |
976 | PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS | 1024 | $(OUTPUT)PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS |
977 | @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@ | 1025 | @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@ |
978 | @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@ | 1026 | @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@ |
979 | @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@ | 1027 | @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@ |
@@ -994,7 +1042,7 @@ all:: $(TEST_PROGRAMS) | |||
994 | 1042 | ||
995 | export NO_SVN_TESTS | 1043 | export NO_SVN_TESTS |
996 | 1044 | ||
997 | check: common-cmds.h | 1045 | check: $(OUTPUT)common-cmds.h |
998 | if sparse; \ | 1046 | if sparse; \ |
999 | then \ | 1047 | then \ |
1000 | for i in *.c */*.c; \ | 1048 | for i in *.c */*.c; \ |
@@ -1028,10 +1076,10 @@ export perfexec_instdir | |||
1028 | 1076 | ||
1029 | install: all | 1077 | install: all |
1030 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)' | 1078 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)' |
1031 | $(INSTALL) perf$X '$(DESTDIR_SQ)$(bindir_SQ)' | 1079 | $(INSTALL) $(OUTPUT)perf$X '$(DESTDIR_SQ)$(bindir_SQ)' |
1032 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' | 1080 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' |
1033 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' | 1081 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' |
1034 | $(INSTALL) perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1082 | $(INSTALL) $(OUTPUT)perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1035 | $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' | 1083 | $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' |
1036 | $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl' | 1084 | $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl' |
1037 | $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' | 1085 | $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' |
@@ -1045,7 +1093,7 @@ ifdef BUILT_INS | |||
1045 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1093 | $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1046 | $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' | 1094 | $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' |
1047 | ifneq (,$X) | 1095 | ifneq (,$X) |
1048 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';) | 1096 | $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) $(OUTPUT)perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';) |
1049 | endif | 1097 | endif |
1050 | endif | 1098 | endif |
1051 | 1099 | ||
@@ -1129,14 +1177,14 @@ clean: | |||
1129 | $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE) | 1177 | $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE) |
1130 | $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X | 1178 | $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X |
1131 | $(RM) $(TEST_PROGRAMS) | 1179 | $(RM) $(TEST_PROGRAMS) |
1132 | $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo common-cmds.h TAGS tags cscope* | 1180 | $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo $(OUTPUT)common-cmds.h TAGS tags cscope* |
1133 | $(RM) -r autom4te.cache | 1181 | $(RM) -r autom4te.cache |
1134 | $(RM) config.log config.mak.autogen config.mak.append config.status config.cache | 1182 | $(RM) config.log config.mak.autogen config.mak.append config.status config.cache |
1135 | $(RM) -r $(PERF_TARNAME) .doc-tmp-dir | 1183 | $(RM) -r $(PERF_TARNAME) .doc-tmp-dir |
1136 | $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz | 1184 | $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz |
1137 | $(RM) $(htmldocs).tar.gz $(manpages).tar.gz | 1185 | $(RM) $(htmldocs).tar.gz $(manpages).tar.gz |
1138 | $(MAKE) -C Documentation/ clean | 1186 | $(MAKE) -C Documentation/ clean |
1139 | $(RM) PERF-VERSION-FILE PERF-CFLAGS PERF-BUILD-OPTIONS | 1187 | $(RM) $(OUTPUT)PERF-VERSION-FILE $(OUTPUT)PERF-CFLAGS $(OUTPUT)PERF-BUILD-OPTIONS |
1140 | 1188 | ||
1141 | .PHONY: all install clean strip | 1189 | .PHONY: all install clean strip |
1142 | .PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell | 1190 | .PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell |
diff --git a/tools/perf/arch/powerpc/Makefile b/tools/perf/arch/powerpc/Makefile new file mode 100644 index 000000000000..15130b50dfe3 --- /dev/null +++ b/tools/perf/arch/powerpc/Makefile | |||
@@ -0,0 +1,4 @@ | |||
1 | ifndef NO_DWARF | ||
2 | PERF_HAVE_DWARF_REGS := 1 | ||
3 | LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o | ||
4 | endif | ||
diff --git a/tools/perf/arch/powerpc/util/dwarf-regs.c b/tools/perf/arch/powerpc/util/dwarf-regs.c new file mode 100644 index 000000000000..48ae0c5e3f73 --- /dev/null +++ b/tools/perf/arch/powerpc/util/dwarf-regs.c | |||
@@ -0,0 +1,88 @@ | |||
1 | /* | ||
2 | * Mapping of DWARF debug register numbers into register names. | ||
3 | * | ||
4 | * Copyright (C) 2010 Ian Munsie, IBM Corporation. | ||
5 | * | ||
6 | * This program is free software; you can redistribute it and/or | ||
7 | * modify it under the terms of the GNU General Public License | ||
8 | * as published by the Free Software Foundation; either version | ||
9 | * 2 of the License, or (at your option) any later version. | ||
10 | */ | ||
11 | |||
12 | #include <libio.h> | ||
13 | #include <dwarf-regs.h> | ||
14 | |||
15 | |||
16 | struct pt_regs_dwarfnum { | ||
17 | const char *name; | ||
18 | unsigned int dwarfnum; | ||
19 | }; | ||
20 | |||
21 | #define STR(s) #s | ||
22 | #define REG_DWARFNUM_NAME(r, num) {.name = r, .dwarfnum = num} | ||
23 | #define GPR_DWARFNUM_NAME(num) \ | ||
24 | {.name = STR(%gpr##num), .dwarfnum = num} | ||
25 | #define REG_DWARFNUM_END {.name = NULL, .dwarfnum = 0} | ||
26 | |||
27 | /* | ||
28 | * Reference: | ||
29 | * http://refspecs.linuxfoundation.org/ELF/ppc64/PPC-elf64abi-1.9.html | ||
30 | */ | ||
31 | static const struct pt_regs_dwarfnum regdwarfnum_table[] = { | ||
32 | GPR_DWARFNUM_NAME(0), | ||
33 | GPR_DWARFNUM_NAME(1), | ||
34 | GPR_DWARFNUM_NAME(2), | ||
35 | GPR_DWARFNUM_NAME(3), | ||
36 | GPR_DWARFNUM_NAME(4), | ||
37 | GPR_DWARFNUM_NAME(5), | ||
38 | GPR_DWARFNUM_NAME(6), | ||
39 | GPR_DWARFNUM_NAME(7), | ||
40 | GPR_DWARFNUM_NAME(8), | ||
41 | GPR_DWARFNUM_NAME(9), | ||
42 | GPR_DWARFNUM_NAME(10), | ||
43 | GPR_DWARFNUM_NAME(11), | ||
44 | GPR_DWARFNUM_NAME(12), | ||
45 | GPR_DWARFNUM_NAME(13), | ||
46 | GPR_DWARFNUM_NAME(14), | ||
47 | GPR_DWARFNUM_NAME(15), | ||
48 | GPR_DWARFNUM_NAME(16), | ||
49 | GPR_DWARFNUM_NAME(17), | ||
50 | GPR_DWARFNUM_NAME(18), | ||
51 | GPR_DWARFNUM_NAME(19), | ||
52 | GPR_DWARFNUM_NAME(20), | ||
53 | GPR_DWARFNUM_NAME(21), | ||
54 | GPR_DWARFNUM_NAME(22), | ||
55 | GPR_DWARFNUM_NAME(23), | ||
56 | GPR_DWARFNUM_NAME(24), | ||
57 | GPR_DWARFNUM_NAME(25), | ||
58 | GPR_DWARFNUM_NAME(26), | ||
59 | GPR_DWARFNUM_NAME(27), | ||
60 | GPR_DWARFNUM_NAME(28), | ||
61 | GPR_DWARFNUM_NAME(29), | ||
62 | GPR_DWARFNUM_NAME(30), | ||
63 | GPR_DWARFNUM_NAME(31), | ||
64 | REG_DWARFNUM_NAME("%msr", 66), | ||
65 | REG_DWARFNUM_NAME("%ctr", 109), | ||
66 | REG_DWARFNUM_NAME("%link", 108), | ||
67 | REG_DWARFNUM_NAME("%xer", 101), | ||
68 | REG_DWARFNUM_NAME("%dar", 119), | ||
69 | REG_DWARFNUM_NAME("%dsisr", 118), | ||
70 | REG_DWARFNUM_END, | ||
71 | }; | ||
72 | |||
73 | /** | ||
74 | * get_arch_regstr() - lookup register name from it's DWARF register number | ||
75 | * @n: the DWARF register number | ||
76 | * | ||
77 | * get_arch_regstr() returns the name of the register in struct | ||
78 | * regdwarfnum_table from it's DWARF register number. If the register is not | ||
79 | * found in the table, this returns NULL; | ||
80 | */ | ||
81 | const char *get_arch_regstr(unsigned int n) | ||
82 | { | ||
83 | const struct pt_regs_dwarfnum *roff; | ||
84 | for (roff = regdwarfnum_table; roff->name != NULL; roff++) | ||
85 | if (roff->dwarfnum == n) | ||
86 | return roff->name; | ||
87 | return NULL; | ||
88 | } | ||
diff --git a/tools/perf/arch/x86/Makefile b/tools/perf/arch/x86/Makefile new file mode 100644 index 000000000000..15130b50dfe3 --- /dev/null +++ b/tools/perf/arch/x86/Makefile | |||
@@ -0,0 +1,4 @@ | |||
1 | ifndef NO_DWARF | ||
2 | PERF_HAVE_DWARF_REGS := 1 | ||
3 | LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o | ||
4 | endif | ||
diff --git a/tools/perf/arch/x86/util/dwarf-regs.c b/tools/perf/arch/x86/util/dwarf-regs.c new file mode 100644 index 000000000000..a794d3081928 --- /dev/null +++ b/tools/perf/arch/x86/util/dwarf-regs.c | |||
@@ -0,0 +1,75 @@ | |||
1 | /* | ||
2 | * dwarf-regs.c : Mapping of DWARF debug register numbers into register names. | ||
3 | * Extracted from probe-finder.c | ||
4 | * | ||
5 | * Written by Masami Hiramatsu <mhiramat@redhat.com> | ||
6 | * | ||
7 | * This program is free software; you can redistribute it and/or modify | ||
8 | * it under the terms of the GNU General Public License as published by | ||
9 | * the Free Software Foundation; either version 2 of the License, or | ||
10 | * (at your option) any later version. | ||
11 | * | ||
12 | * This program is distributed in the hope that it will be useful, | ||
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
15 | * GNU General Public License for more details. | ||
16 | * | ||
17 | * You should have received a copy of the GNU General Public License | ||
18 | * along with this program; if not, write to the Free Software | ||
19 | * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. | ||
20 | * | ||
21 | */ | ||
22 | |||
23 | #include <libio.h> | ||
24 | #include <dwarf-regs.h> | ||
25 | |||
26 | /* | ||
27 | * Generic dwarf analysis helpers | ||
28 | */ | ||
29 | |||
30 | #define X86_32_MAX_REGS 8 | ||
31 | const char *x86_32_regs_table[X86_32_MAX_REGS] = { | ||
32 | "%ax", | ||
33 | "%cx", | ||
34 | "%dx", | ||
35 | "%bx", | ||
36 | "$stack", /* Stack address instead of %sp */ | ||
37 | "%bp", | ||
38 | "%si", | ||
39 | "%di", | ||
40 | }; | ||
41 | |||
42 | #define X86_64_MAX_REGS 16 | ||
43 | const char *x86_64_regs_table[X86_64_MAX_REGS] = { | ||
44 | "%ax", | ||
45 | "%dx", | ||
46 | "%cx", | ||
47 | "%bx", | ||
48 | "%si", | ||
49 | "%di", | ||
50 | "%bp", | ||
51 | "%sp", | ||
52 | "%r8", | ||
53 | "%r9", | ||
54 | "%r10", | ||
55 | "%r11", | ||
56 | "%r12", | ||
57 | "%r13", | ||
58 | "%r14", | ||
59 | "%r15", | ||
60 | }; | ||
61 | |||
62 | /* TODO: switching by dwarf address size */ | ||
63 | #ifdef __x86_64__ | ||
64 | #define ARCH_MAX_REGS X86_64_MAX_REGS | ||
65 | #define arch_regs_table x86_64_regs_table | ||
66 | #else | ||
67 | #define ARCH_MAX_REGS X86_32_MAX_REGS | ||
68 | #define arch_regs_table x86_32_regs_table | ||
69 | #endif | ||
70 | |||
71 | /* Return architecture dependent register string (for kprobe-tracer) */ | ||
72 | const char *get_arch_regstr(unsigned int n) | ||
73 | { | ||
74 | return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL; | ||
75 | } | ||
diff --git a/tools/perf/bench/mem-memcpy.c b/tools/perf/bench/mem-memcpy.c index 89773178e894..38dae7465142 100644 --- a/tools/perf/bench/mem-memcpy.c +++ b/tools/perf/bench/mem-memcpy.c | |||
@@ -10,7 +10,6 @@ | |||
10 | #include "../perf.h" | 10 | #include "../perf.h" |
11 | #include "../util/util.h" | 11 | #include "../util/util.h" |
12 | #include "../util/parse-options.h" | 12 | #include "../util/parse-options.h" |
13 | #include "../util/string.h" | ||
14 | #include "../util/header.h" | 13 | #include "../util/header.h" |
15 | #include "bench.h" | 14 | #include "bench.h" |
16 | 15 | ||
@@ -24,7 +23,7 @@ | |||
24 | 23 | ||
25 | static const char *length_str = "1MB"; | 24 | static const char *length_str = "1MB"; |
26 | static const char *routine = "default"; | 25 | static const char *routine = "default"; |
27 | static int use_clock = 0; | 26 | static bool use_clock = false; |
28 | static int clock_fd; | 27 | static int clock_fd; |
29 | 28 | ||
30 | static const struct option options[] = { | 29 | static const struct option options[] = { |
diff --git a/tools/perf/bench/sched-messaging.c b/tools/perf/bench/sched-messaging.c index 81cee78181fa..da1b2e9f01ff 100644 --- a/tools/perf/bench/sched-messaging.c +++ b/tools/perf/bench/sched-messaging.c | |||
@@ -31,9 +31,9 @@ | |||
31 | 31 | ||
32 | #define DATASIZE 100 | 32 | #define DATASIZE 100 |
33 | 33 | ||
34 | static int use_pipes = 0; | 34 | static bool use_pipes = false; |
35 | static unsigned int loops = 100; | 35 | static unsigned int loops = 100; |
36 | static unsigned int thread_mode = 0; | 36 | static bool thread_mode = false; |
37 | static unsigned int num_groups = 10; | 37 | static unsigned int num_groups = 10; |
38 | 38 | ||
39 | struct sender_context { | 39 | struct sender_context { |
diff --git a/tools/perf/bench/sched-pipe.c b/tools/perf/bench/sched-pipe.c index 4f77c7c27640..d9ab3ce446ac 100644 --- a/tools/perf/bench/sched-pipe.c +++ b/tools/perf/bench/sched-pipe.c | |||
@@ -93,7 +93,7 @@ int bench_sched_pipe(int argc, const char **argv, | |||
93 | 93 | ||
94 | switch (bench_format) { | 94 | switch (bench_format) { |
95 | case BENCH_FORMAT_DEFAULT: | 95 | case BENCH_FORMAT_DEFAULT: |
96 | printf("# Extecuted %d pipe operations between two tasks\n\n", | 96 | printf("# Executed %d pipe operations between two tasks\n\n", |
97 | loops); | 97 | loops); |
98 | 98 | ||
99 | result_usec = diff.tv_sec * 1000000; | 99 | result_usec = diff.tv_sec * 1000000; |
diff --git a/tools/perf/builtin-annotate.c b/tools/perf/builtin-annotate.c index 6ad7148451c5..77bcc9b130f5 100644 --- a/tools/perf/builtin-annotate.c +++ b/tools/perf/builtin-annotate.c | |||
@@ -14,7 +14,6 @@ | |||
14 | #include "util/cache.h" | 14 | #include "util/cache.h" |
15 | #include <linux/rbtree.h> | 15 | #include <linux/rbtree.h> |
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | #include "util/string.h" | ||
18 | 17 | ||
19 | #include "perf.h" | 18 | #include "perf.h" |
20 | #include "util/debug.h" | 19 | #include "util/debug.h" |
@@ -29,80 +28,16 @@ | |||
29 | 28 | ||
30 | static char const *input_name = "perf.data"; | 29 | static char const *input_name = "perf.data"; |
31 | 30 | ||
32 | static int force; | 31 | static bool force; |
33 | 32 | ||
34 | static int full_paths; | 33 | static bool full_paths; |
35 | 34 | ||
36 | static int print_line; | 35 | static bool print_line; |
37 | |||
38 | struct sym_hist { | ||
39 | u64 sum; | ||
40 | u64 ip[0]; | ||
41 | }; | ||
42 | |||
43 | struct sym_ext { | ||
44 | struct rb_node node; | ||
45 | double percent; | ||
46 | char *path; | ||
47 | }; | ||
48 | |||
49 | struct sym_priv { | ||
50 | struct sym_hist *hist; | ||
51 | struct sym_ext *ext; | ||
52 | }; | ||
53 | 36 | ||
54 | static const char *sym_hist_filter; | 37 | static const char *sym_hist_filter; |
55 | 38 | ||
56 | static int sym__alloc_hist(struct symbol *self) | 39 | static int hists__add_entry(struct hists *self, struct addr_location *al) |
57 | { | ||
58 | struct sym_priv *priv = symbol__priv(self); | ||
59 | const int size = (sizeof(*priv->hist) + | ||
60 | (self->end - self->start) * sizeof(u64)); | ||
61 | |||
62 | priv->hist = zalloc(size); | ||
63 | return priv->hist == NULL ? -1 : 0; | ||
64 | } | ||
65 | |||
66 | /* | ||
67 | * collect histogram counts | ||
68 | */ | ||
69 | static int annotate__hist_hit(struct hist_entry *he, u64 ip) | ||
70 | { | ||
71 | unsigned int sym_size, offset; | ||
72 | struct symbol *sym = he->sym; | ||
73 | struct sym_priv *priv; | ||
74 | struct sym_hist *h; | ||
75 | |||
76 | he->count++; | ||
77 | |||
78 | if (!sym || !he->map) | ||
79 | return 0; | ||
80 | |||
81 | priv = symbol__priv(sym); | ||
82 | if (priv->hist == NULL && sym__alloc_hist(sym) < 0) | ||
83 | return -ENOMEM; | ||
84 | |||
85 | sym_size = sym->end - sym->start; | ||
86 | offset = ip - sym->start; | ||
87 | |||
88 | pr_debug3("%s: ip=%#Lx\n", __func__, he->map->unmap_ip(he->map, ip)); | ||
89 | |||
90 | if (offset >= sym_size) | ||
91 | return 0; | ||
92 | |||
93 | h = priv->hist; | ||
94 | h->sum++; | ||
95 | h->ip[offset]++; | ||
96 | |||
97 | pr_debug3("%#Lx %s: count++ [ip: %#Lx, %#Lx] => %Ld\n", he->sym->start, | ||
98 | he->sym->name, ip, ip - he->sym->start, h->ip[offset]); | ||
99 | return 0; | ||
100 | } | ||
101 | |||
102 | static int perf_session__add_hist_entry(struct perf_session *self, | ||
103 | struct addr_location *al, u64 count) | ||
104 | { | 40 | { |
105 | bool hit; | ||
106 | struct hist_entry *he; | 41 | struct hist_entry *he; |
107 | 42 | ||
108 | if (sym_hist_filter != NULL && | 43 | if (sym_hist_filter != NULL && |
@@ -116,11 +51,11 @@ static int perf_session__add_hist_entry(struct perf_session *self, | |||
116 | return 0; | 51 | return 0; |
117 | } | 52 | } |
118 | 53 | ||
119 | he = __perf_session__add_hist_entry(&self->hists, al, NULL, count, &hit); | 54 | he = __hists__add_entry(self, al, NULL, 1); |
120 | if (he == NULL) | 55 | if (he == NULL) |
121 | return -ENOMEM; | 56 | return -ENOMEM; |
122 | 57 | ||
123 | return annotate__hist_hit(he, al->addr); | 58 | return hist_entry__inc_addr_samples(he, al->addr); |
124 | } | 59 | } |
125 | 60 | ||
126 | static int process_sample_event(event_t *event, struct perf_session *session) | 61 | static int process_sample_event(event_t *event, struct perf_session *session) |
@@ -136,7 +71,7 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
136 | return -1; | 71 | return -1; |
137 | } | 72 | } |
138 | 73 | ||
139 | if (!al.filtered && perf_session__add_hist_entry(session, &al, 1)) { | 74 | if (!al.filtered && hists__add_entry(&session->hists, &al)) { |
140 | pr_warning("problem incrementing symbol count, " | 75 | pr_warning("problem incrementing symbol count, " |
141 | "skipping event\n"); | 76 | "skipping event\n"); |
142 | return -1; | 77 | return -1; |
@@ -145,106 +80,11 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
145 | return 0; | 80 | return 0; |
146 | } | 81 | } |
147 | 82 | ||
148 | struct objdump_line { | ||
149 | struct list_head node; | ||
150 | s64 offset; | ||
151 | char *line; | ||
152 | }; | ||
153 | |||
154 | static struct objdump_line *objdump_line__new(s64 offset, char *line) | ||
155 | { | ||
156 | struct objdump_line *self = malloc(sizeof(*self)); | ||
157 | |||
158 | if (self != NULL) { | ||
159 | self->offset = offset; | ||
160 | self->line = line; | ||
161 | } | ||
162 | |||
163 | return self; | ||
164 | } | ||
165 | |||
166 | static void objdump_line__free(struct objdump_line *self) | ||
167 | { | ||
168 | free(self->line); | ||
169 | free(self); | ||
170 | } | ||
171 | |||
172 | static void objdump__add_line(struct list_head *head, struct objdump_line *line) | ||
173 | { | ||
174 | list_add_tail(&line->node, head); | ||
175 | } | ||
176 | |||
177 | static struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
178 | struct objdump_line *pos) | ||
179 | { | ||
180 | list_for_each_entry_continue(pos, head, node) | ||
181 | if (pos->offset >= 0) | ||
182 | return pos; | ||
183 | |||
184 | return NULL; | ||
185 | } | ||
186 | |||
187 | static int parse_line(FILE *file, struct hist_entry *he, | ||
188 | struct list_head *head) | ||
189 | { | ||
190 | struct symbol *sym = he->sym; | ||
191 | struct objdump_line *objdump_line; | ||
192 | char *line = NULL, *tmp, *tmp2; | ||
193 | size_t line_len; | ||
194 | s64 line_ip, offset = -1; | ||
195 | char *c; | ||
196 | |||
197 | if (getline(&line, &line_len, file) < 0) | ||
198 | return -1; | ||
199 | |||
200 | if (!line) | ||
201 | return -1; | ||
202 | |||
203 | c = strchr(line, '\n'); | ||
204 | if (c) | ||
205 | *c = 0; | ||
206 | |||
207 | line_ip = -1; | ||
208 | |||
209 | /* | ||
210 | * Strip leading spaces: | ||
211 | */ | ||
212 | tmp = line; | ||
213 | while (*tmp) { | ||
214 | if (*tmp != ' ') | ||
215 | break; | ||
216 | tmp++; | ||
217 | } | ||
218 | |||
219 | if (*tmp) { | ||
220 | /* | ||
221 | * Parse hexa addresses followed by ':' | ||
222 | */ | ||
223 | line_ip = strtoull(tmp, &tmp2, 16); | ||
224 | if (*tmp2 != ':') | ||
225 | line_ip = -1; | ||
226 | } | ||
227 | |||
228 | if (line_ip != -1) { | ||
229 | u64 start = map__rip_2objdump(he->map, sym->start); | ||
230 | offset = line_ip - start; | ||
231 | } | ||
232 | |||
233 | objdump_line = objdump_line__new(offset, line); | ||
234 | if (objdump_line == NULL) { | ||
235 | free(line); | ||
236 | return -1; | ||
237 | } | ||
238 | objdump__add_line(head, objdump_line); | ||
239 | |||
240 | return 0; | ||
241 | } | ||
242 | |||
243 | static int objdump_line__print(struct objdump_line *self, | 83 | static int objdump_line__print(struct objdump_line *self, |
244 | struct list_head *head, | 84 | struct list_head *head, |
245 | struct hist_entry *he, u64 len) | 85 | struct hist_entry *he, u64 len) |
246 | { | 86 | { |
247 | struct symbol *sym = he->sym; | 87 | struct symbol *sym = he->ms.sym; |
248 | static const char *prev_line; | 88 | static const char *prev_line; |
249 | static const char *prev_color; | 89 | static const char *prev_color; |
250 | 90 | ||
@@ -327,7 +167,7 @@ static void insert_source_line(struct sym_ext *sym_ext) | |||
327 | 167 | ||
328 | static void free_source_line(struct hist_entry *he, int len) | 168 | static void free_source_line(struct hist_entry *he, int len) |
329 | { | 169 | { |
330 | struct sym_priv *priv = symbol__priv(he->sym); | 170 | struct sym_priv *priv = symbol__priv(he->ms.sym); |
331 | struct sym_ext *sym_ext = priv->ext; | 171 | struct sym_ext *sym_ext = priv->ext; |
332 | int i; | 172 | int i; |
333 | 173 | ||
@@ -346,7 +186,7 @@ static void free_source_line(struct hist_entry *he, int len) | |||
346 | static void | 186 | static void |
347 | get_source_line(struct hist_entry *he, int len, const char *filename) | 187 | get_source_line(struct hist_entry *he, int len, const char *filename) |
348 | { | 188 | { |
349 | struct symbol *sym = he->sym; | 189 | struct symbol *sym = he->ms.sym; |
350 | u64 start; | 190 | u64 start; |
351 | int i; | 191 | int i; |
352 | char cmd[PATH_MAX * 2]; | 192 | char cmd[PATH_MAX * 2]; |
@@ -361,7 +201,7 @@ get_source_line(struct hist_entry *he, int len, const char *filename) | |||
361 | if (!priv->ext) | 201 | if (!priv->ext) |
362 | return; | 202 | return; |
363 | 203 | ||
364 | start = he->map->unmap_ip(he->map, sym->start); | 204 | start = he->ms.map->unmap_ip(he->ms.map, sym->start); |
365 | 205 | ||
366 | for (i = 0; i < len; i++) { | 206 | for (i = 0; i < len; i++) { |
367 | char *path = NULL; | 207 | char *path = NULL; |
@@ -425,7 +265,7 @@ static void print_summary(const char *filename) | |||
425 | 265 | ||
426 | static void hist_entry__print_hits(struct hist_entry *self) | 266 | static void hist_entry__print_hits(struct hist_entry *self) |
427 | { | 267 | { |
428 | struct symbol *sym = self->sym; | 268 | struct symbol *sym = self->ms.sym; |
429 | struct sym_priv *priv = symbol__priv(sym); | 269 | struct sym_priv *priv = symbol__priv(sym); |
430 | struct sym_hist *h = priv->hist; | 270 | struct sym_hist *h = priv->hist; |
431 | u64 len = sym->end - sym->start, offset; | 271 | u64 len = sym->end - sym->start, offset; |
@@ -439,23 +279,17 @@ static void hist_entry__print_hits(struct hist_entry *self) | |||
439 | 279 | ||
440 | static void annotate_sym(struct hist_entry *he) | 280 | static void annotate_sym(struct hist_entry *he) |
441 | { | 281 | { |
442 | struct map *map = he->map; | 282 | struct map *map = he->ms.map; |
443 | struct dso *dso = map->dso; | 283 | struct dso *dso = map->dso; |
444 | struct symbol *sym = he->sym; | 284 | struct symbol *sym = he->ms.sym; |
445 | const char *filename = dso->long_name, *d_filename; | 285 | const char *filename = dso->long_name, *d_filename; |
446 | u64 len; | 286 | u64 len; |
447 | char command[PATH_MAX*2]; | ||
448 | FILE *file; | ||
449 | LIST_HEAD(head); | 287 | LIST_HEAD(head); |
450 | struct objdump_line *pos, *n; | 288 | struct objdump_line *pos, *n; |
451 | 289 | ||
452 | if (!filename) | 290 | if (hist_entry__annotate(he, &head) < 0) |
453 | return; | 291 | return; |
454 | 292 | ||
455 | pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__, | ||
456 | filename, sym->name, map->unmap_ip(map, sym->start), | ||
457 | map->unmap_ip(map, sym->end)); | ||
458 | |||
459 | if (full_paths) | 293 | if (full_paths) |
460 | d_filename = filename; | 294 | d_filename = filename; |
461 | else | 295 | else |
@@ -472,29 +306,6 @@ static void annotate_sym(struct hist_entry *he) | |||
472 | printf(" Percent | Source code & Disassembly of %s\n", d_filename); | 306 | printf(" Percent | Source code & Disassembly of %s\n", d_filename); |
473 | printf("------------------------------------------------\n"); | 307 | printf("------------------------------------------------\n"); |
474 | 308 | ||
475 | if (verbose >= 2) | ||
476 | printf("annotating [%p] %30s : [%p] %30s\n", | ||
477 | dso, dso->long_name, sym, sym->name); | ||
478 | |||
479 | sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s", | ||
480 | map__rip_2objdump(map, sym->start), | ||
481 | map__rip_2objdump(map, sym->end), | ||
482 | filename, filename); | ||
483 | |||
484 | if (verbose >= 3) | ||
485 | printf("doing: %s\n", command); | ||
486 | |||
487 | file = popen(command, "r"); | ||
488 | if (!file) | ||
489 | return; | ||
490 | |||
491 | while (!feof(file)) { | ||
492 | if (parse_line(file, he, &head) < 0) | ||
493 | break; | ||
494 | } | ||
495 | |||
496 | pclose(file); | ||
497 | |||
498 | if (verbose) | 309 | if (verbose) |
499 | hist_entry__print_hits(he); | 310 | hist_entry__print_hits(he); |
500 | 311 | ||
@@ -508,25 +319,25 @@ static void annotate_sym(struct hist_entry *he) | |||
508 | free_source_line(he, len); | 319 | free_source_line(he, len); |
509 | } | 320 | } |
510 | 321 | ||
511 | static void perf_session__find_annotations(struct perf_session *self) | 322 | static void hists__find_annotations(struct hists *self) |
512 | { | 323 | { |
513 | struct rb_node *nd; | 324 | struct rb_node *nd; |
514 | 325 | ||
515 | for (nd = rb_first(&self->hists); nd; nd = rb_next(nd)) { | 326 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { |
516 | struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node); | 327 | struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node); |
517 | struct sym_priv *priv; | 328 | struct sym_priv *priv; |
518 | 329 | ||
519 | if (he->sym == NULL) | 330 | if (he->ms.sym == NULL) |
520 | continue; | 331 | continue; |
521 | 332 | ||
522 | priv = symbol__priv(he->sym); | 333 | priv = symbol__priv(he->ms.sym); |
523 | if (priv->hist == NULL) | 334 | if (priv->hist == NULL) |
524 | continue; | 335 | continue; |
525 | 336 | ||
526 | annotate_sym(he); | 337 | annotate_sym(he); |
527 | /* | 338 | /* |
528 | * Since we have a hist_entry per IP for the same symbol, free | 339 | * Since we have a hist_entry per IP for the same symbol, free |
529 | * he->sym->hist to signal we already processed this symbol. | 340 | * he->ms.sym->hist to signal we already processed this symbol. |
530 | */ | 341 | */ |
531 | free(priv->hist); | 342 | free(priv->hist); |
532 | priv->hist = NULL; | 343 | priv->hist = NULL; |
@@ -545,7 +356,7 @@ static int __cmd_annotate(void) | |||
545 | int ret; | 356 | int ret; |
546 | struct perf_session *session; | 357 | struct perf_session *session; |
547 | 358 | ||
548 | session = perf_session__new(input_name, O_RDONLY, force); | 359 | session = perf_session__new(input_name, O_RDONLY, force, false); |
549 | if (session == NULL) | 360 | if (session == NULL) |
550 | return -ENOMEM; | 361 | return -ENOMEM; |
551 | 362 | ||
@@ -554,7 +365,7 @@ static int __cmd_annotate(void) | |||
554 | goto out_delete; | 365 | goto out_delete; |
555 | 366 | ||
556 | if (dump_trace) { | 367 | if (dump_trace) { |
557 | event__print_totals(); | 368 | perf_session__fprintf_nr_events(session, stdout); |
558 | goto out_delete; | 369 | goto out_delete; |
559 | } | 370 | } |
560 | 371 | ||
@@ -562,11 +373,11 @@ static int __cmd_annotate(void) | |||
562 | perf_session__fprintf(session, stdout); | 373 | perf_session__fprintf(session, stdout); |
563 | 374 | ||
564 | if (verbose > 2) | 375 | if (verbose > 2) |
565 | dsos__fprintf(stdout); | 376 | perf_session__fprintf_dsos(session, stdout); |
566 | 377 | ||
567 | perf_session__collapse_resort(&session->hists); | 378 | hists__collapse_resort(&session->hists); |
568 | perf_session__output_resort(&session->hists, session->event_total[0]); | 379 | hists__output_resort(&session->hists); |
569 | perf_session__find_annotations(session); | 380 | hists__find_annotations(&session->hists); |
570 | out_delete: | 381 | out_delete: |
571 | perf_session__delete(session); | 382 | perf_session__delete(session); |
572 | 383 | ||
@@ -581,10 +392,12 @@ static const char * const annotate_usage[] = { | |||
581 | static const struct option options[] = { | 392 | static const struct option options[] = { |
582 | OPT_STRING('i', "input", &input_name, "file", | 393 | OPT_STRING('i', "input", &input_name, "file", |
583 | "input file name"), | 394 | "input file name"), |
395 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", | ||
396 | "only consider symbols in these dsos"), | ||
584 | OPT_STRING('s', "symbol", &sym_hist_filter, "symbol", | 397 | OPT_STRING('s', "symbol", &sym_hist_filter, "symbol", |
585 | "symbol to annotate"), | 398 | "symbol to annotate"), |
586 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), | 399 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), |
587 | OPT_BOOLEAN('v', "verbose", &verbose, | 400 | OPT_INCR('v', "verbose", &verbose, |
588 | "be more verbose (show symbol address, etc)"), | 401 | "be more verbose (show symbol address, etc)"), |
589 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 402 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
590 | "dump raw trace in ASCII"), | 403 | "dump raw trace in ASCII"), |
diff --git a/tools/perf/builtin-buildid-cache.c b/tools/perf/builtin-buildid-cache.c index 30a05f552c96..f8e3d1852029 100644 --- a/tools/perf/builtin-buildid-cache.c +++ b/tools/perf/builtin-buildid-cache.c | |||
@@ -27,7 +27,7 @@ static const struct option buildid_cache_options[] = { | |||
27 | "file list", "file(s) to add"), | 27 | "file list", "file(s) to add"), |
28 | OPT_STRING('r', "remove", &remove_name_list_str, "file list", | 28 | OPT_STRING('r', "remove", &remove_name_list_str, "file list", |
29 | "file(s) to remove"), | 29 | "file(s) to remove"), |
30 | OPT_BOOLEAN('v', "verbose", &verbose, "be more verbose"), | 30 | OPT_INCR('v', "verbose", &verbose, "be more verbose"), |
31 | OPT_END() | 31 | OPT_END() |
32 | }; | 32 | }; |
33 | 33 | ||
diff --git a/tools/perf/builtin-buildid-list.c b/tools/perf/builtin-buildid-list.c index d0675c02f81e..44a47e13bd67 100644 --- a/tools/perf/builtin-buildid-list.c +++ b/tools/perf/builtin-buildid-list.c | |||
@@ -16,7 +16,7 @@ | |||
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | 17 | ||
18 | static char const *input_name = "perf.data"; | 18 | static char const *input_name = "perf.data"; |
19 | static int force; | 19 | static bool force; |
20 | static bool with_hits; | 20 | static bool with_hits; |
21 | 21 | ||
22 | static const char * const buildid_list_usage[] = { | 22 | static const char * const buildid_list_usage[] = { |
@@ -29,7 +29,7 @@ static const struct option options[] = { | |||
29 | OPT_STRING('i', "input", &input_name, "file", | 29 | OPT_STRING('i', "input", &input_name, "file", |
30 | "input file name"), | 30 | "input file name"), |
31 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), | 31 | OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), |
32 | OPT_BOOLEAN('v', "verbose", &verbose, | 32 | OPT_INCR('v', "verbose", &verbose, |
33 | "be more verbose"), | 33 | "be more verbose"), |
34 | OPT_END() | 34 | OPT_END() |
35 | }; | 35 | }; |
@@ -39,14 +39,14 @@ static int __cmd_buildid_list(void) | |||
39 | int err = -1; | 39 | int err = -1; |
40 | struct perf_session *session; | 40 | struct perf_session *session; |
41 | 41 | ||
42 | session = perf_session__new(input_name, O_RDONLY, force); | 42 | session = perf_session__new(input_name, O_RDONLY, force, false); |
43 | if (session == NULL) | 43 | if (session == NULL) |
44 | return -1; | 44 | return -1; |
45 | 45 | ||
46 | if (with_hits) | 46 | if (with_hits) |
47 | perf_session__process_events(session, &build_id__mark_dso_hit_ops); | 47 | perf_session__process_events(session, &build_id__mark_dso_hit_ops); |
48 | 48 | ||
49 | dsos__fprintf_buildid(stdout, with_hits); | 49 | perf_session__fprintf_dsos_buildid(session, stdout, with_hits); |
50 | 50 | ||
51 | perf_session__delete(session); | 51 | perf_session__delete(session); |
52 | return err; | 52 | return err; |
diff --git a/tools/perf/builtin-diff.c b/tools/perf/builtin-diff.c index 1ea15d8aeed1..a6e2fdc7a04e 100644 --- a/tools/perf/builtin-diff.c +++ b/tools/perf/builtin-diff.c | |||
@@ -19,23 +19,15 @@ | |||
19 | static char const *input_old = "perf.data.old", | 19 | static char const *input_old = "perf.data.old", |
20 | *input_new = "perf.data"; | 20 | *input_new = "perf.data"; |
21 | static char diff__default_sort_order[] = "dso,symbol"; | 21 | static char diff__default_sort_order[] = "dso,symbol"; |
22 | static int force; | 22 | static bool force; |
23 | static bool show_displacement; | 23 | static bool show_displacement; |
24 | 24 | ||
25 | static int perf_session__add_hist_entry(struct perf_session *self, | 25 | static int hists__add_entry(struct hists *self, |
26 | struct addr_location *al, u64 count) | 26 | struct addr_location *al, u64 period) |
27 | { | 27 | { |
28 | bool hit; | 28 | if (__hists__add_entry(self, al, NULL, period) != NULL) |
29 | struct hist_entry *he = __perf_session__add_hist_entry(&self->hists, | 29 | return 0; |
30 | al, NULL, | 30 | return -ENOMEM; |
31 | count, &hit); | ||
32 | if (he == NULL) | ||
33 | return -ENOMEM; | ||
34 | |||
35 | if (hit) | ||
36 | he->count += count; | ||
37 | |||
38 | return 0; | ||
39 | } | 31 | } |
40 | 32 | ||
41 | static int diff__process_sample_event(event_t *event, struct perf_session *session) | 33 | static int diff__process_sample_event(event_t *event, struct perf_session *session) |
@@ -57,12 +49,12 @@ static int diff__process_sample_event(event_t *event, struct perf_session *sessi | |||
57 | 49 | ||
58 | event__parse_sample(event, session->sample_type, &data); | 50 | event__parse_sample(event, session->sample_type, &data); |
59 | 51 | ||
60 | if (perf_session__add_hist_entry(session, &al, data.period)) { | 52 | if (hists__add_entry(&session->hists, &al, data.period)) { |
61 | pr_warning("problem incrementing symbol count, skipping event\n"); | 53 | pr_warning("problem incrementing symbol period, skipping event\n"); |
62 | return -1; | 54 | return -1; |
63 | } | 55 | } |
64 | 56 | ||
65 | session->events_stats.total += data.period; | 57 | session->hists.stats.total_period += data.period; |
66 | return 0; | 58 | return 0; |
67 | } | 59 | } |
68 | 60 | ||
@@ -95,35 +87,34 @@ static void perf_session__insert_hist_entry_by_name(struct rb_root *root, | |||
95 | rb_insert_color(&he->rb_node, root); | 87 | rb_insert_color(&he->rb_node, root); |
96 | } | 88 | } |
97 | 89 | ||
98 | static void perf_session__resort_hist_entries(struct perf_session *self) | 90 | static void hists__resort_entries(struct hists *self) |
99 | { | 91 | { |
100 | unsigned long position = 1; | 92 | unsigned long position = 1; |
101 | struct rb_root tmp = RB_ROOT; | 93 | struct rb_root tmp = RB_ROOT; |
102 | struct rb_node *next = rb_first(&self->hists); | 94 | struct rb_node *next = rb_first(&self->entries); |
103 | 95 | ||
104 | while (next != NULL) { | 96 | while (next != NULL) { |
105 | struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node); | 97 | struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node); |
106 | 98 | ||
107 | next = rb_next(&n->rb_node); | 99 | next = rb_next(&n->rb_node); |
108 | rb_erase(&n->rb_node, &self->hists); | 100 | rb_erase(&n->rb_node, &self->entries); |
109 | n->position = position++; | 101 | n->position = position++; |
110 | perf_session__insert_hist_entry_by_name(&tmp, n); | 102 | perf_session__insert_hist_entry_by_name(&tmp, n); |
111 | } | 103 | } |
112 | 104 | ||
113 | self->hists = tmp; | 105 | self->entries = tmp; |
114 | } | 106 | } |
115 | 107 | ||
116 | static void perf_session__set_hist_entries_positions(struct perf_session *self) | 108 | static void hists__set_positions(struct hists *self) |
117 | { | 109 | { |
118 | perf_session__output_resort(&self->hists, self->events_stats.total); | 110 | hists__output_resort(self); |
119 | perf_session__resort_hist_entries(self); | 111 | hists__resort_entries(self); |
120 | } | 112 | } |
121 | 113 | ||
122 | static struct hist_entry * | 114 | static struct hist_entry *hists__find_entry(struct hists *self, |
123 | perf_session__find_hist_entry(struct perf_session *self, | 115 | struct hist_entry *he) |
124 | struct hist_entry *he) | ||
125 | { | 116 | { |
126 | struct rb_node *n = self->hists.rb_node; | 117 | struct rb_node *n = self->entries.rb_node; |
127 | 118 | ||
128 | while (n) { | 119 | while (n) { |
129 | struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node); | 120 | struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node); |
@@ -140,14 +131,13 @@ perf_session__find_hist_entry(struct perf_session *self, | |||
140 | return NULL; | 131 | return NULL; |
141 | } | 132 | } |
142 | 133 | ||
143 | static void perf_session__match_hists(struct perf_session *old_session, | 134 | static void hists__match(struct hists *older, struct hists *newer) |
144 | struct perf_session *new_session) | ||
145 | { | 135 | { |
146 | struct rb_node *nd; | 136 | struct rb_node *nd; |
147 | 137 | ||
148 | for (nd = rb_first(&new_session->hists); nd; nd = rb_next(nd)) { | 138 | for (nd = rb_first(&newer->entries); nd; nd = rb_next(nd)) { |
149 | struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node); | 139 | struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node); |
150 | pos->pair = perf_session__find_hist_entry(old_session, pos); | 140 | pos->pair = hists__find_entry(older, pos); |
151 | } | 141 | } |
152 | } | 142 | } |
153 | 143 | ||
@@ -156,8 +146,8 @@ static int __cmd_diff(void) | |||
156 | int ret, i; | 146 | int ret, i; |
157 | struct perf_session *session[2]; | 147 | struct perf_session *session[2]; |
158 | 148 | ||
159 | session[0] = perf_session__new(input_old, O_RDONLY, force); | 149 | session[0] = perf_session__new(input_old, O_RDONLY, force, false); |
160 | session[1] = perf_session__new(input_new, O_RDONLY, force); | 150 | session[1] = perf_session__new(input_new, O_RDONLY, force, false); |
161 | if (session[0] == NULL || session[1] == NULL) | 151 | if (session[0] == NULL || session[1] == NULL) |
162 | return -ENOMEM; | 152 | return -ENOMEM; |
163 | 153 | ||
@@ -167,15 +157,13 @@ static int __cmd_diff(void) | |||
167 | goto out_delete; | 157 | goto out_delete; |
168 | } | 158 | } |
169 | 159 | ||
170 | perf_session__output_resort(&session[1]->hists, | 160 | hists__output_resort(&session[1]->hists); |
171 | session[1]->events_stats.total); | ||
172 | if (show_displacement) | 161 | if (show_displacement) |
173 | perf_session__set_hist_entries_positions(session[0]); | 162 | hists__set_positions(&session[0]->hists); |
174 | 163 | ||
175 | perf_session__match_hists(session[0], session[1]); | 164 | hists__match(&session[0]->hists, &session[1]->hists); |
176 | perf_session__fprintf_hists(&session[1]->hists, session[0], | 165 | hists__fprintf(&session[1]->hists, &session[0]->hists, |
177 | show_displacement, stdout, | 166 | show_displacement, stdout); |
178 | session[1]->events_stats.total); | ||
179 | out_delete: | 167 | out_delete: |
180 | for (i = 0; i < 2; ++i) | 168 | for (i = 0; i < 2; ++i) |
181 | perf_session__delete(session[i]); | 169 | perf_session__delete(session[i]); |
@@ -188,7 +176,7 @@ static const char * const diff_usage[] = { | |||
188 | }; | 176 | }; |
189 | 177 | ||
190 | static const struct option options[] = { | 178 | static const struct option options[] = { |
191 | OPT_BOOLEAN('v', "verbose", &verbose, | 179 | OPT_INCR('v', "verbose", &verbose, |
192 | "be more verbose (show symbol address, etc)"), | 180 | "be more verbose (show symbol address, etc)"), |
193 | OPT_BOOLEAN('m', "displacement", &show_displacement, | 181 | OPT_BOOLEAN('m', "displacement", &show_displacement, |
194 | "Show position displacement relative to baseline"), | 182 | "Show position displacement relative to baseline"), |
@@ -225,6 +213,10 @@ int cmd_diff(int argc, const char **argv, const char *prefix __used) | |||
225 | input_new = argv[1]; | 213 | input_new = argv[1]; |
226 | } else | 214 | } else |
227 | input_new = argv[0]; | 215 | input_new = argv[0]; |
216 | } else if (symbol_conf.default_guest_vmlinux_name || | ||
217 | symbol_conf.default_guest_kallsyms) { | ||
218 | input_old = "perf.data.host"; | ||
219 | input_new = "perf.data.guest"; | ||
228 | } | 220 | } |
229 | 221 | ||
230 | symbol_conf.exclude_other = false; | 222 | symbol_conf.exclude_other = false; |
diff --git a/tools/perf/builtin-help.c b/tools/perf/builtin-help.c index 215b584007b1..81e3ecc40fc7 100644 --- a/tools/perf/builtin-help.c +++ b/tools/perf/builtin-help.c | |||
@@ -29,7 +29,7 @@ enum help_format { | |||
29 | HELP_FORMAT_WEB, | 29 | HELP_FORMAT_WEB, |
30 | }; | 30 | }; |
31 | 31 | ||
32 | static int show_all = 0; | 32 | static bool show_all = false; |
33 | static enum help_format help_format = HELP_FORMAT_MAN; | 33 | static enum help_format help_format = HELP_FORMAT_MAN; |
34 | static struct option builtin_help_options[] = { | 34 | static struct option builtin_help_options[] = { |
35 | OPT_BOOLEAN('a', "all", &show_all, "print all available commands"), | 35 | OPT_BOOLEAN('a', "all", &show_all, "print all available commands"), |
diff --git a/tools/perf/builtin-inject.c b/tools/perf/builtin-inject.c new file mode 100644 index 000000000000..8e3e47b064ce --- /dev/null +++ b/tools/perf/builtin-inject.c | |||
@@ -0,0 +1,228 @@ | |||
1 | /* | ||
2 | * builtin-inject.c | ||
3 | * | ||
4 | * Builtin inject command: Examine the live mode (stdin) event stream | ||
5 | * and repipe it to stdout while optionally injecting additional | ||
6 | * events into it. | ||
7 | */ | ||
8 | #include "builtin.h" | ||
9 | |||
10 | #include "perf.h" | ||
11 | #include "util/session.h" | ||
12 | #include "util/debug.h" | ||
13 | |||
14 | #include "util/parse-options.h" | ||
15 | |||
16 | static char const *input_name = "-"; | ||
17 | static bool inject_build_ids; | ||
18 | |||
19 | static int event__repipe(event_t *event __used, | ||
20 | struct perf_session *session __used) | ||
21 | { | ||
22 | uint32_t size; | ||
23 | void *buf = event; | ||
24 | |||
25 | size = event->header.size; | ||
26 | |||
27 | while (size) { | ||
28 | int ret = write(STDOUT_FILENO, buf, size); | ||
29 | if (ret < 0) | ||
30 | return -errno; | ||
31 | |||
32 | size -= ret; | ||
33 | buf += ret; | ||
34 | } | ||
35 | |||
36 | return 0; | ||
37 | } | ||
38 | |||
39 | static int event__repipe_mmap(event_t *self, struct perf_session *session) | ||
40 | { | ||
41 | int err; | ||
42 | |||
43 | err = event__process_mmap(self, session); | ||
44 | event__repipe(self, session); | ||
45 | |||
46 | return err; | ||
47 | } | ||
48 | |||
49 | static int event__repipe_task(event_t *self, struct perf_session *session) | ||
50 | { | ||
51 | int err; | ||
52 | |||
53 | err = event__process_task(self, session); | ||
54 | event__repipe(self, session); | ||
55 | |||
56 | return err; | ||
57 | } | ||
58 | |||
59 | static int event__repipe_tracing_data(event_t *self, | ||
60 | struct perf_session *session) | ||
61 | { | ||
62 | int err; | ||
63 | |||
64 | event__repipe(self, session); | ||
65 | err = event__process_tracing_data(self, session); | ||
66 | |||
67 | return err; | ||
68 | } | ||
69 | |||
70 | static int dso__read_build_id(struct dso *self) | ||
71 | { | ||
72 | if (self->has_build_id) | ||
73 | return 0; | ||
74 | |||
75 | if (filename__read_build_id(self->long_name, self->build_id, | ||
76 | sizeof(self->build_id)) > 0) { | ||
77 | self->has_build_id = true; | ||
78 | return 0; | ||
79 | } | ||
80 | |||
81 | return -1; | ||
82 | } | ||
83 | |||
84 | static int dso__inject_build_id(struct dso *self, struct perf_session *session) | ||
85 | { | ||
86 | u16 misc = PERF_RECORD_MISC_USER; | ||
87 | struct machine *machine; | ||
88 | int err; | ||
89 | |||
90 | if (dso__read_build_id(self) < 0) { | ||
91 | pr_debug("no build_id found for %s\n", self->long_name); | ||
92 | return -1; | ||
93 | } | ||
94 | |||
95 | machine = perf_session__find_host_machine(session); | ||
96 | if (machine == NULL) { | ||
97 | pr_err("Can't find machine for session\n"); | ||
98 | return -1; | ||
99 | } | ||
100 | |||
101 | if (self->kernel) | ||
102 | misc = PERF_RECORD_MISC_KERNEL; | ||
103 | |||
104 | err = event__synthesize_build_id(self, misc, event__repipe, | ||
105 | machine, session); | ||
106 | if (err) { | ||
107 | pr_err("Can't synthesize build_id event for %s\n", self->long_name); | ||
108 | return -1; | ||
109 | } | ||
110 | |||
111 | return 0; | ||
112 | } | ||
113 | |||
114 | static int event__inject_buildid(event_t *event, struct perf_session *session) | ||
115 | { | ||
116 | struct addr_location al; | ||
117 | struct thread *thread; | ||
118 | u8 cpumode; | ||
119 | |||
120 | cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | ||
121 | |||
122 | thread = perf_session__findnew(session, event->ip.pid); | ||
123 | if (thread == NULL) { | ||
124 | pr_err("problem processing %d event, skipping it.\n", | ||
125 | event->header.type); | ||
126 | goto repipe; | ||
127 | } | ||
128 | |||
129 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, | ||
130 | event->ip.pid, event->ip.ip, &al); | ||
131 | |||
132 | if (al.map != NULL) { | ||
133 | if (!al.map->dso->hit) { | ||
134 | al.map->dso->hit = 1; | ||
135 | if (map__load(al.map, NULL) >= 0) { | ||
136 | dso__inject_build_id(al.map->dso, session); | ||
137 | /* | ||
138 | * If this fails, too bad, let the other side | ||
139 | * account this as unresolved. | ||
140 | */ | ||
141 | } else | ||
142 | pr_warning("no symbols found in %s, maybe " | ||
143 | "install a debug package?\n", | ||
144 | al.map->dso->long_name); | ||
145 | } | ||
146 | } | ||
147 | |||
148 | repipe: | ||
149 | event__repipe(event, session); | ||
150 | return 0; | ||
151 | } | ||
152 | |||
153 | struct perf_event_ops inject_ops = { | ||
154 | .sample = event__repipe, | ||
155 | .mmap = event__repipe, | ||
156 | .comm = event__repipe, | ||
157 | .fork = event__repipe, | ||
158 | .exit = event__repipe, | ||
159 | .lost = event__repipe, | ||
160 | .read = event__repipe, | ||
161 | .throttle = event__repipe, | ||
162 | .unthrottle = event__repipe, | ||
163 | .attr = event__repipe, | ||
164 | .event_type = event__repipe, | ||
165 | .tracing_data = event__repipe, | ||
166 | .build_id = event__repipe, | ||
167 | }; | ||
168 | |||
169 | extern volatile int session_done; | ||
170 | |||
171 | static void sig_handler(int sig __attribute__((__unused__))) | ||
172 | { | ||
173 | session_done = 1; | ||
174 | } | ||
175 | |||
176 | static int __cmd_inject(void) | ||
177 | { | ||
178 | struct perf_session *session; | ||
179 | int ret = -EINVAL; | ||
180 | |||
181 | signal(SIGINT, sig_handler); | ||
182 | |||
183 | if (inject_build_ids) { | ||
184 | inject_ops.sample = event__inject_buildid; | ||
185 | inject_ops.mmap = event__repipe_mmap; | ||
186 | inject_ops.fork = event__repipe_task; | ||
187 | inject_ops.tracing_data = event__repipe_tracing_data; | ||
188 | } | ||
189 | |||
190 | session = perf_session__new(input_name, O_RDONLY, false, true); | ||
191 | if (session == NULL) | ||
192 | return -ENOMEM; | ||
193 | |||
194 | ret = perf_session__process_events(session, &inject_ops); | ||
195 | |||
196 | perf_session__delete(session); | ||
197 | |||
198 | return ret; | ||
199 | } | ||
200 | |||
201 | static const char * const report_usage[] = { | ||
202 | "perf inject [<options>]", | ||
203 | NULL | ||
204 | }; | ||
205 | |||
206 | static const struct option options[] = { | ||
207 | OPT_BOOLEAN('b', "build-ids", &inject_build_ids, | ||
208 | "Inject build-ids into the output stream"), | ||
209 | OPT_INCR('v', "verbose", &verbose, | ||
210 | "be more verbose (show build ids, etc)"), | ||
211 | OPT_END() | ||
212 | }; | ||
213 | |||
214 | int cmd_inject(int argc, const char **argv, const char *prefix __used) | ||
215 | { | ||
216 | argc = parse_options(argc, argv, options, report_usage, 0); | ||
217 | |||
218 | /* | ||
219 | * Any (unrecognized) arguments left? | ||
220 | */ | ||
221 | if (argc) | ||
222 | usage_with_options(report_usage, options); | ||
223 | |||
224 | if (symbol__init() < 0) | ||
225 | return -1; | ||
226 | |||
227 | return __cmd_inject(); | ||
228 | } | ||
diff --git a/tools/perf/builtin-kmem.c b/tools/perf/builtin-kmem.c index 924a9518931a..31f60a2535e0 100644 --- a/tools/perf/builtin-kmem.c +++ b/tools/perf/builtin-kmem.c | |||
@@ -335,8 +335,9 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
335 | } | 335 | } |
336 | 336 | ||
337 | static struct perf_event_ops event_ops = { | 337 | static struct perf_event_ops event_ops = { |
338 | .sample = process_sample_event, | 338 | .sample = process_sample_event, |
339 | .comm = event__process_comm, | 339 | .comm = event__process_comm, |
340 | .ordered_samples = true, | ||
340 | }; | 341 | }; |
341 | 342 | ||
342 | static double fragmentation(unsigned long n_req, unsigned long n_alloc) | 343 | static double fragmentation(unsigned long n_req, unsigned long n_alloc) |
@@ -351,6 +352,7 @@ static void __print_result(struct rb_root *root, struct perf_session *session, | |||
351 | int n_lines, int is_caller) | 352 | int n_lines, int is_caller) |
352 | { | 353 | { |
353 | struct rb_node *next; | 354 | struct rb_node *next; |
355 | struct machine *machine; | ||
354 | 356 | ||
355 | printf("%.102s\n", graph_dotted_line); | 357 | printf("%.102s\n", graph_dotted_line); |
356 | printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr"); | 358 | printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr"); |
@@ -359,23 +361,29 @@ static void __print_result(struct rb_root *root, struct perf_session *session, | |||
359 | 361 | ||
360 | next = rb_first(root); | 362 | next = rb_first(root); |
361 | 363 | ||
364 | machine = perf_session__find_host_machine(session); | ||
365 | if (!machine) { | ||
366 | pr_err("__print_result: couldn't find kernel information\n"); | ||
367 | return; | ||
368 | } | ||
362 | while (next && n_lines--) { | 369 | while (next && n_lines--) { |
363 | struct alloc_stat *data = rb_entry(next, struct alloc_stat, | 370 | struct alloc_stat *data = rb_entry(next, struct alloc_stat, |
364 | node); | 371 | node); |
365 | struct symbol *sym = NULL; | 372 | struct symbol *sym = NULL; |
373 | struct map *map; | ||
366 | char buf[BUFSIZ]; | 374 | char buf[BUFSIZ]; |
367 | u64 addr; | 375 | u64 addr; |
368 | 376 | ||
369 | if (is_caller) { | 377 | if (is_caller) { |
370 | addr = data->call_site; | 378 | addr = data->call_site; |
371 | if (!raw_ip) | 379 | if (!raw_ip) |
372 | sym = map_groups__find_function(&session->kmaps, addr, NULL); | 380 | sym = machine__find_kernel_function(machine, addr, &map, NULL); |
373 | } else | 381 | } else |
374 | addr = data->ptr; | 382 | addr = data->ptr; |
375 | 383 | ||
376 | if (sym != NULL) | 384 | if (sym != NULL) |
377 | snprintf(buf, sizeof(buf), "%s+%Lx", sym->name, | 385 | snprintf(buf, sizeof(buf), "%s+%Lx", sym->name, |
378 | addr - sym->start); | 386 | addr - map->unmap_ip(map, sym->start)); |
379 | else | 387 | else |
380 | snprintf(buf, sizeof(buf), "%#Lx", addr); | 388 | snprintf(buf, sizeof(buf), "%#Lx", addr); |
381 | printf(" %-34s |", buf); | 389 | printf(" %-34s |", buf); |
@@ -484,10 +492,13 @@ static void sort_result(void) | |||
484 | static int __cmd_kmem(void) | 492 | static int __cmd_kmem(void) |
485 | { | 493 | { |
486 | int err = -EINVAL; | 494 | int err = -EINVAL; |
487 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 495 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
488 | if (session == NULL) | 496 | if (session == NULL) |
489 | return -ENOMEM; | 497 | return -ENOMEM; |
490 | 498 | ||
499 | if (perf_session__create_kernel_maps(session) < 0) | ||
500 | goto out_delete; | ||
501 | |||
491 | if (!perf_session__has_traces(session, "kmem record")) | 502 | if (!perf_session__has_traces(session, "kmem record")) |
492 | goto out_delete; | 503 | goto out_delete; |
493 | 504 | ||
@@ -718,7 +729,6 @@ static const char *record_args[] = { | |||
718 | "record", | 729 | "record", |
719 | "-a", | 730 | "-a", |
720 | "-R", | 731 | "-R", |
721 | "-M", | ||
722 | "-f", | 732 | "-f", |
723 | "-c", "1", | 733 | "-c", "1", |
724 | "-e", "kmem:kmalloc", | 734 | "-e", "kmem:kmalloc", |
diff --git a/tools/perf/builtin-kvm.c b/tools/perf/builtin-kvm.c new file mode 100644 index 000000000000..a4c7cae45024 --- /dev/null +++ b/tools/perf/builtin-kvm.c | |||
@@ -0,0 +1,144 @@ | |||
1 | #include "builtin.h" | ||
2 | #include "perf.h" | ||
3 | |||
4 | #include "util/util.h" | ||
5 | #include "util/cache.h" | ||
6 | #include "util/symbol.h" | ||
7 | #include "util/thread.h" | ||
8 | #include "util/header.h" | ||
9 | #include "util/session.h" | ||
10 | |||
11 | #include "util/parse-options.h" | ||
12 | #include "util/trace-event.h" | ||
13 | |||
14 | #include "util/debug.h" | ||
15 | |||
16 | #include <sys/prctl.h> | ||
17 | |||
18 | #include <semaphore.h> | ||
19 | #include <pthread.h> | ||
20 | #include <math.h> | ||
21 | |||
22 | static char *file_name; | ||
23 | static char name_buffer[256]; | ||
24 | |||
25 | int perf_host = 1; | ||
26 | int perf_guest; | ||
27 | |||
28 | static const char * const kvm_usage[] = { | ||
29 | "perf kvm [<options>] {top|record|report|diff|buildid-list}", | ||
30 | NULL | ||
31 | }; | ||
32 | |||
33 | static const struct option kvm_options[] = { | ||
34 | OPT_STRING('i', "input", &file_name, "file", | ||
35 | "Input file name"), | ||
36 | OPT_STRING('o', "output", &file_name, "file", | ||
37 | "Output file name"), | ||
38 | OPT_BOOLEAN(0, "guest", &perf_guest, | ||
39 | "Collect guest os data"), | ||
40 | OPT_BOOLEAN(0, "host", &perf_host, | ||
41 | "Collect guest os data"), | ||
42 | OPT_STRING(0, "guestmount", &symbol_conf.guestmount, "directory", | ||
43 | "guest mount directory under which every guest os" | ||
44 | " instance has a subdir"), | ||
45 | OPT_STRING(0, "guestvmlinux", &symbol_conf.default_guest_vmlinux_name, | ||
46 | "file", "file saving guest os vmlinux"), | ||
47 | OPT_STRING(0, "guestkallsyms", &symbol_conf.default_guest_kallsyms, | ||
48 | "file", "file saving guest os /proc/kallsyms"), | ||
49 | OPT_STRING(0, "guestmodules", &symbol_conf.default_guest_modules, | ||
50 | "file", "file saving guest os /proc/modules"), | ||
51 | OPT_END() | ||
52 | }; | ||
53 | |||
54 | static int __cmd_record(int argc, const char **argv) | ||
55 | { | ||
56 | int rec_argc, i = 0, j; | ||
57 | const char **rec_argv; | ||
58 | |||
59 | rec_argc = argc + 2; | ||
60 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
61 | rec_argv[i++] = strdup("record"); | ||
62 | rec_argv[i++] = strdup("-o"); | ||
63 | rec_argv[i++] = strdup(file_name); | ||
64 | for (j = 1; j < argc; j++, i++) | ||
65 | rec_argv[i] = argv[j]; | ||
66 | |||
67 | BUG_ON(i != rec_argc); | ||
68 | |||
69 | return cmd_record(i, rec_argv, NULL); | ||
70 | } | ||
71 | |||
72 | static int __cmd_report(int argc, const char **argv) | ||
73 | { | ||
74 | int rec_argc, i = 0, j; | ||
75 | const char **rec_argv; | ||
76 | |||
77 | rec_argc = argc + 2; | ||
78 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
79 | rec_argv[i++] = strdup("report"); | ||
80 | rec_argv[i++] = strdup("-i"); | ||
81 | rec_argv[i++] = strdup(file_name); | ||
82 | for (j = 1; j < argc; j++, i++) | ||
83 | rec_argv[i] = argv[j]; | ||
84 | |||
85 | BUG_ON(i != rec_argc); | ||
86 | |||
87 | return cmd_report(i, rec_argv, NULL); | ||
88 | } | ||
89 | |||
90 | static int __cmd_buildid_list(int argc, const char **argv) | ||
91 | { | ||
92 | int rec_argc, i = 0, j; | ||
93 | const char **rec_argv; | ||
94 | |||
95 | rec_argc = argc + 2; | ||
96 | rec_argv = calloc(rec_argc + 1, sizeof(char *)); | ||
97 | rec_argv[i++] = strdup("buildid-list"); | ||
98 | rec_argv[i++] = strdup("-i"); | ||
99 | rec_argv[i++] = strdup(file_name); | ||
100 | for (j = 1; j < argc; j++, i++) | ||
101 | rec_argv[i] = argv[j]; | ||
102 | |||
103 | BUG_ON(i != rec_argc); | ||
104 | |||
105 | return cmd_buildid_list(i, rec_argv, NULL); | ||
106 | } | ||
107 | |||
108 | int cmd_kvm(int argc, const char **argv, const char *prefix __used) | ||
109 | { | ||
110 | perf_host = perf_guest = 0; | ||
111 | |||
112 | argc = parse_options(argc, argv, kvm_options, kvm_usage, | ||
113 | PARSE_OPT_STOP_AT_NON_OPTION); | ||
114 | if (!argc) | ||
115 | usage_with_options(kvm_usage, kvm_options); | ||
116 | |||
117 | if (!perf_host) | ||
118 | perf_guest = 1; | ||
119 | |||
120 | if (!file_name) { | ||
121 | if (perf_host && !perf_guest) | ||
122 | sprintf(name_buffer, "perf.data.host"); | ||
123 | else if (!perf_host && perf_guest) | ||
124 | sprintf(name_buffer, "perf.data.guest"); | ||
125 | else | ||
126 | sprintf(name_buffer, "perf.data.kvm"); | ||
127 | file_name = name_buffer; | ||
128 | } | ||
129 | |||
130 | if (!strncmp(argv[0], "rec", 3)) | ||
131 | return __cmd_record(argc, argv); | ||
132 | else if (!strncmp(argv[0], "rep", 3)) | ||
133 | return __cmd_report(argc, argv); | ||
134 | else if (!strncmp(argv[0], "diff", 4)) | ||
135 | return cmd_diff(argc, argv, NULL); | ||
136 | else if (!strncmp(argv[0], "top", 3)) | ||
137 | return cmd_top(argc, argv, NULL); | ||
138 | else if (!strncmp(argv[0], "buildid-list", 12)) | ||
139 | return __cmd_buildid_list(argc, argv); | ||
140 | else | ||
141 | usage_with_options(kvm_usage, kvm_options); | ||
142 | |||
143 | return 0; | ||
144 | } | ||
diff --git a/tools/perf/builtin-lock.c b/tools/perf/builtin-lock.c index e12c844df1e2..e18dfdc2948a 100644 --- a/tools/perf/builtin-lock.c +++ b/tools/perf/builtin-lock.c | |||
@@ -23,6 +23,8 @@ | |||
23 | #include <linux/list.h> | 23 | #include <linux/list.h> |
24 | #include <linux/hash.h> | 24 | #include <linux/hash.h> |
25 | 25 | ||
26 | static struct perf_session *session; | ||
27 | |||
26 | /* based on kernel/lockdep.c */ | 28 | /* based on kernel/lockdep.c */ |
27 | #define LOCKHASH_BITS 12 | 29 | #define LOCKHASH_BITS 12 |
28 | #define LOCKHASH_SIZE (1UL << LOCKHASH_BITS) | 30 | #define LOCKHASH_SIZE (1UL << LOCKHASH_BITS) |
@@ -32,9 +34,6 @@ static struct list_head lockhash_table[LOCKHASH_SIZE]; | |||
32 | #define __lockhashfn(key) hash_long((unsigned long)key, LOCKHASH_BITS) | 34 | #define __lockhashfn(key) hash_long((unsigned long)key, LOCKHASH_BITS) |
33 | #define lockhashentry(key) (lockhash_table + __lockhashfn((key))) | 35 | #define lockhashentry(key) (lockhash_table + __lockhashfn((key))) |
34 | 36 | ||
35 | #define LOCK_STATE_UNLOCKED 0 /* initial state */ | ||
36 | #define LOCK_STATE_LOCKED 1 | ||
37 | |||
38 | struct lock_stat { | 37 | struct lock_stat { |
39 | struct list_head hash_entry; | 38 | struct list_head hash_entry; |
40 | struct rb_node rb; /* used for sorting */ | 39 | struct rb_node rb; /* used for sorting */ |
@@ -47,20 +46,151 @@ struct lock_stat { | |||
47 | void *addr; /* address of lockdep_map, used as ID */ | 46 | void *addr; /* address of lockdep_map, used as ID */ |
48 | char *name; /* for strcpy(), we cannot use const */ | 47 | char *name; /* for strcpy(), we cannot use const */ |
49 | 48 | ||
50 | int state; | ||
51 | u64 prev_event_time; /* timestamp of previous event */ | ||
52 | |||
53 | unsigned int nr_acquired; | ||
54 | unsigned int nr_acquire; | 49 | unsigned int nr_acquire; |
50 | unsigned int nr_acquired; | ||
55 | unsigned int nr_contended; | 51 | unsigned int nr_contended; |
56 | unsigned int nr_release; | 52 | unsigned int nr_release; |
57 | 53 | ||
54 | unsigned int nr_readlock; | ||
55 | unsigned int nr_trylock; | ||
58 | /* these times are in nano sec. */ | 56 | /* these times are in nano sec. */ |
59 | u64 wait_time_total; | 57 | u64 wait_time_total; |
60 | u64 wait_time_min; | 58 | u64 wait_time_min; |
61 | u64 wait_time_max; | 59 | u64 wait_time_max; |
60 | |||
61 | int discard; /* flag of blacklist */ | ||
62 | }; | 62 | }; |
63 | 63 | ||
64 | /* | ||
65 | * States of lock_seq_stat | ||
66 | * | ||
67 | * UNINITIALIZED is required for detecting first event of acquire. | ||
68 | * As the nature of lock events, there is no guarantee | ||
69 | * that the first event for the locks are acquire, | ||
70 | * it can be acquired, contended or release. | ||
71 | */ | ||
72 | #define SEQ_STATE_UNINITIALIZED 0 /* initial state */ | ||
73 | #define SEQ_STATE_RELEASED 1 | ||
74 | #define SEQ_STATE_ACQUIRING 2 | ||
75 | #define SEQ_STATE_ACQUIRED 3 | ||
76 | #define SEQ_STATE_READ_ACQUIRED 4 | ||
77 | #define SEQ_STATE_CONTENDED 5 | ||
78 | |||
79 | /* | ||
80 | * MAX_LOCK_DEPTH | ||
81 | * Imported from include/linux/sched.h. | ||
82 | * Should this be synchronized? | ||
83 | */ | ||
84 | #define MAX_LOCK_DEPTH 48 | ||
85 | |||
86 | /* | ||
87 | * struct lock_seq_stat: | ||
88 | * Place to put on state of one lock sequence | ||
89 | * 1) acquire -> acquired -> release | ||
90 | * 2) acquire -> contended -> acquired -> release | ||
91 | * 3) acquire (with read or try) -> release | ||
92 | * 4) Are there other patterns? | ||
93 | */ | ||
94 | struct lock_seq_stat { | ||
95 | struct list_head list; | ||
96 | int state; | ||
97 | u64 prev_event_time; | ||
98 | void *addr; | ||
99 | |||
100 | int read_count; | ||
101 | }; | ||
102 | |||
103 | struct thread_stat { | ||
104 | struct rb_node rb; | ||
105 | |||
106 | u32 tid; | ||
107 | struct list_head seq_list; | ||
108 | }; | ||
109 | |||
110 | static struct rb_root thread_stats; | ||
111 | |||
112 | static struct thread_stat *thread_stat_find(u32 tid) | ||
113 | { | ||
114 | struct rb_node *node; | ||
115 | struct thread_stat *st; | ||
116 | |||
117 | node = thread_stats.rb_node; | ||
118 | while (node) { | ||
119 | st = container_of(node, struct thread_stat, rb); | ||
120 | if (st->tid == tid) | ||
121 | return st; | ||
122 | else if (tid < st->tid) | ||
123 | node = node->rb_left; | ||
124 | else | ||
125 | node = node->rb_right; | ||
126 | } | ||
127 | |||
128 | return NULL; | ||
129 | } | ||
130 | |||
131 | static void thread_stat_insert(struct thread_stat *new) | ||
132 | { | ||
133 | struct rb_node **rb = &thread_stats.rb_node; | ||
134 | struct rb_node *parent = NULL; | ||
135 | struct thread_stat *p; | ||
136 | |||
137 | while (*rb) { | ||
138 | p = container_of(*rb, struct thread_stat, rb); | ||
139 | parent = *rb; | ||
140 | |||
141 | if (new->tid < p->tid) | ||
142 | rb = &(*rb)->rb_left; | ||
143 | else if (new->tid > p->tid) | ||
144 | rb = &(*rb)->rb_right; | ||
145 | else | ||
146 | BUG_ON("inserting invalid thread_stat\n"); | ||
147 | } | ||
148 | |||
149 | rb_link_node(&new->rb, parent, rb); | ||
150 | rb_insert_color(&new->rb, &thread_stats); | ||
151 | } | ||
152 | |||
153 | static struct thread_stat *thread_stat_findnew_after_first(u32 tid) | ||
154 | { | ||
155 | struct thread_stat *st; | ||
156 | |||
157 | st = thread_stat_find(tid); | ||
158 | if (st) | ||
159 | return st; | ||
160 | |||
161 | st = zalloc(sizeof(struct thread_stat)); | ||
162 | if (!st) | ||
163 | die("memory allocation failed\n"); | ||
164 | |||
165 | st->tid = tid; | ||
166 | INIT_LIST_HEAD(&st->seq_list); | ||
167 | |||
168 | thread_stat_insert(st); | ||
169 | |||
170 | return st; | ||
171 | } | ||
172 | |||
173 | static struct thread_stat *thread_stat_findnew_first(u32 tid); | ||
174 | static struct thread_stat *(*thread_stat_findnew)(u32 tid) = | ||
175 | thread_stat_findnew_first; | ||
176 | |||
177 | static struct thread_stat *thread_stat_findnew_first(u32 tid) | ||
178 | { | ||
179 | struct thread_stat *st; | ||
180 | |||
181 | st = zalloc(sizeof(struct thread_stat)); | ||
182 | if (!st) | ||
183 | die("memory allocation failed\n"); | ||
184 | st->tid = tid; | ||
185 | INIT_LIST_HEAD(&st->seq_list); | ||
186 | |||
187 | rb_link_node(&st->rb, NULL, &thread_stats.rb_node); | ||
188 | rb_insert_color(&st->rb, &thread_stats); | ||
189 | |||
190 | thread_stat_findnew = thread_stat_findnew_after_first; | ||
191 | return st; | ||
192 | } | ||
193 | |||
64 | /* build simple key function one is bigger than two */ | 194 | /* build simple key function one is bigger than two */ |
65 | #define SINGLE_KEY(member) \ | 195 | #define SINGLE_KEY(member) \ |
66 | static int lock_stat_key_ ## member(struct lock_stat *one, \ | 196 | static int lock_stat_key_ ## member(struct lock_stat *one, \ |
@@ -175,8 +305,6 @@ static struct lock_stat *lock_stat_findnew(void *addr, const char *name) | |||
175 | goto alloc_failed; | 305 | goto alloc_failed; |
176 | strcpy(new->name, name); | 306 | strcpy(new->name, name); |
177 | 307 | ||
178 | /* LOCK_STATE_UNLOCKED == 0 isn't guaranteed forever */ | ||
179 | new->state = LOCK_STATE_UNLOCKED; | ||
180 | new->wait_time_min = ULLONG_MAX; | 308 | new->wait_time_min = ULLONG_MAX; |
181 | 309 | ||
182 | list_add(&new->hash_entry, entry); | 310 | list_add(&new->hash_entry, entry); |
@@ -188,8 +316,6 @@ alloc_failed: | |||
188 | 316 | ||
189 | static char const *input_name = "perf.data"; | 317 | static char const *input_name = "perf.data"; |
190 | 318 | ||
191 | static int profile_cpu = -1; | ||
192 | |||
193 | struct raw_event_sample { | 319 | struct raw_event_sample { |
194 | u32 size; | 320 | u32 size; |
195 | char data[0]; | 321 | char data[0]; |
@@ -198,6 +324,7 @@ struct raw_event_sample { | |||
198 | struct trace_acquire_event { | 324 | struct trace_acquire_event { |
199 | void *addr; | 325 | void *addr; |
200 | const char *name; | 326 | const char *name; |
327 | int flag; | ||
201 | }; | 328 | }; |
202 | 329 | ||
203 | struct trace_acquired_event { | 330 | struct trace_acquired_event { |
@@ -241,120 +368,258 @@ struct trace_lock_handler { | |||
241 | struct thread *thread); | 368 | struct thread *thread); |
242 | }; | 369 | }; |
243 | 370 | ||
371 | static struct lock_seq_stat *get_seq(struct thread_stat *ts, void *addr) | ||
372 | { | ||
373 | struct lock_seq_stat *seq; | ||
374 | |||
375 | list_for_each_entry(seq, &ts->seq_list, list) { | ||
376 | if (seq->addr == addr) | ||
377 | return seq; | ||
378 | } | ||
379 | |||
380 | seq = zalloc(sizeof(struct lock_seq_stat)); | ||
381 | if (!seq) | ||
382 | die("Not enough memory\n"); | ||
383 | seq->state = SEQ_STATE_UNINITIALIZED; | ||
384 | seq->addr = addr; | ||
385 | |||
386 | list_add(&seq->list, &ts->seq_list); | ||
387 | return seq; | ||
388 | } | ||
389 | |||
390 | enum broken_state { | ||
391 | BROKEN_ACQUIRE, | ||
392 | BROKEN_ACQUIRED, | ||
393 | BROKEN_CONTENDED, | ||
394 | BROKEN_RELEASE, | ||
395 | BROKEN_MAX, | ||
396 | }; | ||
397 | |||
398 | static int bad_hist[BROKEN_MAX]; | ||
399 | |||
400 | enum acquire_flags { | ||
401 | TRY_LOCK = 1, | ||
402 | READ_LOCK = 2, | ||
403 | }; | ||
404 | |||
244 | static void | 405 | static void |
245 | report_lock_acquire_event(struct trace_acquire_event *acquire_event, | 406 | report_lock_acquire_event(struct trace_acquire_event *acquire_event, |
246 | struct event *__event __used, | 407 | struct event *__event __used, |
247 | int cpu __used, | 408 | int cpu __used, |
248 | u64 timestamp, | 409 | u64 timestamp __used, |
249 | struct thread *thread __used) | 410 | struct thread *thread __used) |
250 | { | 411 | { |
251 | struct lock_stat *st; | 412 | struct lock_stat *ls; |
413 | struct thread_stat *ts; | ||
414 | struct lock_seq_stat *seq; | ||
415 | |||
416 | ls = lock_stat_findnew(acquire_event->addr, acquire_event->name); | ||
417 | if (ls->discard) | ||
418 | return; | ||
252 | 419 | ||
253 | st = lock_stat_findnew(acquire_event->addr, acquire_event->name); | 420 | ts = thread_stat_findnew(thread->pid); |
421 | seq = get_seq(ts, acquire_event->addr); | ||
254 | 422 | ||
255 | switch (st->state) { | 423 | switch (seq->state) { |
256 | case LOCK_STATE_UNLOCKED: | 424 | case SEQ_STATE_UNINITIALIZED: |
425 | case SEQ_STATE_RELEASED: | ||
426 | if (!acquire_event->flag) { | ||
427 | seq->state = SEQ_STATE_ACQUIRING; | ||
428 | } else { | ||
429 | if (acquire_event->flag & TRY_LOCK) | ||
430 | ls->nr_trylock++; | ||
431 | if (acquire_event->flag & READ_LOCK) | ||
432 | ls->nr_readlock++; | ||
433 | seq->state = SEQ_STATE_READ_ACQUIRED; | ||
434 | seq->read_count = 1; | ||
435 | ls->nr_acquired++; | ||
436 | } | ||
437 | break; | ||
438 | case SEQ_STATE_READ_ACQUIRED: | ||
439 | if (acquire_event->flag & READ_LOCK) { | ||
440 | seq->read_count++; | ||
441 | ls->nr_acquired++; | ||
442 | goto end; | ||
443 | } else { | ||
444 | goto broken; | ||
445 | } | ||
257 | break; | 446 | break; |
258 | case LOCK_STATE_LOCKED: | 447 | case SEQ_STATE_ACQUIRED: |
448 | case SEQ_STATE_ACQUIRING: | ||
449 | case SEQ_STATE_CONTENDED: | ||
450 | broken: | ||
451 | /* broken lock sequence, discard it */ | ||
452 | ls->discard = 1; | ||
453 | bad_hist[BROKEN_ACQUIRE]++; | ||
454 | list_del(&seq->list); | ||
455 | free(seq); | ||
456 | goto end; | ||
259 | break; | 457 | break; |
260 | default: | 458 | default: |
261 | BUG_ON(1); | 459 | BUG_ON("Unknown state of lock sequence found!\n"); |
262 | break; | 460 | break; |
263 | } | 461 | } |
264 | 462 | ||
265 | st->prev_event_time = timestamp; | 463 | ls->nr_acquire++; |
464 | seq->prev_event_time = timestamp; | ||
465 | end: | ||
466 | return; | ||
266 | } | 467 | } |
267 | 468 | ||
268 | static void | 469 | static void |
269 | report_lock_acquired_event(struct trace_acquired_event *acquired_event, | 470 | report_lock_acquired_event(struct trace_acquired_event *acquired_event, |
270 | struct event *__event __used, | 471 | struct event *__event __used, |
271 | int cpu __used, | 472 | int cpu __used, |
272 | u64 timestamp, | 473 | u64 timestamp __used, |
273 | struct thread *thread __used) | 474 | struct thread *thread __used) |
274 | { | 475 | { |
275 | struct lock_stat *st; | 476 | struct lock_stat *ls; |
477 | struct thread_stat *ts; | ||
478 | struct lock_seq_stat *seq; | ||
479 | u64 contended_term; | ||
480 | |||
481 | ls = lock_stat_findnew(acquired_event->addr, acquired_event->name); | ||
482 | if (ls->discard) | ||
483 | return; | ||
276 | 484 | ||
277 | st = lock_stat_findnew(acquired_event->addr, acquired_event->name); | 485 | ts = thread_stat_findnew(thread->pid); |
486 | seq = get_seq(ts, acquired_event->addr); | ||
278 | 487 | ||
279 | switch (st->state) { | 488 | switch (seq->state) { |
280 | case LOCK_STATE_UNLOCKED: | 489 | case SEQ_STATE_UNINITIALIZED: |
281 | st->state = LOCK_STATE_LOCKED; | 490 | /* orphan event, do nothing */ |
282 | st->nr_acquired++; | 491 | return; |
492 | case SEQ_STATE_ACQUIRING: | ||
493 | break; | ||
494 | case SEQ_STATE_CONTENDED: | ||
495 | contended_term = timestamp - seq->prev_event_time; | ||
496 | ls->wait_time_total += contended_term; | ||
497 | if (contended_term < ls->wait_time_min) | ||
498 | ls->wait_time_min = contended_term; | ||
499 | if (ls->wait_time_max < contended_term) | ||
500 | ls->wait_time_max = contended_term; | ||
283 | break; | 501 | break; |
284 | case LOCK_STATE_LOCKED: | 502 | case SEQ_STATE_RELEASED: |
503 | case SEQ_STATE_ACQUIRED: | ||
504 | case SEQ_STATE_READ_ACQUIRED: | ||
505 | /* broken lock sequence, discard it */ | ||
506 | ls->discard = 1; | ||
507 | bad_hist[BROKEN_ACQUIRED]++; | ||
508 | list_del(&seq->list); | ||
509 | free(seq); | ||
510 | goto end; | ||
285 | break; | 511 | break; |
512 | |||
286 | default: | 513 | default: |
287 | BUG_ON(1); | 514 | BUG_ON("Unknown state of lock sequence found!\n"); |
288 | break; | 515 | break; |
289 | } | 516 | } |
290 | 517 | ||
291 | st->prev_event_time = timestamp; | 518 | seq->state = SEQ_STATE_ACQUIRED; |
519 | ls->nr_acquired++; | ||
520 | seq->prev_event_time = timestamp; | ||
521 | end: | ||
522 | return; | ||
292 | } | 523 | } |
293 | 524 | ||
294 | static void | 525 | static void |
295 | report_lock_contended_event(struct trace_contended_event *contended_event, | 526 | report_lock_contended_event(struct trace_contended_event *contended_event, |
296 | struct event *__event __used, | 527 | struct event *__event __used, |
297 | int cpu __used, | 528 | int cpu __used, |
298 | u64 timestamp, | 529 | u64 timestamp __used, |
299 | struct thread *thread __used) | 530 | struct thread *thread __used) |
300 | { | 531 | { |
301 | struct lock_stat *st; | 532 | struct lock_stat *ls; |
533 | struct thread_stat *ts; | ||
534 | struct lock_seq_stat *seq; | ||
302 | 535 | ||
303 | st = lock_stat_findnew(contended_event->addr, contended_event->name); | 536 | ls = lock_stat_findnew(contended_event->addr, contended_event->name); |
537 | if (ls->discard) | ||
538 | return; | ||
304 | 539 | ||
305 | switch (st->state) { | 540 | ts = thread_stat_findnew(thread->pid); |
306 | case LOCK_STATE_UNLOCKED: | 541 | seq = get_seq(ts, contended_event->addr); |
542 | |||
543 | switch (seq->state) { | ||
544 | case SEQ_STATE_UNINITIALIZED: | ||
545 | /* orphan event, do nothing */ | ||
546 | return; | ||
547 | case SEQ_STATE_ACQUIRING: | ||
307 | break; | 548 | break; |
308 | case LOCK_STATE_LOCKED: | 549 | case SEQ_STATE_RELEASED: |
309 | st->nr_contended++; | 550 | case SEQ_STATE_ACQUIRED: |
551 | case SEQ_STATE_READ_ACQUIRED: | ||
552 | case SEQ_STATE_CONTENDED: | ||
553 | /* broken lock sequence, discard it */ | ||
554 | ls->discard = 1; | ||
555 | bad_hist[BROKEN_CONTENDED]++; | ||
556 | list_del(&seq->list); | ||
557 | free(seq); | ||
558 | goto end; | ||
310 | break; | 559 | break; |
311 | default: | 560 | default: |
312 | BUG_ON(1); | 561 | BUG_ON("Unknown state of lock sequence found!\n"); |
313 | break; | 562 | break; |
314 | } | 563 | } |
315 | 564 | ||
316 | st->prev_event_time = timestamp; | 565 | seq->state = SEQ_STATE_CONTENDED; |
566 | ls->nr_contended++; | ||
567 | seq->prev_event_time = timestamp; | ||
568 | end: | ||
569 | return; | ||
317 | } | 570 | } |
318 | 571 | ||
319 | static void | 572 | static void |
320 | report_lock_release_event(struct trace_release_event *release_event, | 573 | report_lock_release_event(struct trace_release_event *release_event, |
321 | struct event *__event __used, | 574 | struct event *__event __used, |
322 | int cpu __used, | 575 | int cpu __used, |
323 | u64 timestamp, | 576 | u64 timestamp __used, |
324 | struct thread *thread __used) | 577 | struct thread *thread __used) |
325 | { | 578 | { |
326 | struct lock_stat *st; | 579 | struct lock_stat *ls; |
327 | u64 hold_time; | 580 | struct thread_stat *ts; |
581 | struct lock_seq_stat *seq; | ||
328 | 582 | ||
329 | st = lock_stat_findnew(release_event->addr, release_event->name); | 583 | ls = lock_stat_findnew(release_event->addr, release_event->name); |
584 | if (ls->discard) | ||
585 | return; | ||
330 | 586 | ||
331 | switch (st->state) { | 587 | ts = thread_stat_findnew(thread->pid); |
332 | case LOCK_STATE_UNLOCKED: | 588 | seq = get_seq(ts, release_event->addr); |
333 | break; | ||
334 | case LOCK_STATE_LOCKED: | ||
335 | st->state = LOCK_STATE_UNLOCKED; | ||
336 | hold_time = timestamp - st->prev_event_time; | ||
337 | 589 | ||
338 | if (timestamp < st->prev_event_time) { | 590 | switch (seq->state) { |
339 | /* terribly, this can happen... */ | 591 | case SEQ_STATE_UNINITIALIZED: |
592 | goto end; | ||
593 | break; | ||
594 | case SEQ_STATE_ACQUIRED: | ||
595 | break; | ||
596 | case SEQ_STATE_READ_ACQUIRED: | ||
597 | seq->read_count--; | ||
598 | BUG_ON(seq->read_count < 0); | ||
599 | if (!seq->read_count) { | ||
600 | ls->nr_release++; | ||
340 | goto end; | 601 | goto end; |
341 | } | 602 | } |
342 | 603 | break; | |
343 | if (st->wait_time_min > hold_time) | 604 | case SEQ_STATE_ACQUIRING: |
344 | st->wait_time_min = hold_time; | 605 | case SEQ_STATE_CONTENDED: |
345 | if (st->wait_time_max < hold_time) | 606 | case SEQ_STATE_RELEASED: |
346 | st->wait_time_max = hold_time; | 607 | /* broken lock sequence, discard it */ |
347 | st->wait_time_total += hold_time; | 608 | ls->discard = 1; |
348 | 609 | bad_hist[BROKEN_RELEASE]++; | |
349 | st->nr_release++; | 610 | goto free_seq; |
350 | break; | 611 | break; |
351 | default: | 612 | default: |
352 | BUG_ON(1); | 613 | BUG_ON("Unknown state of lock sequence found!\n"); |
353 | break; | 614 | break; |
354 | } | 615 | } |
355 | 616 | ||
617 | ls->nr_release++; | ||
618 | free_seq: | ||
619 | list_del(&seq->list); | ||
620 | free(seq); | ||
356 | end: | 621 | end: |
357 | st->prev_event_time = timestamp; | 622 | return; |
358 | } | 623 | } |
359 | 624 | ||
360 | /* lock oriented handlers */ | 625 | /* lock oriented handlers */ |
@@ -381,6 +646,7 @@ process_lock_acquire_event(void *data, | |||
381 | tmp = raw_field_value(event, "lockdep_addr", data); | 646 | tmp = raw_field_value(event, "lockdep_addr", data); |
382 | memcpy(&acquire_event.addr, &tmp, sizeof(void *)); | 647 | memcpy(&acquire_event.addr, &tmp, sizeof(void *)); |
383 | acquire_event.name = (char *)raw_field_ptr(event, "name", data); | 648 | acquire_event.name = (char *)raw_field_ptr(event, "name", data); |
649 | acquire_event.flag = (int)raw_field_value(event, "flag", data); | ||
384 | 650 | ||
385 | if (trace_handler->acquire_event) | 651 | if (trace_handler->acquire_event) |
386 | trace_handler->acquire_event(&acquire_event, event, cpu, timestamp, thread); | 652 | trace_handler->acquire_event(&acquire_event, event, cpu, timestamp, thread); |
@@ -441,8 +707,7 @@ process_lock_release_event(void *data, | |||
441 | } | 707 | } |
442 | 708 | ||
443 | static void | 709 | static void |
444 | process_raw_event(void *data, int cpu, | 710 | process_raw_event(void *data, int cpu, u64 timestamp, struct thread *thread) |
445 | u64 timestamp, struct thread *thread) | ||
446 | { | 711 | { |
447 | struct event *event; | 712 | struct event *event; |
448 | int type; | 713 | int type; |
@@ -460,173 +725,19 @@ process_raw_event(void *data, int cpu, | |||
460 | process_lock_release_event(data, event, cpu, timestamp, thread); | 725 | process_lock_release_event(data, event, cpu, timestamp, thread); |
461 | } | 726 | } |
462 | 727 | ||
463 | struct raw_event_queue { | 728 | static void print_bad_events(int bad, int total) |
464 | u64 timestamp; | ||
465 | int cpu; | ||
466 | void *data; | ||
467 | struct thread *thread; | ||
468 | struct list_head list; | ||
469 | }; | ||
470 | |||
471 | static LIST_HEAD(raw_event_head); | ||
472 | |||
473 | #define FLUSH_PERIOD (5 * NSEC_PER_SEC) | ||
474 | |||
475 | static u64 flush_limit = ULLONG_MAX; | ||
476 | static u64 last_flush = 0; | ||
477 | struct raw_event_queue *last_inserted; | ||
478 | |||
479 | static void flush_raw_event_queue(u64 limit) | ||
480 | { | ||
481 | struct raw_event_queue *tmp, *iter; | ||
482 | |||
483 | list_for_each_entry_safe(iter, tmp, &raw_event_head, list) { | ||
484 | if (iter->timestamp > limit) | ||
485 | return; | ||
486 | |||
487 | if (iter == last_inserted) | ||
488 | last_inserted = NULL; | ||
489 | |||
490 | process_raw_event(iter->data, iter->cpu, iter->timestamp, | ||
491 | iter->thread); | ||
492 | |||
493 | last_flush = iter->timestamp; | ||
494 | list_del(&iter->list); | ||
495 | free(iter->data); | ||
496 | free(iter); | ||
497 | } | ||
498 | } | ||
499 | |||
500 | static void __queue_raw_event_end(struct raw_event_queue *new) | ||
501 | { | ||
502 | struct raw_event_queue *iter; | ||
503 | |||
504 | list_for_each_entry_reverse(iter, &raw_event_head, list) { | ||
505 | if (iter->timestamp < new->timestamp) { | ||
506 | list_add(&new->list, &iter->list); | ||
507 | return; | ||
508 | } | ||
509 | } | ||
510 | |||
511 | list_add(&new->list, &raw_event_head); | ||
512 | } | ||
513 | |||
514 | static void __queue_raw_event_before(struct raw_event_queue *new, | ||
515 | struct raw_event_queue *iter) | ||
516 | { | 729 | { |
517 | list_for_each_entry_continue_reverse(iter, &raw_event_head, list) { | 730 | /* Output for debug, this have to be removed */ |
518 | if (iter->timestamp < new->timestamp) { | 731 | int i; |
519 | list_add(&new->list, &iter->list); | 732 | const char *name[4] = |
520 | return; | 733 | { "acquire", "acquired", "contended", "release" }; |
521 | } | 734 | |
522 | } | 735 | pr_info("\n=== output for debug===\n\n"); |
523 | 736 | pr_info("bad: %d, total: %d\n", bad, total); | |
524 | list_add(&new->list, &raw_event_head); | 737 | pr_info("bad rate: %f %%\n", (double)bad / (double)total * 100); |
525 | } | 738 | pr_info("histogram of events caused bad sequence\n"); |
526 | 739 | for (i = 0; i < BROKEN_MAX; i++) | |
527 | static void __queue_raw_event_after(struct raw_event_queue *new, | 740 | pr_info(" %10s: %d\n", name[i], bad_hist[i]); |
528 | struct raw_event_queue *iter) | ||
529 | { | ||
530 | list_for_each_entry_continue(iter, &raw_event_head, list) { | ||
531 | if (iter->timestamp > new->timestamp) { | ||
532 | list_add_tail(&new->list, &iter->list); | ||
533 | return; | ||
534 | } | ||
535 | } | ||
536 | list_add_tail(&new->list, &raw_event_head); | ||
537 | } | ||
538 | |||
539 | /* The queue is ordered by time */ | ||
540 | static void __queue_raw_event(struct raw_event_queue *new) | ||
541 | { | ||
542 | if (!last_inserted) { | ||
543 | __queue_raw_event_end(new); | ||
544 | return; | ||
545 | } | ||
546 | |||
547 | /* | ||
548 | * Most of the time the current event has a timestamp | ||
549 | * very close to the last event inserted, unless we just switched | ||
550 | * to another event buffer. Having a sorting based on a list and | ||
551 | * on the last inserted event that is close to the current one is | ||
552 | * probably more efficient than an rbtree based sorting. | ||
553 | */ | ||
554 | if (last_inserted->timestamp >= new->timestamp) | ||
555 | __queue_raw_event_before(new, last_inserted); | ||
556 | else | ||
557 | __queue_raw_event_after(new, last_inserted); | ||
558 | } | ||
559 | |||
560 | static void queue_raw_event(void *data, int raw_size, int cpu, | ||
561 | u64 timestamp, struct thread *thread) | ||
562 | { | ||
563 | struct raw_event_queue *new; | ||
564 | |||
565 | if (flush_limit == ULLONG_MAX) | ||
566 | flush_limit = timestamp + FLUSH_PERIOD; | ||
567 | |||
568 | if (timestamp < last_flush) { | ||
569 | printf("Warning: Timestamp below last timeslice flush\n"); | ||
570 | return; | ||
571 | } | ||
572 | |||
573 | new = malloc(sizeof(*new)); | ||
574 | if (!new) | ||
575 | die("Not enough memory\n"); | ||
576 | |||
577 | new->timestamp = timestamp; | ||
578 | new->cpu = cpu; | ||
579 | new->thread = thread; | ||
580 | |||
581 | new->data = malloc(raw_size); | ||
582 | if (!new->data) | ||
583 | die("Not enough memory\n"); | ||
584 | |||
585 | memcpy(new->data, data, raw_size); | ||
586 | |||
587 | __queue_raw_event(new); | ||
588 | last_inserted = new; | ||
589 | |||
590 | /* | ||
591 | * We want to have a slice of events covering 2 * FLUSH_PERIOD | ||
592 | * If FLUSH_PERIOD is big enough, it ensures every events that occured | ||
593 | * in the first half of the timeslice have all been buffered and there | ||
594 | * are none remaining (we need that because of the weakly ordered | ||
595 | * event recording we have). Then once we reach the 2 * FLUSH_PERIOD | ||
596 | * timeslice, we flush the first half to be gentle with the memory | ||
597 | * (the second half can still get new events in the middle, so wait | ||
598 | * another period to flush it) | ||
599 | */ | ||
600 | if (new->timestamp > flush_limit && | ||
601 | new->timestamp - flush_limit > FLUSH_PERIOD) { | ||
602 | flush_limit += FLUSH_PERIOD; | ||
603 | flush_raw_event_queue(flush_limit); | ||
604 | } | ||
605 | } | ||
606 | |||
607 | static int process_sample_event(event_t *event, struct perf_session *session) | ||
608 | { | ||
609 | struct thread *thread; | ||
610 | struct sample_data data; | ||
611 | |||
612 | bzero(&data, sizeof(struct sample_data)); | ||
613 | event__parse_sample(event, session->sample_type, &data); | ||
614 | thread = perf_session__findnew(session, data.pid); | ||
615 | |||
616 | if (thread == NULL) { | ||
617 | pr_debug("problem processing %d event, skipping it.\n", | ||
618 | event->header.type); | ||
619 | return -1; | ||
620 | } | ||
621 | |||
622 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); | ||
623 | |||
624 | if (profile_cpu != -1 && profile_cpu != (int) data.cpu) | ||
625 | return 0; | ||
626 | |||
627 | queue_raw_event(data.raw_data, data.raw_size, data.cpu, data.time, thread); | ||
628 | |||
629 | return 0; | ||
630 | } | 741 | } |
631 | 742 | ||
632 | /* TODO: various way to print, coloring, nano or milli sec */ | 743 | /* TODO: various way to print, coloring, nano or milli sec */ |
@@ -634,26 +745,30 @@ static void print_result(void) | |||
634 | { | 745 | { |
635 | struct lock_stat *st; | 746 | struct lock_stat *st; |
636 | char cut_name[20]; | 747 | char cut_name[20]; |
748 | int bad, total; | ||
637 | 749 | ||
638 | printf("%18s ", "ID"); | 750 | pr_info("%20s ", "Name"); |
639 | printf("%20s ", "Name"); | 751 | pr_info("%10s ", "acquired"); |
640 | printf("%10s ", "acquired"); | 752 | pr_info("%10s ", "contended"); |
641 | printf("%10s ", "contended"); | ||
642 | 753 | ||
643 | printf("%15s ", "total wait (ns)"); | 754 | pr_info("%15s ", "total wait (ns)"); |
644 | printf("%15s ", "max wait (ns)"); | 755 | pr_info("%15s ", "max wait (ns)"); |
645 | printf("%15s ", "min wait (ns)"); | 756 | pr_info("%15s ", "min wait (ns)"); |
646 | 757 | ||
647 | printf("\n\n"); | 758 | pr_info("\n\n"); |
648 | 759 | ||
760 | bad = total = 0; | ||
649 | while ((st = pop_from_result())) { | 761 | while ((st = pop_from_result())) { |
762 | total++; | ||
763 | if (st->discard) { | ||
764 | bad++; | ||
765 | continue; | ||
766 | } | ||
650 | bzero(cut_name, 20); | 767 | bzero(cut_name, 20); |
651 | 768 | ||
652 | printf("%p ", st->addr); | ||
653 | |||
654 | if (strlen(st->name) < 16) { | 769 | if (strlen(st->name) < 16) { |
655 | /* output raw name */ | 770 | /* output raw name */ |
656 | printf("%20s ", st->name); | 771 | pr_info("%20s ", st->name); |
657 | } else { | 772 | } else { |
658 | strncpy(cut_name, st->name, 16); | 773 | strncpy(cut_name, st->name, 16); |
659 | cut_name[16] = '.'; | 774 | cut_name[16] = '.'; |
@@ -661,18 +776,40 @@ static void print_result(void) | |||
661 | cut_name[18] = '.'; | 776 | cut_name[18] = '.'; |
662 | cut_name[19] = '\0'; | 777 | cut_name[19] = '\0'; |
663 | /* cut off name for saving output style */ | 778 | /* cut off name for saving output style */ |
664 | printf("%20s ", cut_name); | 779 | pr_info("%20s ", cut_name); |
665 | } | 780 | } |
666 | 781 | ||
667 | printf("%10u ", st->nr_acquired); | 782 | pr_info("%10u ", st->nr_acquired); |
668 | printf("%10u ", st->nr_contended); | 783 | pr_info("%10u ", st->nr_contended); |
669 | 784 | ||
670 | printf("%15llu ", st->wait_time_total); | 785 | pr_info("%15llu ", st->wait_time_total); |
671 | printf("%15llu ", st->wait_time_max); | 786 | pr_info("%15llu ", st->wait_time_max); |
672 | printf("%15llu ", st->wait_time_min == ULLONG_MAX ? | 787 | pr_info("%15llu ", st->wait_time_min == ULLONG_MAX ? |
673 | 0 : st->wait_time_min); | 788 | 0 : st->wait_time_min); |
674 | printf("\n"); | 789 | pr_info("\n"); |
675 | } | 790 | } |
791 | |||
792 | print_bad_events(bad, total); | ||
793 | } | ||
794 | |||
795 | static int info_threads; | ||
796 | static int info_map; | ||
797 | |||
798 | static void dump_threads(void) | ||
799 | { | ||
800 | struct thread_stat *st; | ||
801 | struct rb_node *node; | ||
802 | struct thread *t; | ||
803 | |||
804 | pr_info("%10s: comm\n", "Thread ID"); | ||
805 | |||
806 | node = rb_first(&thread_stats); | ||
807 | while (node) { | ||
808 | st = container_of(node, struct thread_stat, rb); | ||
809 | t = perf_session__findnew(session, st->tid); | ||
810 | pr_info("%10d: %s\n", st->tid, t->comm); | ||
811 | node = rb_next(node); | ||
812 | }; | ||
676 | } | 813 | } |
677 | 814 | ||
678 | static void dump_map(void) | 815 | static void dump_map(void) |
@@ -680,23 +817,53 @@ static void dump_map(void) | |||
680 | unsigned int i; | 817 | unsigned int i; |
681 | struct lock_stat *st; | 818 | struct lock_stat *st; |
682 | 819 | ||
820 | pr_info("Address of instance: name of class\n"); | ||
683 | for (i = 0; i < LOCKHASH_SIZE; i++) { | 821 | for (i = 0; i < LOCKHASH_SIZE; i++) { |
684 | list_for_each_entry(st, &lockhash_table[i], hash_entry) { | 822 | list_for_each_entry(st, &lockhash_table[i], hash_entry) { |
685 | printf("%p: %s\n", st->addr, st->name); | 823 | pr_info(" %p: %s\n", st->addr, st->name); |
686 | } | 824 | } |
687 | } | 825 | } |
688 | } | 826 | } |
689 | 827 | ||
828 | static void dump_info(void) | ||
829 | { | ||
830 | if (info_threads) | ||
831 | dump_threads(); | ||
832 | else if (info_map) | ||
833 | dump_map(); | ||
834 | else | ||
835 | die("Unknown type of information\n"); | ||
836 | } | ||
837 | |||
838 | static int process_sample_event(event_t *self, struct perf_session *s) | ||
839 | { | ||
840 | struct sample_data data; | ||
841 | struct thread *thread; | ||
842 | |||
843 | bzero(&data, sizeof(data)); | ||
844 | event__parse_sample(self, s->sample_type, &data); | ||
845 | |||
846 | thread = perf_session__findnew(s, data.tid); | ||
847 | if (thread == NULL) { | ||
848 | pr_debug("problem processing %d event, skipping it.\n", | ||
849 | self->header.type); | ||
850 | return -1; | ||
851 | } | ||
852 | |||
853 | process_raw_event(data.raw_data, data.cpu, data.time, thread); | ||
854 | |||
855 | return 0; | ||
856 | } | ||
857 | |||
690 | static struct perf_event_ops eops = { | 858 | static struct perf_event_ops eops = { |
691 | .sample = process_sample_event, | 859 | .sample = process_sample_event, |
692 | .comm = event__process_comm, | 860 | .comm = event__process_comm, |
861 | .ordered_samples = true, | ||
693 | }; | 862 | }; |
694 | 863 | ||
695 | static struct perf_session *session; | ||
696 | |||
697 | static int read_events(void) | 864 | static int read_events(void) |
698 | { | 865 | { |
699 | session = perf_session__new(input_name, O_RDONLY, 0); | 866 | session = perf_session__new(input_name, O_RDONLY, 0, false); |
700 | if (!session) | 867 | if (!session) |
701 | die("Initializing perf session failed\n"); | 868 | die("Initializing perf session failed\n"); |
702 | 869 | ||
@@ -720,7 +887,6 @@ static void __cmd_report(void) | |||
720 | setup_pager(); | 887 | setup_pager(); |
721 | select_key(); | 888 | select_key(); |
722 | read_events(); | 889 | read_events(); |
723 | flush_raw_event_queue(ULLONG_MAX); | ||
724 | sort_result(); | 890 | sort_result(); |
725 | print_result(); | 891 | print_result(); |
726 | } | 892 | } |
@@ -737,6 +903,19 @@ static const struct option report_options[] = { | |||
737 | OPT_END() | 903 | OPT_END() |
738 | }; | 904 | }; |
739 | 905 | ||
906 | static const char * const info_usage[] = { | ||
907 | "perf lock info [<options>]", | ||
908 | NULL | ||
909 | }; | ||
910 | |||
911 | static const struct option info_options[] = { | ||
912 | OPT_BOOLEAN('t', "threads", &info_threads, | ||
913 | "dump thread list in perf.data"), | ||
914 | OPT_BOOLEAN('m', "map", &info_map, | ||
915 | "map of lock instances (name:address table)"), | ||
916 | OPT_END() | ||
917 | }; | ||
918 | |||
740 | static const char * const lock_usage[] = { | 919 | static const char * const lock_usage[] = { |
741 | "perf lock [<options>] {record|trace|report}", | 920 | "perf lock [<options>] {record|trace|report}", |
742 | NULL | 921 | NULL |
@@ -744,14 +923,13 @@ static const char * const lock_usage[] = { | |||
744 | 923 | ||
745 | static const struct option lock_options[] = { | 924 | static const struct option lock_options[] = { |
746 | OPT_STRING('i', "input", &input_name, "file", "input file name"), | 925 | OPT_STRING('i', "input", &input_name, "file", "input file name"), |
747 | OPT_BOOLEAN('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"), | 926 | OPT_INCR('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"), |
748 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"), | 927 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"), |
749 | OPT_END() | 928 | OPT_END() |
750 | }; | 929 | }; |
751 | 930 | ||
752 | static const char *record_args[] = { | 931 | static const char *record_args[] = { |
753 | "record", | 932 | "record", |
754 | "-a", | ||
755 | "-R", | 933 | "-R", |
756 | "-f", | 934 | "-f", |
757 | "-m", "1024", | 935 | "-m", "1024", |
@@ -808,12 +986,18 @@ int cmd_lock(int argc, const char **argv, const char *prefix __used) | |||
808 | } else if (!strcmp(argv[0], "trace")) { | 986 | } else if (!strcmp(argv[0], "trace")) { |
809 | /* Aliased to 'perf trace' */ | 987 | /* Aliased to 'perf trace' */ |
810 | return cmd_trace(argc, argv, prefix); | 988 | return cmd_trace(argc, argv, prefix); |
811 | } else if (!strcmp(argv[0], "map")) { | 989 | } else if (!strcmp(argv[0], "info")) { |
990 | if (argc) { | ||
991 | argc = parse_options(argc, argv, | ||
992 | info_options, info_usage, 0); | ||
993 | if (argc) | ||
994 | usage_with_options(info_usage, info_options); | ||
995 | } | ||
812 | /* recycling report_lock_ops */ | 996 | /* recycling report_lock_ops */ |
813 | trace_handler = &report_lock_ops; | 997 | trace_handler = &report_lock_ops; |
814 | setup_pager(); | 998 | setup_pager(); |
815 | read_events(); | 999 | read_events(); |
816 | dump_map(); | 1000 | dump_info(); |
817 | } else { | 1001 | } else { |
818 | usage_with_options(lock_usage, lock_options); | 1002 | usage_with_options(lock_usage, lock_options); |
819 | } | 1003 | } |
diff --git a/tools/perf/builtin-probe.c b/tools/perf/builtin-probe.c index 152d6c9b1fa4..61c6d70732c9 100644 --- a/tools/perf/builtin-probe.c +++ b/tools/perf/builtin-probe.c | |||
@@ -36,13 +36,10 @@ | |||
36 | #include "builtin.h" | 36 | #include "builtin.h" |
37 | #include "util/util.h" | 37 | #include "util/util.h" |
38 | #include "util/strlist.h" | 38 | #include "util/strlist.h" |
39 | #include "util/event.h" | 39 | #include "util/symbol.h" |
40 | #include "util/debug.h" | 40 | #include "util/debug.h" |
41 | #include "util/debugfs.h" | 41 | #include "util/debugfs.h" |
42 | #include "util/symbol.h" | ||
43 | #include "util/thread.h" | ||
44 | #include "util/parse-options.h" | 42 | #include "util/parse-options.h" |
45 | #include "util/parse-events.h" /* For debugfs_path */ | ||
46 | #include "util/probe-finder.h" | 43 | #include "util/probe-finder.h" |
47 | #include "util/probe-event.h" | 44 | #include "util/probe-event.h" |
48 | 45 | ||
@@ -50,103 +47,84 @@ | |||
50 | 47 | ||
51 | /* Session management structure */ | 48 | /* Session management structure */ |
52 | static struct { | 49 | static struct { |
53 | bool need_dwarf; | ||
54 | bool list_events; | 50 | bool list_events; |
55 | bool force_add; | 51 | bool force_add; |
56 | bool show_lines; | 52 | bool show_lines; |
57 | int nr_probe; | 53 | int nevents; |
58 | struct probe_point probes[MAX_PROBES]; | 54 | struct perf_probe_event events[MAX_PROBES]; |
59 | struct strlist *dellist; | 55 | struct strlist *dellist; |
60 | struct map_groups kmap_groups; | ||
61 | struct map *kmaps[MAP__NR_TYPES]; | ||
62 | struct line_range line_range; | 56 | struct line_range line_range; |
63 | } session; | 57 | int max_probe_points; |
58 | } params; | ||
64 | 59 | ||
65 | 60 | ||
66 | /* Parse an event definition. Note that any error must die. */ | 61 | /* Parse an event definition. Note that any error must die. */ |
67 | static void parse_probe_event(const char *str) | 62 | static int parse_probe_event(const char *str) |
68 | { | 63 | { |
69 | struct probe_point *pp = &session.probes[session.nr_probe]; | 64 | struct perf_probe_event *pev = ¶ms.events[params.nevents]; |
65 | int ret; | ||
70 | 66 | ||
71 | pr_debug("probe-definition(%d): %s\n", session.nr_probe, str); | 67 | pr_debug("probe-definition(%d): %s\n", params.nevents, str); |
72 | if (++session.nr_probe == MAX_PROBES) | 68 | if (++params.nevents == MAX_PROBES) |
73 | die("Too many probes (> %d) are specified.", MAX_PROBES); | 69 | die("Too many probes (> %d) are specified.", MAX_PROBES); |
74 | 70 | ||
75 | /* Parse perf-probe event into probe_point */ | 71 | /* Parse a perf-probe command into event */ |
76 | parse_perf_probe_event(str, pp, &session.need_dwarf); | 72 | ret = parse_perf_probe_command(str, pev); |
73 | pr_debug("%d arguments\n", pev->nargs); | ||
77 | 74 | ||
78 | pr_debug("%d arguments\n", pp->nr_args); | 75 | return ret; |
79 | } | 76 | } |
80 | 77 | ||
81 | static void parse_probe_event_argv(int argc, const char **argv) | 78 | static int parse_probe_event_argv(int argc, const char **argv) |
82 | { | 79 | { |
83 | int i, len; | 80 | int i, len, ret; |
84 | char *buf; | 81 | char *buf; |
85 | 82 | ||
86 | /* Bind up rest arguments */ | 83 | /* Bind up rest arguments */ |
87 | len = 0; | 84 | len = 0; |
88 | for (i = 0; i < argc; i++) | 85 | for (i = 0; i < argc; i++) |
89 | len += strlen(argv[i]) + 1; | 86 | len += strlen(argv[i]) + 1; |
90 | buf = zalloc(len + 1); | 87 | buf = xzalloc(len + 1); |
91 | if (!buf) | ||
92 | die("Failed to allocate memory for binding arguments."); | ||
93 | len = 0; | 88 | len = 0; |
94 | for (i = 0; i < argc; i++) | 89 | for (i = 0; i < argc; i++) |
95 | len += sprintf(&buf[len], "%s ", argv[i]); | 90 | len += sprintf(&buf[len], "%s ", argv[i]); |
96 | parse_probe_event(buf); | 91 | ret = parse_probe_event(buf); |
97 | free(buf); | 92 | free(buf); |
93 | return ret; | ||
98 | } | 94 | } |
99 | 95 | ||
100 | static int opt_add_probe_event(const struct option *opt __used, | 96 | static int opt_add_probe_event(const struct option *opt __used, |
101 | const char *str, int unset __used) | 97 | const char *str, int unset __used) |
102 | { | 98 | { |
103 | if (str) | 99 | if (str) |
104 | parse_probe_event(str); | 100 | return parse_probe_event(str); |
105 | return 0; | 101 | else |
102 | return 0; | ||
106 | } | 103 | } |
107 | 104 | ||
108 | static int opt_del_probe_event(const struct option *opt __used, | 105 | static int opt_del_probe_event(const struct option *opt __used, |
109 | const char *str, int unset __used) | 106 | const char *str, int unset __used) |
110 | { | 107 | { |
111 | if (str) { | 108 | if (str) { |
112 | if (!session.dellist) | 109 | if (!params.dellist) |
113 | session.dellist = strlist__new(true, NULL); | 110 | params.dellist = strlist__new(true, NULL); |
114 | strlist__add(session.dellist, str); | 111 | strlist__add(params.dellist, str); |
115 | } | 112 | } |
116 | return 0; | 113 | return 0; |
117 | } | 114 | } |
118 | 115 | ||
119 | /* Currently just checking function name from symbol map */ | 116 | #ifdef DWARF_SUPPORT |
120 | static void evaluate_probe_point(struct probe_point *pp) | ||
121 | { | ||
122 | struct symbol *sym; | ||
123 | sym = map__find_symbol_by_name(session.kmaps[MAP__FUNCTION], | ||
124 | pp->function, NULL); | ||
125 | if (!sym) | ||
126 | die("Kernel symbol \'%s\' not found - probe not added.", | ||
127 | pp->function); | ||
128 | } | ||
129 | |||
130 | #ifndef NO_DWARF_SUPPORT | ||
131 | static int open_vmlinux(void) | ||
132 | { | ||
133 | if (map__load(session.kmaps[MAP__FUNCTION], NULL) < 0) { | ||
134 | pr_debug("Failed to load kernel map.\n"); | ||
135 | return -EINVAL; | ||
136 | } | ||
137 | pr_debug("Try to open %s\n", | ||
138 | session.kmaps[MAP__FUNCTION]->dso->long_name); | ||
139 | return open(session.kmaps[MAP__FUNCTION]->dso->long_name, O_RDONLY); | ||
140 | } | ||
141 | |||
142 | static int opt_show_lines(const struct option *opt __used, | 117 | static int opt_show_lines(const struct option *opt __used, |
143 | const char *str, int unset __used) | 118 | const char *str, int unset __used) |
144 | { | 119 | { |
120 | int ret = 0; | ||
121 | |||
145 | if (str) | 122 | if (str) |
146 | parse_line_range_desc(str, &session.line_range); | 123 | ret = parse_line_range_desc(str, ¶ms.line_range); |
147 | INIT_LIST_HEAD(&session.line_range.line_list); | 124 | INIT_LIST_HEAD(¶ms.line_range.line_list); |
148 | session.show_lines = true; | 125 | params.show_lines = true; |
149 | return 0; | 126 | |
127 | return ret; | ||
150 | } | 128 | } |
151 | #endif | 129 | #endif |
152 | 130 | ||
@@ -155,29 +133,25 @@ static const char * const probe_usage[] = { | |||
155 | "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]", | 133 | "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]", |
156 | "perf probe [<options>] --del '[GROUP:]EVENT' ...", | 134 | "perf probe [<options>] --del '[GROUP:]EVENT' ...", |
157 | "perf probe --list", | 135 | "perf probe --list", |
158 | #ifndef NO_DWARF_SUPPORT | 136 | #ifdef DWARF_SUPPORT |
159 | "perf probe --line 'LINEDESC'", | 137 | "perf probe --line 'LINEDESC'", |
160 | #endif | 138 | #endif |
161 | NULL | 139 | NULL |
162 | }; | 140 | }; |
163 | 141 | ||
164 | static const struct option options[] = { | 142 | static const struct option options[] = { |
165 | OPT_BOOLEAN('v', "verbose", &verbose, | 143 | OPT_INCR('v', "verbose", &verbose, |
166 | "be more verbose (show parsed arguments, etc)"), | 144 | "be more verbose (show parsed arguments, etc)"), |
167 | #ifndef NO_DWARF_SUPPORT | 145 | OPT_BOOLEAN('l', "list", ¶ms.list_events, |
168 | OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name, | ||
169 | "file", "vmlinux pathname"), | ||
170 | #endif | ||
171 | OPT_BOOLEAN('l', "list", &session.list_events, | ||
172 | "list up current probe events"), | 146 | "list up current probe events"), |
173 | OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.", | 147 | OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.", |
174 | opt_del_probe_event), | 148 | opt_del_probe_event), |
175 | OPT_CALLBACK('a', "add", NULL, | 149 | OPT_CALLBACK('a', "add", NULL, |
176 | #ifdef NO_DWARF_SUPPORT | 150 | #ifdef DWARF_SUPPORT |
177 | "[EVENT=]FUNC[+OFF|%return] [ARG ...]", | ||
178 | #else | ||
179 | "[EVENT=]FUNC[@SRC][+OFF|%return|:RL|;PT]|SRC:AL|SRC;PT" | 151 | "[EVENT=]FUNC[@SRC][+OFF|%return|:RL|;PT]|SRC:AL|SRC;PT" |
180 | " [ARG ...]", | 152 | " [[NAME=]ARG ...]", |
153 | #else | ||
154 | "[EVENT=]FUNC[+OFF|%return] [[NAME=]ARG ...]", | ||
181 | #endif | 155 | #endif |
182 | "probe point definition, where\n" | 156 | "probe point definition, where\n" |
183 | "\t\tGROUP:\tGroup name (optional)\n" | 157 | "\t\tGROUP:\tGroup name (optional)\n" |
@@ -185,51 +159,35 @@ static const struct option options[] = { | |||
185 | "\t\tFUNC:\tFunction name\n" | 159 | "\t\tFUNC:\tFunction name\n" |
186 | "\t\tOFF:\tOffset from function entry (in byte)\n" | 160 | "\t\tOFF:\tOffset from function entry (in byte)\n" |
187 | "\t\t%return:\tPut the probe at function return\n" | 161 | "\t\t%return:\tPut the probe at function return\n" |
188 | #ifdef NO_DWARF_SUPPORT | 162 | #ifdef DWARF_SUPPORT |
189 | "\t\tARG:\tProbe argument (only \n" | ||
190 | #else | ||
191 | "\t\tSRC:\tSource code path\n" | 163 | "\t\tSRC:\tSource code path\n" |
192 | "\t\tRL:\tRelative line number from function entry.\n" | 164 | "\t\tRL:\tRelative line number from function entry.\n" |
193 | "\t\tAL:\tAbsolute line number in file.\n" | 165 | "\t\tAL:\tAbsolute line number in file.\n" |
194 | "\t\tPT:\tLazy expression of line code.\n" | 166 | "\t\tPT:\tLazy expression of line code.\n" |
195 | "\t\tARG:\tProbe argument (local variable name or\n" | 167 | "\t\tARG:\tProbe argument (local variable name or\n" |
196 | #endif | ||
197 | "\t\t\tkprobe-tracer argument format.)\n", | 168 | "\t\t\tkprobe-tracer argument format.)\n", |
169 | #else | ||
170 | "\t\tARG:\tProbe argument (kprobe-tracer argument format.)\n", | ||
171 | #endif | ||
198 | opt_add_probe_event), | 172 | opt_add_probe_event), |
199 | OPT_BOOLEAN('f', "force", &session.force_add, "forcibly add events" | 173 | OPT_BOOLEAN('f', "force", ¶ms.force_add, "forcibly add events" |
200 | " with existing name"), | 174 | " with existing name"), |
201 | #ifndef NO_DWARF_SUPPORT | 175 | #ifdef DWARF_SUPPORT |
202 | OPT_CALLBACK('L', "line", NULL, | 176 | OPT_CALLBACK('L', "line", NULL, |
203 | "FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]", | 177 | "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]", |
204 | "Show source code lines.", opt_show_lines), | 178 | "Show source code lines.", opt_show_lines), |
179 | OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name, | ||
180 | "file", "vmlinux pathname"), | ||
205 | #endif | 181 | #endif |
182 | OPT__DRY_RUN(&probe_event_dry_run), | ||
183 | OPT_INTEGER('\0', "max-probes", ¶ms.max_probe_points, | ||
184 | "Set how many probe points can be found for a probe."), | ||
206 | OPT_END() | 185 | OPT_END() |
207 | }; | 186 | }; |
208 | 187 | ||
209 | /* Initialize symbol maps for vmlinux */ | ||
210 | static void init_vmlinux(void) | ||
211 | { | ||
212 | symbol_conf.sort_by_name = true; | ||
213 | if (symbol_conf.vmlinux_name == NULL) | ||
214 | symbol_conf.try_vmlinux_path = true; | ||
215 | else | ||
216 | pr_debug("Use vmlinux: %s\n", symbol_conf.vmlinux_name); | ||
217 | if (symbol__init() < 0) | ||
218 | die("Failed to init symbol map."); | ||
219 | |||
220 | map_groups__init(&session.kmap_groups); | ||
221 | if (map_groups__create_kernel_maps(&session.kmap_groups, | ||
222 | session.kmaps) < 0) | ||
223 | die("Failed to create kernel maps."); | ||
224 | } | ||
225 | |||
226 | int cmd_probe(int argc, const char **argv, const char *prefix __used) | 188 | int cmd_probe(int argc, const char **argv, const char *prefix __used) |
227 | { | 189 | { |
228 | int i, ret; | 190 | int ret; |
229 | #ifndef NO_DWARF_SUPPORT | ||
230 | int fd; | ||
231 | #endif | ||
232 | struct probe_point *pp; | ||
233 | 191 | ||
234 | argc = parse_options(argc, argv, options, probe_usage, | 192 | argc = parse_options(argc, argv, options, probe_usage, |
235 | PARSE_OPT_STOP_AT_NON_OPTION); | 193 | PARSE_OPT_STOP_AT_NON_OPTION); |
@@ -238,123 +196,69 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used) | |||
238 | pr_warning(" Error: '-' is not supported.\n"); | 196 | pr_warning(" Error: '-' is not supported.\n"); |
239 | usage_with_options(probe_usage, options); | 197 | usage_with_options(probe_usage, options); |
240 | } | 198 | } |
241 | parse_probe_event_argv(argc, argv); | 199 | ret = parse_probe_event_argv(argc, argv); |
200 | if (ret < 0) { | ||
201 | pr_err(" Error: Parse Error. (%d)\n", ret); | ||
202 | return ret; | ||
203 | } | ||
242 | } | 204 | } |
243 | 205 | ||
244 | if ((!session.nr_probe && !session.dellist && !session.list_events && | 206 | if (params.max_probe_points == 0) |
245 | !session.show_lines)) | 207 | params.max_probe_points = MAX_PROBES; |
246 | usage_with_options(probe_usage, options); | ||
247 | 208 | ||
248 | if (debugfs_valid_mountpoint(debugfs_path) < 0) | 209 | if ((!params.nevents && !params.dellist && !params.list_events && |
249 | die("Failed to find debugfs path."); | 210 | !params.show_lines)) |
211 | usage_with_options(probe_usage, options); | ||
250 | 212 | ||
251 | if (session.list_events) { | 213 | if (params.list_events) { |
252 | if (session.nr_probe != 0 || session.dellist) { | 214 | if (params.nevents != 0 || params.dellist) { |
253 | pr_warning(" Error: Don't use --list with" | 215 | pr_err(" Error: Don't use --list with --add/--del.\n"); |
254 | " --add/--del.\n"); | ||
255 | usage_with_options(probe_usage, options); | 216 | usage_with_options(probe_usage, options); |
256 | } | 217 | } |
257 | if (session.show_lines) { | 218 | if (params.show_lines) { |
258 | pr_warning(" Error: Don't use --list with --line.\n"); | 219 | pr_err(" Error: Don't use --list with --line.\n"); |
259 | usage_with_options(probe_usage, options); | 220 | usage_with_options(probe_usage, options); |
260 | } | 221 | } |
261 | show_perf_probe_events(); | 222 | ret = show_perf_probe_events(); |
262 | return 0; | 223 | if (ret < 0) |
224 | pr_err(" Error: Failed to show event list. (%d)\n", | ||
225 | ret); | ||
226 | return ret; | ||
263 | } | 227 | } |
264 | 228 | ||
265 | #ifndef NO_DWARF_SUPPORT | 229 | #ifdef DWARF_SUPPORT |
266 | if (session.show_lines) { | 230 | if (params.show_lines) { |
267 | if (session.nr_probe != 0 || session.dellist) { | 231 | if (params.nevents != 0 || params.dellist) { |
268 | pr_warning(" Error: Don't use --line with" | 232 | pr_warning(" Error: Don't use --line with" |
269 | " --add/--del.\n"); | 233 | " --add/--del.\n"); |
270 | usage_with_options(probe_usage, options); | 234 | usage_with_options(probe_usage, options); |
271 | } | 235 | } |
272 | init_vmlinux(); | ||
273 | fd = open_vmlinux(); | ||
274 | if (fd < 0) | ||
275 | die("Could not open debuginfo file."); | ||
276 | ret = find_line_range(fd, &session.line_range); | ||
277 | if (ret <= 0) | ||
278 | die("Source line is not found.\n"); | ||
279 | close(fd); | ||
280 | show_line_range(&session.line_range); | ||
281 | return 0; | ||
282 | } | ||
283 | #endif | ||
284 | 236 | ||
285 | if (session.dellist) { | 237 | ret = show_line_range(¶ms.line_range); |
286 | del_trace_kprobe_events(session.dellist); | 238 | if (ret < 0) |
287 | strlist__delete(session.dellist); | 239 | pr_err(" Error: Failed to show lines. (%d)\n", ret); |
288 | if (session.nr_probe == 0) | 240 | return ret; |
289 | return 0; | ||
290 | } | 241 | } |
242 | #endif | ||
291 | 243 | ||
292 | /* Add probes */ | 244 | if (params.dellist) { |
293 | init_vmlinux(); | 245 | ret = del_perf_probe_events(params.dellist); |
294 | 246 | strlist__delete(params.dellist); | |
295 | if (session.need_dwarf) | 247 | if (ret < 0) { |
296 | #ifdef NO_DWARF_SUPPORT | 248 | pr_err(" Error: Failed to delete events. (%d)\n", ret); |
297 | die("Debuginfo-analysis is not supported"); | 249 | return ret; |
298 | #else /* !NO_DWARF_SUPPORT */ | ||
299 | pr_debug("Some probes require debuginfo.\n"); | ||
300 | |||
301 | fd = open_vmlinux(); | ||
302 | if (fd < 0) { | ||
303 | if (session.need_dwarf) | ||
304 | die("Could not open debuginfo file."); | ||
305 | |||
306 | pr_debug("Could not open vmlinux/module file." | ||
307 | " Try to use symbols.\n"); | ||
308 | goto end_dwarf; | ||
309 | } | ||
310 | |||
311 | /* Searching probe points */ | ||
312 | for (i = 0; i < session.nr_probe; i++) { | ||
313 | pp = &session.probes[i]; | ||
314 | if (pp->found) | ||
315 | continue; | ||
316 | |||
317 | lseek(fd, SEEK_SET, 0); | ||
318 | ret = find_probe_point(fd, pp); | ||
319 | if (ret > 0) | ||
320 | continue; | ||
321 | if (ret == 0) { /* No error but failed to find probe point. */ | ||
322 | synthesize_perf_probe_point(pp); | ||
323 | die("Probe point '%s' not found. - probe not added.", | ||
324 | pp->probes[0]); | ||
325 | } | ||
326 | /* Error path */ | ||
327 | if (session.need_dwarf) { | ||
328 | if (ret == -ENOENT) | ||
329 | pr_warning("No dwarf info found in the vmlinux - please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
330 | die("Could not analyze debuginfo."); | ||
331 | } | 250 | } |
332 | pr_debug("An error occurred in debuginfo analysis." | ||
333 | " Try to use symbols.\n"); | ||
334 | break; | ||
335 | } | 251 | } |
336 | close(fd); | ||
337 | |||
338 | end_dwarf: | ||
339 | #endif /* !NO_DWARF_SUPPORT */ | ||
340 | 252 | ||
341 | /* Synthesize probes without dwarf */ | 253 | if (params.nevents) { |
342 | for (i = 0; i < session.nr_probe; i++) { | 254 | ret = add_perf_probe_events(params.events, params.nevents, |
343 | pp = &session.probes[i]; | 255 | params.force_add, |
344 | if (pp->found) /* This probe is already found. */ | 256 | params.max_probe_points); |
345 | continue; | 257 | if (ret < 0) { |
346 | 258 | pr_err(" Error: Failed to add events. (%d)\n", ret); | |
347 | evaluate_probe_point(pp); | 259 | return ret; |
348 | ret = synthesize_trace_kprobe_event(pp); | 260 | } |
349 | if (ret == -E2BIG) | ||
350 | die("probe point definition becomes too long."); | ||
351 | else if (ret < 0) | ||
352 | die("Failed to synthesize a probe point."); | ||
353 | } | 261 | } |
354 | |||
355 | /* Settng up probe points */ | ||
356 | add_trace_kprobe_events(session.probes, session.nr_probe, | ||
357 | session.force_add); | ||
358 | return 0; | 262 | return 0; |
359 | } | 263 | } |
360 | 264 | ||
diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c index 3b8b6387c47c..0f467cf7aa72 100644 --- a/tools/perf/builtin-record.c +++ b/tools/perf/builtin-record.c | |||
@@ -15,7 +15,6 @@ | |||
15 | #include "util/util.h" | 15 | #include "util/util.h" |
16 | #include "util/parse-options.h" | 16 | #include "util/parse-options.h" |
17 | #include "util/parse-events.h" | 17 | #include "util/parse-events.h" |
18 | #include "util/string.h" | ||
19 | 18 | ||
20 | #include "util/header.h" | 19 | #include "util/header.h" |
21 | #include "util/event.h" | 20 | #include "util/event.h" |
@@ -27,31 +26,41 @@ | |||
27 | #include <unistd.h> | 26 | #include <unistd.h> |
28 | #include <sched.h> | 27 | #include <sched.h> |
29 | 28 | ||
30 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 29 | enum write_mode_t { |
30 | WRITE_FORCE, | ||
31 | WRITE_APPEND | ||
32 | }; | ||
33 | |||
34 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; | ||
31 | 35 | ||
36 | static unsigned int user_interval = UINT_MAX; | ||
32 | static long default_interval = 0; | 37 | static long default_interval = 0; |
33 | 38 | ||
34 | static int nr_cpus = 0; | 39 | static int nr_cpus = 0; |
35 | static unsigned int page_size; | 40 | static unsigned int page_size; |
36 | static unsigned int mmap_pages = 128; | 41 | static unsigned int mmap_pages = 128; |
42 | static unsigned int user_freq = UINT_MAX; | ||
37 | static int freq = 1000; | 43 | static int freq = 1000; |
38 | static int output; | 44 | static int output; |
45 | static int pipe_output = 0; | ||
39 | static const char *output_name = "perf.data"; | 46 | static const char *output_name = "perf.data"; |
40 | static int group = 0; | 47 | static int group = 0; |
41 | static unsigned int realtime_prio = 0; | 48 | static unsigned int realtime_prio = 0; |
42 | static int raw_samples = 0; | 49 | static bool raw_samples = false; |
43 | static int system_wide = 0; | 50 | static bool system_wide = false; |
44 | static int profile_cpu = -1; | 51 | static int profile_cpu = -1; |
45 | static pid_t target_pid = -1; | 52 | static pid_t target_pid = -1; |
53 | static pid_t target_tid = -1; | ||
54 | static pid_t *all_tids = NULL; | ||
55 | static int thread_num = 0; | ||
46 | static pid_t child_pid = -1; | 56 | static pid_t child_pid = -1; |
47 | static int inherit = 1; | 57 | static bool no_inherit = false; |
48 | static int force = 0; | 58 | static enum write_mode_t write_mode = WRITE_FORCE; |
49 | static int append_file = 0; | 59 | static bool call_graph = false; |
50 | static int call_graph = 0; | 60 | static bool inherit_stat = false; |
51 | static int inherit_stat = 0; | 61 | static bool no_samples = false; |
52 | static int no_samples = 0; | 62 | static bool sample_address = false; |
53 | static int sample_address = 0; | 63 | static bool multiplex = false; |
54 | static int multiplex = 0; | ||
55 | static int multiplex_fd = -1; | 64 | static int multiplex_fd = -1; |
56 | 65 | ||
57 | static long samples = 0; | 66 | static long samples = 0; |
@@ -60,7 +69,7 @@ static struct timeval this_read; | |||
60 | 69 | ||
61 | static u64 bytes_written = 0; | 70 | static u64 bytes_written = 0; |
62 | 71 | ||
63 | static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; | 72 | static struct pollfd *event_array; |
64 | 73 | ||
65 | static int nr_poll = 0; | 74 | static int nr_poll = 0; |
66 | static int nr_cpu = 0; | 75 | static int nr_cpu = 0; |
@@ -77,7 +86,7 @@ struct mmap_data { | |||
77 | unsigned int prev; | 86 | unsigned int prev; |
78 | }; | 87 | }; |
79 | 88 | ||
80 | static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; | 89 | static struct mmap_data *mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; |
81 | 90 | ||
82 | static unsigned long mmap_read_head(struct mmap_data *md) | 91 | static unsigned long mmap_read_head(struct mmap_data *md) |
83 | { | 92 | { |
@@ -101,6 +110,11 @@ static void mmap_write_tail(struct mmap_data *md, unsigned long tail) | |||
101 | pc->data_tail = tail; | 110 | pc->data_tail = tail; |
102 | } | 111 | } |
103 | 112 | ||
113 | static void advance_output(size_t size) | ||
114 | { | ||
115 | bytes_written += size; | ||
116 | } | ||
117 | |||
104 | static void write_output(void *buf, size_t size) | 118 | static void write_output(void *buf, size_t size) |
105 | { | 119 | { |
106 | while (size) { | 120 | while (size) { |
@@ -225,12 +239,13 @@ static struct perf_header_attr *get_header_attr(struct perf_event_attr *a, int n | |||
225 | return h_attr; | 239 | return h_attr; |
226 | } | 240 | } |
227 | 241 | ||
228 | static void create_counter(int counter, int cpu, pid_t pid) | 242 | static void create_counter(int counter, int cpu) |
229 | { | 243 | { |
230 | char *filter = filters[counter]; | 244 | char *filter = filters[counter]; |
231 | struct perf_event_attr *attr = attrs + counter; | 245 | struct perf_event_attr *attr = attrs + counter; |
232 | struct perf_header_attr *h_attr; | 246 | struct perf_header_attr *h_attr; |
233 | int track = !counter; /* only the first counter needs these */ | 247 | int track = !counter; /* only the first counter needs these */ |
248 | int thread_index; | ||
234 | int ret; | 249 | int ret; |
235 | struct { | 250 | struct { |
236 | u64 count; | 251 | u64 count; |
@@ -248,10 +263,19 @@ static void create_counter(int counter, int cpu, pid_t pid) | |||
248 | if (nr_counters > 1) | 263 | if (nr_counters > 1) |
249 | attr->sample_type |= PERF_SAMPLE_ID; | 264 | attr->sample_type |= PERF_SAMPLE_ID; |
250 | 265 | ||
251 | if (freq) { | 266 | /* |
252 | attr->sample_type |= PERF_SAMPLE_PERIOD; | 267 | * We default some events to a 1 default interval. But keep |
253 | attr->freq = 1; | 268 | * it a weak assumption overridable by the user. |
254 | attr->sample_freq = freq; | 269 | */ |
270 | if (!attr->sample_period || (user_freq != UINT_MAX && | ||
271 | user_interval != UINT_MAX)) { | ||
272 | if (freq) { | ||
273 | attr->sample_type |= PERF_SAMPLE_PERIOD; | ||
274 | attr->freq = 1; | ||
275 | attr->sample_freq = freq; | ||
276 | } else { | ||
277 | attr->sample_period = default_interval; | ||
278 | } | ||
255 | } | 279 | } |
256 | 280 | ||
257 | if (no_samples) | 281 | if (no_samples) |
@@ -274,119 +298,130 @@ static void create_counter(int counter, int cpu, pid_t pid) | |||
274 | 298 | ||
275 | attr->mmap = track; | 299 | attr->mmap = track; |
276 | attr->comm = track; | 300 | attr->comm = track; |
277 | attr->inherit = inherit; | 301 | attr->inherit = !no_inherit; |
278 | attr->disabled = 1; | 302 | if (target_pid == -1 && target_tid == -1 && !system_wide) { |
303 | attr->disabled = 1; | ||
304 | attr->enable_on_exec = 1; | ||
305 | } | ||
279 | 306 | ||
307 | for (thread_index = 0; thread_index < thread_num; thread_index++) { | ||
280 | try_again: | 308 | try_again: |
281 | fd[nr_cpu][counter] = sys_perf_event_open(attr, pid, cpu, group_fd, 0); | 309 | fd[nr_cpu][counter][thread_index] = sys_perf_event_open(attr, |
282 | 310 | all_tids[thread_index], cpu, group_fd, 0); | |
283 | if (fd[nr_cpu][counter] < 0) { | 311 | |
284 | int err = errno; | 312 | if (fd[nr_cpu][counter][thread_index] < 0) { |
285 | 313 | int err = errno; | |
286 | if (err == EPERM || err == EACCES) | 314 | |
287 | die("Permission error - are you root?\n"); | 315 | if (err == EPERM || err == EACCES) |
288 | else if (err == ENODEV && profile_cpu != -1) | 316 | die("Permission error - are you root?\n" |
289 | die("No such device - did you specify an out-of-range profile CPU?\n"); | 317 | "\t Consider tweaking" |
318 | " /proc/sys/kernel/perf_event_paranoid.\n"); | ||
319 | else if (err == ENODEV && profile_cpu != -1) { | ||
320 | die("No such device - did you specify" | ||
321 | " an out-of-range profile CPU?\n"); | ||
322 | } | ||
290 | 323 | ||
291 | /* | 324 | /* |
292 | * If it's cycles then fall back to hrtimer | 325 | * If it's cycles then fall back to hrtimer |
293 | * based cpu-clock-tick sw counter, which | 326 | * based cpu-clock-tick sw counter, which |
294 | * is always available even if no PMU support: | 327 | * is always available even if no PMU support: |
295 | */ | 328 | */ |
296 | if (attr->type == PERF_TYPE_HARDWARE | 329 | if (attr->type == PERF_TYPE_HARDWARE |
297 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | 330 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { |
298 | 331 | ||
299 | if (verbose) | 332 | if (verbose) |
300 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | 333 | warning(" ... trying to fall back to cpu-clock-ticks\n"); |
301 | attr->type = PERF_TYPE_SOFTWARE; | 334 | attr->type = PERF_TYPE_SOFTWARE; |
302 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | 335 | attr->config = PERF_COUNT_SW_CPU_CLOCK; |
303 | goto try_again; | 336 | goto try_again; |
304 | } | 337 | } |
305 | printf("\n"); | 338 | printf("\n"); |
306 | error("perfcounter syscall returned with %d (%s)\n", | 339 | error("perfcounter syscall returned with %d (%s)\n", |
307 | fd[nr_cpu][counter], strerror(err)); | 340 | fd[nr_cpu][counter][thread_index], strerror(err)); |
308 | 341 | ||
309 | #if defined(__i386__) || defined(__x86_64__) | 342 | #if defined(__i386__) || defined(__x86_64__) |
310 | if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP) | 343 | if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP) |
311 | die("No hardware sampling interrupt available. No APIC? If so then you can boot the kernel with the \"lapic\" boot parameter to force-enable it.\n"); | 344 | die("No hardware sampling interrupt available." |
345 | " No APIC? If so then you can boot the kernel" | ||
346 | " with the \"lapic\" boot parameter to" | ||
347 | " force-enable it.\n"); | ||
312 | #endif | 348 | #endif |
313 | 349 | ||
314 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | 350 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); |
315 | exit(-1); | 351 | exit(-1); |
316 | } | 352 | } |
317 | 353 | ||
318 | h_attr = get_header_attr(attr, counter); | 354 | h_attr = get_header_attr(attr, counter); |
319 | if (h_attr == NULL) | 355 | if (h_attr == NULL) |
320 | die("nomem\n"); | 356 | die("nomem\n"); |
321 | 357 | ||
322 | if (!file_new) { | 358 | if (!file_new) { |
323 | if (memcmp(&h_attr->attr, attr, sizeof(*attr))) { | 359 | if (memcmp(&h_attr->attr, attr, sizeof(*attr))) { |
324 | fprintf(stderr, "incompatible append\n"); | 360 | fprintf(stderr, "incompatible append\n"); |
325 | exit(-1); | 361 | exit(-1); |
362 | } | ||
326 | } | 363 | } |
327 | } | ||
328 | 364 | ||
329 | if (read(fd[nr_cpu][counter], &read_data, sizeof(read_data)) == -1) { | 365 | if (read(fd[nr_cpu][counter][thread_index], &read_data, sizeof(read_data)) == -1) { |
330 | perror("Unable to read perf file descriptor\n"); | 366 | perror("Unable to read perf file descriptor\n"); |
331 | exit(-1); | 367 | exit(-1); |
332 | } | 368 | } |
333 | 369 | ||
334 | if (perf_header_attr__add_id(h_attr, read_data.id) < 0) { | 370 | if (perf_header_attr__add_id(h_attr, read_data.id) < 0) { |
335 | pr_warning("Not enough memory to add id\n"); | 371 | pr_warning("Not enough memory to add id\n"); |
336 | exit(-1); | 372 | exit(-1); |
337 | } | 373 | } |
338 | 374 | ||
339 | assert(fd[nr_cpu][counter] >= 0); | 375 | assert(fd[nr_cpu][counter][thread_index] >= 0); |
340 | fcntl(fd[nr_cpu][counter], F_SETFL, O_NONBLOCK); | 376 | fcntl(fd[nr_cpu][counter][thread_index], F_SETFL, O_NONBLOCK); |
341 | 377 | ||
342 | /* | 378 | /* |
343 | * First counter acts as the group leader: | 379 | * First counter acts as the group leader: |
344 | */ | 380 | */ |
345 | if (group && group_fd == -1) | 381 | if (group && group_fd == -1) |
346 | group_fd = fd[nr_cpu][counter]; | 382 | group_fd = fd[nr_cpu][counter][thread_index]; |
347 | if (multiplex && multiplex_fd == -1) | 383 | if (multiplex && multiplex_fd == -1) |
348 | multiplex_fd = fd[nr_cpu][counter]; | 384 | multiplex_fd = fd[nr_cpu][counter][thread_index]; |
349 | 385 | ||
350 | if (multiplex && fd[nr_cpu][counter] != multiplex_fd) { | 386 | if (multiplex && fd[nr_cpu][counter][thread_index] != multiplex_fd) { |
351 | 387 | ||
352 | ret = ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_SET_OUTPUT, multiplex_fd); | 388 | ret = ioctl(fd[nr_cpu][counter][thread_index], PERF_EVENT_IOC_SET_OUTPUT, multiplex_fd); |
353 | assert(ret != -1); | 389 | assert(ret != -1); |
354 | } else { | 390 | } else { |
355 | event_array[nr_poll].fd = fd[nr_cpu][counter]; | 391 | event_array[nr_poll].fd = fd[nr_cpu][counter][thread_index]; |
356 | event_array[nr_poll].events = POLLIN; | 392 | event_array[nr_poll].events = POLLIN; |
357 | nr_poll++; | 393 | nr_poll++; |
358 | 394 | ||
359 | mmap_array[nr_cpu][counter].counter = counter; | 395 | mmap_array[nr_cpu][counter][thread_index].counter = counter; |
360 | mmap_array[nr_cpu][counter].prev = 0; | 396 | mmap_array[nr_cpu][counter][thread_index].prev = 0; |
361 | mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1; | 397 | mmap_array[nr_cpu][counter][thread_index].mask = mmap_pages*page_size - 1; |
362 | mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size, | 398 | mmap_array[nr_cpu][counter][thread_index].base = mmap(NULL, (mmap_pages+1)*page_size, |
363 | PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter], 0); | 399 | PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter][thread_index], 0); |
364 | if (mmap_array[nr_cpu][counter].base == MAP_FAILED) { | 400 | if (mmap_array[nr_cpu][counter][thread_index].base == MAP_FAILED) { |
365 | error("failed to mmap with %d (%s)\n", errno, strerror(errno)); | 401 | error("failed to mmap with %d (%s)\n", errno, strerror(errno)); |
366 | exit(-1); | 402 | exit(-1); |
403 | } | ||
367 | } | 404 | } |
368 | } | ||
369 | 405 | ||
370 | if (filter != NULL) { | 406 | if (filter != NULL) { |
371 | ret = ioctl(fd[nr_cpu][counter], | 407 | ret = ioctl(fd[nr_cpu][counter][thread_index], |
372 | PERF_EVENT_IOC_SET_FILTER, filter); | 408 | PERF_EVENT_IOC_SET_FILTER, filter); |
373 | if (ret) { | 409 | if (ret) { |
374 | error("failed to set filter with %d (%s)\n", errno, | 410 | error("failed to set filter with %d (%s)\n", errno, |
375 | strerror(errno)); | 411 | strerror(errno)); |
376 | exit(-1); | 412 | exit(-1); |
413 | } | ||
377 | } | 414 | } |
378 | } | 415 | } |
379 | |||
380 | ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_ENABLE); | ||
381 | } | 416 | } |
382 | 417 | ||
383 | static void open_counters(int cpu, pid_t pid) | 418 | static void open_counters(int cpu) |
384 | { | 419 | { |
385 | int counter; | 420 | int counter; |
386 | 421 | ||
387 | group_fd = -1; | 422 | group_fd = -1; |
388 | for (counter = 0; counter < nr_counters; counter++) | 423 | for (counter = 0; counter < nr_counters; counter++) |
389 | create_counter(counter, cpu, pid); | 424 | create_counter(counter, cpu); |
390 | 425 | ||
391 | nr_cpu++; | 426 | nr_cpu++; |
392 | } | 427 | } |
@@ -406,10 +441,80 @@ static int process_buildids(void) | |||
406 | 441 | ||
407 | static void atexit_header(void) | 442 | static void atexit_header(void) |
408 | { | 443 | { |
409 | session->header.data_size += bytes_written; | 444 | if (!pipe_output) { |
445 | session->header.data_size += bytes_written; | ||
446 | |||
447 | process_buildids(); | ||
448 | perf_header__write(&session->header, output, true); | ||
449 | } | ||
450 | } | ||
451 | |||
452 | static void event__synthesize_guest_os(struct machine *machine, void *data) | ||
453 | { | ||
454 | int err; | ||
455 | char *guest_kallsyms; | ||
456 | char path[PATH_MAX]; | ||
457 | struct perf_session *psession = data; | ||
458 | |||
459 | if (machine__is_host(machine)) | ||
460 | return; | ||
461 | |||
462 | /* | ||
463 | *As for guest kernel when processing subcommand record&report, | ||
464 | *we arrange module mmap prior to guest kernel mmap and trigger | ||
465 | *a preload dso because default guest module symbols are loaded | ||
466 | *from guest kallsyms instead of /lib/modules/XXX/XXX. This | ||
467 | *method is used to avoid symbol missing when the first addr is | ||
468 | *in module instead of in guest kernel. | ||
469 | */ | ||
470 | err = event__synthesize_modules(process_synthesized_event, | ||
471 | psession, machine); | ||
472 | if (err < 0) | ||
473 | pr_err("Couldn't record guest kernel [%d]'s reference" | ||
474 | " relocation symbol.\n", machine->pid); | ||
475 | |||
476 | if (machine__is_default_guest(machine)) | ||
477 | guest_kallsyms = (char *) symbol_conf.default_guest_kallsyms; | ||
478 | else { | ||
479 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
480 | guest_kallsyms = path; | ||
481 | } | ||
482 | |||
483 | /* | ||
484 | * We use _stext for guest kernel because guest kernel's /proc/kallsyms | ||
485 | * have no _text sometimes. | ||
486 | */ | ||
487 | err = event__synthesize_kernel_mmap(process_synthesized_event, | ||
488 | psession, machine, "_text"); | ||
489 | if (err < 0) | ||
490 | err = event__synthesize_kernel_mmap(process_synthesized_event, | ||
491 | psession, machine, "_stext"); | ||
492 | if (err < 0) | ||
493 | pr_err("Couldn't record guest kernel [%d]'s reference" | ||
494 | " relocation symbol.\n", machine->pid); | ||
495 | } | ||
496 | |||
497 | static struct perf_event_header finished_round_event = { | ||
498 | .size = sizeof(struct perf_event_header), | ||
499 | .type = PERF_RECORD_FINISHED_ROUND, | ||
500 | }; | ||
501 | |||
502 | static void mmap_read_all(void) | ||
503 | { | ||
504 | int i, counter, thread; | ||
410 | 505 | ||
411 | process_buildids(); | 506 | for (i = 0; i < nr_cpu; i++) { |
412 | perf_header__write(&session->header, output, true); | 507 | for (counter = 0; counter < nr_counters; counter++) { |
508 | for (thread = 0; thread < thread_num; thread++) { | ||
509 | if (mmap_array[i][counter][thread].base) | ||
510 | mmap_read(&mmap_array[i][counter][thread]); | ||
511 | } | ||
512 | |||
513 | } | ||
514 | } | ||
515 | |||
516 | if (perf_header__has_feat(&session->header, HEADER_TRACE_INFO)) | ||
517 | write_output(&finished_round_event, sizeof(finished_round_event)); | ||
413 | } | 518 | } |
414 | 519 | ||
415 | static int __cmd_record(int argc, const char **argv) | 520 | static int __cmd_record(int argc, const char **argv) |
@@ -421,8 +526,9 @@ static int __cmd_record(int argc, const char **argv) | |||
421 | int err; | 526 | int err; |
422 | unsigned long waking = 0; | 527 | unsigned long waking = 0; |
423 | int child_ready_pipe[2], go_pipe[2]; | 528 | int child_ready_pipe[2], go_pipe[2]; |
424 | const bool forks = target_pid == -1 && argc > 0; | 529 | const bool forks = argc > 0; |
425 | char buf; | 530 | char buf; |
531 | struct machine *machine; | ||
426 | 532 | ||
427 | page_size = sysconf(_SC_PAGE_SIZE); | 533 | page_size = sysconf(_SC_PAGE_SIZE); |
428 | 534 | ||
@@ -435,70 +541,63 @@ static int __cmd_record(int argc, const char **argv) | |||
435 | exit(-1); | 541 | exit(-1); |
436 | } | 542 | } |
437 | 543 | ||
438 | if (!stat(output_name, &st) && st.st_size) { | 544 | if (!strcmp(output_name, "-")) |
439 | if (!force) { | 545 | pipe_output = 1; |
440 | if (!append_file) { | 546 | else if (!stat(output_name, &st) && st.st_size) { |
441 | pr_err("Error, output file %s exists, use -A " | 547 | if (write_mode == WRITE_FORCE) { |
442 | "to append or -f to overwrite.\n", | ||
443 | output_name); | ||
444 | exit(-1); | ||
445 | } | ||
446 | } else { | ||
447 | char oldname[PATH_MAX]; | 548 | char oldname[PATH_MAX]; |
448 | snprintf(oldname, sizeof(oldname), "%s.old", | 549 | snprintf(oldname, sizeof(oldname), "%s.old", |
449 | output_name); | 550 | output_name); |
450 | unlink(oldname); | 551 | unlink(oldname); |
451 | rename(output_name, oldname); | 552 | rename(output_name, oldname); |
452 | } | 553 | } |
453 | } else { | 554 | } else if (write_mode == WRITE_APPEND) { |
454 | append_file = 0; | 555 | write_mode = WRITE_FORCE; |
455 | } | 556 | } |
456 | 557 | ||
457 | flags = O_CREAT|O_RDWR; | 558 | flags = O_CREAT|O_RDWR; |
458 | if (append_file) | 559 | if (write_mode == WRITE_APPEND) |
459 | file_new = 0; | 560 | file_new = 0; |
460 | else | 561 | else |
461 | flags |= O_TRUNC; | 562 | flags |= O_TRUNC; |
462 | 563 | ||
463 | output = open(output_name, flags, S_IRUSR|S_IWUSR); | 564 | if (pipe_output) |
565 | output = STDOUT_FILENO; | ||
566 | else | ||
567 | output = open(output_name, flags, S_IRUSR | S_IWUSR); | ||
464 | if (output < 0) { | 568 | if (output < 0) { |
465 | perror("failed to create output file"); | 569 | perror("failed to create output file"); |
466 | exit(-1); | 570 | exit(-1); |
467 | } | 571 | } |
468 | 572 | ||
469 | session = perf_session__new(output_name, O_WRONLY, force); | 573 | session = perf_session__new(output_name, O_WRONLY, |
574 | write_mode == WRITE_FORCE, false); | ||
470 | if (session == NULL) { | 575 | if (session == NULL) { |
471 | pr_err("Not enough memory for reading perf file header\n"); | 576 | pr_err("Not enough memory for reading perf file header\n"); |
472 | return -1; | 577 | return -1; |
473 | } | 578 | } |
474 | 579 | ||
475 | if (!file_new) { | 580 | if (!file_new) { |
476 | err = perf_header__read(&session->header, output); | 581 | err = perf_header__read(session, output); |
477 | if (err < 0) | 582 | if (err < 0) |
478 | return err; | 583 | return err; |
479 | } | 584 | } |
480 | 585 | ||
481 | if (raw_samples) { | 586 | if (have_tracepoints(attrs, nr_counters)) |
482 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); | 587 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); |
483 | } else { | ||
484 | for (i = 0; i < nr_counters; i++) { | ||
485 | if (attrs[i].sample_type & PERF_SAMPLE_RAW) { | ||
486 | perf_header__set_feat(&session->header, HEADER_TRACE_INFO); | ||
487 | break; | ||
488 | } | ||
489 | } | ||
490 | } | ||
491 | 588 | ||
492 | atexit(atexit_header); | 589 | atexit(atexit_header); |
493 | 590 | ||
494 | if (forks) { | 591 | if (forks) { |
495 | pid = fork(); | 592 | child_pid = fork(); |
496 | if (pid < 0) { | 593 | if (pid < 0) { |
497 | perror("failed to fork"); | 594 | perror("failed to fork"); |
498 | exit(-1); | 595 | exit(-1); |
499 | } | 596 | } |
500 | 597 | ||
501 | if (!pid) { | 598 | if (!child_pid) { |
599 | if (pipe_output) | ||
600 | dup2(2, 1); | ||
502 | close(child_ready_pipe[0]); | 601 | close(child_ready_pipe[0]); |
503 | close(go_pipe[1]); | 602 | close(go_pipe[1]); |
504 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); | 603 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); |
@@ -527,10 +626,8 @@ static int __cmd_record(int argc, const char **argv) | |||
527 | exit(-1); | 626 | exit(-1); |
528 | } | 627 | } |
529 | 628 | ||
530 | child_pid = pid; | 629 | if (!system_wide && target_tid == -1 && target_pid == -1) |
531 | 630 | all_tids[0] = child_pid; | |
532 | if (!system_wide) | ||
533 | target_pid = pid; | ||
534 | 631 | ||
535 | close(child_ready_pipe[1]); | 632 | close(child_ready_pipe[1]); |
536 | close(go_pipe[0]); | 633 | close(go_pipe[0]); |
@@ -544,16 +641,19 @@ static int __cmd_record(int argc, const char **argv) | |||
544 | close(child_ready_pipe[0]); | 641 | close(child_ready_pipe[0]); |
545 | } | 642 | } |
546 | 643 | ||
547 | 644 | if ((!system_wide && no_inherit) || profile_cpu != -1) { | |
548 | if ((!system_wide && !inherit) || profile_cpu != -1) { | 645 | open_counters(profile_cpu); |
549 | open_counters(profile_cpu, target_pid); | ||
550 | } else { | 646 | } else { |
551 | nr_cpus = read_cpu_map(); | 647 | nr_cpus = read_cpu_map(); |
552 | for (i = 0; i < nr_cpus; i++) | 648 | for (i = 0; i < nr_cpus; i++) |
553 | open_counters(cpumap[i], target_pid); | 649 | open_counters(cpumap[i]); |
554 | } | 650 | } |
555 | 651 | ||
556 | if (file_new) { | 652 | if (pipe_output) { |
653 | err = perf_header__write_pipe(output); | ||
654 | if (err < 0) | ||
655 | return err; | ||
656 | } else if (file_new) { | ||
557 | err = perf_header__write(&session->header, output, false); | 657 | err = perf_header__write(&session->header, output, false); |
558 | if (err < 0) | 658 | if (err < 0) |
559 | return err; | 659 | return err; |
@@ -561,21 +661,70 @@ static int __cmd_record(int argc, const char **argv) | |||
561 | 661 | ||
562 | post_processing_offset = lseek(output, 0, SEEK_CUR); | 662 | post_processing_offset = lseek(output, 0, SEEK_CUR); |
563 | 663 | ||
664 | if (pipe_output) { | ||
665 | err = event__synthesize_attrs(&session->header, | ||
666 | process_synthesized_event, | ||
667 | session); | ||
668 | if (err < 0) { | ||
669 | pr_err("Couldn't synthesize attrs.\n"); | ||
670 | return err; | ||
671 | } | ||
672 | |||
673 | err = event__synthesize_event_types(process_synthesized_event, | ||
674 | session); | ||
675 | if (err < 0) { | ||
676 | pr_err("Couldn't synthesize event_types.\n"); | ||
677 | return err; | ||
678 | } | ||
679 | |||
680 | if (have_tracepoints(attrs, nr_counters)) { | ||
681 | /* | ||
682 | * FIXME err <= 0 here actually means that | ||
683 | * there were no tracepoints so its not really | ||
684 | * an error, just that we don't need to | ||
685 | * synthesize anything. We really have to | ||
686 | * return this more properly and also | ||
687 | * propagate errors that now are calling die() | ||
688 | */ | ||
689 | err = event__synthesize_tracing_data(output, attrs, | ||
690 | nr_counters, | ||
691 | process_synthesized_event, | ||
692 | session); | ||
693 | if (err <= 0) { | ||
694 | pr_err("Couldn't record tracing data.\n"); | ||
695 | return err; | ||
696 | } | ||
697 | advance_output(err); | ||
698 | } | ||
699 | } | ||
700 | |||
701 | machine = perf_session__find_host_machine(session); | ||
702 | if (!machine) { | ||
703 | pr_err("Couldn't find native kernel information.\n"); | ||
704 | return -1; | ||
705 | } | ||
706 | |||
564 | err = event__synthesize_kernel_mmap(process_synthesized_event, | 707 | err = event__synthesize_kernel_mmap(process_synthesized_event, |
565 | session, "_text"); | 708 | session, machine, "_text"); |
709 | if (err < 0) | ||
710 | err = event__synthesize_kernel_mmap(process_synthesized_event, | ||
711 | session, machine, "_stext"); | ||
566 | if (err < 0) { | 712 | if (err < 0) { |
567 | pr_err("Couldn't record kernel reference relocation symbol.\n"); | 713 | pr_err("Couldn't record kernel reference relocation symbol.\n"); |
568 | return err; | 714 | return err; |
569 | } | 715 | } |
570 | 716 | ||
571 | err = event__synthesize_modules(process_synthesized_event, session); | 717 | err = event__synthesize_modules(process_synthesized_event, |
718 | session, machine); | ||
572 | if (err < 0) { | 719 | if (err < 0) { |
573 | pr_err("Couldn't record kernel reference relocation symbol.\n"); | 720 | pr_err("Couldn't record kernel reference relocation symbol.\n"); |
574 | return err; | 721 | return err; |
575 | } | 722 | } |
723 | if (perf_guest) | ||
724 | perf_session__process_machines(session, event__synthesize_guest_os); | ||
576 | 725 | ||
577 | if (!system_wide && profile_cpu == -1) | 726 | if (!system_wide && profile_cpu == -1) |
578 | event__synthesize_thread(target_pid, process_synthesized_event, | 727 | event__synthesize_thread(target_tid, process_synthesized_event, |
579 | session); | 728 | session); |
580 | else | 729 | else |
581 | event__synthesize_threads(process_synthesized_event, session); | 730 | event__synthesize_threads(process_synthesized_event, session); |
@@ -598,13 +747,9 @@ static int __cmd_record(int argc, const char **argv) | |||
598 | 747 | ||
599 | for (;;) { | 748 | for (;;) { |
600 | int hits = samples; | 749 | int hits = samples; |
750 | int thread; | ||
601 | 751 | ||
602 | for (i = 0; i < nr_cpu; i++) { | 752 | mmap_read_all(); |
603 | for (counter = 0; counter < nr_counters; counter++) { | ||
604 | if (mmap_array[i][counter].base) | ||
605 | mmap_read(&mmap_array[i][counter]); | ||
606 | } | ||
607 | } | ||
608 | 753 | ||
609 | if (hits == samples) { | 754 | if (hits == samples) { |
610 | if (done) | 755 | if (done) |
@@ -615,8 +760,15 @@ static int __cmd_record(int argc, const char **argv) | |||
615 | 760 | ||
616 | if (done) { | 761 | if (done) { |
617 | for (i = 0; i < nr_cpu; i++) { | 762 | for (i = 0; i < nr_cpu; i++) { |
618 | for (counter = 0; counter < nr_counters; counter++) | 763 | for (counter = 0; |
619 | ioctl(fd[i][counter], PERF_EVENT_IOC_DISABLE); | 764 | counter < nr_counters; |
765 | counter++) { | ||
766 | for (thread = 0; | ||
767 | thread < thread_num; | ||
768 | thread++) | ||
769 | ioctl(fd[i][counter][thread], | ||
770 | PERF_EVENT_IOC_DISABLE); | ||
771 | } | ||
620 | } | 772 | } |
621 | } | 773 | } |
622 | } | 774 | } |
@@ -641,6 +793,8 @@ static const char * const record_usage[] = { | |||
641 | NULL | 793 | NULL |
642 | }; | 794 | }; |
643 | 795 | ||
796 | static bool force, append_file; | ||
797 | |||
644 | static const struct option options[] = { | 798 | static const struct option options[] = { |
645 | OPT_CALLBACK('e', "event", NULL, "event", | 799 | OPT_CALLBACK('e', "event", NULL, "event", |
646 | "event selector. use 'perf list' to list available events", | 800 | "event selector. use 'perf list' to list available events", |
@@ -648,7 +802,9 @@ static const struct option options[] = { | |||
648 | OPT_CALLBACK(0, "filter", NULL, "filter", | 802 | OPT_CALLBACK(0, "filter", NULL, "filter", |
649 | "event filter", parse_filter), | 803 | "event filter", parse_filter), |
650 | OPT_INTEGER('p', "pid", &target_pid, | 804 | OPT_INTEGER('p', "pid", &target_pid, |
651 | "record events on existing pid"), | 805 | "record events on existing process id"), |
806 | OPT_INTEGER('t', "tid", &target_tid, | ||
807 | "record events on existing thread id"), | ||
652 | OPT_INTEGER('r', "realtime", &realtime_prio, | 808 | OPT_INTEGER('r', "realtime", &realtime_prio, |
653 | "collect data with this RT SCHED_FIFO priority"), | 809 | "collect data with this RT SCHED_FIFO priority"), |
654 | OPT_BOOLEAN('R', "raw-samples", &raw_samples, | 810 | OPT_BOOLEAN('R', "raw-samples", &raw_samples, |
@@ -660,20 +816,20 @@ static const struct option options[] = { | |||
660 | OPT_INTEGER('C', "profile_cpu", &profile_cpu, | 816 | OPT_INTEGER('C', "profile_cpu", &profile_cpu, |
661 | "CPU to profile on"), | 817 | "CPU to profile on"), |
662 | OPT_BOOLEAN('f', "force", &force, | 818 | OPT_BOOLEAN('f', "force", &force, |
663 | "overwrite existing data file"), | 819 | "overwrite existing data file (deprecated)"), |
664 | OPT_LONG('c', "count", &default_interval, | 820 | OPT_LONG('c', "count", &user_interval, |
665 | "event period to sample"), | 821 | "event period to sample"), |
666 | OPT_STRING('o', "output", &output_name, "file", | 822 | OPT_STRING('o', "output", &output_name, "file", |
667 | "output file name"), | 823 | "output file name"), |
668 | OPT_BOOLEAN('i', "inherit", &inherit, | 824 | OPT_BOOLEAN('i', "no-inherit", &no_inherit, |
669 | "child tasks inherit counters"), | 825 | "child tasks do not inherit counters"), |
670 | OPT_INTEGER('F', "freq", &freq, | 826 | OPT_INTEGER('F', "freq", &user_freq, |
671 | "profile at this frequency"), | 827 | "profile at this frequency"), |
672 | OPT_INTEGER('m', "mmap-pages", &mmap_pages, | 828 | OPT_INTEGER('m', "mmap-pages", &mmap_pages, |
673 | "number of mmap data pages"), | 829 | "number of mmap data pages"), |
674 | OPT_BOOLEAN('g', "call-graph", &call_graph, | 830 | OPT_BOOLEAN('g', "call-graph", &call_graph, |
675 | "do call-graph (stack chain/backtrace) recording"), | 831 | "do call-graph (stack chain/backtrace) recording"), |
676 | OPT_BOOLEAN('v', "verbose", &verbose, | 832 | OPT_INCR('v', "verbose", &verbose, |
677 | "be more verbose (show counter open errors, etc)"), | 833 | "be more verbose (show counter open errors, etc)"), |
678 | OPT_BOOLEAN('s', "stat", &inherit_stat, | 834 | OPT_BOOLEAN('s', "stat", &inherit_stat, |
679 | "per thread counts"), | 835 | "per thread counts"), |
@@ -688,13 +844,24 @@ static const struct option options[] = { | |||
688 | 844 | ||
689 | int cmd_record(int argc, const char **argv, const char *prefix __used) | 845 | int cmd_record(int argc, const char **argv, const char *prefix __used) |
690 | { | 846 | { |
691 | int counter; | 847 | int i,j; |
692 | 848 | ||
693 | argc = parse_options(argc, argv, options, record_usage, | 849 | argc = parse_options(argc, argv, options, record_usage, |
694 | PARSE_OPT_STOP_AT_NON_OPTION); | 850 | PARSE_OPT_STOP_AT_NON_OPTION); |
695 | if (!argc && target_pid == -1 && !system_wide && profile_cpu == -1) | 851 | if (!argc && target_pid == -1 && target_tid == -1 && |
852 | !system_wide && profile_cpu == -1) | ||
696 | usage_with_options(record_usage, options); | 853 | usage_with_options(record_usage, options); |
697 | 854 | ||
855 | if (force && append_file) { | ||
856 | fprintf(stderr, "Can't overwrite and append at the same time." | ||
857 | " You need to choose between -f and -A"); | ||
858 | usage_with_options(record_usage, options); | ||
859 | } else if (append_file) { | ||
860 | write_mode = WRITE_APPEND; | ||
861 | } else { | ||
862 | write_mode = WRITE_FORCE; | ||
863 | } | ||
864 | |||
698 | symbol__init(); | 865 | symbol__init(); |
699 | 866 | ||
700 | if (!nr_counters) { | 867 | if (!nr_counters) { |
@@ -703,6 +870,42 @@ int cmd_record(int argc, const char **argv, const char *prefix __used) | |||
703 | attrs[0].config = PERF_COUNT_HW_CPU_CYCLES; | 870 | attrs[0].config = PERF_COUNT_HW_CPU_CYCLES; |
704 | } | 871 | } |
705 | 872 | ||
873 | if (target_pid != -1) { | ||
874 | target_tid = target_pid; | ||
875 | thread_num = find_all_tid(target_pid, &all_tids); | ||
876 | if (thread_num <= 0) { | ||
877 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
878 | target_pid); | ||
879 | usage_with_options(record_usage, options); | ||
880 | } | ||
881 | } else { | ||
882 | all_tids=malloc(sizeof(pid_t)); | ||
883 | if (!all_tids) | ||
884 | return -ENOMEM; | ||
885 | |||
886 | all_tids[0] = target_tid; | ||
887 | thread_num = 1; | ||
888 | } | ||
889 | |||
890 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
891 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
892 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
893 | mmap_array[i][j] = zalloc( | ||
894 | sizeof(struct mmap_data)*thread_num); | ||
895 | if (!fd[i][j] || !mmap_array[i][j]) | ||
896 | return -ENOMEM; | ||
897 | } | ||
898 | } | ||
899 | event_array = malloc( | ||
900 | sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num); | ||
901 | if (!event_array) | ||
902 | return -ENOMEM; | ||
903 | |||
904 | if (user_interval != UINT_MAX) | ||
905 | default_interval = user_interval; | ||
906 | if (user_freq != UINT_MAX) | ||
907 | freq = user_freq; | ||
908 | |||
706 | /* | 909 | /* |
707 | * User specified count overrides default frequency. | 910 | * User specified count overrides default frequency. |
708 | */ | 911 | */ |
@@ -715,12 +918,5 @@ int cmd_record(int argc, const char **argv, const char *prefix __used) | |||
715 | exit(EXIT_FAILURE); | 918 | exit(EXIT_FAILURE); |
716 | } | 919 | } |
717 | 920 | ||
718 | for (counter = 0; counter < nr_counters; counter++) { | ||
719 | if (attrs[counter].sample_period) | ||
720 | continue; | ||
721 | |||
722 | attrs[counter].sample_period = default_interval; | ||
723 | } | ||
724 | |||
725 | return __cmd_record(argc, argv); | 921 | return __cmd_record(argc, argv); |
726 | } | 922 | } |
diff --git a/tools/perf/builtin-report.c b/tools/perf/builtin-report.c index f815de25d0fc..68265120ee07 100644 --- a/tools/perf/builtin-report.c +++ b/tools/perf/builtin-report.c | |||
@@ -14,7 +14,6 @@ | |||
14 | #include "util/cache.h" | 14 | #include "util/cache.h" |
15 | #include <linux/rbtree.h> | 15 | #include <linux/rbtree.h> |
16 | #include "util/symbol.h" | 16 | #include "util/symbol.h" |
17 | #include "util/string.h" | ||
18 | #include "util/callchain.h" | 17 | #include "util/callchain.h" |
19 | #include "util/strlist.h" | 18 | #include "util/strlist.h" |
20 | #include "util/values.h" | 19 | #include "util/values.h" |
@@ -33,11 +32,11 @@ | |||
33 | 32 | ||
34 | static char const *input_name = "perf.data"; | 33 | static char const *input_name = "perf.data"; |
35 | 34 | ||
36 | static int force; | 35 | static bool force; |
37 | static bool hide_unresolved; | 36 | static bool hide_unresolved; |
38 | static bool dont_use_callchains; | 37 | static bool dont_use_callchains; |
39 | 38 | ||
40 | static int show_threads; | 39 | static bool show_threads; |
41 | static struct perf_read_values show_threads_values; | 40 | static struct perf_read_values show_threads_values; |
42 | 41 | ||
43 | static char default_pretty_printing_style[] = "normal"; | 42 | static char default_pretty_printing_style[] = "normal"; |
@@ -45,16 +44,17 @@ static char *pretty_printing_style = default_pretty_printing_style; | |||
45 | 44 | ||
46 | static char callchain_default_opt[] = "fractal,0.5"; | 45 | static char callchain_default_opt[] = "fractal,0.5"; |
47 | 46 | ||
48 | static struct event_stat_id *get_stats(struct perf_session *self, | 47 | static struct hists *perf_session__hists_findnew(struct perf_session *self, |
49 | u64 event_stream, u32 type, u64 config) | 48 | u64 event_stream, u32 type, |
49 | u64 config) | ||
50 | { | 50 | { |
51 | struct rb_node **p = &self->stats_by_id.rb_node; | 51 | struct rb_node **p = &self->hists_tree.rb_node; |
52 | struct rb_node *parent = NULL; | 52 | struct rb_node *parent = NULL; |
53 | struct event_stat_id *iter, *new; | 53 | struct hists *iter, *new; |
54 | 54 | ||
55 | while (*p != NULL) { | 55 | while (*p != NULL) { |
56 | parent = *p; | 56 | parent = *p; |
57 | iter = rb_entry(parent, struct event_stat_id, rb_node); | 57 | iter = rb_entry(parent, struct hists, rb_node); |
58 | if (iter->config == config) | 58 | if (iter->config == config) |
59 | return iter; | 59 | return iter; |
60 | 60 | ||
@@ -65,15 +65,15 @@ static struct event_stat_id *get_stats(struct perf_session *self, | |||
65 | p = &(*p)->rb_left; | 65 | p = &(*p)->rb_left; |
66 | } | 66 | } |
67 | 67 | ||
68 | new = malloc(sizeof(struct event_stat_id)); | 68 | new = malloc(sizeof(struct hists)); |
69 | if (new == NULL) | 69 | if (new == NULL) |
70 | return NULL; | 70 | return NULL; |
71 | memset(new, 0, sizeof(struct event_stat_id)); | 71 | memset(new, 0, sizeof(struct hists)); |
72 | new->event_stream = event_stream; | 72 | new->event_stream = event_stream; |
73 | new->config = config; | 73 | new->config = config; |
74 | new->type = type; | 74 | new->type = type; |
75 | rb_link_node(&new->rb_node, parent, p); | 75 | rb_link_node(&new->rb_node, parent, p); |
76 | rb_insert_color(&new->rb_node, &self->stats_by_id); | 76 | rb_insert_color(&new->rb_node, &self->hists_tree); |
77 | return new; | 77 | return new; |
78 | } | 78 | } |
79 | 79 | ||
@@ -81,70 +81,71 @@ static int perf_session__add_hist_entry(struct perf_session *self, | |||
81 | struct addr_location *al, | 81 | struct addr_location *al, |
82 | struct sample_data *data) | 82 | struct sample_data *data) |
83 | { | 83 | { |
84 | struct symbol **syms = NULL, *parent = NULL; | 84 | struct map_symbol *syms = NULL; |
85 | bool hit; | 85 | struct symbol *parent = NULL; |
86 | int err = -ENOMEM; | ||
86 | struct hist_entry *he; | 87 | struct hist_entry *he; |
87 | struct event_stat_id *stats; | 88 | struct hists *hists; |
88 | struct perf_event_attr *attr; | 89 | struct perf_event_attr *attr; |
89 | 90 | ||
90 | if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) | 91 | if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) { |
91 | syms = perf_session__resolve_callchain(self, al->thread, | 92 | syms = perf_session__resolve_callchain(self, al->thread, |
92 | data->callchain, &parent); | 93 | data->callchain, &parent); |
94 | if (syms == NULL) | ||
95 | return -ENOMEM; | ||
96 | } | ||
93 | 97 | ||
94 | attr = perf_header__find_attr(data->id, &self->header); | 98 | attr = perf_header__find_attr(data->id, &self->header); |
95 | if (attr) | 99 | if (attr) |
96 | stats = get_stats(self, data->id, attr->type, attr->config); | 100 | hists = perf_session__hists_findnew(self, data->id, attr->type, attr->config); |
97 | else | 101 | else |
98 | stats = get_stats(self, data->id, 0, 0); | 102 | hists = perf_session__hists_findnew(self, data->id, 0, 0); |
99 | if (stats == NULL) | 103 | if (hists == NULL) |
100 | return -ENOMEM; | 104 | goto out_free_syms; |
101 | he = __perf_session__add_hist_entry(&stats->hists, al, parent, | 105 | he = __hists__add_entry(hists, al, parent, data->period); |
102 | data->period, &hit); | ||
103 | if (he == NULL) | 106 | if (he == NULL) |
104 | return -ENOMEM; | 107 | goto out_free_syms; |
105 | 108 | err = 0; | |
106 | if (hit) | ||
107 | he->count += data->period; | ||
108 | |||
109 | if (symbol_conf.use_callchain) { | 109 | if (symbol_conf.use_callchain) { |
110 | if (!hit) | 110 | err = append_chain(he->callchain, data->callchain, syms); |
111 | callchain_init(&he->callchain); | 111 | if (err) |
112 | append_chain(&he->callchain, data->callchain, syms); | 112 | goto out_free_syms; |
113 | free(syms); | ||
114 | } | 113 | } |
115 | 114 | /* | |
116 | return 0; | 115 | * Only in the newt browser we are doing integrated annotation, |
117 | } | 116 | * so we don't allocated the extra space needed because the stdio |
118 | 117 | * code will not use it. | |
119 | static int validate_chain(struct ip_callchain *chain, event_t *event) | 118 | */ |
120 | { | 119 | if (use_browser) |
121 | unsigned int chain_size; | 120 | err = hist_entry__inc_addr_samples(he, al->addr); |
122 | 121 | out_free_syms: | |
123 | chain_size = event->header.size; | 122 | free(syms); |
124 | chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event; | 123 | return err; |
125 | |||
126 | if (chain->nr*sizeof(u64) > chain_size) | ||
127 | return -1; | ||
128 | |||
129 | return 0; | ||
130 | } | 124 | } |
131 | 125 | ||
132 | static int add_event_total(struct perf_session *session, | 126 | static int add_event_total(struct perf_session *session, |
133 | struct sample_data *data, | 127 | struct sample_data *data, |
134 | struct perf_event_attr *attr) | 128 | struct perf_event_attr *attr) |
135 | { | 129 | { |
136 | struct event_stat_id *stats; | 130 | struct hists *hists; |
137 | 131 | ||
138 | if (attr) | 132 | if (attr) |
139 | stats = get_stats(session, data->id, attr->type, attr->config); | 133 | hists = perf_session__hists_findnew(session, data->id, |
134 | attr->type, attr->config); | ||
140 | else | 135 | else |
141 | stats = get_stats(session, data->id, 0, 0); | 136 | hists = perf_session__hists_findnew(session, data->id, 0, 0); |
142 | 137 | ||
143 | if (!stats) | 138 | if (!hists) |
144 | return -ENOMEM; | 139 | return -ENOMEM; |
145 | 140 | ||
146 | stats->stats.total += data->period; | 141 | hists->stats.total_period += data->period; |
147 | session->events_stats.total += data->period; | 142 | /* |
143 | * FIXME: add_event_total should be moved from here to | ||
144 | * perf_session__process_event so that the proper hist is passed to | ||
145 | * the event_op methods. | ||
146 | */ | ||
147 | hists__inc_nr_events(hists, PERF_RECORD_SAMPLE); | ||
148 | session->hists.stats.total_period += data->period; | ||
148 | return 0; | 149 | return 0; |
149 | } | 150 | } |
150 | 151 | ||
@@ -164,7 +165,7 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
164 | 165 | ||
165 | dump_printf("... chain: nr:%Lu\n", data.callchain->nr); | 166 | dump_printf("... chain: nr:%Lu\n", data.callchain->nr); |
166 | 167 | ||
167 | if (validate_chain(data.callchain, event) < 0) { | 168 | if (!ip_callchain__valid(data.callchain, event)) { |
168 | pr_debug("call-chain problem with event, " | 169 | pr_debug("call-chain problem with event, " |
169 | "skipping it.\n"); | 170 | "skipping it.\n"); |
170 | return 0; | 171 | return 0; |
@@ -187,14 +188,14 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
187 | return 0; | 188 | return 0; |
188 | 189 | ||
189 | if (perf_session__add_hist_entry(session, &al, &data)) { | 190 | if (perf_session__add_hist_entry(session, &al, &data)) { |
190 | pr_debug("problem incrementing symbol count, skipping event\n"); | 191 | pr_debug("problem incrementing symbol period, skipping event\n"); |
191 | return -1; | 192 | return -1; |
192 | } | 193 | } |
193 | 194 | ||
194 | attr = perf_header__find_attr(data.id, &session->header); | 195 | attr = perf_header__find_attr(data.id, &session->header); |
195 | 196 | ||
196 | if (add_event_total(session, &data, attr)) { | 197 | if (add_event_total(session, &data, attr)) { |
197 | pr_debug("problem adding event count\n"); | 198 | pr_debug("problem adding event period\n"); |
198 | return -1; | 199 | return -1; |
199 | } | 200 | } |
200 | 201 | ||
@@ -260,15 +261,43 @@ static struct perf_event_ops event_ops = { | |||
260 | .fork = event__process_task, | 261 | .fork = event__process_task, |
261 | .lost = event__process_lost, | 262 | .lost = event__process_lost, |
262 | .read = process_read_event, | 263 | .read = process_read_event, |
264 | .attr = event__process_attr, | ||
265 | .event_type = event__process_event_type, | ||
266 | .tracing_data = event__process_tracing_data, | ||
267 | .build_id = event__process_build_id, | ||
263 | }; | 268 | }; |
264 | 269 | ||
270 | extern volatile int session_done; | ||
271 | |||
272 | static void sig_handler(int sig __used) | ||
273 | { | ||
274 | session_done = 1; | ||
275 | } | ||
276 | |||
277 | static size_t hists__fprintf_nr_sample_events(struct hists *self, | ||
278 | const char *evname, FILE *fp) | ||
279 | { | ||
280 | size_t ret; | ||
281 | char unit; | ||
282 | unsigned long nr_events = self->stats.nr_events[PERF_RECORD_SAMPLE]; | ||
283 | |||
284 | nr_events = convert_unit(nr_events, &unit); | ||
285 | ret = fprintf(fp, "# Events: %lu%c", nr_events, unit); | ||
286 | if (evname != NULL) | ||
287 | ret += fprintf(fp, " %s", evname); | ||
288 | return ret + fprintf(fp, "\n#\n"); | ||
289 | } | ||
290 | |||
265 | static int __cmd_report(void) | 291 | static int __cmd_report(void) |
266 | { | 292 | { |
267 | int ret = -EINVAL; | 293 | int ret = -EINVAL; |
268 | struct perf_session *session; | 294 | struct perf_session *session; |
269 | struct rb_node *next; | 295 | struct rb_node *next; |
296 | const char *help = "For a higher level overview, try: perf report --sort comm,dso"; | ||
297 | |||
298 | signal(SIGINT, sig_handler); | ||
270 | 299 | ||
271 | session = perf_session__new(input_name, O_RDONLY, force); | 300 | session = perf_session__new(input_name, O_RDONLY, force, false); |
272 | if (session == NULL) | 301 | if (session == NULL) |
273 | return -ENOMEM; | 302 | return -ENOMEM; |
274 | 303 | ||
@@ -284,7 +313,7 @@ static int __cmd_report(void) | |||
284 | goto out_delete; | 313 | goto out_delete; |
285 | 314 | ||
286 | if (dump_trace) { | 315 | if (dump_trace) { |
287 | event__print_totals(); | 316 | perf_session__fprintf_nr_events(session, stdout); |
288 | goto out_delete; | 317 | goto out_delete; |
289 | } | 318 | } |
290 | 319 | ||
@@ -292,39 +321,42 @@ static int __cmd_report(void) | |||
292 | perf_session__fprintf(session, stdout); | 321 | perf_session__fprintf(session, stdout); |
293 | 322 | ||
294 | if (verbose > 2) | 323 | if (verbose > 2) |
295 | dsos__fprintf(stdout); | 324 | perf_session__fprintf_dsos(session, stdout); |
296 | 325 | ||
297 | next = rb_first(&session->stats_by_id); | 326 | next = rb_first(&session->hists_tree); |
298 | while (next) { | 327 | while (next) { |
299 | struct event_stat_id *stats; | 328 | struct hists *hists; |
300 | 329 | ||
301 | stats = rb_entry(next, struct event_stat_id, rb_node); | 330 | hists = rb_entry(next, struct hists, rb_node); |
302 | perf_session__collapse_resort(&stats->hists); | 331 | hists__collapse_resort(hists); |
303 | perf_session__output_resort(&stats->hists, stats->stats.total); | 332 | hists__output_resort(hists); |
304 | if (rb_first(&session->stats_by_id) == | 333 | if (use_browser) |
305 | rb_last(&session->stats_by_id)) | 334 | hists__browse(hists, help, input_name); |
306 | fprintf(stdout, "# Samples: %Ld\n#\n", | 335 | else { |
307 | stats->stats.total); | 336 | const char *evname = NULL; |
308 | else | 337 | if (rb_first(&session->hists.entries) != |
309 | fprintf(stdout, "# Samples: %Ld %s\n#\n", | 338 | rb_last(&session->hists.entries)) |
310 | stats->stats.total, | 339 | evname = __event_name(hists->type, hists->config); |
311 | __event_name(stats->type, stats->config)); | 340 | |
312 | 341 | hists__fprintf_nr_sample_events(hists, evname, stdout); | |
313 | perf_session__fprintf_hists(&stats->hists, NULL, false, stdout, | 342 | |
314 | stats->stats.total); | 343 | hists__fprintf(hists, NULL, false, stdout); |
315 | fprintf(stdout, "\n\n"); | 344 | fprintf(stdout, "\n\n"); |
316 | next = rb_next(&stats->rb_node); | 345 | } |
346 | |||
347 | next = rb_next(&hists->rb_node); | ||
317 | } | 348 | } |
318 | 349 | ||
319 | if (sort_order == default_sort_order && | 350 | if (!use_browser && sort_order == default_sort_order && |
320 | parent_pattern == default_parent_pattern) | 351 | parent_pattern == default_parent_pattern) { |
321 | fprintf(stdout, "#\n# (For a higher level overview, try: perf report --sort comm,dso)\n#\n"); | 352 | fprintf(stdout, "#\n# (%s)\n#\n", help); |
322 | 353 | ||
323 | if (show_threads) { | 354 | if (show_threads) { |
324 | bool raw_printing_style = !strcmp(pretty_printing_style, "raw"); | 355 | bool style = !strcmp(pretty_printing_style, "raw"); |
325 | perf_read_values_display(stdout, &show_threads_values, | 356 | perf_read_values_display(stdout, &show_threads_values, |
326 | raw_printing_style); | 357 | style); |
327 | perf_read_values_destroy(&show_threads_values); | 358 | perf_read_values_destroy(&show_threads_values); |
359 | } | ||
328 | } | 360 | } |
329 | out_delete: | 361 | out_delete: |
330 | perf_session__delete(session); | 362 | perf_session__delete(session); |
@@ -335,7 +367,7 @@ static int | |||
335 | parse_callchain_opt(const struct option *opt __used, const char *arg, | 367 | parse_callchain_opt(const struct option *opt __used, const char *arg, |
336 | int unset) | 368 | int unset) |
337 | { | 369 | { |
338 | char *tok; | 370 | char *tok, *tok2; |
339 | char *endptr; | 371 | char *endptr; |
340 | 372 | ||
341 | /* | 373 | /* |
@@ -380,10 +412,13 @@ parse_callchain_opt(const struct option *opt __used, const char *arg, | |||
380 | if (!tok) | 412 | if (!tok) |
381 | goto setup; | 413 | goto setup; |
382 | 414 | ||
415 | tok2 = strtok(NULL, ","); | ||
383 | callchain_param.min_percent = strtod(tok, &endptr); | 416 | callchain_param.min_percent = strtod(tok, &endptr); |
384 | if (tok == endptr) | 417 | if (tok == endptr) |
385 | return -1; | 418 | return -1; |
386 | 419 | ||
420 | if (tok2) | ||
421 | callchain_param.print_limit = strtod(tok2, &endptr); | ||
387 | setup: | 422 | setup: |
388 | if (register_callchain_param(&callchain_param) < 0) { | 423 | if (register_callchain_param(&callchain_param) < 0) { |
389 | fprintf(stderr, "Can't register callchain params\n"); | 424 | fprintf(stderr, "Can't register callchain params\n"); |
@@ -400,7 +435,7 @@ static const char * const report_usage[] = { | |||
400 | static const struct option options[] = { | 435 | static const struct option options[] = { |
401 | OPT_STRING('i', "input", &input_name, "file", | 436 | OPT_STRING('i', "input", &input_name, "file", |
402 | "input file name"), | 437 | "input file name"), |
403 | OPT_BOOLEAN('v', "verbose", &verbose, | 438 | OPT_INCR('v', "verbose", &verbose, |
404 | "be more verbose (show symbol address, etc)"), | 439 | "be more verbose (show symbol address, etc)"), |
405 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 440 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
406 | "dump raw trace in ASCII"), | 441 | "dump raw trace in ASCII"), |
@@ -419,12 +454,14 @@ static const struct option options[] = { | |||
419 | "sort by key(s): pid, comm, dso, symbol, parent"), | 454 | "sort by key(s): pid, comm, dso, symbol, parent"), |
420 | OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths, | 455 | OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths, |
421 | "Don't shorten the pathnames taking into account the cwd"), | 456 | "Don't shorten the pathnames taking into account the cwd"), |
457 | OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization, | ||
458 | "Show sample percentage for different cpu modes"), | ||
422 | OPT_STRING('p', "parent", &parent_pattern, "regex", | 459 | OPT_STRING('p', "parent", &parent_pattern, "regex", |
423 | "regex filter to identify parent, see: '--sort parent'"), | 460 | "regex filter to identify parent, see: '--sort parent'"), |
424 | OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other, | 461 | OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other, |
425 | "Only display entries with parent-match"), | 462 | "Only display entries with parent-match"), |
426 | OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent", | 463 | OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent", |
427 | "Display callchains using output_type and min percent threshold. " | 464 | "Display callchains using output_type (graph, flat, fractal, or none) and min percent threshold. " |
428 | "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt), | 465 | "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt), |
429 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", | 466 | OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", |
430 | "only consider symbols in these dsos"), | 467 | "only consider symbols in these dsos"), |
@@ -447,7 +484,15 @@ int cmd_report(int argc, const char **argv, const char *prefix __used) | |||
447 | { | 484 | { |
448 | argc = parse_options(argc, argv, options, report_usage, 0); | 485 | argc = parse_options(argc, argv, options, report_usage, 0); |
449 | 486 | ||
450 | setup_pager(); | 487 | if (strcmp(input_name, "-") != 0) |
488 | setup_browser(); | ||
489 | /* | ||
490 | * Only in the newt browser we are doing integrated annotation, | ||
491 | * so don't allocate extra space that won't be used in the stdio | ||
492 | * implementation. | ||
493 | */ | ||
494 | if (use_browser) | ||
495 | symbol_conf.priv_size = sizeof(struct sym_priv); | ||
451 | 496 | ||
452 | if (symbol__init() < 0) | 497 | if (symbol__init() < 0) |
453 | return -1; | 498 | return -1; |
@@ -455,7 +500,8 @@ int cmd_report(int argc, const char **argv, const char *prefix __used) | |||
455 | setup_sorting(report_usage, options); | 500 | setup_sorting(report_usage, options); |
456 | 501 | ||
457 | if (parent_pattern != default_parent_pattern) { | 502 | if (parent_pattern != default_parent_pattern) { |
458 | sort_dimension__add("parent"); | 503 | if (sort_dimension__add("parent") < 0) |
504 | return -1; | ||
459 | sort_parent.elide = 1; | 505 | sort_parent.elide = 1; |
460 | } else | 506 | } else |
461 | symbol_conf.exclude_other = false; | 507 | symbol_conf.exclude_other = false; |
diff --git a/tools/perf/builtin-sched.c b/tools/perf/builtin-sched.c index 4f5a03e43444..be7bc9264710 100644 --- a/tools/perf/builtin-sched.c +++ b/tools/perf/builtin-sched.c | |||
@@ -68,10 +68,10 @@ enum sched_event_type { | |||
68 | 68 | ||
69 | struct sched_atom { | 69 | struct sched_atom { |
70 | enum sched_event_type type; | 70 | enum sched_event_type type; |
71 | int specific_wait; | ||
71 | u64 timestamp; | 72 | u64 timestamp; |
72 | u64 duration; | 73 | u64 duration; |
73 | unsigned long nr; | 74 | unsigned long nr; |
74 | int specific_wait; | ||
75 | sem_t *wait_sem; | 75 | sem_t *wait_sem; |
76 | struct task_desc *wakee; | 76 | struct task_desc *wakee; |
77 | }; | 77 | }; |
@@ -1641,30 +1641,26 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
1641 | return 0; | 1641 | return 0; |
1642 | } | 1642 | } |
1643 | 1643 | ||
1644 | static int process_lost_event(event_t *event __used, | ||
1645 | struct perf_session *session __used) | ||
1646 | { | ||
1647 | nr_lost_chunks++; | ||
1648 | nr_lost_events += event->lost.lost; | ||
1649 | |||
1650 | return 0; | ||
1651 | } | ||
1652 | |||
1653 | static struct perf_event_ops event_ops = { | 1644 | static struct perf_event_ops event_ops = { |
1654 | .sample = process_sample_event, | 1645 | .sample = process_sample_event, |
1655 | .comm = event__process_comm, | 1646 | .comm = event__process_comm, |
1656 | .lost = process_lost_event, | 1647 | .lost = event__process_lost, |
1648 | .ordered_samples = true, | ||
1657 | }; | 1649 | }; |
1658 | 1650 | ||
1659 | static int read_events(void) | 1651 | static int read_events(void) |
1660 | { | 1652 | { |
1661 | int err = -EINVAL; | 1653 | int err = -EINVAL; |
1662 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 1654 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
1663 | if (session == NULL) | 1655 | if (session == NULL) |
1664 | return -ENOMEM; | 1656 | return -ENOMEM; |
1665 | 1657 | ||
1666 | if (perf_session__has_traces(session, "record -R")) | 1658 | if (perf_session__has_traces(session, "record -R")) { |
1667 | err = perf_session__process_events(session, &event_ops); | 1659 | err = perf_session__process_events(session, &event_ops); |
1660 | nr_events = session->hists.stats.nr_events[0]; | ||
1661 | nr_lost_events = session->hists.stats.total_lost; | ||
1662 | nr_lost_chunks = session->hists.stats.nr_events[PERF_RECORD_LOST]; | ||
1663 | } | ||
1668 | 1664 | ||
1669 | perf_session__delete(session); | 1665 | perf_session__delete(session); |
1670 | return err; | 1666 | return err; |
@@ -1790,7 +1786,7 @@ static const char * const sched_usage[] = { | |||
1790 | static const struct option sched_options[] = { | 1786 | static const struct option sched_options[] = { |
1791 | OPT_STRING('i', "input", &input_name, "file", | 1787 | OPT_STRING('i', "input", &input_name, "file", |
1792 | "input file name"), | 1788 | "input file name"), |
1793 | OPT_BOOLEAN('v', "verbose", &verbose, | 1789 | OPT_INCR('v', "verbose", &verbose, |
1794 | "be more verbose (show symbol address, etc)"), | 1790 | "be more verbose (show symbol address, etc)"), |
1795 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 1791 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
1796 | "dump raw trace in ASCII"), | 1792 | "dump raw trace in ASCII"), |
@@ -1805,7 +1801,7 @@ static const char * const latency_usage[] = { | |||
1805 | static const struct option latency_options[] = { | 1801 | static const struct option latency_options[] = { |
1806 | OPT_STRING('s', "sort", &sort_order, "key[,key2...]", | 1802 | OPT_STRING('s', "sort", &sort_order, "key[,key2...]", |
1807 | "sort by key(s): runtime, switch, avg, max"), | 1803 | "sort by key(s): runtime, switch, avg, max"), |
1808 | OPT_BOOLEAN('v', "verbose", &verbose, | 1804 | OPT_INCR('v', "verbose", &verbose, |
1809 | "be more verbose (show symbol address, etc)"), | 1805 | "be more verbose (show symbol address, etc)"), |
1810 | OPT_INTEGER('C', "CPU", &profile_cpu, | 1806 | OPT_INTEGER('C', "CPU", &profile_cpu, |
1811 | "CPU to profile on"), | 1807 | "CPU to profile on"), |
@@ -1822,7 +1818,7 @@ static const char * const replay_usage[] = { | |||
1822 | static const struct option replay_options[] = { | 1818 | static const struct option replay_options[] = { |
1823 | OPT_INTEGER('r', "repeat", &replay_repeat, | 1819 | OPT_INTEGER('r', "repeat", &replay_repeat, |
1824 | "repeat the workload replay N times (-1: infinite)"), | 1820 | "repeat the workload replay N times (-1: infinite)"), |
1825 | OPT_BOOLEAN('v', "verbose", &verbose, | 1821 | OPT_INCR('v', "verbose", &verbose, |
1826 | "be more verbose (show symbol address, etc)"), | 1822 | "be more verbose (show symbol address, etc)"), |
1827 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 1823 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
1828 | "dump raw trace in ASCII"), | 1824 | "dump raw trace in ASCII"), |
@@ -1850,7 +1846,6 @@ static const char *record_args[] = { | |||
1850 | "record", | 1846 | "record", |
1851 | "-a", | 1847 | "-a", |
1852 | "-R", | 1848 | "-R", |
1853 | "-M", | ||
1854 | "-f", | 1849 | "-f", |
1855 | "-m", "1024", | 1850 | "-m", "1024", |
1856 | "-c", "1", | 1851 | "-c", "1", |
diff --git a/tools/perf/builtin-stat.c b/tools/perf/builtin-stat.c index 95db31cff6fd..ff8c413b7e73 100644 --- a/tools/perf/builtin-stat.c +++ b/tools/perf/builtin-stat.c | |||
@@ -46,6 +46,7 @@ | |||
46 | #include "util/debug.h" | 46 | #include "util/debug.h" |
47 | #include "util/header.h" | 47 | #include "util/header.h" |
48 | #include "util/cpumap.h" | 48 | #include "util/cpumap.h" |
49 | #include "util/thread.h" | ||
49 | 50 | ||
50 | #include <sys/prctl.h> | 51 | #include <sys/prctl.h> |
51 | #include <math.h> | 52 | #include <math.h> |
@@ -66,18 +67,21 @@ static struct perf_event_attr default_attrs[] = { | |||
66 | 67 | ||
67 | }; | 68 | }; |
68 | 69 | ||
69 | static int system_wide = 0; | 70 | static bool system_wide = false; |
70 | static unsigned int nr_cpus = 0; | 71 | static unsigned int nr_cpus = 0; |
71 | static int run_idx = 0; | 72 | static int run_idx = 0; |
72 | 73 | ||
73 | static int run_count = 1; | 74 | static int run_count = 1; |
74 | static int inherit = 1; | 75 | static bool no_inherit = false; |
75 | static int scale = 1; | 76 | static bool scale = true; |
76 | static pid_t target_pid = -1; | 77 | static pid_t target_pid = -1; |
78 | static pid_t target_tid = -1; | ||
79 | static pid_t *all_tids = NULL; | ||
80 | static int thread_num = 0; | ||
77 | static pid_t child_pid = -1; | 81 | static pid_t child_pid = -1; |
78 | static int null_run = 0; | 82 | static bool null_run = false; |
79 | 83 | ||
80 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 84 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; |
81 | 85 | ||
82 | static int event_scaled[MAX_COUNTERS]; | 86 | static int event_scaled[MAX_COUNTERS]; |
83 | 87 | ||
@@ -140,9 +144,11 @@ struct stats runtime_branches_stats; | |||
140 | #define ERR_PERF_OPEN \ | 144 | #define ERR_PERF_OPEN \ |
141 | "Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n" | 145 | "Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n" |
142 | 146 | ||
143 | static void create_perf_stat_counter(int counter, int pid) | 147 | static int create_perf_stat_counter(int counter) |
144 | { | 148 | { |
145 | struct perf_event_attr *attr = attrs + counter; | 149 | struct perf_event_attr *attr = attrs + counter; |
150 | int thread; | ||
151 | int ncreated = 0; | ||
146 | 152 | ||
147 | if (scale) | 153 | if (scale) |
148 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | | 154 | attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | |
@@ -152,21 +158,33 @@ static void create_perf_stat_counter(int counter, int pid) | |||
152 | unsigned int cpu; | 158 | unsigned int cpu; |
153 | 159 | ||
154 | for (cpu = 0; cpu < nr_cpus; cpu++) { | 160 | for (cpu = 0; cpu < nr_cpus; cpu++) { |
155 | fd[cpu][counter] = sys_perf_event_open(attr, -1, cpumap[cpu], -1, 0); | 161 | fd[cpu][counter][0] = sys_perf_event_open(attr, |
156 | if (fd[cpu][counter] < 0 && verbose) | 162 | -1, cpumap[cpu], -1, 0); |
157 | fprintf(stderr, ERR_PERF_OPEN, counter, | 163 | if (fd[cpu][counter][0] < 0) |
158 | fd[cpu][counter], strerror(errno)); | 164 | pr_debug(ERR_PERF_OPEN, counter, |
165 | fd[cpu][counter][0], strerror(errno)); | ||
166 | else | ||
167 | ++ncreated; | ||
159 | } | 168 | } |
160 | } else { | 169 | } else { |
161 | attr->inherit = inherit; | 170 | attr->inherit = !no_inherit; |
162 | attr->disabled = 1; | 171 | if (target_pid == -1 && target_tid == -1) { |
163 | attr->enable_on_exec = 1; | 172 | attr->disabled = 1; |
164 | 173 | attr->enable_on_exec = 1; | |
165 | fd[0][counter] = sys_perf_event_open(attr, pid, -1, -1, 0); | 174 | } |
166 | if (fd[0][counter] < 0 && verbose) | 175 | for (thread = 0; thread < thread_num; thread++) { |
167 | fprintf(stderr, ERR_PERF_OPEN, counter, | 176 | fd[0][counter][thread] = sys_perf_event_open(attr, |
168 | fd[0][counter], strerror(errno)); | 177 | all_tids[thread], -1, -1, 0); |
178 | if (fd[0][counter][thread] < 0) | ||
179 | pr_debug(ERR_PERF_OPEN, counter, | ||
180 | fd[0][counter][thread], | ||
181 | strerror(errno)); | ||
182 | else | ||
183 | ++ncreated; | ||
184 | } | ||
169 | } | 185 | } |
186 | |||
187 | return ncreated; | ||
170 | } | 188 | } |
171 | 189 | ||
172 | /* | 190 | /* |
@@ -190,25 +208,28 @@ static void read_counter(int counter) | |||
190 | unsigned int cpu; | 208 | unsigned int cpu; |
191 | size_t res, nv; | 209 | size_t res, nv; |
192 | int scaled; | 210 | int scaled; |
193 | int i; | 211 | int i, thread; |
194 | 212 | ||
195 | count[0] = count[1] = count[2] = 0; | 213 | count[0] = count[1] = count[2] = 0; |
196 | 214 | ||
197 | nv = scale ? 3 : 1; | 215 | nv = scale ? 3 : 1; |
198 | for (cpu = 0; cpu < nr_cpus; cpu++) { | 216 | for (cpu = 0; cpu < nr_cpus; cpu++) { |
199 | if (fd[cpu][counter] < 0) | 217 | for (thread = 0; thread < thread_num; thread++) { |
200 | continue; | 218 | if (fd[cpu][counter][thread] < 0) |
201 | 219 | continue; | |
202 | res = read(fd[cpu][counter], single_count, nv * sizeof(u64)); | 220 | |
203 | assert(res == nv * sizeof(u64)); | 221 | res = read(fd[cpu][counter][thread], |
204 | 222 | single_count, nv * sizeof(u64)); | |
205 | close(fd[cpu][counter]); | 223 | assert(res == nv * sizeof(u64)); |
206 | fd[cpu][counter] = -1; | 224 | |
207 | 225 | close(fd[cpu][counter][thread]); | |
208 | count[0] += single_count[0]; | 226 | fd[cpu][counter][thread] = -1; |
209 | if (scale) { | 227 | |
210 | count[1] += single_count[1]; | 228 | count[0] += single_count[0]; |
211 | count[2] += single_count[2]; | 229 | if (scale) { |
230 | count[1] += single_count[1]; | ||
231 | count[2] += single_count[2]; | ||
232 | } | ||
212 | } | 233 | } |
213 | } | 234 | } |
214 | 235 | ||
@@ -250,10 +271,9 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
250 | { | 271 | { |
251 | unsigned long long t0, t1; | 272 | unsigned long long t0, t1; |
252 | int status = 0; | 273 | int status = 0; |
253 | int counter; | 274 | int counter, ncreated = 0; |
254 | int pid = target_pid; | ||
255 | int child_ready_pipe[2], go_pipe[2]; | 275 | int child_ready_pipe[2], go_pipe[2]; |
256 | const bool forks = (target_pid == -1 && argc > 0); | 276 | const bool forks = (argc > 0); |
257 | char buf; | 277 | char buf; |
258 | 278 | ||
259 | if (!system_wide) | 279 | if (!system_wide) |
@@ -265,10 +285,10 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
265 | } | 285 | } |
266 | 286 | ||
267 | if (forks) { | 287 | if (forks) { |
268 | if ((pid = fork()) < 0) | 288 | if ((child_pid = fork()) < 0) |
269 | perror("failed to fork"); | 289 | perror("failed to fork"); |
270 | 290 | ||
271 | if (!pid) { | 291 | if (!child_pid) { |
272 | close(child_ready_pipe[0]); | 292 | close(child_ready_pipe[0]); |
273 | close(go_pipe[1]); | 293 | close(go_pipe[1]); |
274 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); | 294 | fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); |
@@ -297,7 +317,8 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
297 | exit(-1); | 317 | exit(-1); |
298 | } | 318 | } |
299 | 319 | ||
300 | child_pid = pid; | 320 | if (target_tid == -1 && target_pid == -1 && !system_wide) |
321 | all_tids[0] = child_pid; | ||
301 | 322 | ||
302 | /* | 323 | /* |
303 | * Wait for the child to be ready to exec. | 324 | * Wait for the child to be ready to exec. |
@@ -310,7 +331,16 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
310 | } | 331 | } |
311 | 332 | ||
312 | for (counter = 0; counter < nr_counters; counter++) | 333 | for (counter = 0; counter < nr_counters; counter++) |
313 | create_perf_stat_counter(counter, pid); | 334 | ncreated += create_perf_stat_counter(counter); |
335 | |||
336 | if (ncreated == 0) { | ||
337 | pr_err("No permission to collect %sstats.\n" | ||
338 | "Consider tweaking /proc/sys/kernel/perf_event_paranoid.\n", | ||
339 | system_wide ? "system-wide " : ""); | ||
340 | if (child_pid != -1) | ||
341 | kill(child_pid, SIGTERM); | ||
342 | return -1; | ||
343 | } | ||
314 | 344 | ||
315 | /* | 345 | /* |
316 | * Enable counters and exec the command: | 346 | * Enable counters and exec the command: |
@@ -321,7 +351,7 @@ static int run_perf_stat(int argc __used, const char **argv) | |||
321 | close(go_pipe[1]); | 351 | close(go_pipe[1]); |
322 | wait(&status); | 352 | wait(&status); |
323 | } else { | 353 | } else { |
324 | while(!done); | 354 | while(!done) sleep(1); |
325 | } | 355 | } |
326 | 356 | ||
327 | t1 = rdclock(); | 357 | t1 = rdclock(); |
@@ -429,12 +459,14 @@ static void print_stat(int argc, const char **argv) | |||
429 | 459 | ||
430 | fprintf(stderr, "\n"); | 460 | fprintf(stderr, "\n"); |
431 | fprintf(stderr, " Performance counter stats for "); | 461 | fprintf(stderr, " Performance counter stats for "); |
432 | if(target_pid == -1) { | 462 | if(target_pid == -1 && target_tid == -1) { |
433 | fprintf(stderr, "\'%s", argv[0]); | 463 | fprintf(stderr, "\'%s", argv[0]); |
434 | for (i = 1; i < argc; i++) | 464 | for (i = 1; i < argc; i++) |
435 | fprintf(stderr, " %s", argv[i]); | 465 | fprintf(stderr, " %s", argv[i]); |
436 | }else | 466 | } else if (target_pid != -1) |
437 | fprintf(stderr, "task pid \'%d", target_pid); | 467 | fprintf(stderr, "process id \'%d", target_pid); |
468 | else | ||
469 | fprintf(stderr, "thread id \'%d", target_tid); | ||
438 | 470 | ||
439 | fprintf(stderr, "\'"); | 471 | fprintf(stderr, "\'"); |
440 | if (run_count > 1) | 472 | if (run_count > 1) |
@@ -459,7 +491,7 @@ static volatile int signr = -1; | |||
459 | 491 | ||
460 | static void skip_signal(int signo) | 492 | static void skip_signal(int signo) |
461 | { | 493 | { |
462 | if(target_pid != -1) | 494 | if(child_pid == -1) |
463 | done = 1; | 495 | done = 1; |
464 | 496 | ||
465 | signr = signo; | 497 | signr = signo; |
@@ -486,15 +518,17 @@ static const struct option options[] = { | |||
486 | OPT_CALLBACK('e', "event", NULL, "event", | 518 | OPT_CALLBACK('e', "event", NULL, "event", |
487 | "event selector. use 'perf list' to list available events", | 519 | "event selector. use 'perf list' to list available events", |
488 | parse_events), | 520 | parse_events), |
489 | OPT_BOOLEAN('i', "inherit", &inherit, | 521 | OPT_BOOLEAN('i', "no-inherit", &no_inherit, |
490 | "child tasks inherit counters"), | 522 | "child tasks do not inherit counters"), |
491 | OPT_INTEGER('p', "pid", &target_pid, | 523 | OPT_INTEGER('p', "pid", &target_pid, |
492 | "stat events on existing pid"), | 524 | "stat events on existing process id"), |
525 | OPT_INTEGER('t', "tid", &target_tid, | ||
526 | "stat events on existing thread id"), | ||
493 | OPT_BOOLEAN('a', "all-cpus", &system_wide, | 527 | OPT_BOOLEAN('a', "all-cpus", &system_wide, |
494 | "system-wide collection from all CPUs"), | 528 | "system-wide collection from all CPUs"), |
495 | OPT_BOOLEAN('c', "scale", &scale, | 529 | OPT_BOOLEAN('c', "scale", &scale, |
496 | "scale/normalize counters"), | 530 | "scale/normalize counters"), |
497 | OPT_BOOLEAN('v', "verbose", &verbose, | 531 | OPT_INCR('v', "verbose", &verbose, |
498 | "be more verbose (show counter open errors, etc)"), | 532 | "be more verbose (show counter open errors, etc)"), |
499 | OPT_INTEGER('r', "repeat", &run_count, | 533 | OPT_INTEGER('r', "repeat", &run_count, |
500 | "repeat command and print average + stddev (max: 100)"), | 534 | "repeat command and print average + stddev (max: 100)"), |
@@ -506,10 +540,11 @@ static const struct option options[] = { | |||
506 | int cmd_stat(int argc, const char **argv, const char *prefix __used) | 540 | int cmd_stat(int argc, const char **argv, const char *prefix __used) |
507 | { | 541 | { |
508 | int status; | 542 | int status; |
543 | int i,j; | ||
509 | 544 | ||
510 | argc = parse_options(argc, argv, options, stat_usage, | 545 | argc = parse_options(argc, argv, options, stat_usage, |
511 | PARSE_OPT_STOP_AT_NON_OPTION); | 546 | PARSE_OPT_STOP_AT_NON_OPTION); |
512 | if (!argc && target_pid == -1) | 547 | if (!argc && target_pid == -1 && target_tid == -1) |
513 | usage_with_options(stat_usage, options); | 548 | usage_with_options(stat_usage, options); |
514 | if (run_count <= 0) | 549 | if (run_count <= 0) |
515 | usage_with_options(stat_usage, options); | 550 | usage_with_options(stat_usage, options); |
@@ -525,6 +560,31 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used) | |||
525 | else | 560 | else |
526 | nr_cpus = 1; | 561 | nr_cpus = 1; |
527 | 562 | ||
563 | if (target_pid != -1) { | ||
564 | target_tid = target_pid; | ||
565 | thread_num = find_all_tid(target_pid, &all_tids); | ||
566 | if (thread_num <= 0) { | ||
567 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
568 | target_pid); | ||
569 | usage_with_options(stat_usage, options); | ||
570 | } | ||
571 | } else { | ||
572 | all_tids=malloc(sizeof(pid_t)); | ||
573 | if (!all_tids) | ||
574 | return -ENOMEM; | ||
575 | |||
576 | all_tids[0] = target_tid; | ||
577 | thread_num = 1; | ||
578 | } | ||
579 | |||
580 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
581 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
582 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
583 | if (!fd[i][j]) | ||
584 | return -ENOMEM; | ||
585 | } | ||
586 | } | ||
587 | |||
528 | /* | 588 | /* |
529 | * We dont want to block the signals - that would cause | 589 | * We dont want to block the signals - that would cause |
530 | * child tasks to inherit that and Ctrl-C would not work. | 590 | * child tasks to inherit that and Ctrl-C would not work. |
@@ -543,7 +603,8 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used) | |||
543 | status = run_perf_stat(argc, argv); | 603 | status = run_perf_stat(argc, argv); |
544 | } | 604 | } |
545 | 605 | ||
546 | print_stat(argc, argv); | 606 | if (status != -1) |
607 | print_stat(argc, argv); | ||
547 | 608 | ||
548 | return status; | 609 | return status; |
549 | } | 610 | } |
diff --git a/tools/perf/builtin-test.c b/tools/perf/builtin-test.c new file mode 100644 index 000000000000..0339612e7385 --- /dev/null +++ b/tools/perf/builtin-test.c | |||
@@ -0,0 +1,281 @@ | |||
1 | /* | ||
2 | * builtin-test.c | ||
3 | * | ||
4 | * Builtin regression testing command: ever growing number of sanity tests | ||
5 | */ | ||
6 | #include "builtin.h" | ||
7 | |||
8 | #include "util/cache.h" | ||
9 | #include "util/debug.h" | ||
10 | #include "util/parse-options.h" | ||
11 | #include "util/session.h" | ||
12 | #include "util/symbol.h" | ||
13 | #include "util/thread.h" | ||
14 | |||
15 | static long page_size; | ||
16 | |||
17 | static int vmlinux_matches_kallsyms_filter(struct map *map __used, struct symbol *sym) | ||
18 | { | ||
19 | bool *visited = symbol__priv(sym); | ||
20 | *visited = true; | ||
21 | return 0; | ||
22 | } | ||
23 | |||
24 | static int test__vmlinux_matches_kallsyms(void) | ||
25 | { | ||
26 | int err = -1; | ||
27 | struct rb_node *nd; | ||
28 | struct symbol *sym; | ||
29 | struct map *kallsyms_map, *vmlinux_map; | ||
30 | struct machine kallsyms, vmlinux; | ||
31 | enum map_type type = MAP__FUNCTION; | ||
32 | struct ref_reloc_sym ref_reloc_sym = { .name = "_stext", }; | ||
33 | |||
34 | /* | ||
35 | * Step 1: | ||
36 | * | ||
37 | * Init the machines that will hold kernel, modules obtained from | ||
38 | * both vmlinux + .ko files and from /proc/kallsyms split by modules. | ||
39 | */ | ||
40 | machine__init(&kallsyms, "", HOST_KERNEL_ID); | ||
41 | machine__init(&vmlinux, "", HOST_KERNEL_ID); | ||
42 | |||
43 | /* | ||
44 | * Step 2: | ||
45 | * | ||
46 | * Create the kernel maps for kallsyms and the DSO where we will then | ||
47 | * load /proc/kallsyms. Also create the modules maps from /proc/modules | ||
48 | * and find the .ko files that match them in /lib/modules/`uname -r`/. | ||
49 | */ | ||
50 | if (machine__create_kernel_maps(&kallsyms) < 0) { | ||
51 | pr_debug("machine__create_kernel_maps "); | ||
52 | return -1; | ||
53 | } | ||
54 | |||
55 | /* | ||
56 | * Step 3: | ||
57 | * | ||
58 | * Load and split /proc/kallsyms into multiple maps, one per module. | ||
59 | */ | ||
60 | if (machine__load_kallsyms(&kallsyms, "/proc/kallsyms", type, NULL) <= 0) { | ||
61 | pr_debug("dso__load_kallsyms "); | ||
62 | goto out; | ||
63 | } | ||
64 | |||
65 | /* | ||
66 | * Step 4: | ||
67 | * | ||
68 | * kallsyms will be internally on demand sorted by name so that we can | ||
69 | * find the reference relocation * symbol, i.e. the symbol we will use | ||
70 | * to see if the running kernel was relocated by checking if it has the | ||
71 | * same value in the vmlinux file we load. | ||
72 | */ | ||
73 | kallsyms_map = machine__kernel_map(&kallsyms, type); | ||
74 | |||
75 | sym = map__find_symbol_by_name(kallsyms_map, ref_reloc_sym.name, NULL); | ||
76 | if (sym == NULL) { | ||
77 | pr_debug("dso__find_symbol_by_name "); | ||
78 | goto out; | ||
79 | } | ||
80 | |||
81 | ref_reloc_sym.addr = sym->start; | ||
82 | |||
83 | /* | ||
84 | * Step 5: | ||
85 | * | ||
86 | * Now repeat step 2, this time for the vmlinux file we'll auto-locate. | ||
87 | */ | ||
88 | if (machine__create_kernel_maps(&vmlinux) < 0) { | ||
89 | pr_debug("machine__create_kernel_maps "); | ||
90 | goto out; | ||
91 | } | ||
92 | |||
93 | vmlinux_map = machine__kernel_map(&vmlinux, type); | ||
94 | map__kmap(vmlinux_map)->ref_reloc_sym = &ref_reloc_sym; | ||
95 | |||
96 | /* | ||
97 | * Step 6: | ||
98 | * | ||
99 | * Locate a vmlinux file in the vmlinux path that has a buildid that | ||
100 | * matches the one of the running kernel. | ||
101 | * | ||
102 | * While doing that look if we find the ref reloc symbol, if we find it | ||
103 | * we'll have its ref_reloc_symbol.unrelocated_addr and then | ||
104 | * maps__reloc_vmlinux will notice and set proper ->[un]map_ip routines | ||
105 | * to fixup the symbols. | ||
106 | */ | ||
107 | if (machine__load_vmlinux_path(&vmlinux, type, | ||
108 | vmlinux_matches_kallsyms_filter) <= 0) { | ||
109 | pr_debug("machine__load_vmlinux_path "); | ||
110 | goto out; | ||
111 | } | ||
112 | |||
113 | err = 0; | ||
114 | /* | ||
115 | * Step 7: | ||
116 | * | ||
117 | * Now look at the symbols in the vmlinux DSO and check if we find all of them | ||
118 | * in the kallsyms dso. For the ones that are in both, check its names and | ||
119 | * end addresses too. | ||
120 | */ | ||
121 | for (nd = rb_first(&vmlinux_map->dso->symbols[type]); nd; nd = rb_next(nd)) { | ||
122 | struct symbol *pair; | ||
123 | |||
124 | sym = rb_entry(nd, struct symbol, rb_node); | ||
125 | pair = machine__find_kernel_symbol(&kallsyms, type, sym->start, NULL, NULL); | ||
126 | |||
127 | if (pair && pair->start == sym->start) { | ||
128 | next_pair: | ||
129 | if (strcmp(sym->name, pair->name) == 0) { | ||
130 | /* | ||
131 | * kallsyms don't have the symbol end, so we | ||
132 | * set that by using the next symbol start - 1, | ||
133 | * in some cases we get this up to a page | ||
134 | * wrong, trace_kmalloc when I was developing | ||
135 | * this code was one such example, 2106 bytes | ||
136 | * off the real size. More than that and we | ||
137 | * _really_ have a problem. | ||
138 | */ | ||
139 | s64 skew = sym->end - pair->end; | ||
140 | if (llabs(skew) < page_size) | ||
141 | continue; | ||
142 | |||
143 | pr_debug("%#Lx: diff end addr for %s v: %#Lx k: %#Lx\n", | ||
144 | sym->start, sym->name, sym->end, pair->end); | ||
145 | } else { | ||
146 | struct rb_node *nnd = rb_prev(&pair->rb_node); | ||
147 | |||
148 | if (nnd) { | ||
149 | struct symbol *next = rb_entry(nnd, struct symbol, rb_node); | ||
150 | |||
151 | if (next->start == sym->start) { | ||
152 | pair = next; | ||
153 | goto next_pair; | ||
154 | } | ||
155 | } | ||
156 | pr_debug("%#Lx: diff name v: %s k: %s\n", | ||
157 | sym->start, sym->name, pair->name); | ||
158 | } | ||
159 | } else | ||
160 | pr_debug("%#Lx: %s not on kallsyms\n", sym->start, sym->name); | ||
161 | |||
162 | err = -1; | ||
163 | } | ||
164 | |||
165 | if (!verbose) | ||
166 | goto out; | ||
167 | |||
168 | pr_info("Maps only in vmlinux:\n"); | ||
169 | |||
170 | for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) { | ||
171 | struct map *pos = rb_entry(nd, struct map, rb_node), *pair; | ||
172 | /* | ||
173 | * If it is the kernel, kallsyms is always "[kernel.kallsyms]", while | ||
174 | * the kernel will have the path for the vmlinux file being used, | ||
175 | * so use the short name, less descriptive but the same ("[kernel]" in | ||
176 | * both cases. | ||
177 | */ | ||
178 | pair = map_groups__find_by_name(&kallsyms.kmaps, type, | ||
179 | (pos->dso->kernel ? | ||
180 | pos->dso->short_name : | ||
181 | pos->dso->name)); | ||
182 | if (pair) | ||
183 | pair->priv = 1; | ||
184 | else | ||
185 | map__fprintf(pos, stderr); | ||
186 | } | ||
187 | |||
188 | pr_info("Maps in vmlinux with a different name in kallsyms:\n"); | ||
189 | |||
190 | for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) { | ||
191 | struct map *pos = rb_entry(nd, struct map, rb_node), *pair; | ||
192 | |||
193 | pair = map_groups__find(&kallsyms.kmaps, type, pos->start); | ||
194 | if (pair == NULL || pair->priv) | ||
195 | continue; | ||
196 | |||
197 | if (pair->start == pos->start) { | ||
198 | pair->priv = 1; | ||
199 | pr_info(" %Lx-%Lx %Lx %s in kallsyms as", | ||
200 | pos->start, pos->end, pos->pgoff, pos->dso->name); | ||
201 | if (pos->pgoff != pair->pgoff || pos->end != pair->end) | ||
202 | pr_info(": \n*%Lx-%Lx %Lx", | ||
203 | pair->start, pair->end, pair->pgoff); | ||
204 | pr_info(" %s\n", pair->dso->name); | ||
205 | pair->priv = 1; | ||
206 | } | ||
207 | } | ||
208 | |||
209 | pr_info("Maps only in kallsyms:\n"); | ||
210 | |||
211 | for (nd = rb_first(&kallsyms.kmaps.maps[type]); | ||
212 | nd; nd = rb_next(nd)) { | ||
213 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
214 | |||
215 | if (!pos->priv) | ||
216 | map__fprintf(pos, stderr); | ||
217 | } | ||
218 | out: | ||
219 | return err; | ||
220 | } | ||
221 | |||
222 | static struct test { | ||
223 | const char *desc; | ||
224 | int (*func)(void); | ||
225 | } tests[] = { | ||
226 | { | ||
227 | .desc = "vmlinux symtab matches kallsyms", | ||
228 | .func = test__vmlinux_matches_kallsyms, | ||
229 | }, | ||
230 | { | ||
231 | .func = NULL, | ||
232 | }, | ||
233 | }; | ||
234 | |||
235 | static int __cmd_test(void) | ||
236 | { | ||
237 | int i = 0; | ||
238 | |||
239 | page_size = sysconf(_SC_PAGE_SIZE); | ||
240 | |||
241 | while (tests[i].func) { | ||
242 | int err; | ||
243 | pr_info("%2d: %s:", i + 1, tests[i].desc); | ||
244 | pr_debug("\n--- start ---\n"); | ||
245 | err = tests[i].func(); | ||
246 | pr_debug("---- end ----\n%s:", tests[i].desc); | ||
247 | pr_info(" %s\n", err ? "FAILED!\n" : "Ok"); | ||
248 | ++i; | ||
249 | } | ||
250 | |||
251 | return 0; | ||
252 | } | ||
253 | |||
254 | static const char * const test_usage[] = { | ||
255 | "perf test [<options>]", | ||
256 | NULL, | ||
257 | }; | ||
258 | |||
259 | static const struct option test_options[] = { | ||
260 | OPT_BOOLEAN('v', "verbose", &verbose, | ||
261 | "be more verbose (show symbol address, etc)"), | ||
262 | OPT_END() | ||
263 | }; | ||
264 | |||
265 | int cmd_test(int argc, const char **argv, const char *prefix __used) | ||
266 | { | ||
267 | argc = parse_options(argc, argv, test_options, test_usage, 0); | ||
268 | if (argc) | ||
269 | usage_with_options(test_usage, test_options); | ||
270 | |||
271 | symbol_conf.priv_size = sizeof(int); | ||
272 | symbol_conf.sort_by_name = true; | ||
273 | symbol_conf.try_vmlinux_path = true; | ||
274 | |||
275 | if (symbol__init() < 0) | ||
276 | return -1; | ||
277 | |||
278 | setup_pager(); | ||
279 | |||
280 | return __cmd_test(); | ||
281 | } | ||
diff --git a/tools/perf/builtin-timechart.c b/tools/perf/builtin-timechart.c index 0d4d8ff7914b..5a52ed9fc10b 100644 --- a/tools/perf/builtin-timechart.c +++ b/tools/perf/builtin-timechart.c | |||
@@ -21,7 +21,6 @@ | |||
21 | #include "util/cache.h" | 21 | #include "util/cache.h" |
22 | #include <linux/rbtree.h> | 22 | #include <linux/rbtree.h> |
23 | #include "util/symbol.h" | 23 | #include "util/symbol.h" |
24 | #include "util/string.h" | ||
25 | #include "util/callchain.h" | 24 | #include "util/callchain.h" |
26 | #include "util/strlist.h" | 25 | #include "util/strlist.h" |
27 | 26 | ||
@@ -43,7 +42,7 @@ static u64 turbo_frequency; | |||
43 | 42 | ||
44 | static u64 first_time, last_time; | 43 | static u64 first_time, last_time; |
45 | 44 | ||
46 | static int power_only; | 45 | static bool power_only; |
47 | 46 | ||
48 | 47 | ||
49 | struct per_pid; | 48 | struct per_pid; |
@@ -78,8 +77,6 @@ struct per_pid { | |||
78 | 77 | ||
79 | struct per_pidcomm *all; | 78 | struct per_pidcomm *all; |
80 | struct per_pidcomm *current; | 79 | struct per_pidcomm *current; |
81 | |||
82 | int painted; | ||
83 | }; | 80 | }; |
84 | 81 | ||
85 | 82 | ||
@@ -146,9 +143,6 @@ struct wake_event { | |||
146 | static struct power_event *power_events; | 143 | static struct power_event *power_events; |
147 | static struct wake_event *wake_events; | 144 | static struct wake_event *wake_events; |
148 | 145 | ||
149 | struct sample_wrapper *all_samples; | ||
150 | |||
151 | |||
152 | struct process_filter; | 146 | struct process_filter; |
153 | struct process_filter { | 147 | struct process_filter { |
154 | char *name; | 148 | char *name; |
@@ -569,88 +563,6 @@ static void end_sample_processing(void) | |||
569 | } | 563 | } |
570 | } | 564 | } |
571 | 565 | ||
572 | static u64 sample_time(event_t *event, const struct perf_session *session) | ||
573 | { | ||
574 | int cursor; | ||
575 | |||
576 | cursor = 0; | ||
577 | if (session->sample_type & PERF_SAMPLE_IP) | ||
578 | cursor++; | ||
579 | if (session->sample_type & PERF_SAMPLE_TID) | ||
580 | cursor++; | ||
581 | if (session->sample_type & PERF_SAMPLE_TIME) | ||
582 | return event->sample.array[cursor]; | ||
583 | return 0; | ||
584 | } | ||
585 | |||
586 | |||
587 | /* | ||
588 | * We first queue all events, sorted backwards by insertion. | ||
589 | * The order will get flipped later. | ||
590 | */ | ||
591 | static int queue_sample_event(event_t *event, struct perf_session *session) | ||
592 | { | ||
593 | struct sample_wrapper *copy, *prev; | ||
594 | int size; | ||
595 | |||
596 | size = event->sample.header.size + sizeof(struct sample_wrapper) + 8; | ||
597 | |||
598 | copy = malloc(size); | ||
599 | if (!copy) | ||
600 | return 1; | ||
601 | |||
602 | memset(copy, 0, size); | ||
603 | |||
604 | copy->next = NULL; | ||
605 | copy->timestamp = sample_time(event, session); | ||
606 | |||
607 | memcpy(©->data, event, event->sample.header.size); | ||
608 | |||
609 | /* insert in the right place in the list */ | ||
610 | |||
611 | if (!all_samples) { | ||
612 | /* first sample ever */ | ||
613 | all_samples = copy; | ||
614 | return 0; | ||
615 | } | ||
616 | |||
617 | if (all_samples->timestamp < copy->timestamp) { | ||
618 | /* insert at the head of the list */ | ||
619 | copy->next = all_samples; | ||
620 | all_samples = copy; | ||
621 | return 0; | ||
622 | } | ||
623 | |||
624 | prev = all_samples; | ||
625 | while (prev->next) { | ||
626 | if (prev->next->timestamp < copy->timestamp) { | ||
627 | copy->next = prev->next; | ||
628 | prev->next = copy; | ||
629 | return 0; | ||
630 | } | ||
631 | prev = prev->next; | ||
632 | } | ||
633 | /* insert at the end of the list */ | ||
634 | prev->next = copy; | ||
635 | |||
636 | return 0; | ||
637 | } | ||
638 | |||
639 | static void sort_queued_samples(void) | ||
640 | { | ||
641 | struct sample_wrapper *cursor, *next; | ||
642 | |||
643 | cursor = all_samples; | ||
644 | all_samples = NULL; | ||
645 | |||
646 | while (cursor) { | ||
647 | next = cursor->next; | ||
648 | cursor->next = all_samples; | ||
649 | all_samples = cursor; | ||
650 | cursor = next; | ||
651 | } | ||
652 | } | ||
653 | |||
654 | /* | 566 | /* |
655 | * Sort the pid datastructure | 567 | * Sort the pid datastructure |
656 | */ | 568 | */ |
@@ -1014,31 +926,17 @@ static void write_svg_file(const char *filename) | |||
1014 | svg_close(); | 926 | svg_close(); |
1015 | } | 927 | } |
1016 | 928 | ||
1017 | static void process_samples(struct perf_session *session) | ||
1018 | { | ||
1019 | struct sample_wrapper *cursor; | ||
1020 | event_t *event; | ||
1021 | |||
1022 | sort_queued_samples(); | ||
1023 | |||
1024 | cursor = all_samples; | ||
1025 | while (cursor) { | ||
1026 | event = (void *)&cursor->data; | ||
1027 | cursor = cursor->next; | ||
1028 | process_sample_event(event, session); | ||
1029 | } | ||
1030 | } | ||
1031 | |||
1032 | static struct perf_event_ops event_ops = { | 929 | static struct perf_event_ops event_ops = { |
1033 | .comm = process_comm_event, | 930 | .comm = process_comm_event, |
1034 | .fork = process_fork_event, | 931 | .fork = process_fork_event, |
1035 | .exit = process_exit_event, | 932 | .exit = process_exit_event, |
1036 | .sample = queue_sample_event, | 933 | .sample = process_sample_event, |
934 | .ordered_samples = true, | ||
1037 | }; | 935 | }; |
1038 | 936 | ||
1039 | static int __cmd_timechart(void) | 937 | static int __cmd_timechart(void) |
1040 | { | 938 | { |
1041 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); | 939 | struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false); |
1042 | int ret = -EINVAL; | 940 | int ret = -EINVAL; |
1043 | 941 | ||
1044 | if (session == NULL) | 942 | if (session == NULL) |
@@ -1051,8 +949,6 @@ static int __cmd_timechart(void) | |||
1051 | if (ret) | 949 | if (ret) |
1052 | goto out_delete; | 950 | goto out_delete; |
1053 | 951 | ||
1054 | process_samples(session); | ||
1055 | |||
1056 | end_sample_processing(); | 952 | end_sample_processing(); |
1057 | 953 | ||
1058 | sort_pids(); | 954 | sort_pids(); |
@@ -1075,7 +971,6 @@ static const char *record_args[] = { | |||
1075 | "record", | 971 | "record", |
1076 | "-a", | 972 | "-a", |
1077 | "-R", | 973 | "-R", |
1078 | "-M", | ||
1079 | "-f", | 974 | "-f", |
1080 | "-c", "1", | 975 | "-c", "1", |
1081 | "-e", "power:power_start", | 976 | "-e", "power:power_start", |
diff --git a/tools/perf/builtin-top.c b/tools/perf/builtin-top.c index 1f529321607e..ed9b5b6905fa 100644 --- a/tools/perf/builtin-top.c +++ b/tools/perf/builtin-top.c | |||
@@ -55,9 +55,9 @@ | |||
55 | #include <linux/unistd.h> | 55 | #include <linux/unistd.h> |
56 | #include <linux/types.h> | 56 | #include <linux/types.h> |
57 | 57 | ||
58 | static int fd[MAX_NR_CPUS][MAX_COUNTERS]; | 58 | static int *fd[MAX_NR_CPUS][MAX_COUNTERS]; |
59 | 59 | ||
60 | static int system_wide = 0; | 60 | static bool system_wide = false; |
61 | 61 | ||
62 | static int default_interval = 0; | 62 | static int default_interval = 0; |
63 | 63 | ||
@@ -65,18 +65,21 @@ static int count_filter = 5; | |||
65 | static int print_entries; | 65 | static int print_entries; |
66 | 66 | ||
67 | static int target_pid = -1; | 67 | static int target_pid = -1; |
68 | static int inherit = 0; | 68 | static int target_tid = -1; |
69 | static pid_t *all_tids = NULL; | ||
70 | static int thread_num = 0; | ||
71 | static bool inherit = false; | ||
69 | static int profile_cpu = -1; | 72 | static int profile_cpu = -1; |
70 | static int nr_cpus = 0; | 73 | static int nr_cpus = 0; |
71 | static unsigned int realtime_prio = 0; | 74 | static unsigned int realtime_prio = 0; |
72 | static int group = 0; | 75 | static bool group = false; |
73 | static unsigned int page_size; | 76 | static unsigned int page_size; |
74 | static unsigned int mmap_pages = 16; | 77 | static unsigned int mmap_pages = 16; |
75 | static int freq = 1000; /* 1 KHz */ | 78 | static int freq = 1000; /* 1 KHz */ |
76 | 79 | ||
77 | static int delay_secs = 2; | 80 | static int delay_secs = 2; |
78 | static int zero = 0; | 81 | static bool zero = false; |
79 | static int dump_symtab = 0; | 82 | static bool dump_symtab = false; |
80 | 83 | ||
81 | static bool hide_kernel_symbols = false; | 84 | static bool hide_kernel_symbols = false; |
82 | static bool hide_user_symbols = false; | 85 | static bool hide_user_symbols = false; |
@@ -133,7 +136,7 @@ static inline struct symbol *sym_entry__symbol(struct sym_entry *self) | |||
133 | return ((void *)self) + symbol_conf.priv_size; | 136 | return ((void *)self) + symbol_conf.priv_size; |
134 | } | 137 | } |
135 | 138 | ||
136 | static void get_term_dimensions(struct winsize *ws) | 139 | void get_term_dimensions(struct winsize *ws) |
137 | { | 140 | { |
138 | char *s = getenv("LINES"); | 141 | char *s = getenv("LINES"); |
139 | 142 | ||
@@ -169,7 +172,7 @@ static void sig_winch_handler(int sig __used) | |||
169 | update_print_entries(&winsize); | 172 | update_print_entries(&winsize); |
170 | } | 173 | } |
171 | 174 | ||
172 | static void parse_source(struct sym_entry *syme) | 175 | static int parse_source(struct sym_entry *syme) |
173 | { | 176 | { |
174 | struct symbol *sym; | 177 | struct symbol *sym; |
175 | struct sym_entry_source *source; | 178 | struct sym_entry_source *source; |
@@ -180,12 +183,21 @@ static void parse_source(struct sym_entry *syme) | |||
180 | u64 len; | 183 | u64 len; |
181 | 184 | ||
182 | if (!syme) | 185 | if (!syme) |
183 | return; | 186 | return -1; |
187 | |||
188 | sym = sym_entry__symbol(syme); | ||
189 | map = syme->map; | ||
190 | |||
191 | /* | ||
192 | * We can't annotate with just /proc/kallsyms | ||
193 | */ | ||
194 | if (map->dso->origin == DSO__ORIG_KERNEL) | ||
195 | return -1; | ||
184 | 196 | ||
185 | if (syme->src == NULL) { | 197 | if (syme->src == NULL) { |
186 | syme->src = zalloc(sizeof(*source)); | 198 | syme->src = zalloc(sizeof(*source)); |
187 | if (syme->src == NULL) | 199 | if (syme->src == NULL) |
188 | return; | 200 | return -1; |
189 | pthread_mutex_init(&syme->src->lock, NULL); | 201 | pthread_mutex_init(&syme->src->lock, NULL); |
190 | } | 202 | } |
191 | 203 | ||
@@ -195,9 +207,6 @@ static void parse_source(struct sym_entry *syme) | |||
195 | pthread_mutex_lock(&source->lock); | 207 | pthread_mutex_lock(&source->lock); |
196 | goto out_assign; | 208 | goto out_assign; |
197 | } | 209 | } |
198 | |||
199 | sym = sym_entry__symbol(syme); | ||
200 | map = syme->map; | ||
201 | path = map->dso->long_name; | 210 | path = map->dso->long_name; |
202 | 211 | ||
203 | len = sym->end - sym->start; | 212 | len = sym->end - sym->start; |
@@ -209,7 +218,7 @@ static void parse_source(struct sym_entry *syme) | |||
209 | 218 | ||
210 | file = popen(command, "r"); | 219 | file = popen(command, "r"); |
211 | if (!file) | 220 | if (!file) |
212 | return; | 221 | return -1; |
213 | 222 | ||
214 | pthread_mutex_lock(&source->lock); | 223 | pthread_mutex_lock(&source->lock); |
215 | source->lines_tail = &source->lines; | 224 | source->lines_tail = &source->lines; |
@@ -245,6 +254,7 @@ static void parse_source(struct sym_entry *syme) | |||
245 | out_assign: | 254 | out_assign: |
246 | sym_filter_entry = syme; | 255 | sym_filter_entry = syme; |
247 | pthread_mutex_unlock(&source->lock); | 256 | pthread_mutex_unlock(&source->lock); |
257 | return 0; | ||
248 | } | 258 | } |
249 | 259 | ||
250 | static void __zero_source_counters(struct sym_entry *syme) | 260 | static void __zero_source_counters(struct sym_entry *syme) |
@@ -410,7 +420,9 @@ static double sym_weight(const struct sym_entry *sym) | |||
410 | } | 420 | } |
411 | 421 | ||
412 | static long samples; | 422 | static long samples; |
413 | static long userspace_samples; | 423 | static long kernel_samples, us_samples; |
424 | static long exact_samples; | ||
425 | static long guest_us_samples, guest_kernel_samples; | ||
414 | static const char CONSOLE_CLEAR[] = "[H[2J"; | 426 | static const char CONSOLE_CLEAR[] = "[H[2J"; |
415 | 427 | ||
416 | static void __list_insert_active_sym(struct sym_entry *syme) | 428 | static void __list_insert_active_sym(struct sym_entry *syme) |
@@ -450,7 +462,11 @@ static void print_sym_table(void) | |||
450 | int printed = 0, j; | 462 | int printed = 0, j; |
451 | int counter, snap = !display_weighted ? sym_counter : 0; | 463 | int counter, snap = !display_weighted ? sym_counter : 0; |
452 | float samples_per_sec = samples/delay_secs; | 464 | float samples_per_sec = samples/delay_secs; |
453 | float ksamples_per_sec = (samples-userspace_samples)/delay_secs; | 465 | float ksamples_per_sec = kernel_samples/delay_secs; |
466 | float us_samples_per_sec = (us_samples)/delay_secs; | ||
467 | float guest_kernel_samples_per_sec = (guest_kernel_samples)/delay_secs; | ||
468 | float guest_us_samples_per_sec = (guest_us_samples)/delay_secs; | ||
469 | float esamples_percent = (100.0*exact_samples)/samples; | ||
454 | float sum_ksamples = 0.0; | 470 | float sum_ksamples = 0.0; |
455 | struct sym_entry *syme, *n; | 471 | struct sym_entry *syme, *n; |
456 | struct rb_root tmp = RB_ROOT; | 472 | struct rb_root tmp = RB_ROOT; |
@@ -458,7 +474,8 @@ static void print_sym_table(void) | |||
458 | int sym_width = 0, dso_width = 0, dso_short_width = 0; | 474 | int sym_width = 0, dso_width = 0, dso_short_width = 0; |
459 | const int win_width = winsize.ws_col - 1; | 475 | const int win_width = winsize.ws_col - 1; |
460 | 476 | ||
461 | samples = userspace_samples = 0; | 477 | samples = us_samples = kernel_samples = exact_samples = 0; |
478 | guest_kernel_samples = guest_us_samples = 0; | ||
462 | 479 | ||
463 | /* Sort the active symbols */ | 480 | /* Sort the active symbols */ |
464 | pthread_mutex_lock(&active_symbols_lock); | 481 | pthread_mutex_lock(&active_symbols_lock); |
@@ -489,9 +506,30 @@ static void print_sym_table(void) | |||
489 | puts(CONSOLE_CLEAR); | 506 | puts(CONSOLE_CLEAR); |
490 | 507 | ||
491 | printf("%-*.*s\n", win_width, win_width, graph_dotted_line); | 508 | printf("%-*.*s\n", win_width, win_width, graph_dotted_line); |
492 | printf( " PerfTop:%8.0f irqs/sec kernel:%4.1f%% [", | 509 | if (!perf_guest) { |
493 | samples_per_sec, | 510 | printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%%" |
494 | 100.0 - (100.0*((samples_per_sec-ksamples_per_sec)/samples_per_sec))); | 511 | " exact: %4.1f%% [", |
512 | samples_per_sec, | ||
513 | 100.0 - (100.0 * ((samples_per_sec - ksamples_per_sec) / | ||
514 | samples_per_sec)), | ||
515 | esamples_percent); | ||
516 | } else { | ||
517 | printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%% us:%4.1f%%" | ||
518 | " guest kernel:%4.1f%% guest us:%4.1f%%" | ||
519 | " exact: %4.1f%% [", | ||
520 | samples_per_sec, | ||
521 | 100.0 - (100.0 * ((samples_per_sec-ksamples_per_sec) / | ||
522 | samples_per_sec)), | ||
523 | 100.0 - (100.0 * ((samples_per_sec-us_samples_per_sec) / | ||
524 | samples_per_sec)), | ||
525 | 100.0 - (100.0 * ((samples_per_sec - | ||
526 | guest_kernel_samples_per_sec) / | ||
527 | samples_per_sec)), | ||
528 | 100.0 - (100.0 * ((samples_per_sec - | ||
529 | guest_us_samples_per_sec) / | ||
530 | samples_per_sec)), | ||
531 | esamples_percent); | ||
532 | } | ||
495 | 533 | ||
496 | if (nr_counters == 1 || !display_weighted) { | 534 | if (nr_counters == 1 || !display_weighted) { |
497 | printf("%Ld", (u64)attrs[0].sample_period); | 535 | printf("%Ld", (u64)attrs[0].sample_period); |
@@ -514,13 +552,15 @@ static void print_sym_table(void) | |||
514 | 552 | ||
515 | if (target_pid != -1) | 553 | if (target_pid != -1) |
516 | printf(" (target_pid: %d", target_pid); | 554 | printf(" (target_pid: %d", target_pid); |
555 | else if (target_tid != -1) | ||
556 | printf(" (target_tid: %d", target_tid); | ||
517 | else | 557 | else |
518 | printf(" (all"); | 558 | printf(" (all"); |
519 | 559 | ||
520 | if (profile_cpu != -1) | 560 | if (profile_cpu != -1) |
521 | printf(", cpu: %d)\n", profile_cpu); | 561 | printf(", cpu: %d)\n", profile_cpu); |
522 | else { | 562 | else { |
523 | if (target_pid != -1) | 563 | if (target_tid != -1) |
524 | printf(")\n"); | 564 | printf(")\n"); |
525 | else | 565 | else |
526 | printf(", %d CPUs)\n", nr_cpus); | 566 | printf(", %d CPUs)\n", nr_cpus); |
@@ -582,7 +622,6 @@ static void print_sym_table(void) | |||
582 | 622 | ||
583 | syme = rb_entry(nd, struct sym_entry, rb_node); | 623 | syme = rb_entry(nd, struct sym_entry, rb_node); |
584 | sym = sym_entry__symbol(syme); | 624 | sym = sym_entry__symbol(syme); |
585 | |||
586 | if (++printed > print_entries || (int)syme->snap_count < count_filter) | 625 | if (++printed > print_entries || (int)syme->snap_count < count_filter) |
587 | continue; | 626 | continue; |
588 | 627 | ||
@@ -746,7 +785,7 @@ static int key_mapped(int c) | |||
746 | return 0; | 785 | return 0; |
747 | } | 786 | } |
748 | 787 | ||
749 | static void handle_keypress(int c) | 788 | static void handle_keypress(struct perf_session *session, int c) |
750 | { | 789 | { |
751 | if (!key_mapped(c)) { | 790 | if (!key_mapped(c)) { |
752 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; | 791 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; |
@@ -815,7 +854,7 @@ static void handle_keypress(int c) | |||
815 | case 'Q': | 854 | case 'Q': |
816 | printf("exiting.\n"); | 855 | printf("exiting.\n"); |
817 | if (dump_symtab) | 856 | if (dump_symtab) |
818 | dsos__fprintf(stderr); | 857 | perf_session__fprintf_dsos(session, stderr); |
819 | exit(0); | 858 | exit(0); |
820 | case 's': | 859 | case 's': |
821 | prompt_symbol(&sym_filter_entry, "Enter details symbol"); | 860 | prompt_symbol(&sym_filter_entry, "Enter details symbol"); |
@@ -839,7 +878,7 @@ static void handle_keypress(int c) | |||
839 | display_weighted = ~display_weighted; | 878 | display_weighted = ~display_weighted; |
840 | break; | 879 | break; |
841 | case 'z': | 880 | case 'z': |
842 | zero = ~zero; | 881 | zero = !zero; |
843 | break; | 882 | break; |
844 | default: | 883 | default: |
845 | break; | 884 | break; |
@@ -851,6 +890,7 @@ static void *display_thread(void *arg __used) | |||
851 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; | 890 | struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; |
852 | struct termios tc, save; | 891 | struct termios tc, save; |
853 | int delay_msecs, c; | 892 | int delay_msecs, c; |
893 | struct perf_session *session = (struct perf_session *) arg; | ||
854 | 894 | ||
855 | tcgetattr(0, &save); | 895 | tcgetattr(0, &save); |
856 | tc = save; | 896 | tc = save; |
@@ -871,7 +911,7 @@ repeat: | |||
871 | c = getc(stdin); | 911 | c = getc(stdin); |
872 | tcsetattr(0, TCSAFLUSH, &save); | 912 | tcsetattr(0, TCSAFLUSH, &save); |
873 | 913 | ||
874 | handle_keypress(c); | 914 | handle_keypress(session, c); |
875 | goto repeat; | 915 | goto repeat; |
876 | 916 | ||
877 | return NULL; | 917 | return NULL; |
@@ -942,24 +982,48 @@ static void event__process_sample(const event_t *self, | |||
942 | u64 ip = self->ip.ip; | 982 | u64 ip = self->ip.ip; |
943 | struct sym_entry *syme; | 983 | struct sym_entry *syme; |
944 | struct addr_location al; | 984 | struct addr_location al; |
985 | struct machine *machine; | ||
945 | u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | 986 | u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; |
946 | 987 | ||
947 | ++samples; | 988 | ++samples; |
948 | 989 | ||
949 | switch (origin) { | 990 | switch (origin) { |
950 | case PERF_RECORD_MISC_USER: | 991 | case PERF_RECORD_MISC_USER: |
951 | ++userspace_samples; | 992 | ++us_samples; |
952 | if (hide_user_symbols) | 993 | if (hide_user_symbols) |
953 | return; | 994 | return; |
995 | machine = perf_session__find_host_machine(session); | ||
954 | break; | 996 | break; |
955 | case PERF_RECORD_MISC_KERNEL: | 997 | case PERF_RECORD_MISC_KERNEL: |
998 | ++kernel_samples; | ||
956 | if (hide_kernel_symbols) | 999 | if (hide_kernel_symbols) |
957 | return; | 1000 | return; |
1001 | machine = perf_session__find_host_machine(session); | ||
1002 | break; | ||
1003 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
1004 | ++guest_kernel_samples; | ||
1005 | machine = perf_session__find_machine(session, self->ip.pid); | ||
958 | break; | 1006 | break; |
1007 | case PERF_RECORD_MISC_GUEST_USER: | ||
1008 | ++guest_us_samples; | ||
1009 | /* | ||
1010 | * TODO: we don't process guest user from host side | ||
1011 | * except simple counting. | ||
1012 | */ | ||
1013 | return; | ||
959 | default: | 1014 | default: |
960 | return; | 1015 | return; |
961 | } | 1016 | } |
962 | 1017 | ||
1018 | if (!machine && perf_guest) { | ||
1019 | pr_err("Can't find guest [%d]'s kernel information\n", | ||
1020 | self->ip.pid); | ||
1021 | return; | ||
1022 | } | ||
1023 | |||
1024 | if (self->header.misc & PERF_RECORD_MISC_EXACT_IP) | ||
1025 | exact_samples++; | ||
1026 | |||
963 | if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 || | 1027 | if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 || |
964 | al.filtered) | 1028 | al.filtered) |
965 | return; | 1029 | return; |
@@ -976,7 +1040,7 @@ static void event__process_sample(const event_t *self, | |||
976 | * --hide-kernel-symbols, even if the user specifies an | 1040 | * --hide-kernel-symbols, even if the user specifies an |
977 | * invalid --vmlinux ;-) | 1041 | * invalid --vmlinux ;-) |
978 | */ | 1042 | */ |
979 | if (al.map == session->vmlinux_maps[MAP__FUNCTION] && | 1043 | if (al.map == machine->vmlinux_maps[MAP__FUNCTION] && |
980 | RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) { | 1044 | RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) { |
981 | pr_err("The %s file can't be used\n", | 1045 | pr_err("The %s file can't be used\n", |
982 | symbol_conf.vmlinux_name); | 1046 | symbol_conf.vmlinux_name); |
@@ -990,7 +1054,17 @@ static void event__process_sample(const event_t *self, | |||
990 | if (sym_filter_entry_sched) { | 1054 | if (sym_filter_entry_sched) { |
991 | sym_filter_entry = sym_filter_entry_sched; | 1055 | sym_filter_entry = sym_filter_entry_sched; |
992 | sym_filter_entry_sched = NULL; | 1056 | sym_filter_entry_sched = NULL; |
993 | parse_source(sym_filter_entry); | 1057 | if (parse_source(sym_filter_entry) < 0) { |
1058 | struct symbol *sym = sym_entry__symbol(sym_filter_entry); | ||
1059 | |||
1060 | pr_err("Can't annotate %s", sym->name); | ||
1061 | if (sym_filter_entry->map->dso->origin == DSO__ORIG_KERNEL) { | ||
1062 | pr_err(": No vmlinux file was found in the path:\n"); | ||
1063 | vmlinux_path__fprintf(stderr); | ||
1064 | } else | ||
1065 | pr_err(".\n"); | ||
1066 | exit(1); | ||
1067 | } | ||
994 | } | 1068 | } |
995 | 1069 | ||
996 | syme = symbol__priv(al.sym); | 1070 | syme = symbol__priv(al.sym); |
@@ -1106,16 +1180,21 @@ static void perf_session__mmap_read_counter(struct perf_session *self, | |||
1106 | md->prev = old; | 1180 | md->prev = old; |
1107 | } | 1181 | } |
1108 | 1182 | ||
1109 | static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; | 1183 | static struct pollfd *event_array; |
1110 | static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; | 1184 | static struct mmap_data *mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; |
1111 | 1185 | ||
1112 | static void perf_session__mmap_read(struct perf_session *self) | 1186 | static void perf_session__mmap_read(struct perf_session *self) |
1113 | { | 1187 | { |
1114 | int i, counter; | 1188 | int i, counter, thread_index; |
1115 | 1189 | ||
1116 | for (i = 0; i < nr_cpus; i++) { | 1190 | for (i = 0; i < nr_cpus; i++) { |
1117 | for (counter = 0; counter < nr_counters; counter++) | 1191 | for (counter = 0; counter < nr_counters; counter++) |
1118 | perf_session__mmap_read_counter(self, &mmap_array[i][counter]); | 1192 | for (thread_index = 0; |
1193 | thread_index < thread_num; | ||
1194 | thread_index++) { | ||
1195 | perf_session__mmap_read_counter(self, | ||
1196 | &mmap_array[i][counter][thread_index]); | ||
1197 | } | ||
1119 | } | 1198 | } |
1120 | } | 1199 | } |
1121 | 1200 | ||
@@ -1126,9 +1205,10 @@ static void start_counter(int i, int counter) | |||
1126 | { | 1205 | { |
1127 | struct perf_event_attr *attr; | 1206 | struct perf_event_attr *attr; |
1128 | int cpu; | 1207 | int cpu; |
1208 | int thread_index; | ||
1129 | 1209 | ||
1130 | cpu = profile_cpu; | 1210 | cpu = profile_cpu; |
1131 | if (target_pid == -1 && profile_cpu == -1) | 1211 | if (target_tid == -1 && profile_cpu == -1) |
1132 | cpu = cpumap[i]; | 1212 | cpu = cpumap[i]; |
1133 | 1213 | ||
1134 | attr = attrs + counter; | 1214 | attr = attrs + counter; |
@@ -1144,55 +1224,58 @@ static void start_counter(int i, int counter) | |||
1144 | attr->inherit = (cpu < 0) && inherit; | 1224 | attr->inherit = (cpu < 0) && inherit; |
1145 | attr->mmap = 1; | 1225 | attr->mmap = 1; |
1146 | 1226 | ||
1227 | for (thread_index = 0; thread_index < thread_num; thread_index++) { | ||
1147 | try_again: | 1228 | try_again: |
1148 | fd[i][counter] = sys_perf_event_open(attr, target_pid, cpu, group_fd, 0); | 1229 | fd[i][counter][thread_index] = sys_perf_event_open(attr, |
1149 | 1230 | all_tids[thread_index], cpu, group_fd, 0); | |
1150 | if (fd[i][counter] < 0) { | 1231 | |
1151 | int err = errno; | 1232 | if (fd[i][counter][thread_index] < 0) { |
1233 | int err = errno; | ||
1234 | |||
1235 | if (err == EPERM || err == EACCES) | ||
1236 | die("No permission - are you root?\n"); | ||
1237 | /* | ||
1238 | * If it's cycles then fall back to hrtimer | ||
1239 | * based cpu-clock-tick sw counter, which | ||
1240 | * is always available even if no PMU support: | ||
1241 | */ | ||
1242 | if (attr->type == PERF_TYPE_HARDWARE | ||
1243 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | ||
1244 | |||
1245 | if (verbose) | ||
1246 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | ||
1247 | |||
1248 | attr->type = PERF_TYPE_SOFTWARE; | ||
1249 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | ||
1250 | goto try_again; | ||
1251 | } | ||
1252 | printf("\n"); | ||
1253 | error("perfcounter syscall returned with %d (%s)\n", | ||
1254 | fd[i][counter][thread_index], strerror(err)); | ||
1255 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | ||
1256 | exit(-1); | ||
1257 | } | ||
1258 | assert(fd[i][counter][thread_index] >= 0); | ||
1259 | fcntl(fd[i][counter][thread_index], F_SETFL, O_NONBLOCK); | ||
1152 | 1260 | ||
1153 | if (err == EPERM || err == EACCES) | ||
1154 | die("No permission - are you root?\n"); | ||
1155 | /* | 1261 | /* |
1156 | * If it's cycles then fall back to hrtimer | 1262 | * First counter acts as the group leader: |
1157 | * based cpu-clock-tick sw counter, which | ||
1158 | * is always available even if no PMU support: | ||
1159 | */ | 1263 | */ |
1160 | if (attr->type == PERF_TYPE_HARDWARE | 1264 | if (group && group_fd == -1) |
1161 | && attr->config == PERF_COUNT_HW_CPU_CYCLES) { | 1265 | group_fd = fd[i][counter][thread_index]; |
1162 | 1266 | ||
1163 | if (verbose) | 1267 | event_array[nr_poll].fd = fd[i][counter][thread_index]; |
1164 | warning(" ... trying to fall back to cpu-clock-ticks\n"); | 1268 | event_array[nr_poll].events = POLLIN; |
1165 | 1269 | nr_poll++; | |
1166 | attr->type = PERF_TYPE_SOFTWARE; | 1270 | |
1167 | attr->config = PERF_COUNT_SW_CPU_CLOCK; | 1271 | mmap_array[i][counter][thread_index].counter = counter; |
1168 | goto try_again; | 1272 | mmap_array[i][counter][thread_index].prev = 0; |
1169 | } | 1273 | mmap_array[i][counter][thread_index].mask = mmap_pages*page_size - 1; |
1170 | printf("\n"); | 1274 | mmap_array[i][counter][thread_index].base = mmap(NULL, (mmap_pages+1)*page_size, |
1171 | error("perfcounter syscall returned with %d (%s)\n", | 1275 | PROT_READ, MAP_SHARED, fd[i][counter][thread_index], 0); |
1172 | fd[i][counter], strerror(err)); | 1276 | if (mmap_array[i][counter][thread_index].base == MAP_FAILED) |
1173 | die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); | 1277 | die("failed to mmap with %d (%s)\n", errno, strerror(errno)); |
1174 | exit(-1); | ||
1175 | } | 1278 | } |
1176 | assert(fd[i][counter] >= 0); | ||
1177 | fcntl(fd[i][counter], F_SETFL, O_NONBLOCK); | ||
1178 | |||
1179 | /* | ||
1180 | * First counter acts as the group leader: | ||
1181 | */ | ||
1182 | if (group && group_fd == -1) | ||
1183 | group_fd = fd[i][counter]; | ||
1184 | |||
1185 | event_array[nr_poll].fd = fd[i][counter]; | ||
1186 | event_array[nr_poll].events = POLLIN; | ||
1187 | nr_poll++; | ||
1188 | |||
1189 | mmap_array[i][counter].counter = counter; | ||
1190 | mmap_array[i][counter].prev = 0; | ||
1191 | mmap_array[i][counter].mask = mmap_pages*page_size - 1; | ||
1192 | mmap_array[i][counter].base = mmap(NULL, (mmap_pages+1)*page_size, | ||
1193 | PROT_READ, MAP_SHARED, fd[i][counter], 0); | ||
1194 | if (mmap_array[i][counter].base == MAP_FAILED) | ||
1195 | die("failed to mmap with %d (%s)\n", errno, strerror(errno)); | ||
1196 | } | 1279 | } |
1197 | 1280 | ||
1198 | static int __cmd_top(void) | 1281 | static int __cmd_top(void) |
@@ -1204,12 +1287,12 @@ static int __cmd_top(void) | |||
1204 | * FIXME: perf_session__new should allow passing a O_MMAP, so that all this | 1287 | * FIXME: perf_session__new should allow passing a O_MMAP, so that all this |
1205 | * mmap reading, etc is encapsulated in it. Use O_WRONLY for now. | 1288 | * mmap reading, etc is encapsulated in it. Use O_WRONLY for now. |
1206 | */ | 1289 | */ |
1207 | struct perf_session *session = perf_session__new(NULL, O_WRONLY, false); | 1290 | struct perf_session *session = perf_session__new(NULL, O_WRONLY, false, false); |
1208 | if (session == NULL) | 1291 | if (session == NULL) |
1209 | return -ENOMEM; | 1292 | return -ENOMEM; |
1210 | 1293 | ||
1211 | if (target_pid != -1) | 1294 | if (target_tid != -1) |
1212 | event__synthesize_thread(target_pid, event__process, session); | 1295 | event__synthesize_thread(target_tid, event__process, session); |
1213 | else | 1296 | else |
1214 | event__synthesize_threads(event__process, session); | 1297 | event__synthesize_threads(event__process, session); |
1215 | 1298 | ||
@@ -1220,11 +1303,11 @@ static int __cmd_top(void) | |||
1220 | } | 1303 | } |
1221 | 1304 | ||
1222 | /* Wait for a minimal set of events before starting the snapshot */ | 1305 | /* Wait for a minimal set of events before starting the snapshot */ |
1223 | poll(event_array, nr_poll, 100); | 1306 | poll(&event_array[0], nr_poll, 100); |
1224 | 1307 | ||
1225 | perf_session__mmap_read(session); | 1308 | perf_session__mmap_read(session); |
1226 | 1309 | ||
1227 | if (pthread_create(&thread, NULL, display_thread, NULL)) { | 1310 | if (pthread_create(&thread, NULL, display_thread, session)) { |
1228 | printf("Could not create display thread.\n"); | 1311 | printf("Could not create display thread.\n"); |
1229 | exit(-1); | 1312 | exit(-1); |
1230 | } | 1313 | } |
@@ -1263,7 +1346,9 @@ static const struct option options[] = { | |||
1263 | OPT_INTEGER('c', "count", &default_interval, | 1346 | OPT_INTEGER('c', "count", &default_interval, |
1264 | "event period to sample"), | 1347 | "event period to sample"), |
1265 | OPT_INTEGER('p', "pid", &target_pid, | 1348 | OPT_INTEGER('p', "pid", &target_pid, |
1266 | "profile events on existing pid"), | 1349 | "profile events on existing process id"), |
1350 | OPT_INTEGER('t', "tid", &target_tid, | ||
1351 | "profile events on existing thread id"), | ||
1267 | OPT_BOOLEAN('a', "all-cpus", &system_wide, | 1352 | OPT_BOOLEAN('a', "all-cpus", &system_wide, |
1268 | "system-wide collection from all CPUs"), | 1353 | "system-wide collection from all CPUs"), |
1269 | OPT_INTEGER('C', "CPU", &profile_cpu, | 1354 | OPT_INTEGER('C', "CPU", &profile_cpu, |
@@ -1296,7 +1381,7 @@ static const struct option options[] = { | |||
1296 | "display this many functions"), | 1381 | "display this many functions"), |
1297 | OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols, | 1382 | OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols, |
1298 | "hide user symbols"), | 1383 | "hide user symbols"), |
1299 | OPT_BOOLEAN('v', "verbose", &verbose, | 1384 | OPT_INCR('v', "verbose", &verbose, |
1300 | "be more verbose (show counter open errors, etc)"), | 1385 | "be more verbose (show counter open errors, etc)"), |
1301 | OPT_END() | 1386 | OPT_END() |
1302 | }; | 1387 | }; |
@@ -1304,6 +1389,7 @@ static const struct option options[] = { | |||
1304 | int cmd_top(int argc, const char **argv, const char *prefix __used) | 1389 | int cmd_top(int argc, const char **argv, const char *prefix __used) |
1305 | { | 1390 | { |
1306 | int counter; | 1391 | int counter; |
1392 | int i,j; | ||
1307 | 1393 | ||
1308 | page_size = sysconf(_SC_PAGE_SIZE); | 1394 | page_size = sysconf(_SC_PAGE_SIZE); |
1309 | 1395 | ||
@@ -1311,8 +1397,39 @@ int cmd_top(int argc, const char **argv, const char *prefix __used) | |||
1311 | if (argc) | 1397 | if (argc) |
1312 | usage_with_options(top_usage, options); | 1398 | usage_with_options(top_usage, options); |
1313 | 1399 | ||
1400 | if (target_pid != -1) { | ||
1401 | target_tid = target_pid; | ||
1402 | thread_num = find_all_tid(target_pid, &all_tids); | ||
1403 | if (thread_num <= 0) { | ||
1404 | fprintf(stderr, "Can't find all threads of pid %d\n", | ||
1405 | target_pid); | ||
1406 | usage_with_options(top_usage, options); | ||
1407 | } | ||
1408 | } else { | ||
1409 | all_tids=malloc(sizeof(pid_t)); | ||
1410 | if (!all_tids) | ||
1411 | return -ENOMEM; | ||
1412 | |||
1413 | all_tids[0] = target_tid; | ||
1414 | thread_num = 1; | ||
1415 | } | ||
1416 | |||
1417 | for (i = 0; i < MAX_NR_CPUS; i++) { | ||
1418 | for (j = 0; j < MAX_COUNTERS; j++) { | ||
1419 | fd[i][j] = malloc(sizeof(int)*thread_num); | ||
1420 | mmap_array[i][j] = zalloc( | ||
1421 | sizeof(struct mmap_data)*thread_num); | ||
1422 | if (!fd[i][j] || !mmap_array[i][j]) | ||
1423 | return -ENOMEM; | ||
1424 | } | ||
1425 | } | ||
1426 | event_array = malloc( | ||
1427 | sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num); | ||
1428 | if (!event_array) | ||
1429 | return -ENOMEM; | ||
1430 | |||
1314 | /* CPU and PID are mutually exclusive */ | 1431 | /* CPU and PID are mutually exclusive */ |
1315 | if (target_pid != -1 && profile_cpu != -1) { | 1432 | if (target_tid > 0 && profile_cpu != -1) { |
1316 | printf("WARNING: PID switch overriding CPU\n"); | 1433 | printf("WARNING: PID switch overriding CPU\n"); |
1317 | sleep(1); | 1434 | sleep(1); |
1318 | profile_cpu = -1; | 1435 | profile_cpu = -1; |
@@ -1353,7 +1470,7 @@ int cmd_top(int argc, const char **argv, const char *prefix __used) | |||
1353 | attrs[counter].sample_period = default_interval; | 1470 | attrs[counter].sample_period = default_interval; |
1354 | } | 1471 | } |
1355 | 1472 | ||
1356 | if (target_pid != -1 || profile_cpu != -1) | 1473 | if (target_tid != -1 || profile_cpu != -1) |
1357 | nr_cpus = 1; | 1474 | nr_cpus = 1; |
1358 | else | 1475 | else |
1359 | nr_cpus = read_cpu_map(); | 1476 | nr_cpus = read_cpu_map(); |
diff --git a/tools/perf/builtin-trace.c b/tools/perf/builtin-trace.c index 407041d20de0..dddf3f01b5ab 100644 --- a/tools/perf/builtin-trace.c +++ b/tools/perf/builtin-trace.c | |||
@@ -11,6 +11,8 @@ | |||
11 | 11 | ||
12 | static char const *script_name; | 12 | static char const *script_name; |
13 | static char const *generate_script_lang; | 13 | static char const *generate_script_lang; |
14 | static bool debug_ordering; | ||
15 | static u64 last_timestamp; | ||
14 | 16 | ||
15 | static int default_start_script(const char *script __unused, | 17 | static int default_start_script(const char *script __unused, |
16 | int argc __unused, | 18 | int argc __unused, |
@@ -51,6 +53,8 @@ static void setup_scripting(void) | |||
51 | 53 | ||
52 | static int cleanup_scripting(void) | 54 | static int cleanup_scripting(void) |
53 | { | 55 | { |
56 | pr_debug("\nperf trace script stopped\n"); | ||
57 | |||
54 | return scripting_ops->stop_script(); | 58 | return scripting_ops->stop_script(); |
55 | } | 59 | } |
56 | 60 | ||
@@ -87,6 +91,14 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
87 | } | 91 | } |
88 | 92 | ||
89 | if (session->sample_type & PERF_SAMPLE_RAW) { | 93 | if (session->sample_type & PERF_SAMPLE_RAW) { |
94 | if (debug_ordering) { | ||
95 | if (data.time < last_timestamp) { | ||
96 | pr_err("Samples misordered, previous: %llu " | ||
97 | "this: %llu\n", last_timestamp, | ||
98 | data.time); | ||
99 | } | ||
100 | last_timestamp = data.time; | ||
101 | } | ||
90 | /* | 102 | /* |
91 | * FIXME: better resolve from pid from the struct trace_entry | 103 | * FIXME: better resolve from pid from the struct trace_entry |
92 | * field, although it should be the same than this perf | 104 | * field, although it should be the same than this perf |
@@ -97,17 +109,31 @@ static int process_sample_event(event_t *event, struct perf_session *session) | |||
97 | data.time, thread->comm); | 109 | data.time, thread->comm); |
98 | } | 110 | } |
99 | 111 | ||
100 | session->events_stats.total += data.period; | 112 | session->hists.stats.total_period += data.period; |
101 | return 0; | 113 | return 0; |
102 | } | 114 | } |
103 | 115 | ||
104 | static struct perf_event_ops event_ops = { | 116 | static struct perf_event_ops event_ops = { |
105 | .sample = process_sample_event, | 117 | .sample = process_sample_event, |
106 | .comm = event__process_comm, | 118 | .comm = event__process_comm, |
119 | .attr = event__process_attr, | ||
120 | .event_type = event__process_event_type, | ||
121 | .tracing_data = event__process_tracing_data, | ||
122 | .build_id = event__process_build_id, | ||
123 | .ordered_samples = true, | ||
107 | }; | 124 | }; |
108 | 125 | ||
126 | extern volatile int session_done; | ||
127 | |||
128 | static void sig_handler(int sig __unused) | ||
129 | { | ||
130 | session_done = 1; | ||
131 | } | ||
132 | |||
109 | static int __cmd_trace(struct perf_session *session) | 133 | static int __cmd_trace(struct perf_session *session) |
110 | { | 134 | { |
135 | signal(SIGINT, sig_handler); | ||
136 | |||
111 | return perf_session__process_events(session, &event_ops); | 137 | return perf_session__process_events(session, &event_ops); |
112 | } | 138 | } |
113 | 139 | ||
@@ -505,7 +531,7 @@ static const char * const trace_usage[] = { | |||
505 | static const struct option options[] = { | 531 | static const struct option options[] = { |
506 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, | 532 | OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, |
507 | "dump raw trace in ASCII"), | 533 | "dump raw trace in ASCII"), |
508 | OPT_BOOLEAN('v', "verbose", &verbose, | 534 | OPT_INCR('v', "verbose", &verbose, |
509 | "be more verbose (show symbol address, etc)"), | 535 | "be more verbose (show symbol address, etc)"), |
510 | OPT_BOOLEAN('L', "Latency", &latency_format, | 536 | OPT_BOOLEAN('L', "Latency", &latency_format, |
511 | "show latency attributes (irqs/preemption disabled, etc)"), | 537 | "show latency attributes (irqs/preemption disabled, etc)"), |
@@ -518,6 +544,8 @@ static const struct option options[] = { | |||
518 | "generate perf-trace.xx script in specified language"), | 544 | "generate perf-trace.xx script in specified language"), |
519 | OPT_STRING('i', "input", &input_name, "file", | 545 | OPT_STRING('i', "input", &input_name, "file", |
520 | "input file name"), | 546 | "input file name"), |
547 | OPT_BOOLEAN('d', "debug-ordering", &debug_ordering, | ||
548 | "check that samples time ordering is monotonic"), | ||
521 | 549 | ||
522 | OPT_END() | 550 | OPT_END() |
523 | }; | 551 | }; |
@@ -548,6 +576,65 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
548 | suffix = REPORT_SUFFIX; | 576 | suffix = REPORT_SUFFIX; |
549 | } | 577 | } |
550 | 578 | ||
579 | if (!suffix && argc >= 2 && strncmp(argv[1], "-", strlen("-")) != 0) { | ||
580 | char *record_script_path, *report_script_path; | ||
581 | int live_pipe[2]; | ||
582 | pid_t pid; | ||
583 | |||
584 | record_script_path = get_script_path(argv[1], RECORD_SUFFIX); | ||
585 | if (!record_script_path) { | ||
586 | fprintf(stderr, "record script not found\n"); | ||
587 | return -1; | ||
588 | } | ||
589 | |||
590 | report_script_path = get_script_path(argv[1], REPORT_SUFFIX); | ||
591 | if (!report_script_path) { | ||
592 | fprintf(stderr, "report script not found\n"); | ||
593 | return -1; | ||
594 | } | ||
595 | |||
596 | if (pipe(live_pipe) < 0) { | ||
597 | perror("failed to create pipe"); | ||
598 | exit(-1); | ||
599 | } | ||
600 | |||
601 | pid = fork(); | ||
602 | if (pid < 0) { | ||
603 | perror("failed to fork"); | ||
604 | exit(-1); | ||
605 | } | ||
606 | |||
607 | if (!pid) { | ||
608 | dup2(live_pipe[1], 1); | ||
609 | close(live_pipe[0]); | ||
610 | |||
611 | __argv = malloc(5 * sizeof(const char *)); | ||
612 | __argv[0] = "/bin/sh"; | ||
613 | __argv[1] = record_script_path; | ||
614 | __argv[2] = "-o"; | ||
615 | __argv[3] = "-"; | ||
616 | __argv[4] = NULL; | ||
617 | |||
618 | execvp("/bin/sh", (char **)__argv); | ||
619 | exit(-1); | ||
620 | } | ||
621 | |||
622 | dup2(live_pipe[0], 0); | ||
623 | close(live_pipe[1]); | ||
624 | |||
625 | __argv = malloc((argc + 3) * sizeof(const char *)); | ||
626 | __argv[0] = "/bin/sh"; | ||
627 | __argv[1] = report_script_path; | ||
628 | for (i = 2; i < argc; i++) | ||
629 | __argv[i] = argv[i]; | ||
630 | __argv[i++] = "-i"; | ||
631 | __argv[i++] = "-"; | ||
632 | __argv[i++] = NULL; | ||
633 | |||
634 | execvp("/bin/sh", (char **)__argv); | ||
635 | exit(-1); | ||
636 | } | ||
637 | |||
551 | if (suffix) { | 638 | if (suffix) { |
552 | script_path = get_script_path(argv[2], suffix); | 639 | script_path = get_script_path(argv[2], suffix); |
553 | if (!script_path) { | 640 | if (!script_path) { |
@@ -576,11 +663,12 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
576 | if (!script_name) | 663 | if (!script_name) |
577 | setup_pager(); | 664 | setup_pager(); |
578 | 665 | ||
579 | session = perf_session__new(input_name, O_RDONLY, 0); | 666 | session = perf_session__new(input_name, O_RDONLY, 0, false); |
580 | if (session == NULL) | 667 | if (session == NULL) |
581 | return -ENOMEM; | 668 | return -ENOMEM; |
582 | 669 | ||
583 | if (!perf_session__has_traces(session, "record -R")) | 670 | if (strcmp(input_name, "-") && |
671 | !perf_session__has_traces(session, "record -R")) | ||
584 | return -EINVAL; | 672 | return -EINVAL; |
585 | 673 | ||
586 | if (generate_script_lang) { | 674 | if (generate_script_lang) { |
@@ -617,6 +705,7 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used) | |||
617 | err = scripting_ops->start_script(script_name, argc, argv); | 705 | err = scripting_ops->start_script(script_name, argc, argv); |
618 | if (err) | 706 | if (err) |
619 | goto out; | 707 | goto out; |
708 | pr_debug("perf trace started with script %s\n\n", script_name); | ||
620 | } | 709 | } |
621 | 710 | ||
622 | err = __cmd_trace(session); | 711 | err = __cmd_trace(session); |
diff --git a/tools/perf/builtin.h b/tools/perf/builtin.h index 10fe49e7048a..921245b28583 100644 --- a/tools/perf/builtin.h +++ b/tools/perf/builtin.h | |||
@@ -32,5 +32,8 @@ extern int cmd_version(int argc, const char **argv, const char *prefix); | |||
32 | extern int cmd_probe(int argc, const char **argv, const char *prefix); | 32 | extern int cmd_probe(int argc, const char **argv, const char *prefix); |
33 | extern int cmd_kmem(int argc, const char **argv, const char *prefix); | 33 | extern int cmd_kmem(int argc, const char **argv, const char *prefix); |
34 | extern int cmd_lock(int argc, const char **argv, const char *prefix); | 34 | extern int cmd_lock(int argc, const char **argv, const char *prefix); |
35 | extern int cmd_kvm(int argc, const char **argv, const char *prefix); | ||
36 | extern int cmd_test(int argc, const char **argv, const char *prefix); | ||
37 | extern int cmd_inject(int argc, const char **argv, const char *prefix); | ||
35 | 38 | ||
36 | #endif | 39 | #endif |
diff --git a/tools/perf/command-list.txt b/tools/perf/command-list.txt index db6ee94d4a8e..949d77fc0b97 100644 --- a/tools/perf/command-list.txt +++ b/tools/perf/command-list.txt | |||
@@ -8,6 +8,7 @@ perf-bench mainporcelain common | |||
8 | perf-buildid-cache mainporcelain common | 8 | perf-buildid-cache mainporcelain common |
9 | perf-buildid-list mainporcelain common | 9 | perf-buildid-list mainporcelain common |
10 | perf-diff mainporcelain common | 10 | perf-diff mainporcelain common |
11 | perf-inject mainporcelain common | ||
11 | perf-list mainporcelain common | 12 | perf-list mainporcelain common |
12 | perf-sched mainporcelain common | 13 | perf-sched mainporcelain common |
13 | perf-record mainporcelain common | 14 | perf-record mainporcelain common |
@@ -19,3 +20,5 @@ perf-trace mainporcelain common | |||
19 | perf-probe mainporcelain common | 20 | perf-probe mainporcelain common |
20 | perf-kmem mainporcelain common | 21 | perf-kmem mainporcelain common |
21 | perf-lock mainporcelain common | 22 | perf-lock mainporcelain common |
23 | perf-kvm mainporcelain common | ||
24 | perf-test mainporcelain common | ||
diff --git a/tools/perf/perf-archive.sh b/tools/perf/perf-archive.sh index 910468e6e01c..2e7a4f417e20 100644 --- a/tools/perf/perf-archive.sh +++ b/tools/perf/perf-archive.sh | |||
@@ -30,4 +30,7 @@ done | |||
30 | 30 | ||
31 | tar cfj $PERF_DATA.tar.bz2 -C $DEBUGDIR -T $MANIFEST | 31 | tar cfj $PERF_DATA.tar.bz2 -C $DEBUGDIR -T $MANIFEST |
32 | rm -f $MANIFEST $BUILDIDS | 32 | rm -f $MANIFEST $BUILDIDS |
33 | echo -e "Now please run:\n" | ||
34 | echo -e "$ tar xvf $PERF_DATA.tar.bz2 -C ~/.debug\n" | ||
35 | echo "wherever you need to run 'perf report' on." | ||
33 | exit 0 | 36 | exit 0 |
diff --git a/tools/perf/perf.c b/tools/perf/perf.c index cd32c200cdb3..08e0e5d2b50e 100644 --- a/tools/perf/perf.c +++ b/tools/perf/perf.c | |||
@@ -13,9 +13,10 @@ | |||
13 | #include "util/quote.h" | 13 | #include "util/quote.h" |
14 | #include "util/run-command.h" | 14 | #include "util/run-command.h" |
15 | #include "util/parse-events.h" | 15 | #include "util/parse-events.h" |
16 | #include "util/string.h" | ||
17 | #include "util/debugfs.h" | 16 | #include "util/debugfs.h" |
18 | 17 | ||
18 | bool use_browser; | ||
19 | |||
19 | const char perf_usage_string[] = | 20 | const char perf_usage_string[] = |
20 | "perf [--version] [--help] COMMAND [ARGS]"; | 21 | "perf [--version] [--help] COMMAND [ARGS]"; |
21 | 22 | ||
@@ -262,6 +263,8 @@ static int run_builtin(struct cmd_struct *p, int argc, const char **argv) | |||
262 | set_debugfs_path(); | 263 | set_debugfs_path(); |
263 | 264 | ||
264 | status = p->fn(argc, argv, prefix); | 265 | status = p->fn(argc, argv, prefix); |
266 | exit_browser(status); | ||
267 | |||
265 | if (status) | 268 | if (status) |
266 | return status & 0xff; | 269 | return status & 0xff; |
267 | 270 | ||
@@ -304,6 +307,9 @@ static void handle_internal_command(int argc, const char **argv) | |||
304 | { "probe", cmd_probe, 0 }, | 307 | { "probe", cmd_probe, 0 }, |
305 | { "kmem", cmd_kmem, 0 }, | 308 | { "kmem", cmd_kmem, 0 }, |
306 | { "lock", cmd_lock, 0 }, | 309 | { "lock", cmd_lock, 0 }, |
310 | { "kvm", cmd_kvm, 0 }, | ||
311 | { "test", cmd_test, 0 }, | ||
312 | { "inject", cmd_inject, 0 }, | ||
307 | }; | 313 | }; |
308 | unsigned int i; | 314 | unsigned int i; |
309 | static const char ext[] = STRIP_EXTENSION; | 315 | static const char ext[] = STRIP_EXTENSION; |
diff --git a/tools/perf/perf.h b/tools/perf/perf.h index 6fb379bc1d1f..02821febb704 100644 --- a/tools/perf/perf.h +++ b/tools/perf/perf.h | |||
@@ -1,6 +1,10 @@ | |||
1 | #ifndef _PERF_PERF_H | 1 | #ifndef _PERF_PERF_H |
2 | #define _PERF_PERF_H | 2 | #define _PERF_PERF_H |
3 | 3 | ||
4 | struct winsize; | ||
5 | |||
6 | void get_term_dimensions(struct winsize *ws); | ||
7 | |||
4 | #if defined(__i386__) | 8 | #if defined(__i386__) |
5 | #include "../../arch/x86/include/asm/unistd.h" | 9 | #include "../../arch/x86/include/asm/unistd.h" |
6 | #define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory") | 10 | #define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory") |
@@ -102,8 +106,6 @@ static inline unsigned long long rdclock(void) | |||
102 | #define __user | 106 | #define __user |
103 | #define asmlinkage | 107 | #define asmlinkage |
104 | 108 | ||
105 | #define __used __attribute__((__unused__)) | ||
106 | |||
107 | #define unlikely(x) __builtin_expect(!!(x), 0) | 109 | #define unlikely(x) __builtin_expect(!!(x), 0) |
108 | #define min(x, y) ({ \ | 110 | #define min(x, y) ({ \ |
109 | typeof(x) _min1 = (x); \ | 111 | typeof(x) _min1 = (x); \ |
@@ -129,4 +131,6 @@ struct ip_callchain { | |||
129 | u64 ips[0]; | 131 | u64 ips[0]; |
130 | }; | 132 | }; |
131 | 133 | ||
134 | extern int perf_host, perf_guest; | ||
135 | |||
132 | #endif | 136 | #endif |
diff --git a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm index f869c48dc9b0..d94b40c8ac85 100644 --- a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm +++ b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm | |||
@@ -15,6 +15,7 @@ our @EXPORT_OK = ( @{ $EXPORT_TAGS{'all'} } ); | |||
15 | 15 | ||
16 | our @EXPORT = qw( | 16 | our @EXPORT = qw( |
17 | avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs | 17 | avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs |
18 | clear_term | ||
18 | ); | 19 | ); |
19 | 20 | ||
20 | our $VERSION = '0.01'; | 21 | our $VERSION = '0.01'; |
@@ -55,6 +56,11 @@ sub nsecs_str { | |||
55 | return $str; | 56 | return $str; |
56 | } | 57 | } |
57 | 58 | ||
59 | sub clear_term | ||
60 | { | ||
61 | print "\x1b[H\x1b[2J"; | ||
62 | } | ||
63 | |||
58 | 1; | 64 | 1; |
59 | __END__ | 65 | __END__ |
60 | =head1 NAME | 66 | =head1 NAME |
diff --git a/tools/perf/scripts/perl/bin/check-perf-trace-record b/tools/perf/scripts/perl/bin/check-perf-trace-record index e6cb1474f8e8..423ad6aed056 100644 --- a/tools/perf/scripts/perl/bin/check-perf-trace-record +++ b/tools/perf/scripts/perl/bin/check-perf-trace-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e kmem:kmalloc -e irq:softirq_entry -e kmem:kfree | 2 | perf record -a -e kmem:kmalloc -e irq:softirq_entry -e kmem:kfree |
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-record b/tools/perf/scripts/perl/bin/failed-syscalls-record index f8885d389e6f..eb5846bcb565 100644 --- a/tools/perf/scripts/perl/bin/failed-syscalls-record +++ b/tools/perf/scripts/perl/bin/failed-syscalls-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_exit | 2 | perf record -a -e raw_syscalls:sys_exit $@ |
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-report b/tools/perf/scripts/perl/bin/failed-syscalls-report index 8bfc660e5056..e3a5e55d54ff 100644 --- a/tools/perf/scripts/perl/bin/failed-syscalls-report +++ b/tools/perf/scripts/perl/bin/failed-syscalls-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide failed syscalls | 2 | # description: system-wide failed syscalls |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/perl/failed-syscalls.pl $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/failed-syscalls.pl $comm | ||
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-record b/tools/perf/scripts/perl/bin/rw-by-file-record index b25056ebf963..5bfaae5a6cba 100644 --- a/tools/perf/scripts/perl/bin/rw-by-file-record +++ b/tools/perf/scripts/perl/bin/rw-by-file-record | |||
@@ -1,2 +1,3 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_enter_write | 2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_enter_write $@ |
3 | |||
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-report b/tools/perf/scripts/perl/bin/rw-by-file-report index eddb9ccce6a5..d83070b7eeb5 100644 --- a/tools/perf/scripts/perl/bin/rw-by-file-report +++ b/tools/perf/scripts/perl/bin/rw-by-file-report | |||
@@ -1,7 +1,13 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: r/w activity for a program, by file | 2 | # description: r/w activity for a program, by file |
3 | # args: <comm> | 3 | # args: <comm> |
4 | perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $1 | 4 | if [ $# -lt 1 ] ; then |
5 | echo "usage: rw-by-file <comm>" | ||
6 | exit | ||
7 | fi | ||
8 | comm=$1 | ||
9 | shift | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $comm | ||
5 | 11 | ||
6 | 12 | ||
7 | 13 | ||
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-record b/tools/perf/scripts/perl/bin/rw-by-pid-record index 8903979c5b6c..6e0b2f7755ac 100644 --- a/tools/perf/scripts/perl/bin/rw-by-pid-record +++ b/tools/perf/scripts/perl/bin/rw-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write | 2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@ |
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-report b/tools/perf/scripts/perl/bin/rw-by-pid-report index 7f44c25cc857..7ef46983f62f 100644 --- a/tools/perf/scripts/perl/bin/rw-by-pid-report +++ b/tools/perf/scripts/perl/bin/rw-by-pid-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide r/w activity | 2 | # description: system-wide r/w activity |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/bin/rwtop-record b/tools/perf/scripts/perl/bin/rwtop-record new file mode 100644 index 000000000000..6e0b2f7755ac --- /dev/null +++ b/tools/perf/scripts/perl/bin/rwtop-record | |||
@@ -0,0 +1,2 @@ | |||
1 | #!/bin/bash | ||
2 | perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@ | ||
diff --git a/tools/perf/scripts/perl/bin/rwtop-report b/tools/perf/scripts/perl/bin/rwtop-report new file mode 100644 index 000000000000..93e698cd3f38 --- /dev/null +++ b/tools/perf/scripts/perl/bin/rwtop-report | |||
@@ -0,0 +1,23 @@ | |||
1 | #!/bin/bash | ||
2 | # description: system-wide r/w top | ||
3 | # args: [interval] | ||
4 | n_args=0 | ||
5 | for i in "$@" | ||
6 | do | ||
7 | if expr match "$i" "-" > /dev/null ; then | ||
8 | break | ||
9 | fi | ||
10 | n_args=$(( $n_args + 1 )) | ||
11 | done | ||
12 | if [ "$n_args" -gt 1 ] ; then | ||
13 | echo "usage: rwtop-report [interval]" | ||
14 | exit | ||
15 | fi | ||
16 | if [ "$n_args" -gt 0 ] ; then | ||
17 | interval=$1 | ||
18 | shift | ||
19 | fi | ||
20 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/rwtop.pl $interval | ||
21 | |||
22 | |||
23 | |||
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-record b/tools/perf/scripts/perl/bin/wakeup-latency-record index 6abedda911a4..9f2acaaae9f0 100644 --- a/tools/perf/scripts/perl/bin/wakeup-latency-record +++ b/tools/perf/scripts/perl/bin/wakeup-latency-record | |||
@@ -1,5 +1,5 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e sched:sched_switch -e sched:sched_wakeup | 2 | perf record -a -e sched:sched_switch -e sched:sched_wakeup $@ |
3 | 3 | ||
4 | 4 | ||
5 | 5 | ||
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-report b/tools/perf/scripts/perl/bin/wakeup-latency-report index fce3adcb3249..a0d898f9ca1d 100644 --- a/tools/perf/scripts/perl/bin/wakeup-latency-report +++ b/tools/perf/scripts/perl/bin/wakeup-latency-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide min/max/avg wakeup latency | 2 | # description: system-wide min/max/avg wakeup latency |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-record b/tools/perf/scripts/perl/bin/workqueue-stats-record index fce6637b19ba..85301f2471ff 100644 --- a/tools/perf/scripts/perl/bin/workqueue-stats-record +++ b/tools/perf/scripts/perl/bin/workqueue-stats-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion | 2 | perf record -a -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion $@ |
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-report b/tools/perf/scripts/perl/bin/workqueue-stats-report index 71cfbd182fb9..35081132ef97 100644 --- a/tools/perf/scripts/perl/bin/workqueue-stats-report +++ b/tools/perf/scripts/perl/bin/workqueue-stats-report | |||
@@ -1,6 +1,6 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: workqueue stats (ins/exe/create/destroy) | 2 | # description: workqueue stats (ins/exe/create/destroy) |
3 | perf trace -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl | 3 | perf trace $@ -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl |
4 | 4 | ||
5 | 5 | ||
6 | 6 | ||
diff --git a/tools/perf/scripts/perl/failed-syscalls.pl b/tools/perf/scripts/perl/failed-syscalls.pl index c18e7e27a84b..94bc25a347eb 100644 --- a/tools/perf/scripts/perl/failed-syscalls.pl +++ b/tools/perf/scripts/perl/failed-syscalls.pl | |||
@@ -11,6 +11,8 @@ use Perf::Trace::Core; | |||
11 | use Perf::Trace::Context; | 11 | use Perf::Trace::Context; |
12 | use Perf::Trace::Util; | 12 | use Perf::Trace::Util; |
13 | 13 | ||
14 | my $for_comm = shift; | ||
15 | |||
14 | my %failed_syscalls; | 16 | my %failed_syscalls; |
15 | 17 | ||
16 | sub raw_syscalls::sys_exit | 18 | sub raw_syscalls::sys_exit |
@@ -33,6 +35,8 @@ sub trace_end | |||
33 | 35 | ||
34 | foreach my $comm (sort {$failed_syscalls{$b} <=> $failed_syscalls{$a}} | 36 | foreach my $comm (sort {$failed_syscalls{$b} <=> $failed_syscalls{$a}} |
35 | keys %failed_syscalls) { | 37 | keys %failed_syscalls) { |
36 | printf("%-20s %10s\n", $comm, $failed_syscalls{$comm}); | 38 | next if ($for_comm && $comm ne $for_comm); |
39 | |||
40 | printf("%-20s %10s\n", $comm, $failed_syscalls{$comm}); | ||
37 | } | 41 | } |
38 | } | 42 | } |
diff --git a/tools/perf/scripts/perl/rw-by-pid.pl b/tools/perf/scripts/perl/rw-by-pid.pl index da601fae1a00..9db23c9daf55 100644 --- a/tools/perf/scripts/perl/rw-by-pid.pl +++ b/tools/perf/scripts/perl/rw-by-pid.pl | |||
@@ -79,12 +79,12 @@ sub trace_end | |||
79 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", | 79 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", |
80 | "-----------", "----------", "----------"); | 80 | "-----------", "----------", "----------"); |
81 | 81 | ||
82 | foreach my $pid (sort {$reads{$b}{bytes_read} <=> | 82 | foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=> |
83 | $reads{$a}{bytes_read}} keys %reads) { | 83 | ($reads{$a}{bytes_read} || 0) } keys %reads) { |
84 | my $comm = $reads{$pid}{comm}; | 84 | my $comm = $reads{$pid}{comm} || ""; |
85 | my $total_reads = $reads{$pid}{total_reads}; | 85 | my $total_reads = $reads{$pid}{total_reads} || 0; |
86 | my $bytes_requested = $reads{$pid}{bytes_requested}; | 86 | my $bytes_requested = $reads{$pid}{bytes_requested} || 0; |
87 | my $bytes_read = $reads{$pid}{bytes_read}; | 87 | my $bytes_read = $reads{$pid}{bytes_read} || 0; |
88 | 88 | ||
89 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, | 89 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, |
90 | $total_reads, $bytes_requested, $bytes_read); | 90 | $total_reads, $bytes_requested, $bytes_read); |
@@ -96,16 +96,23 @@ sub trace_end | |||
96 | printf("%6s %20s %6s %10s\n", "------", "--------------------", | 96 | printf("%6s %20s %6s %10s\n", "------", "--------------------", |
97 | "------", "----------"); | 97 | "------", "----------"); |
98 | 98 | ||
99 | foreach my $pid (keys %reads) { | 99 | my @errcounts = (); |
100 | my $comm = $reads{$pid}{comm}; | ||
101 | foreach my $err (sort {$reads{$b}{comm} cmp $reads{$a}{comm}} | ||
102 | keys %{$reads{$pid}{errors}}) { | ||
103 | my $errors = $reads{$pid}{errors}{$err}; | ||
104 | 100 | ||
105 | printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); | 101 | foreach my $pid (keys %reads) { |
102 | foreach my $error (keys %{$reads{$pid}{errors}}) { | ||
103 | my $comm = $reads{$pid}{comm} || ""; | ||
104 | my $errcount = $reads{$pid}{errors}{$error} || 0; | ||
105 | push @errcounts, [$pid, $comm, $error, $errcount]; | ||
106 | } | 106 | } |
107 | } | 107 | } |
108 | 108 | ||
109 | @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts; | ||
110 | |||
111 | for my $i (0 .. $#errcounts) { | ||
112 | printf("%6d %-20s %6d %10s\n", $errcounts[$i][0], | ||
113 | $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]); | ||
114 | } | ||
115 | |||
109 | printf("\nwrite counts by pid:\n\n"); | 116 | printf("\nwrite counts by pid:\n\n"); |
110 | 117 | ||
111 | printf("%6s %20s %10s %10s\n", "pid", "comm", | 118 | printf("%6s %20s %10s %10s\n", "pid", "comm", |
@@ -113,11 +120,11 @@ sub trace_end | |||
113 | printf("%6s %-20s %10s %10s\n", "------", "--------------------", | 120 | printf("%6s %-20s %10s %10s\n", "------", "--------------------", |
114 | "-----------", "----------"); | 121 | "-----------", "----------"); |
115 | 122 | ||
116 | foreach my $pid (sort {$writes{$b}{bytes_written} <=> | 123 | foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=> |
117 | $writes{$a}{bytes_written}} keys %writes) { | 124 | ($writes{$a}{bytes_written} || 0)} keys %writes) { |
118 | my $comm = $writes{$pid}{comm}; | 125 | my $comm = $writes{$pid}{comm} || ""; |
119 | my $total_writes = $writes{$pid}{total_writes}; | 126 | my $total_writes = $writes{$pid}{total_writes} || 0; |
120 | my $bytes_written = $writes{$pid}{bytes_written}; | 127 | my $bytes_written = $writes{$pid}{bytes_written} || 0; |
121 | 128 | ||
122 | printf("%6s %-20s %10s %10s\n", $pid, $comm, | 129 | printf("%6s %-20s %10s %10s\n", $pid, $comm, |
123 | $total_writes, $bytes_written); | 130 | $total_writes, $bytes_written); |
@@ -129,16 +136,23 @@ sub trace_end | |||
129 | printf("%6s %20s %6s %10s\n", "------", "--------------------", | 136 | printf("%6s %20s %6s %10s\n", "------", "--------------------", |
130 | "------", "----------"); | 137 | "------", "----------"); |
131 | 138 | ||
132 | foreach my $pid (keys %writes) { | 139 | @errcounts = (); |
133 | my $comm = $writes{$pid}{comm}; | ||
134 | foreach my $err (sort {$writes{$b}{comm} cmp $writes{$a}{comm}} | ||
135 | keys %{$writes{$pid}{errors}}) { | ||
136 | my $errors = $writes{$pid}{errors}{$err}; | ||
137 | 140 | ||
138 | printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); | 141 | foreach my $pid (keys %writes) { |
142 | foreach my $error (keys %{$writes{$pid}{errors}}) { | ||
143 | my $comm = $writes{$pid}{comm} || ""; | ||
144 | my $errcount = $writes{$pid}{errors}{$error} || 0; | ||
145 | push @errcounts, [$pid, $comm, $error, $errcount]; | ||
139 | } | 146 | } |
140 | } | 147 | } |
141 | 148 | ||
149 | @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts; | ||
150 | |||
151 | for my $i (0 .. $#errcounts) { | ||
152 | printf("%6d %-20s %6d %10s\n", $errcounts[$i][0], | ||
153 | $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]); | ||
154 | } | ||
155 | |||
142 | print_unhandled(); | 156 | print_unhandled(); |
143 | } | 157 | } |
144 | 158 | ||
diff --git a/tools/perf/scripts/perl/rwtop.pl b/tools/perf/scripts/perl/rwtop.pl new file mode 100644 index 000000000000..4bb3ecd33472 --- /dev/null +++ b/tools/perf/scripts/perl/rwtop.pl | |||
@@ -0,0 +1,199 @@ | |||
1 | #!/usr/bin/perl -w | ||
2 | # (c) 2010, Tom Zanussi <tzanussi@gmail.com> | ||
3 | # Licensed under the terms of the GNU GPL License version 2 | ||
4 | |||
5 | # read/write top | ||
6 | # | ||
7 | # Periodically displays system-wide r/w call activity, broken down by | ||
8 | # pid. If an [interval] arg is specified, the display will be | ||
9 | # refreshed every [interval] seconds. The default interval is 3 | ||
10 | # seconds. | ||
11 | |||
12 | use 5.010000; | ||
13 | use strict; | ||
14 | use warnings; | ||
15 | |||
16 | use lib "$ENV{'PERF_EXEC_PATH'}/scripts/perl/Perf-Trace-Util/lib"; | ||
17 | use lib "./Perf-Trace-Util/lib"; | ||
18 | use Perf::Trace::Core; | ||
19 | use Perf::Trace::Util; | ||
20 | |||
21 | my $default_interval = 3; | ||
22 | my $nlines = 20; | ||
23 | my $print_thread; | ||
24 | my $print_pending = 0; | ||
25 | |||
26 | my %reads; | ||
27 | my %writes; | ||
28 | |||
29 | my $interval = shift; | ||
30 | if (!$interval) { | ||
31 | $interval = $default_interval; | ||
32 | } | ||
33 | |||
34 | sub syscalls::sys_exit_read | ||
35 | { | ||
36 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
37 | $common_pid, $common_comm, | ||
38 | $nr, $ret) = @_; | ||
39 | |||
40 | print_check(); | ||
41 | |||
42 | if ($ret > 0) { | ||
43 | $reads{$common_pid}{bytes_read} += $ret; | ||
44 | } else { | ||
45 | if (!defined ($reads{$common_pid}{bytes_read})) { | ||
46 | $reads{$common_pid}{bytes_read} = 0; | ||
47 | } | ||
48 | $reads{$common_pid}{errors}{$ret}++; | ||
49 | } | ||
50 | } | ||
51 | |||
52 | sub syscalls::sys_enter_read | ||
53 | { | ||
54 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
55 | $common_pid, $common_comm, | ||
56 | $nr, $fd, $buf, $count) = @_; | ||
57 | |||
58 | print_check(); | ||
59 | |||
60 | $reads{$common_pid}{bytes_requested} += $count; | ||
61 | $reads{$common_pid}{total_reads}++; | ||
62 | $reads{$common_pid}{comm} = $common_comm; | ||
63 | } | ||
64 | |||
65 | sub syscalls::sys_exit_write | ||
66 | { | ||
67 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
68 | $common_pid, $common_comm, | ||
69 | $nr, $ret) = @_; | ||
70 | |||
71 | print_check(); | ||
72 | |||
73 | if ($ret <= 0) { | ||
74 | $writes{$common_pid}{errors}{$ret}++; | ||
75 | } | ||
76 | } | ||
77 | |||
78 | sub syscalls::sys_enter_write | ||
79 | { | ||
80 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
81 | $common_pid, $common_comm, | ||
82 | $nr, $fd, $buf, $count) = @_; | ||
83 | |||
84 | print_check(); | ||
85 | |||
86 | $writes{$common_pid}{bytes_written} += $count; | ||
87 | $writes{$common_pid}{total_writes}++; | ||
88 | $writes{$common_pid}{comm} = $common_comm; | ||
89 | } | ||
90 | |||
91 | sub trace_begin | ||
92 | { | ||
93 | $SIG{ALRM} = \&set_print_pending; | ||
94 | alarm 1; | ||
95 | } | ||
96 | |||
97 | sub trace_end | ||
98 | { | ||
99 | print_unhandled(); | ||
100 | print_totals(); | ||
101 | } | ||
102 | |||
103 | sub print_check() | ||
104 | { | ||
105 | if ($print_pending == 1) { | ||
106 | $print_pending = 0; | ||
107 | print_totals(); | ||
108 | } | ||
109 | } | ||
110 | |||
111 | sub set_print_pending() | ||
112 | { | ||
113 | $print_pending = 1; | ||
114 | alarm $interval; | ||
115 | } | ||
116 | |||
117 | sub print_totals | ||
118 | { | ||
119 | my $count; | ||
120 | |||
121 | $count = 0; | ||
122 | |||
123 | clear_term(); | ||
124 | |||
125 | printf("\nread counts by pid:\n\n"); | ||
126 | |||
127 | printf("%6s %20s %10s %10s %10s\n", "pid", "comm", | ||
128 | "# reads", "bytes_req", "bytes_read"); | ||
129 | printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", | ||
130 | "----------", "----------", "----------"); | ||
131 | |||
132 | foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=> | ||
133 | ($reads{$a}{bytes_read} || 0) } keys %reads) { | ||
134 | my $comm = $reads{$pid}{comm} || ""; | ||
135 | my $total_reads = $reads{$pid}{total_reads} || 0; | ||
136 | my $bytes_requested = $reads{$pid}{bytes_requested} || 0; | ||
137 | my $bytes_read = $reads{$pid}{bytes_read} || 0; | ||
138 | |||
139 | printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, | ||
140 | $total_reads, $bytes_requested, $bytes_read); | ||
141 | |||
142 | if (++$count == $nlines) { | ||
143 | last; | ||
144 | } | ||
145 | } | ||
146 | |||
147 | $count = 0; | ||
148 | |||
149 | printf("\nwrite counts by pid:\n\n"); | ||
150 | |||
151 | printf("%6s %20s %10s %13s\n", "pid", "comm", | ||
152 | "# writes", "bytes_written"); | ||
153 | printf("%6s %-20s %10s %13s\n", "------", "--------------------", | ||
154 | "----------", "-------------"); | ||
155 | |||
156 | foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=> | ||
157 | ($writes{$a}{bytes_written} || 0)} keys %writes) { | ||
158 | my $comm = $writes{$pid}{comm} || ""; | ||
159 | my $total_writes = $writes{$pid}{total_writes} || 0; | ||
160 | my $bytes_written = $writes{$pid}{bytes_written} || 0; | ||
161 | |||
162 | printf("%6s %-20s %10s %13s\n", $pid, $comm, | ||
163 | $total_writes, $bytes_written); | ||
164 | |||
165 | if (++$count == $nlines) { | ||
166 | last; | ||
167 | } | ||
168 | } | ||
169 | |||
170 | %reads = (); | ||
171 | %writes = (); | ||
172 | } | ||
173 | |||
174 | my %unhandled; | ||
175 | |||
176 | sub print_unhandled | ||
177 | { | ||
178 | if ((scalar keys %unhandled) == 0) { | ||
179 | return; | ||
180 | } | ||
181 | |||
182 | print "\nunhandled events:\n\n"; | ||
183 | |||
184 | printf("%-40s %10s\n", "event", "count"); | ||
185 | printf("%-40s %10s\n", "----------------------------------------", | ||
186 | "-----------"); | ||
187 | |||
188 | foreach my $event_name (keys %unhandled) { | ||
189 | printf("%-40s %10d\n", $event_name, $unhandled{$event_name}); | ||
190 | } | ||
191 | } | ||
192 | |||
193 | sub trace_unhandled | ||
194 | { | ||
195 | my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs, | ||
196 | $common_pid, $common_comm) = @_; | ||
197 | |||
198 | $unhandled{$event_name}++; | ||
199 | } | ||
diff --git a/tools/perf/scripts/perl/wakeup-latency.pl b/tools/perf/scripts/perl/wakeup-latency.pl index ed58ef284e23..d9143dcec6c6 100644 --- a/tools/perf/scripts/perl/wakeup-latency.pl +++ b/tools/perf/scripts/perl/wakeup-latency.pl | |||
@@ -22,8 +22,8 @@ my %last_wakeup; | |||
22 | 22 | ||
23 | my $max_wakeup_latency; | 23 | my $max_wakeup_latency; |
24 | my $min_wakeup_latency; | 24 | my $min_wakeup_latency; |
25 | my $total_wakeup_latency; | 25 | my $total_wakeup_latency = 0; |
26 | my $total_wakeups; | 26 | my $total_wakeups = 0; |
27 | 27 | ||
28 | sub sched::sched_switch | 28 | sub sched::sched_switch |
29 | { | 29 | { |
@@ -67,8 +67,12 @@ sub trace_end | |||
67 | { | 67 | { |
68 | printf("wakeup_latency stats:\n\n"); | 68 | printf("wakeup_latency stats:\n\n"); |
69 | print "total_wakeups: $total_wakeups\n"; | 69 | print "total_wakeups: $total_wakeups\n"; |
70 | printf("avg_wakeup_latency (ns): %u\n", | 70 | if ($total_wakeups) { |
71 | avg($total_wakeup_latency, $total_wakeups)); | 71 | printf("avg_wakeup_latency (ns): %u\n", |
72 | avg($total_wakeup_latency, $total_wakeups)); | ||
73 | } else { | ||
74 | printf("avg_wakeup_latency (ns): N/A\n"); | ||
75 | } | ||
72 | printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency); | 76 | printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency); |
73 | printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency); | 77 | printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency); |
74 | 78 | ||
diff --git a/tools/perf/scripts/perl/workqueue-stats.pl b/tools/perf/scripts/perl/workqueue-stats.pl index 511302c8a494..b84b12699b70 100644 --- a/tools/perf/scripts/perl/workqueue-stats.pl +++ b/tools/perf/scripts/perl/workqueue-stats.pl | |||
@@ -71,9 +71,9 @@ sub trace_end | |||
71 | printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----"); | 71 | printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----"); |
72 | foreach my $pidhash (@cpus) { | 72 | foreach my $pidhash (@cpus) { |
73 | while ((my $pid, my $wqhash) = each %$pidhash) { | 73 | while ((my $pid, my $wqhash) = each %$pidhash) { |
74 | my $ins = $$wqhash{'inserted'}; | 74 | my $ins = $$wqhash{'inserted'} || 0; |
75 | my $exe = $$wqhash{'executed'}; | 75 | my $exe = $$wqhash{'executed'} || 0; |
76 | my $comm = $$wqhash{'comm'}; | 76 | my $comm = $$wqhash{'comm'} || ""; |
77 | if ($ins || $exe) { | 77 | if ($ins || $exe) { |
78 | printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm); | 78 | printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm); |
79 | } | 79 | } |
@@ -87,9 +87,9 @@ sub trace_end | |||
87 | printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----"); | 87 | printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----"); |
88 | foreach my $pidhash (@cpus) { | 88 | foreach my $pidhash (@cpus) { |
89 | while ((my $pid, my $wqhash) = each %$pidhash) { | 89 | while ((my $pid, my $wqhash) = each %$pidhash) { |
90 | my $created = $$wqhash{'created'}; | 90 | my $created = $$wqhash{'created'} || 0; |
91 | my $destroyed = $$wqhash{'destroyed'}; | 91 | my $destroyed = $$wqhash{'destroyed'} || 0; |
92 | my $comm = $$wqhash{'comm'}; | 92 | my $comm = $$wqhash{'comm'} || ""; |
93 | if ($created || $destroyed) { | 93 | if ($created || $destroyed) { |
94 | printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed, | 94 | printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed, |
95 | $comm); | 95 | $comm); |
diff --git a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py index 83e91435ed09..9689bc0acd9f 100644 --- a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py +++ b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py | |||
@@ -23,3 +23,6 @@ def nsecs_nsecs(nsecs): | |||
23 | def nsecs_str(nsecs): | 23 | def nsecs_str(nsecs): |
24 | str = "%5u.%09u" % (nsecs_secs(nsecs), nsecs_nsecs(nsecs)), | 24 | str = "%5u.%09u" % (nsecs_secs(nsecs), nsecs_nsecs(nsecs)), |
25 | return str | 25 | return str |
26 | |||
27 | def clear_term(): | ||
28 | print("\x1b[H\x1b[2J") | ||
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record index f8885d389e6f..eb5846bcb565 100644 --- a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record +++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_exit | 2 | perf record -a -e raw_syscalls:sys_exit $@ |
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report index 1e0c0a860c87..30293545fcc2 100644 --- a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report +++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide failed syscalls, by pid | 2 | # description: system-wide failed syscalls, by pid |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/failed-syscalls-by-pid.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/failed-syscalls-by-pid.py $comm | ||
diff --git a/tools/perf/scripts/python/bin/sctop-record b/tools/perf/scripts/python/bin/sctop-record new file mode 100644 index 000000000000..1fc5998b721d --- /dev/null +++ b/tools/perf/scripts/python/bin/sctop-record | |||
@@ -0,0 +1,2 @@ | |||
1 | #!/bin/bash | ||
2 | perf record -a -e raw_syscalls:sys_enter $@ | ||
diff --git a/tools/perf/scripts/python/bin/sctop-report b/tools/perf/scripts/python/bin/sctop-report new file mode 100644 index 000000000000..b01c842ae7b4 --- /dev/null +++ b/tools/perf/scripts/python/bin/sctop-report | |||
@@ -0,0 +1,24 @@ | |||
1 | #!/bin/bash | ||
2 | # description: syscall top | ||
3 | # args: [comm] [interval] | ||
4 | n_args=0 | ||
5 | for i in "$@" | ||
6 | do | ||
7 | if expr match "$i" "-" > /dev/null ; then | ||
8 | break | ||
9 | fi | ||
10 | n_args=$(( $n_args + 1 )) | ||
11 | done | ||
12 | if [ "$n_args" -gt 2 ] ; then | ||
13 | echo "usage: sctop-report [comm] [interval]" | ||
14 | exit | ||
15 | fi | ||
16 | if [ "$n_args" -gt 1 ] ; then | ||
17 | comm=$1 | ||
18 | interval=$2 | ||
19 | shift 2 | ||
20 | elif [ "$n_args" -gt 0 ] ; then | ||
21 | interval=$1 | ||
22 | shift | ||
23 | fi | ||
24 | perf trace $@ -s ~/libexec/perf-core/scripts/python/sctop.py $comm $interval | ||
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-record b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record index 45a8c50359da..1fc5998b721d 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-by-pid-record +++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 2 | perf record -a -e raw_syscalls:sys_enter $@ |
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-report b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report index f8044d192271..9e9d8ddd72ce 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-by-pid-report +++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide syscall counts, by pid | 2 | # description: system-wide syscall counts, by pid |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/syscall-counts-by-pid.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts-by-pid.py $comm | ||
diff --git a/tools/perf/scripts/python/bin/syscall-counts-record b/tools/perf/scripts/python/bin/syscall-counts-record index 45a8c50359da..1fc5998b721d 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-record +++ b/tools/perf/scripts/python/bin/syscall-counts-record | |||
@@ -1,2 +1,2 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | perf record -c 1 -f -a -M -R -e raw_syscalls:sys_enter | 2 | perf record -a -e raw_syscalls:sys_enter $@ |
diff --git a/tools/perf/scripts/python/bin/syscall-counts-report b/tools/perf/scripts/python/bin/syscall-counts-report index a366aa61612f..dc076b618796 100644 --- a/tools/perf/scripts/python/bin/syscall-counts-report +++ b/tools/perf/scripts/python/bin/syscall-counts-report | |||
@@ -1,4 +1,10 @@ | |||
1 | #!/bin/bash | 1 | #!/bin/bash |
2 | # description: system-wide syscall counts | 2 | # description: system-wide syscall counts |
3 | # args: [comm] | 3 | # args: [comm] |
4 | perf trace -s ~/libexec/perf-core/scripts/python/syscall-counts.py $1 | 4 | if [ $# -gt 0 ] ; then |
5 | if ! expr match "$1" "-" > /dev/null ; then | ||
6 | comm=$1 | ||
7 | shift | ||
8 | fi | ||
9 | fi | ||
10 | perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts.py $comm | ||
diff --git a/tools/perf/scripts/python/sctop.py b/tools/perf/scripts/python/sctop.py new file mode 100644 index 000000000000..6cafad40c296 --- /dev/null +++ b/tools/perf/scripts/python/sctop.py | |||
@@ -0,0 +1,78 @@ | |||
1 | # system call top | ||
2 | # (c) 2010, Tom Zanussi <tzanussi@gmail.com> | ||
3 | # Licensed under the terms of the GNU GPL License version 2 | ||
4 | # | ||
5 | # Periodically displays system-wide system call totals, broken down by | ||
6 | # syscall. If a [comm] arg is specified, only syscalls called by | ||
7 | # [comm] are displayed. If an [interval] arg is specified, the display | ||
8 | # will be refreshed every [interval] seconds. The default interval is | ||
9 | # 3 seconds. | ||
10 | |||
11 | import thread | ||
12 | import time | ||
13 | import os | ||
14 | import sys | ||
15 | |||
16 | sys.path.append(os.environ['PERF_EXEC_PATH'] + \ | ||
17 | '/scripts/python/Perf-Trace-Util/lib/Perf/Trace') | ||
18 | |||
19 | from perf_trace_context import * | ||
20 | from Core import * | ||
21 | from Util import * | ||
22 | |||
23 | usage = "perf trace -s syscall-counts.py [comm] [interval]\n"; | ||
24 | |||
25 | for_comm = None | ||
26 | default_interval = 3 | ||
27 | interval = default_interval | ||
28 | |||
29 | if len(sys.argv) > 3: | ||
30 | sys.exit(usage) | ||
31 | |||
32 | if len(sys.argv) > 2: | ||
33 | for_comm = sys.argv[1] | ||
34 | interval = int(sys.argv[2]) | ||
35 | elif len(sys.argv) > 1: | ||
36 | try: | ||
37 | interval = int(sys.argv[1]) | ||
38 | except ValueError: | ||
39 | for_comm = sys.argv[1] | ||
40 | interval = default_interval | ||
41 | |||
42 | syscalls = autodict() | ||
43 | |||
44 | def trace_begin(): | ||
45 | thread.start_new_thread(print_syscall_totals, (interval,)) | ||
46 | pass | ||
47 | |||
48 | def raw_syscalls__sys_enter(event_name, context, common_cpu, | ||
49 | common_secs, common_nsecs, common_pid, common_comm, | ||
50 | id, args): | ||
51 | if for_comm is not None: | ||
52 | if common_comm != for_comm: | ||
53 | return | ||
54 | try: | ||
55 | syscalls[id] += 1 | ||
56 | except TypeError: | ||
57 | syscalls[id] = 1 | ||
58 | |||
59 | def print_syscall_totals(interval): | ||
60 | while 1: | ||
61 | clear_term() | ||
62 | if for_comm is not None: | ||
63 | print "\nsyscall events for %s:\n\n" % (for_comm), | ||
64 | else: | ||
65 | print "\nsyscall events:\n\n", | ||
66 | |||
67 | print "%-40s %10s\n" % ("event", "count"), | ||
68 | print "%-40s %10s\n" % ("----------------------------------------", \ | ||
69 | "----------"), | ||
70 | |||
71 | for id, val in sorted(syscalls.iteritems(), key = lambda(k, v): (v, k), \ | ||
72 | reverse = True): | ||
73 | try: | ||
74 | print "%-40d %10d\n" % (id, val), | ||
75 | except TypeError: | ||
76 | pass | ||
77 | syscalls.clear() | ||
78 | time.sleep(interval) | ||
diff --git a/tools/perf/util/PERF-VERSION-GEN b/tools/perf/util/PERF-VERSION-GEN index 54552a00a117..49ece7921914 100755 --- a/tools/perf/util/PERF-VERSION-GEN +++ b/tools/perf/util/PERF-VERSION-GEN | |||
@@ -1,6 +1,10 @@ | |||
1 | #!/bin/sh | 1 | #!/bin/sh |
2 | 2 | ||
3 | GVF=PERF-VERSION-FILE | 3 | if [ $# -eq 1 ] ; then |
4 | OUTPUT=$1 | ||
5 | fi | ||
6 | |||
7 | GVF=${OUTPUT}PERF-VERSION-FILE | ||
4 | DEF_VER=v0.0.2.PERF | 8 | DEF_VER=v0.0.2.PERF |
5 | 9 | ||
6 | LF=' | 10 | LF=' |
diff --git a/tools/perf/util/bitmap.c b/tools/perf/util/bitmap.c new file mode 100644 index 000000000000..5e230acae1e9 --- /dev/null +++ b/tools/perf/util/bitmap.c | |||
@@ -0,0 +1,21 @@ | |||
1 | /* | ||
2 | * From lib/bitmap.c | ||
3 | * Helper functions for bitmap.h. | ||
4 | * | ||
5 | * This source code is licensed under the GNU General Public License, | ||
6 | * Version 2. See the file COPYING for more details. | ||
7 | */ | ||
8 | #include <linux/bitmap.h> | ||
9 | |||
10 | int __bitmap_weight(const unsigned long *bitmap, int bits) | ||
11 | { | ||
12 | int k, w = 0, lim = bits/BITS_PER_LONG; | ||
13 | |||
14 | for (k = 0; k < lim; k++) | ||
15 | w += hweight_long(bitmap[k]); | ||
16 | |||
17 | if (bits % BITS_PER_LONG) | ||
18 | w += hweight_long(bitmap[k] & BITMAP_LAST_WORD_MASK(bits)); | ||
19 | |||
20 | return w; | ||
21 | } | ||
diff --git a/tools/perf/util/build-id.c b/tools/perf/util/build-id.c index 04904b35ba81..0f60a3906808 100644 --- a/tools/perf/util/build-id.c +++ b/tools/perf/util/build-id.c | |||
@@ -24,7 +24,7 @@ static int build_id__mark_dso_hit(event_t *event, struct perf_session *session) | |||
24 | } | 24 | } |
25 | 25 | ||
26 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, | 26 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, |
27 | event->ip.ip, &al); | 27 | event->ip.pid, event->ip.ip, &al); |
28 | 28 | ||
29 | if (al.map != NULL) | 29 | if (al.map != NULL) |
30 | al.map->dso->hit = 1; | 30 | al.map->dso->hit = 1; |
diff --git a/tools/perf/util/cache.h b/tools/perf/util/cache.h index 918eb376abe3..4b9aab7f0405 100644 --- a/tools/perf/util/cache.h +++ b/tools/perf/util/cache.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_CACHE_H | 1 | #ifndef __PERF_CACHE_H |
2 | #define __PERF_CACHE_H | 2 | #define __PERF_CACHE_H |
3 | 3 | ||
4 | #include <stdbool.h> | ||
4 | #include "util.h" | 5 | #include "util.h" |
5 | #include "strbuf.h" | 6 | #include "strbuf.h" |
6 | #include "../perf.h" | 7 | #include "../perf.h" |
@@ -69,6 +70,19 @@ extern const char *pager_program; | |||
69 | extern int pager_in_use(void); | 70 | extern int pager_in_use(void); |
70 | extern int pager_use_color; | 71 | extern int pager_use_color; |
71 | 72 | ||
73 | extern bool use_browser; | ||
74 | |||
75 | #ifdef NO_NEWT_SUPPORT | ||
76 | static inline void setup_browser(void) | ||
77 | { | ||
78 | setup_pager(); | ||
79 | } | ||
80 | static inline void exit_browser(bool wait_for_ok __used) {} | ||
81 | #else | ||
82 | void setup_browser(void); | ||
83 | void exit_browser(bool wait_for_ok); | ||
84 | #endif | ||
85 | |||
72 | extern const char *editor_program; | 86 | extern const char *editor_program; |
73 | extern const char *excludes_file; | 87 | extern const char *excludes_file; |
74 | 88 | ||
diff --git a/tools/perf/util/callchain.c b/tools/perf/util/callchain.c index b3b71258272a..21a52e0a4435 100644 --- a/tools/perf/util/callchain.c +++ b/tools/perf/util/callchain.c | |||
@@ -1,5 +1,5 @@ | |||
1 | /* | 1 | /* |
2 | * Copyright (C) 2009, Frederic Weisbecker <fweisbec@gmail.com> | 2 | * Copyright (C) 2009-2010, Frederic Weisbecker <fweisbec@gmail.com> |
3 | * | 3 | * |
4 | * Handle the callchains from the stream in an ad-hoc radix tree and then | 4 | * Handle the callchains from the stream in an ad-hoc radix tree and then |
5 | * sort them in an rbtree. | 5 | * sort them in an rbtree. |
@@ -17,6 +17,13 @@ | |||
17 | 17 | ||
18 | #include "callchain.h" | 18 | #include "callchain.h" |
19 | 19 | ||
20 | bool ip_callchain__valid(struct ip_callchain *chain, event_t *event) | ||
21 | { | ||
22 | unsigned int chain_size = event->header.size; | ||
23 | chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event; | ||
24 | return chain->nr * sizeof(u64) <= chain_size; | ||
25 | } | ||
26 | |||
20 | #define chain_for_each_child(child, parent) \ | 27 | #define chain_for_each_child(child, parent) \ |
21 | list_for_each_entry(child, &parent->children, brothers) | 28 | list_for_each_entry(child, &parent->children, brothers) |
22 | 29 | ||
@@ -160,7 +167,7 @@ create_child(struct callchain_node *parent, bool inherit_children) | |||
160 | { | 167 | { |
161 | struct callchain_node *new; | 168 | struct callchain_node *new; |
162 | 169 | ||
163 | new = malloc(sizeof(*new)); | 170 | new = zalloc(sizeof(*new)); |
164 | if (!new) { | 171 | if (!new) { |
165 | perror("not enough memory to create child for code path tree"); | 172 | perror("not enough memory to create child for code path tree"); |
166 | return NULL; | 173 | return NULL; |
@@ -183,25 +190,36 @@ create_child(struct callchain_node *parent, bool inherit_children) | |||
183 | return new; | 190 | return new; |
184 | } | 191 | } |
185 | 192 | ||
193 | |||
194 | struct resolved_ip { | ||
195 | u64 ip; | ||
196 | struct map_symbol ms; | ||
197 | }; | ||
198 | |||
199 | struct resolved_chain { | ||
200 | u64 nr; | ||
201 | struct resolved_ip ips[0]; | ||
202 | }; | ||
203 | |||
204 | |||
186 | /* | 205 | /* |
187 | * Fill the node with callchain values | 206 | * Fill the node with callchain values |
188 | */ | 207 | */ |
189 | static void | 208 | static void |
190 | fill_node(struct callchain_node *node, struct ip_callchain *chain, | 209 | fill_node(struct callchain_node *node, struct resolved_chain *chain, int start) |
191 | int start, struct symbol **syms) | ||
192 | { | 210 | { |
193 | unsigned int i; | 211 | unsigned int i; |
194 | 212 | ||
195 | for (i = start; i < chain->nr; i++) { | 213 | for (i = start; i < chain->nr; i++) { |
196 | struct callchain_list *call; | 214 | struct callchain_list *call; |
197 | 215 | ||
198 | call = malloc(sizeof(*call)); | 216 | call = zalloc(sizeof(*call)); |
199 | if (!call) { | 217 | if (!call) { |
200 | perror("not enough memory for the code path tree"); | 218 | perror("not enough memory for the code path tree"); |
201 | return; | 219 | return; |
202 | } | 220 | } |
203 | call->ip = chain->ips[i]; | 221 | call->ip = chain->ips[i].ip; |
204 | call->sym = syms[i]; | 222 | call->ms = chain->ips[i].ms; |
205 | list_add_tail(&call->list, &node->val); | 223 | list_add_tail(&call->list, &node->val); |
206 | } | 224 | } |
207 | node->val_nr = chain->nr - start; | 225 | node->val_nr = chain->nr - start; |
@@ -210,13 +228,13 @@ fill_node(struct callchain_node *node, struct ip_callchain *chain, | |||
210 | } | 228 | } |
211 | 229 | ||
212 | static void | 230 | static void |
213 | add_child(struct callchain_node *parent, struct ip_callchain *chain, | 231 | add_child(struct callchain_node *parent, struct resolved_chain *chain, |
214 | int start, struct symbol **syms) | 232 | int start) |
215 | { | 233 | { |
216 | struct callchain_node *new; | 234 | struct callchain_node *new; |
217 | 235 | ||
218 | new = create_child(parent, false); | 236 | new = create_child(parent, false); |
219 | fill_node(new, chain, start, syms); | 237 | fill_node(new, chain, start); |
220 | 238 | ||
221 | new->children_hit = 0; | 239 | new->children_hit = 0; |
222 | new->hit = 1; | 240 | new->hit = 1; |
@@ -228,9 +246,8 @@ add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
228 | * Then create another child to host the given callchain of new branch | 246 | * Then create another child to host the given callchain of new branch |
229 | */ | 247 | */ |
230 | static void | 248 | static void |
231 | split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | 249 | split_add_child(struct callchain_node *parent, struct resolved_chain *chain, |
232 | struct callchain_list *to_split, int idx_parents, int idx_local, | 250 | struct callchain_list *to_split, int idx_parents, int idx_local) |
233 | struct symbol **syms) | ||
234 | { | 251 | { |
235 | struct callchain_node *new; | 252 | struct callchain_node *new; |
236 | struct list_head *old_tail; | 253 | struct list_head *old_tail; |
@@ -257,7 +274,7 @@ split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
257 | /* create a new child for the new branch if any */ | 274 | /* create a new child for the new branch if any */ |
258 | if (idx_total < chain->nr) { | 275 | if (idx_total < chain->nr) { |
259 | parent->hit = 0; | 276 | parent->hit = 0; |
260 | add_child(parent, chain, idx_total, syms); | 277 | add_child(parent, chain, idx_total); |
261 | parent->children_hit++; | 278 | parent->children_hit++; |
262 | } else { | 279 | } else { |
263 | parent->hit = 1; | 280 | parent->hit = 1; |
@@ -265,32 +282,33 @@ split_add_child(struct callchain_node *parent, struct ip_callchain *chain, | |||
265 | } | 282 | } |
266 | 283 | ||
267 | static int | 284 | static int |
268 | __append_chain(struct callchain_node *root, struct ip_callchain *chain, | 285 | __append_chain(struct callchain_node *root, struct resolved_chain *chain, |
269 | unsigned int start, struct symbol **syms); | 286 | unsigned int start); |
270 | 287 | ||
271 | static void | 288 | static void |
272 | __append_chain_children(struct callchain_node *root, struct ip_callchain *chain, | 289 | __append_chain_children(struct callchain_node *root, |
273 | struct symbol **syms, unsigned int start) | 290 | struct resolved_chain *chain, |
291 | unsigned int start) | ||
274 | { | 292 | { |
275 | struct callchain_node *rnode; | 293 | struct callchain_node *rnode; |
276 | 294 | ||
277 | /* lookup in childrens */ | 295 | /* lookup in childrens */ |
278 | chain_for_each_child(rnode, root) { | 296 | chain_for_each_child(rnode, root) { |
279 | unsigned int ret = __append_chain(rnode, chain, start, syms); | 297 | unsigned int ret = __append_chain(rnode, chain, start); |
280 | 298 | ||
281 | if (!ret) | 299 | if (!ret) |
282 | goto inc_children_hit; | 300 | goto inc_children_hit; |
283 | } | 301 | } |
284 | /* nothing in children, add to the current node */ | 302 | /* nothing in children, add to the current node */ |
285 | add_child(root, chain, start, syms); | 303 | add_child(root, chain, start); |
286 | 304 | ||
287 | inc_children_hit: | 305 | inc_children_hit: |
288 | root->children_hit++; | 306 | root->children_hit++; |
289 | } | 307 | } |
290 | 308 | ||
291 | static int | 309 | static int |
292 | __append_chain(struct callchain_node *root, struct ip_callchain *chain, | 310 | __append_chain(struct callchain_node *root, struct resolved_chain *chain, |
293 | unsigned int start, struct symbol **syms) | 311 | unsigned int start) |
294 | { | 312 | { |
295 | struct callchain_list *cnode; | 313 | struct callchain_list *cnode; |
296 | unsigned int i = start; | 314 | unsigned int i = start; |
@@ -302,13 +320,19 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
302 | * anywhere inside a function. | 320 | * anywhere inside a function. |
303 | */ | 321 | */ |
304 | list_for_each_entry(cnode, &root->val, list) { | 322 | list_for_each_entry(cnode, &root->val, list) { |
323 | struct symbol *sym; | ||
324 | |||
305 | if (i == chain->nr) | 325 | if (i == chain->nr) |
306 | break; | 326 | break; |
307 | if (cnode->sym && syms[i]) { | 327 | |
308 | if (cnode->sym->start != syms[i]->start) | 328 | sym = chain->ips[i].ms.sym; |
329 | |||
330 | if (cnode->ms.sym && sym) { | ||
331 | if (cnode->ms.sym->start != sym->start) | ||
309 | break; | 332 | break; |
310 | } else if (cnode->ip != chain->ips[i]) | 333 | } else if (cnode->ip != chain->ips[i].ip) |
311 | break; | 334 | break; |
335 | |||
312 | if (!found) | 336 | if (!found) |
313 | found = true; | 337 | found = true; |
314 | i++; | 338 | i++; |
@@ -320,7 +344,7 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
320 | 344 | ||
321 | /* we match only a part of the node. Split it and add the new chain */ | 345 | /* we match only a part of the node. Split it and add the new chain */ |
322 | if (i - start < root->val_nr) { | 346 | if (i - start < root->val_nr) { |
323 | split_add_child(root, chain, cnode, start, i - start, syms); | 347 | split_add_child(root, chain, cnode, start, i - start); |
324 | return 0; | 348 | return 0; |
325 | } | 349 | } |
326 | 350 | ||
@@ -331,15 +355,50 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain, | |||
331 | } | 355 | } |
332 | 356 | ||
333 | /* We match the node and still have a part remaining */ | 357 | /* We match the node and still have a part remaining */ |
334 | __append_chain_children(root, chain, syms, i); | 358 | __append_chain_children(root, chain, i); |
335 | 359 | ||
336 | return 0; | 360 | return 0; |
337 | } | 361 | } |
338 | 362 | ||
339 | void append_chain(struct callchain_node *root, struct ip_callchain *chain, | 363 | static void filter_context(struct ip_callchain *old, struct resolved_chain *new, |
340 | struct symbol **syms) | 364 | struct map_symbol *syms) |
341 | { | 365 | { |
366 | int i, j = 0; | ||
367 | |||
368 | for (i = 0; i < (int)old->nr; i++) { | ||
369 | if (old->ips[i] >= PERF_CONTEXT_MAX) | ||
370 | continue; | ||
371 | |||
372 | new->ips[j].ip = old->ips[i]; | ||
373 | new->ips[j].ms = syms[i]; | ||
374 | j++; | ||
375 | } | ||
376 | |||
377 | new->nr = j; | ||
378 | } | ||
379 | |||
380 | |||
381 | int append_chain(struct callchain_node *root, struct ip_callchain *chain, | ||
382 | struct map_symbol *syms) | ||
383 | { | ||
384 | struct resolved_chain *filtered; | ||
385 | |||
342 | if (!chain->nr) | 386 | if (!chain->nr) |
343 | return; | 387 | return 0; |
344 | __append_chain_children(root, chain, syms, 0); | 388 | |
389 | filtered = zalloc(sizeof(*filtered) + | ||
390 | chain->nr * sizeof(struct resolved_ip)); | ||
391 | if (!filtered) | ||
392 | return -ENOMEM; | ||
393 | |||
394 | filter_context(chain, filtered, syms); | ||
395 | |||
396 | if (!filtered->nr) | ||
397 | goto end; | ||
398 | |||
399 | __append_chain_children(root, filtered, 0); | ||
400 | end: | ||
401 | free(filtered); | ||
402 | |||
403 | return 0; | ||
345 | } | 404 | } |
diff --git a/tools/perf/util/callchain.h b/tools/perf/util/callchain.h index ad4626de4c2b..1cba1f5504e7 100644 --- a/tools/perf/util/callchain.h +++ b/tools/perf/util/callchain.h | |||
@@ -4,6 +4,7 @@ | |||
4 | #include "../perf.h" | 4 | #include "../perf.h" |
5 | #include <linux/list.h> | 5 | #include <linux/list.h> |
6 | #include <linux/rbtree.h> | 6 | #include <linux/rbtree.h> |
7 | #include "event.h" | ||
7 | #include "util.h" | 8 | #include "util.h" |
8 | #include "symbol.h" | 9 | #include "symbol.h" |
9 | 10 | ||
@@ -33,13 +34,14 @@ typedef void (*sort_chain_func_t)(struct rb_root *, struct callchain_node *, | |||
33 | 34 | ||
34 | struct callchain_param { | 35 | struct callchain_param { |
35 | enum chain_mode mode; | 36 | enum chain_mode mode; |
37 | u32 print_limit; | ||
36 | double min_percent; | 38 | double min_percent; |
37 | sort_chain_func_t sort; | 39 | sort_chain_func_t sort; |
38 | }; | 40 | }; |
39 | 41 | ||
40 | struct callchain_list { | 42 | struct callchain_list { |
41 | u64 ip; | 43 | u64 ip; |
42 | struct symbol *sym; | 44 | struct map_symbol ms; |
43 | struct list_head list; | 45 | struct list_head list; |
44 | }; | 46 | }; |
45 | 47 | ||
@@ -56,6 +58,8 @@ static inline u64 cumul_hits(struct callchain_node *node) | |||
56 | } | 58 | } |
57 | 59 | ||
58 | int register_callchain_param(struct callchain_param *param); | 60 | int register_callchain_param(struct callchain_param *param); |
59 | void append_chain(struct callchain_node *root, struct ip_callchain *chain, | 61 | int append_chain(struct callchain_node *root, struct ip_callchain *chain, |
60 | struct symbol **syms); | 62 | struct map_symbol *syms); |
63 | |||
64 | bool ip_callchain__valid(struct ip_callchain *chain, event_t *event); | ||
61 | #endif /* __PERF_CALLCHAIN_H */ | 65 | #endif /* __PERF_CALLCHAIN_H */ |
diff --git a/tools/perf/util/color.c b/tools/perf/util/color.c index e88bca55a599..e191eb9a667f 100644 --- a/tools/perf/util/color.c +++ b/tools/perf/util/color.c | |||
@@ -166,6 +166,31 @@ int perf_color_default_config(const char *var, const char *value, void *cb) | |||
166 | return perf_default_config(var, value, cb); | 166 | return perf_default_config(var, value, cb); |
167 | } | 167 | } |
168 | 168 | ||
169 | static int __color_vsnprintf(char *bf, size_t size, const char *color, | ||
170 | const char *fmt, va_list args, const char *trail) | ||
171 | { | ||
172 | int r = 0; | ||
173 | |||
174 | /* | ||
175 | * Auto-detect: | ||
176 | */ | ||
177 | if (perf_use_color_default < 0) { | ||
178 | if (isatty(1) || pager_in_use()) | ||
179 | perf_use_color_default = 1; | ||
180 | else | ||
181 | perf_use_color_default = 0; | ||
182 | } | ||
183 | |||
184 | if (perf_use_color_default && *color) | ||
185 | r += snprintf(bf, size, "%s", color); | ||
186 | r += vsnprintf(bf + r, size - r, fmt, args); | ||
187 | if (perf_use_color_default && *color) | ||
188 | r += snprintf(bf + r, size - r, "%s", PERF_COLOR_RESET); | ||
189 | if (trail) | ||
190 | r += snprintf(bf + r, size - r, "%s", trail); | ||
191 | return r; | ||
192 | } | ||
193 | |||
169 | static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, | 194 | static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, |
170 | va_list args, const char *trail) | 195 | va_list args, const char *trail) |
171 | { | 196 | { |
@@ -191,11 +216,28 @@ static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, | |||
191 | return r; | 216 | return r; |
192 | } | 217 | } |
193 | 218 | ||
219 | int color_vsnprintf(char *bf, size_t size, const char *color, | ||
220 | const char *fmt, va_list args) | ||
221 | { | ||
222 | return __color_vsnprintf(bf, size, color, fmt, args, NULL); | ||
223 | } | ||
224 | |||
194 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args) | 225 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args) |
195 | { | 226 | { |
196 | return __color_vfprintf(fp, color, fmt, args, NULL); | 227 | return __color_vfprintf(fp, color, fmt, args, NULL); |
197 | } | 228 | } |
198 | 229 | ||
230 | int color_snprintf(char *bf, size_t size, const char *color, | ||
231 | const char *fmt, ...) | ||
232 | { | ||
233 | va_list args; | ||
234 | int r; | ||
235 | |||
236 | va_start(args, fmt); | ||
237 | r = color_vsnprintf(bf, size, color, fmt, args); | ||
238 | va_end(args); | ||
239 | return r; | ||
240 | } | ||
199 | 241 | ||
200 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...) | 242 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...) |
201 | { | 243 | { |
@@ -274,3 +316,9 @@ int percent_color_fprintf(FILE *fp, const char *fmt, double percent) | |||
274 | 316 | ||
275 | return r; | 317 | return r; |
276 | } | 318 | } |
319 | |||
320 | int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent) | ||
321 | { | ||
322 | const char *color = get_percent_color(percent); | ||
323 | return color_snprintf(bf, size, color, fmt, percent); | ||
324 | } | ||
diff --git a/tools/perf/util/color.h b/tools/perf/util/color.h index 24e8809210bb..dea082b79602 100644 --- a/tools/perf/util/color.h +++ b/tools/perf/util/color.h | |||
@@ -32,10 +32,14 @@ int perf_color_default_config(const char *var, const char *value, void *cb); | |||
32 | int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty); | 32 | int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty); |
33 | void color_parse(const char *value, const char *var, char *dst); | 33 | void color_parse(const char *value, const char *var, char *dst); |
34 | void color_parse_mem(const char *value, int len, const char *var, char *dst); | 34 | void color_parse_mem(const char *value, int len, const char *var, char *dst); |
35 | int color_vsnprintf(char *bf, size_t size, const char *color, | ||
36 | const char *fmt, va_list args); | ||
35 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args); | 37 | int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args); |
36 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...); | 38 | int color_fprintf(FILE *fp, const char *color, const char *fmt, ...); |
39 | int color_snprintf(char *bf, size_t size, const char *color, const char *fmt, ...); | ||
37 | int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...); | 40 | int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...); |
38 | int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf); | 41 | int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf); |
42 | int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent); | ||
39 | int percent_color_fprintf(FILE *fp, const char *fmt, double percent); | 43 | int percent_color_fprintf(FILE *fp, const char *fmt, double percent); |
40 | const char *get_percent_color(double percent); | 44 | const char *get_percent_color(double percent); |
41 | 45 | ||
diff --git a/tools/perf/util/debug.c b/tools/perf/util/debug.c index 0905600c3851..dd824cf3b628 100644 --- a/tools/perf/util/debug.c +++ b/tools/perf/util/debug.c | |||
@@ -6,13 +6,14 @@ | |||
6 | #include <stdarg.h> | 6 | #include <stdarg.h> |
7 | #include <stdio.h> | 7 | #include <stdio.h> |
8 | 8 | ||
9 | #include "cache.h" | ||
9 | #include "color.h" | 10 | #include "color.h" |
10 | #include "event.h" | 11 | #include "event.h" |
11 | #include "debug.h" | 12 | #include "debug.h" |
12 | #include "util.h" | 13 | #include "util.h" |
13 | 14 | ||
14 | int verbose = 0; | 15 | int verbose = 0; |
15 | int dump_trace = 0; | 16 | bool dump_trace = false; |
16 | 17 | ||
17 | int eprintf(int level, const char *fmt, ...) | 18 | int eprintf(int level, const char *fmt, ...) |
18 | { | 19 | { |
@@ -21,7 +22,10 @@ int eprintf(int level, const char *fmt, ...) | |||
21 | 22 | ||
22 | if (verbose >= level) { | 23 | if (verbose >= level) { |
23 | va_start(args, fmt); | 24 | va_start(args, fmt); |
24 | ret = vfprintf(stderr, fmt, args); | 25 | if (use_browser) |
26 | ret = browser__show_help(fmt, args); | ||
27 | else | ||
28 | ret = vfprintf(stderr, fmt, args); | ||
25 | va_end(args); | 29 | va_end(args); |
26 | } | 30 | } |
27 | 31 | ||
diff --git a/tools/perf/util/debug.h b/tools/perf/util/debug.h index c6c24c522dea..047ac3324ebe 100644 --- a/tools/perf/util/debug.h +++ b/tools/perf/util/debug.h | |||
@@ -2,14 +2,38 @@ | |||
2 | #ifndef __PERF_DEBUG_H | 2 | #ifndef __PERF_DEBUG_H |
3 | #define __PERF_DEBUG_H | 3 | #define __PERF_DEBUG_H |
4 | 4 | ||
5 | #include <stdbool.h> | ||
5 | #include "event.h" | 6 | #include "event.h" |
6 | 7 | ||
7 | extern int verbose; | 8 | extern int verbose; |
8 | extern int dump_trace; | 9 | extern bool dump_trace; |
9 | 10 | ||
10 | int eprintf(int level, | ||
11 | const char *fmt, ...) __attribute__((format(printf, 2, 3))); | ||
12 | int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2))); | 11 | int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2))); |
13 | void trace_event(event_t *event); | 12 | void trace_event(event_t *event); |
14 | 13 | ||
14 | struct ui_progress; | ||
15 | |||
16 | #ifdef NO_NEWT_SUPPORT | ||
17 | static inline int browser__show_help(const char *format __used, va_list ap __used) | ||
18 | { | ||
19 | return 0; | ||
20 | } | ||
21 | |||
22 | static inline struct ui_progress *ui_progress__new(const char *title __used, | ||
23 | u64 total __used) | ||
24 | { | ||
25 | return (struct ui_progress *)1; | ||
26 | } | ||
27 | |||
28 | static inline void ui_progress__update(struct ui_progress *self __used, | ||
29 | u64 curr __used) {} | ||
30 | |||
31 | static inline void ui_progress__delete(struct ui_progress *self __used) {} | ||
32 | #else | ||
33 | int browser__show_help(const char *format, va_list ap); | ||
34 | struct ui_progress *ui_progress__new(const char *title, u64 total); | ||
35 | void ui_progress__update(struct ui_progress *self, u64 curr); | ||
36 | void ui_progress__delete(struct ui_progress *self); | ||
37 | #endif | ||
38 | |||
15 | #endif /* __PERF_DEBUG_H */ | 39 | #endif /* __PERF_DEBUG_H */ |
diff --git a/tools/perf/util/event.c b/tools/perf/util/event.c index 705ec63548b4..50771b5813ee 100644 --- a/tools/perf/util/event.c +++ b/tools/perf/util/event.c | |||
@@ -7,6 +7,23 @@ | |||
7 | #include "strlist.h" | 7 | #include "strlist.h" |
8 | #include "thread.h" | 8 | #include "thread.h" |
9 | 9 | ||
10 | const char *event__name[] = { | ||
11 | [0] = "TOTAL", | ||
12 | [PERF_RECORD_MMAP] = "MMAP", | ||
13 | [PERF_RECORD_LOST] = "LOST", | ||
14 | [PERF_RECORD_COMM] = "COMM", | ||
15 | [PERF_RECORD_EXIT] = "EXIT", | ||
16 | [PERF_RECORD_THROTTLE] = "THROTTLE", | ||
17 | [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE", | ||
18 | [PERF_RECORD_FORK] = "FORK", | ||
19 | [PERF_RECORD_READ] = "READ", | ||
20 | [PERF_RECORD_SAMPLE] = "SAMPLE", | ||
21 | [PERF_RECORD_HEADER_ATTR] = "ATTR", | ||
22 | [PERF_RECORD_HEADER_EVENT_TYPE] = "EVENT_TYPE", | ||
23 | [PERF_RECORD_HEADER_TRACING_DATA] = "TRACING_DATA", | ||
24 | [PERF_RECORD_HEADER_BUILD_ID] = "BUILD_ID", | ||
25 | }; | ||
26 | |||
10 | static pid_t event__synthesize_comm(pid_t pid, int full, | 27 | static pid_t event__synthesize_comm(pid_t pid, int full, |
11 | event__handler_t process, | 28 | event__handler_t process, |
12 | struct perf_session *session) | 29 | struct perf_session *session) |
@@ -112,7 +129,11 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
112 | event_t ev = { | 129 | event_t ev = { |
113 | .header = { | 130 | .header = { |
114 | .type = PERF_RECORD_MMAP, | 131 | .type = PERF_RECORD_MMAP, |
115 | .misc = 0, /* Just like the kernel, see kernel/perf_event.c __perf_event_mmap */ | 132 | /* |
133 | * Just like the kernel, see __perf_event_mmap | ||
134 | * in kernel/perf_event.c | ||
135 | */ | ||
136 | .misc = PERF_RECORD_MISC_USER, | ||
116 | }, | 137 | }, |
117 | }; | 138 | }; |
118 | int n; | 139 | int n; |
@@ -130,6 +151,7 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
130 | continue; | 151 | continue; |
131 | pbf += n + 3; | 152 | pbf += n + 3; |
132 | if (*pbf == 'x') { /* vm_exec */ | 153 | if (*pbf == 'x') { /* vm_exec */ |
154 | u64 vm_pgoff; | ||
133 | char *execname = strchr(bf, '/'); | 155 | char *execname = strchr(bf, '/'); |
134 | 156 | ||
135 | /* Catch VDSO */ | 157 | /* Catch VDSO */ |
@@ -139,6 +161,14 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
139 | if (execname == NULL) | 161 | if (execname == NULL) |
140 | continue; | 162 | continue; |
141 | 163 | ||
164 | pbf += 3; | ||
165 | n = hex2u64(pbf, &vm_pgoff); | ||
166 | /* pgoff is in bytes, not pages */ | ||
167 | if (n >= 0) | ||
168 | ev.mmap.pgoff = vm_pgoff << getpagesize(); | ||
169 | else | ||
170 | ev.mmap.pgoff = 0; | ||
171 | |||
142 | size = strlen(execname); | 172 | size = strlen(execname); |
143 | execname[size - 1] = '\0'; /* Remove \n */ | 173 | execname[size - 1] = '\0'; /* Remove \n */ |
144 | memcpy(ev.mmap.filename, execname, size); | 174 | memcpy(ev.mmap.filename, execname, size); |
@@ -158,11 +188,23 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, | |||
158 | } | 188 | } |
159 | 189 | ||
160 | int event__synthesize_modules(event__handler_t process, | 190 | int event__synthesize_modules(event__handler_t process, |
161 | struct perf_session *session) | 191 | struct perf_session *session, |
192 | struct machine *machine) | ||
162 | { | 193 | { |
163 | struct rb_node *nd; | 194 | struct rb_node *nd; |
195 | struct map_groups *kmaps = &machine->kmaps; | ||
196 | u16 misc; | ||
197 | |||
198 | /* | ||
199 | * kernel uses 0 for user space maps, see kernel/perf_event.c | ||
200 | * __perf_event_mmap | ||
201 | */ | ||
202 | if (machine__is_host(machine)) | ||
203 | misc = PERF_RECORD_MISC_KERNEL; | ||
204 | else | ||
205 | misc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
164 | 206 | ||
165 | for (nd = rb_first(&session->kmaps.maps[MAP__FUNCTION]); | 207 | for (nd = rb_first(&kmaps->maps[MAP__FUNCTION]); |
166 | nd; nd = rb_next(nd)) { | 208 | nd; nd = rb_next(nd)) { |
167 | event_t ev; | 209 | event_t ev; |
168 | size_t size; | 210 | size_t size; |
@@ -173,12 +215,13 @@ int event__synthesize_modules(event__handler_t process, | |||
173 | 215 | ||
174 | size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64)); | 216 | size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64)); |
175 | memset(&ev, 0, sizeof(ev)); | 217 | memset(&ev, 0, sizeof(ev)); |
176 | ev.mmap.header.misc = 1; /* kernel uses 0 for user space maps, see kernel/perf_event.c __perf_event_mmap */ | 218 | ev.mmap.header.misc = misc; |
177 | ev.mmap.header.type = PERF_RECORD_MMAP; | 219 | ev.mmap.header.type = PERF_RECORD_MMAP; |
178 | ev.mmap.header.size = (sizeof(ev.mmap) - | 220 | ev.mmap.header.size = (sizeof(ev.mmap) - |
179 | (sizeof(ev.mmap.filename) - size)); | 221 | (sizeof(ev.mmap.filename) - size)); |
180 | ev.mmap.start = pos->start; | 222 | ev.mmap.start = pos->start; |
181 | ev.mmap.len = pos->end - pos->start; | 223 | ev.mmap.len = pos->end - pos->start; |
224 | ev.mmap.pid = machine->pid; | ||
182 | 225 | ||
183 | memcpy(ev.mmap.filename, pos->dso->long_name, | 226 | memcpy(ev.mmap.filename, pos->dso->long_name, |
184 | pos->dso->long_name_len + 1); | 227 | pos->dso->long_name_len + 1); |
@@ -241,13 +284,18 @@ static int find_symbol_cb(void *arg, const char *name, char type, u64 start) | |||
241 | 284 | ||
242 | int event__synthesize_kernel_mmap(event__handler_t process, | 285 | int event__synthesize_kernel_mmap(event__handler_t process, |
243 | struct perf_session *session, | 286 | struct perf_session *session, |
287 | struct machine *machine, | ||
244 | const char *symbol_name) | 288 | const char *symbol_name) |
245 | { | 289 | { |
246 | size_t size; | 290 | size_t size; |
291 | const char *filename, *mmap_name; | ||
292 | char path[PATH_MAX]; | ||
293 | char name_buff[PATH_MAX]; | ||
294 | struct map *map; | ||
295 | |||
247 | event_t ev = { | 296 | event_t ev = { |
248 | .header = { | 297 | .header = { |
249 | .type = PERF_RECORD_MMAP, | 298 | .type = PERF_RECORD_MMAP, |
250 | .misc = 1, /* kernel uses 0 for user space maps, see kernel/perf_event.c __perf_event_mmap */ | ||
251 | }, | 299 | }, |
252 | }; | 300 | }; |
253 | /* | 301 | /* |
@@ -257,16 +305,37 @@ int event__synthesize_kernel_mmap(event__handler_t process, | |||
257 | */ | 305 | */ |
258 | struct process_symbol_args args = { .name = symbol_name, }; | 306 | struct process_symbol_args args = { .name = symbol_name, }; |
259 | 307 | ||
260 | if (kallsyms__parse("/proc/kallsyms", &args, find_symbol_cb) <= 0) | 308 | mmap_name = machine__mmap_name(machine, name_buff, sizeof(name_buff)); |
309 | if (machine__is_host(machine)) { | ||
310 | /* | ||
311 | * kernel uses PERF_RECORD_MISC_USER for user space maps, | ||
312 | * see kernel/perf_event.c __perf_event_mmap | ||
313 | */ | ||
314 | ev.header.misc = PERF_RECORD_MISC_KERNEL; | ||
315 | filename = "/proc/kallsyms"; | ||
316 | } else { | ||
317 | ev.header.misc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
318 | if (machine__is_default_guest(machine)) | ||
319 | filename = (char *) symbol_conf.default_guest_kallsyms; | ||
320 | else { | ||
321 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
322 | filename = path; | ||
323 | } | ||
324 | } | ||
325 | |||
326 | if (kallsyms__parse(filename, &args, find_symbol_cb) <= 0) | ||
261 | return -ENOENT; | 327 | return -ENOENT; |
262 | 328 | ||
329 | map = machine->vmlinux_maps[MAP__FUNCTION]; | ||
263 | size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename), | 330 | size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename), |
264 | "[kernel.kallsyms.%s]", symbol_name) + 1; | 331 | "%s%s", mmap_name, symbol_name) + 1; |
265 | size = ALIGN(size, sizeof(u64)); | 332 | size = ALIGN(size, sizeof(u64)); |
266 | ev.mmap.header.size = (sizeof(ev.mmap) - (sizeof(ev.mmap.filename) - size)); | 333 | ev.mmap.header.size = (sizeof(ev.mmap) - |
334 | (sizeof(ev.mmap.filename) - size)); | ||
267 | ev.mmap.pgoff = args.start; | 335 | ev.mmap.pgoff = args.start; |
268 | ev.mmap.start = session->vmlinux_maps[MAP__FUNCTION]->start; | 336 | ev.mmap.start = map->start; |
269 | ev.mmap.len = session->vmlinux_maps[MAP__FUNCTION]->end - ev.mmap.start ; | 337 | ev.mmap.len = map->end - ev.mmap.start; |
338 | ev.mmap.pid = machine->pid; | ||
270 | 339 | ||
271 | return process(&ev, session); | 340 | return process(&ev, session); |
272 | } | 341 | } |
@@ -316,26 +385,54 @@ int event__process_comm(event_t *self, struct perf_session *session) | |||
316 | int event__process_lost(event_t *self, struct perf_session *session) | 385 | int event__process_lost(event_t *self, struct perf_session *session) |
317 | { | 386 | { |
318 | dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost); | 387 | dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost); |
319 | session->events_stats.lost += self->lost.lost; | 388 | session->hists.stats.total_lost += self->lost.lost; |
320 | return 0; | 389 | return 0; |
321 | } | 390 | } |
322 | 391 | ||
323 | int event__process_mmap(event_t *self, struct perf_session *session) | 392 | static void event_set_kernel_mmap_len(struct map **maps, event_t *self) |
393 | { | ||
394 | maps[MAP__FUNCTION]->start = self->mmap.start; | ||
395 | maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len; | ||
396 | /* | ||
397 | * Be a bit paranoid here, some perf.data file came with | ||
398 | * a zero sized synthesized MMAP event for the kernel. | ||
399 | */ | ||
400 | if (maps[MAP__FUNCTION]->end == 0) | ||
401 | maps[MAP__FUNCTION]->end = ~0UL; | ||
402 | } | ||
403 | |||
404 | static int event__process_kernel_mmap(event_t *self, | ||
405 | struct perf_session *session) | ||
324 | { | 406 | { |
325 | struct thread *thread; | ||
326 | struct map *map; | 407 | struct map *map; |
408 | char kmmap_prefix[PATH_MAX]; | ||
409 | struct machine *machine; | ||
410 | enum dso_kernel_type kernel_type; | ||
411 | bool is_kernel_mmap; | ||
412 | |||
413 | machine = perf_session__findnew_machine(session, self->mmap.pid); | ||
414 | if (!machine) { | ||
415 | pr_err("Can't find id %d's machine\n", self->mmap.pid); | ||
416 | goto out_problem; | ||
417 | } | ||
327 | 418 | ||
328 | dump_printf(" %d/%d: [%#Lx(%#Lx) @ %#Lx]: %s\n", | 419 | machine__mmap_name(machine, kmmap_prefix, sizeof(kmmap_prefix)); |
329 | self->mmap.pid, self->mmap.tid, self->mmap.start, | 420 | if (machine__is_host(machine)) |
330 | self->mmap.len, self->mmap.pgoff, self->mmap.filename); | 421 | kernel_type = DSO_TYPE_KERNEL; |
422 | else | ||
423 | kernel_type = DSO_TYPE_GUEST_KERNEL; | ||
331 | 424 | ||
332 | if (self->mmap.pid == 0) { | 425 | is_kernel_mmap = memcmp(self->mmap.filename, |
333 | static const char kmmap_prefix[] = "[kernel.kallsyms."; | 426 | kmmap_prefix, |
427 | strlen(kmmap_prefix)) == 0; | ||
428 | if (self->mmap.filename[0] == '/' || | ||
429 | (!is_kernel_mmap && self->mmap.filename[0] == '[')) { | ||
334 | 430 | ||
335 | if (self->mmap.filename[0] == '/') { | 431 | char short_module_name[1024]; |
336 | char short_module_name[1024]; | 432 | char *name, *dot; |
337 | char *name = strrchr(self->mmap.filename, '/'), *dot; | ||
338 | 433 | ||
434 | if (self->mmap.filename[0] == '/') { | ||
435 | name = strrchr(self->mmap.filename, '/'); | ||
339 | if (name == NULL) | 436 | if (name == NULL) |
340 | goto out_problem; | 437 | goto out_problem; |
341 | 438 | ||
@@ -343,58 +440,84 @@ int event__process_mmap(event_t *self, struct perf_session *session) | |||
343 | dot = strrchr(name, '.'); | 440 | dot = strrchr(name, '.'); |
344 | if (dot == NULL) | 441 | if (dot == NULL) |
345 | goto out_problem; | 442 | goto out_problem; |
346 | |||
347 | snprintf(short_module_name, sizeof(short_module_name), | 443 | snprintf(short_module_name, sizeof(short_module_name), |
348 | "[%.*s]", (int)(dot - name), name); | 444 | "[%.*s]", (int)(dot - name), name); |
349 | strxfrchar(short_module_name, '-', '_'); | 445 | strxfrchar(short_module_name, '-', '_'); |
350 | 446 | } else | |
351 | map = perf_session__new_module_map(session, | 447 | strcpy(short_module_name, self->mmap.filename); |
352 | self->mmap.start, | 448 | |
353 | self->mmap.filename); | 449 | map = machine__new_module(machine, self->mmap.start, |
354 | if (map == NULL) | 450 | self->mmap.filename); |
355 | goto out_problem; | 451 | if (map == NULL) |
356 | 452 | goto out_problem; | |
357 | name = strdup(short_module_name); | 453 | |
358 | if (name == NULL) | 454 | name = strdup(short_module_name); |
359 | goto out_problem; | 455 | if (name == NULL) |
360 | 456 | goto out_problem; | |
361 | map->dso->short_name = name; | 457 | |
362 | map->end = map->start + self->mmap.len; | 458 | map->dso->short_name = name; |
363 | } else if (memcmp(self->mmap.filename, kmmap_prefix, | 459 | map->end = map->start + self->mmap.len; |
364 | sizeof(kmmap_prefix) - 1) == 0) { | 460 | } else if (is_kernel_mmap) { |
365 | const char *symbol_name = (self->mmap.filename + | 461 | const char *symbol_name = (self->mmap.filename + |
366 | sizeof(kmmap_prefix) - 1); | 462 | strlen(kmmap_prefix)); |
463 | /* | ||
464 | * Should be there already, from the build-id table in | ||
465 | * the header. | ||
466 | */ | ||
467 | struct dso *kernel = __dsos__findnew(&machine->kernel_dsos, | ||
468 | kmmap_prefix); | ||
469 | if (kernel == NULL) | ||
470 | goto out_problem; | ||
471 | |||
472 | kernel->kernel = kernel_type; | ||
473 | if (__machine__create_kernel_maps(machine, kernel) < 0) | ||
474 | goto out_problem; | ||
475 | |||
476 | event_set_kernel_mmap_len(machine->vmlinux_maps, self); | ||
477 | perf_session__set_kallsyms_ref_reloc_sym(machine->vmlinux_maps, | ||
478 | symbol_name, | ||
479 | self->mmap.pgoff); | ||
480 | if (machine__is_default_guest(machine)) { | ||
367 | /* | 481 | /* |
368 | * Should be there already, from the build-id table in | 482 | * preload dso of guest kernel and modules |
369 | * the header. | ||
370 | */ | 483 | */ |
371 | struct dso *kernel = __dsos__findnew(&dsos__kernel, | 484 | dso__load(kernel, machine->vmlinux_maps[MAP__FUNCTION], |
372 | "[kernel.kallsyms]"); | 485 | NULL); |
373 | if (kernel == NULL) | 486 | } |
374 | goto out_problem; | 487 | } |
375 | 488 | return 0; | |
376 | kernel->kernel = 1; | 489 | out_problem: |
377 | if (__perf_session__create_kernel_maps(session, kernel) < 0) | 490 | return -1; |
378 | goto out_problem; | 491 | } |
379 | 492 | ||
380 | session->vmlinux_maps[MAP__FUNCTION]->start = self->mmap.start; | 493 | int event__process_mmap(event_t *self, struct perf_session *session) |
381 | session->vmlinux_maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len; | 494 | { |
382 | /* | 495 | struct machine *machine; |
383 | * Be a bit paranoid here, some perf.data file came with | 496 | struct thread *thread; |
384 | * a zero sized synthesized MMAP event for the kernel. | 497 | struct map *map; |
385 | */ | 498 | u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; |
386 | if (session->vmlinux_maps[MAP__FUNCTION]->end == 0) | 499 | int ret = 0; |
387 | session->vmlinux_maps[MAP__FUNCTION]->end = ~0UL; | ||
388 | 500 | ||
389 | perf_session__set_kallsyms_ref_reloc_sym(session, symbol_name, | 501 | dump_printf(" %d/%d: [%#Lx(%#Lx) @ %#Lx]: %s\n", |
390 | self->mmap.pgoff); | 502 | self->mmap.pid, self->mmap.tid, self->mmap.start, |
391 | } | 503 | self->mmap.len, self->mmap.pgoff, self->mmap.filename); |
504 | |||
505 | if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL || | ||
506 | cpumode == PERF_RECORD_MISC_KERNEL) { | ||
507 | ret = event__process_kernel_mmap(self, session); | ||
508 | if (ret < 0) | ||
509 | goto out_problem; | ||
392 | return 0; | 510 | return 0; |
393 | } | 511 | } |
394 | 512 | ||
513 | machine = perf_session__find_host_machine(session); | ||
514 | if (machine == NULL) | ||
515 | goto out_problem; | ||
395 | thread = perf_session__findnew(session, self->mmap.pid); | 516 | thread = perf_session__findnew(session, self->mmap.pid); |
396 | map = map__new(&self->mmap, MAP__FUNCTION, | 517 | map = map__new(&machine->user_dsos, self->mmap.start, |
397 | session->cwd, session->cwdlen); | 518 | self->mmap.len, self->mmap.pgoff, |
519 | self->mmap.pid, self->mmap.filename, | ||
520 | MAP__FUNCTION, session->cwd, session->cwdlen); | ||
398 | 521 | ||
399 | if (thread == NULL || map == NULL) | 522 | if (thread == NULL || map == NULL) |
400 | goto out_problem; | 523 | goto out_problem; |
@@ -434,22 +557,56 @@ int event__process_task(event_t *self, struct perf_session *session) | |||
434 | 557 | ||
435 | void thread__find_addr_map(struct thread *self, | 558 | void thread__find_addr_map(struct thread *self, |
436 | struct perf_session *session, u8 cpumode, | 559 | struct perf_session *session, u8 cpumode, |
437 | enum map_type type, u64 addr, | 560 | enum map_type type, pid_t pid, u64 addr, |
438 | struct addr_location *al) | 561 | struct addr_location *al) |
439 | { | 562 | { |
440 | struct map_groups *mg = &self->mg; | 563 | struct map_groups *mg = &self->mg; |
564 | struct machine *machine = NULL; | ||
441 | 565 | ||
442 | al->thread = self; | 566 | al->thread = self; |
443 | al->addr = addr; | 567 | al->addr = addr; |
568 | al->cpumode = cpumode; | ||
569 | al->filtered = false; | ||
444 | 570 | ||
445 | if (cpumode == PERF_RECORD_MISC_KERNEL) { | 571 | if (cpumode == PERF_RECORD_MISC_KERNEL && perf_host) { |
446 | al->level = 'k'; | 572 | al->level = 'k'; |
447 | mg = &session->kmaps; | 573 | machine = perf_session__find_host_machine(session); |
448 | } else if (cpumode == PERF_RECORD_MISC_USER) | 574 | if (machine == NULL) { |
575 | al->map = NULL; | ||
576 | return; | ||
577 | } | ||
578 | mg = &machine->kmaps; | ||
579 | } else if (cpumode == PERF_RECORD_MISC_USER && perf_host) { | ||
449 | al->level = '.'; | 580 | al->level = '.'; |
450 | else { | 581 | machine = perf_session__find_host_machine(session); |
451 | al->level = 'H'; | 582 | } else if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL && perf_guest) { |
583 | al->level = 'g'; | ||
584 | machine = perf_session__find_machine(session, pid); | ||
585 | if (machine == NULL) { | ||
586 | al->map = NULL; | ||
587 | return; | ||
588 | } | ||
589 | mg = &machine->kmaps; | ||
590 | } else { | ||
591 | /* | ||
592 | * 'u' means guest os user space. | ||
593 | * TODO: We don't support guest user space. Might support late. | ||
594 | */ | ||
595 | if (cpumode == PERF_RECORD_MISC_GUEST_USER && perf_guest) | ||
596 | al->level = 'u'; | ||
597 | else | ||
598 | al->level = 'H'; | ||
452 | al->map = NULL; | 599 | al->map = NULL; |
600 | |||
601 | if ((cpumode == PERF_RECORD_MISC_GUEST_USER || | ||
602 | cpumode == PERF_RECORD_MISC_GUEST_KERNEL) && | ||
603 | !perf_guest) | ||
604 | al->filtered = true; | ||
605 | if ((cpumode == PERF_RECORD_MISC_USER || | ||
606 | cpumode == PERF_RECORD_MISC_KERNEL) && | ||
607 | !perf_host) | ||
608 | al->filtered = true; | ||
609 | |||
453 | return; | 610 | return; |
454 | } | 611 | } |
455 | try_again: | 612 | try_again: |
@@ -464,8 +621,10 @@ try_again: | |||
464 | * "[vdso]" dso, but for now lets use the old trick of looking | 621 | * "[vdso]" dso, but for now lets use the old trick of looking |
465 | * in the whole kernel symbol list. | 622 | * in the whole kernel symbol list. |
466 | */ | 623 | */ |
467 | if ((long long)al->addr < 0 && mg != &session->kmaps) { | 624 | if ((long long)al->addr < 0 && |
468 | mg = &session->kmaps; | 625 | cpumode == PERF_RECORD_MISC_KERNEL && |
626 | machine && mg != &machine->kmaps) { | ||
627 | mg = &machine->kmaps; | ||
469 | goto try_again; | 628 | goto try_again; |
470 | } | 629 | } |
471 | } else | 630 | } else |
@@ -474,11 +633,11 @@ try_again: | |||
474 | 633 | ||
475 | void thread__find_addr_location(struct thread *self, | 634 | void thread__find_addr_location(struct thread *self, |
476 | struct perf_session *session, u8 cpumode, | 635 | struct perf_session *session, u8 cpumode, |
477 | enum map_type type, u64 addr, | 636 | enum map_type type, pid_t pid, u64 addr, |
478 | struct addr_location *al, | 637 | struct addr_location *al, |
479 | symbol_filter_t filter) | 638 | symbol_filter_t filter) |
480 | { | 639 | { |
481 | thread__find_addr_map(self, session, cpumode, type, addr, al); | 640 | thread__find_addr_map(self, session, cpumode, type, pid, addr, al); |
482 | if (al->map != NULL) | 641 | if (al->map != NULL) |
483 | al->sym = map__find_symbol(al->map, al->addr, filter); | 642 | al->sym = map__find_symbol(al->map, al->addr, filter); |
484 | else | 643 | else |
@@ -490,8 +649,10 @@ static void dso__calc_col_width(struct dso *self) | |||
490 | if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep && | 649 | if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep && |
491 | (!symbol_conf.dso_list || | 650 | (!symbol_conf.dso_list || |
492 | strlist__has_entry(symbol_conf.dso_list, self->name))) { | 651 | strlist__has_entry(symbol_conf.dso_list, self->name))) { |
493 | unsigned int slen = strlen(self->name); | 652 | u16 slen = self->short_name_len; |
494 | if (slen > dsos__col_width) | 653 | if (verbose) |
654 | slen = self->long_name_len; | ||
655 | if (dsos__col_width < slen) | ||
495 | dsos__col_width = slen; | 656 | dsos__col_width = slen; |
496 | } | 657 | } |
497 | 658 | ||
@@ -512,31 +673,55 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session, | |||
512 | goto out_filtered; | 673 | goto out_filtered; |
513 | 674 | ||
514 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); | 675 | dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); |
676 | /* | ||
677 | * Have we already created the kernel maps for the host machine? | ||
678 | * | ||
679 | * This should have happened earlier, when we processed the kernel MMAP | ||
680 | * events, but for older perf.data files there was no such thing, so do | ||
681 | * it now. | ||
682 | */ | ||
683 | if (cpumode == PERF_RECORD_MISC_KERNEL && | ||
684 | session->host_machine.vmlinux_maps[MAP__FUNCTION] == NULL) | ||
685 | machine__create_kernel_maps(&session->host_machine); | ||
515 | 686 | ||
516 | thread__find_addr_location(thread, session, cpumode, MAP__FUNCTION, | 687 | thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION, |
517 | self->ip.ip, al, filter); | 688 | self->ip.pid, self->ip.ip, al); |
518 | dump_printf(" ...... dso: %s\n", | 689 | dump_printf(" ...... dso: %s\n", |
519 | al->map ? al->map->dso->long_name : | 690 | al->map ? al->map->dso->long_name : |
520 | al->level == 'H' ? "[hypervisor]" : "<not found>"); | 691 | al->level == 'H' ? "[hypervisor]" : "<not found>"); |
521 | /* | 692 | al->sym = NULL; |
522 | * We have to do this here as we may have a dso with no symbol hit that | 693 | |
523 | * has a name longer than the ones with symbols sampled. | 694 | if (al->map) { |
524 | */ | 695 | if (symbol_conf.dso_list && |
525 | if (al->map && !sort_dso.elide && !al->map->dso->slen_calculated) | 696 | (!al->map || !al->map->dso || |
526 | dso__calc_col_width(al->map->dso); | 697 | !(strlist__has_entry(symbol_conf.dso_list, |
527 | 698 | al->map->dso->short_name) || | |
528 | if (symbol_conf.dso_list && | 699 | (al->map->dso->short_name != al->map->dso->long_name && |
529 | (!al->map || !al->map->dso || | 700 | strlist__has_entry(symbol_conf.dso_list, |
530 | !(strlist__has_entry(symbol_conf.dso_list, al->map->dso->short_name) || | 701 | al->map->dso->long_name))))) |
531 | (al->map->dso->short_name != al->map->dso->long_name && | 702 | goto out_filtered; |
532 | strlist__has_entry(symbol_conf.dso_list, al->map->dso->long_name))))) | 703 | /* |
533 | goto out_filtered; | 704 | * We have to do this here as we may have a dso with no symbol |
705 | * hit that has a name longer than the ones with symbols | ||
706 | * sampled. | ||
707 | */ | ||
708 | if (!sort_dso.elide && !al->map->dso->slen_calculated) | ||
709 | dso__calc_col_width(al->map->dso); | ||
710 | |||
711 | al->sym = map__find_symbol(al->map, al->addr, filter); | ||
712 | } else { | ||
713 | const unsigned int unresolved_col_width = BITS_PER_LONG / 4; | ||
714 | |||
715 | if (dsos__col_width < unresolved_col_width && | ||
716 | !symbol_conf.col_width_list_str && !symbol_conf.field_sep && | ||
717 | !symbol_conf.dso_list) | ||
718 | dsos__col_width = unresolved_col_width; | ||
719 | } | ||
534 | 720 | ||
535 | if (symbol_conf.sym_list && al->sym && | 721 | if (symbol_conf.sym_list && al->sym && |
536 | !strlist__has_entry(symbol_conf.sym_list, al->sym->name)) | 722 | !strlist__has_entry(symbol_conf.sym_list, al->sym->name)) |
537 | goto out_filtered; | 723 | goto out_filtered; |
538 | 724 | ||
539 | al->filtered = false; | ||
540 | return 0; | 725 | return 0; |
541 | 726 | ||
542 | out_filtered: | 727 | out_filtered: |
@@ -570,6 +755,7 @@ int event__parse_sample(event_t *event, u64 type, struct sample_data *data) | |||
570 | array++; | 755 | array++; |
571 | } | 756 | } |
572 | 757 | ||
758 | data->id = -1ULL; | ||
573 | if (type & PERF_SAMPLE_ID) { | 759 | if (type & PERF_SAMPLE_ID) { |
574 | data->id = *array; | 760 | data->id = *array; |
575 | array++; | 761 | array++; |
diff --git a/tools/perf/util/event.h b/tools/perf/util/event.h index a33b94952e34..8577085db067 100644 --- a/tools/perf/util/event.h +++ b/tools/perf/util/event.h | |||
@@ -68,21 +68,54 @@ struct sample_data { | |||
68 | u64 addr; | 68 | u64 addr; |
69 | u64 id; | 69 | u64 id; |
70 | u64 stream_id; | 70 | u64 stream_id; |
71 | u32 cpu; | ||
72 | u64 period; | 71 | u64 period; |
73 | struct ip_callchain *callchain; | 72 | u32 cpu; |
74 | u32 raw_size; | 73 | u32 raw_size; |
75 | void *raw_data; | 74 | void *raw_data; |
75 | struct ip_callchain *callchain; | ||
76 | }; | 76 | }; |
77 | 77 | ||
78 | #define BUILD_ID_SIZE 20 | 78 | #define BUILD_ID_SIZE 20 |
79 | 79 | ||
80 | struct build_id_event { | 80 | struct build_id_event { |
81 | struct perf_event_header header; | 81 | struct perf_event_header header; |
82 | pid_t pid; | ||
82 | u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))]; | 83 | u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))]; |
83 | char filename[]; | 84 | char filename[]; |
84 | }; | 85 | }; |
85 | 86 | ||
87 | enum perf_user_event_type { /* above any possible kernel type */ | ||
88 | PERF_RECORD_HEADER_ATTR = 64, | ||
89 | PERF_RECORD_HEADER_EVENT_TYPE = 65, | ||
90 | PERF_RECORD_HEADER_TRACING_DATA = 66, | ||
91 | PERF_RECORD_HEADER_BUILD_ID = 67, | ||
92 | PERF_RECORD_FINISHED_ROUND = 68, | ||
93 | PERF_RECORD_HEADER_MAX | ||
94 | }; | ||
95 | |||
96 | struct attr_event { | ||
97 | struct perf_event_header header; | ||
98 | struct perf_event_attr attr; | ||
99 | u64 id[]; | ||
100 | }; | ||
101 | |||
102 | #define MAX_EVENT_NAME 64 | ||
103 | |||
104 | struct perf_trace_event_type { | ||
105 | u64 event_id; | ||
106 | char name[MAX_EVENT_NAME]; | ||
107 | }; | ||
108 | |||
109 | struct event_type_event { | ||
110 | struct perf_event_header header; | ||
111 | struct perf_trace_event_type event_type; | ||
112 | }; | ||
113 | |||
114 | struct tracing_data_event { | ||
115 | struct perf_event_header header; | ||
116 | u32 size; | ||
117 | }; | ||
118 | |||
86 | typedef union event_union { | 119 | typedef union event_union { |
87 | struct perf_event_header header; | 120 | struct perf_event_header header; |
88 | struct ip_event ip; | 121 | struct ip_event ip; |
@@ -92,22 +125,12 @@ typedef union event_union { | |||
92 | struct lost_event lost; | 125 | struct lost_event lost; |
93 | struct read_event read; | 126 | struct read_event read; |
94 | struct sample_event sample; | 127 | struct sample_event sample; |
128 | struct attr_event attr; | ||
129 | struct event_type_event event_type; | ||
130 | struct tracing_data_event tracing_data; | ||
131 | struct build_id_event build_id; | ||
95 | } event_t; | 132 | } event_t; |
96 | 133 | ||
97 | struct events_stats { | ||
98 | u64 total; | ||
99 | u64 lost; | ||
100 | }; | ||
101 | |||
102 | struct event_stat_id { | ||
103 | struct rb_node rb_node; | ||
104 | struct rb_root hists; | ||
105 | struct events_stats stats; | ||
106 | u64 config; | ||
107 | u64 event_stream; | ||
108 | u32 type; | ||
109 | }; | ||
110 | |||
111 | void event__print_totals(void); | 134 | void event__print_totals(void); |
112 | 135 | ||
113 | struct perf_session; | 136 | struct perf_session; |
@@ -119,10 +142,13 @@ int event__synthesize_thread(pid_t pid, event__handler_t process, | |||
119 | void event__synthesize_threads(event__handler_t process, | 142 | void event__synthesize_threads(event__handler_t process, |
120 | struct perf_session *session); | 143 | struct perf_session *session); |
121 | int event__synthesize_kernel_mmap(event__handler_t process, | 144 | int event__synthesize_kernel_mmap(event__handler_t process, |
122 | struct perf_session *session, | 145 | struct perf_session *session, |
123 | const char *symbol_name); | 146 | struct machine *machine, |
147 | const char *symbol_name); | ||
148 | |||
124 | int event__synthesize_modules(event__handler_t process, | 149 | int event__synthesize_modules(event__handler_t process, |
125 | struct perf_session *session); | 150 | struct perf_session *session, |
151 | struct machine *machine); | ||
126 | 152 | ||
127 | int event__process_comm(event_t *self, struct perf_session *session); | 153 | int event__process_comm(event_t *self, struct perf_session *session); |
128 | int event__process_lost(event_t *self, struct perf_session *session); | 154 | int event__process_lost(event_t *self, struct perf_session *session); |
@@ -134,4 +160,6 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session, | |||
134 | struct addr_location *al, symbol_filter_t filter); | 160 | struct addr_location *al, symbol_filter_t filter); |
135 | int event__parse_sample(event_t *event, u64 type, struct sample_data *data); | 161 | int event__parse_sample(event_t *event, u64 type, struct sample_data *data); |
136 | 162 | ||
163 | extern const char *event__name[]; | ||
164 | |||
137 | #endif /* __PERF_RECORD_H */ | 165 | #endif /* __PERF_RECORD_H */ |
diff --git a/tools/perf/util/header.c b/tools/perf/util/header.c index 6c9aa16ee51f..8847bec64c54 100644 --- a/tools/perf/util/header.c +++ b/tools/perf/util/header.c | |||
@@ -99,13 +99,6 @@ int perf_header__add_attr(struct perf_header *self, | |||
99 | return 0; | 99 | return 0; |
100 | } | 100 | } |
101 | 101 | ||
102 | #define MAX_EVENT_NAME 64 | ||
103 | |||
104 | struct perf_trace_event_type { | ||
105 | u64 event_id; | ||
106 | char name[MAX_EVENT_NAME]; | ||
107 | }; | ||
108 | |||
109 | static int event_count; | 102 | static int event_count; |
110 | static struct perf_trace_event_type *events; | 103 | static struct perf_trace_event_type *events; |
111 | 104 | ||
@@ -197,7 +190,8 @@ static int write_padded(int fd, const void *bf, size_t count, | |||
197 | continue; \ | 190 | continue; \ |
198 | else | 191 | else |
199 | 192 | ||
200 | static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | 193 | static int __dsos__write_buildid_table(struct list_head *head, pid_t pid, |
194 | u16 misc, int fd) | ||
201 | { | 195 | { |
202 | struct dso *pos; | 196 | struct dso *pos; |
203 | 197 | ||
@@ -212,6 +206,7 @@ static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | |||
212 | len = ALIGN(len, NAME_ALIGN); | 206 | len = ALIGN(len, NAME_ALIGN); |
213 | memset(&b, 0, sizeof(b)); | 207 | memset(&b, 0, sizeof(b)); |
214 | memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id)); | 208 | memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id)); |
209 | b.pid = pid; | ||
215 | b.header.misc = misc; | 210 | b.header.misc = misc; |
216 | b.header.size = sizeof(b) + len; | 211 | b.header.size = sizeof(b) + len; |
217 | err = do_write(fd, &b, sizeof(b)); | 212 | err = do_write(fd, &b, sizeof(b)); |
@@ -226,13 +221,32 @@ static int __dsos__write_buildid_table(struct list_head *head, u16 misc, int fd) | |||
226 | return 0; | 221 | return 0; |
227 | } | 222 | } |
228 | 223 | ||
229 | static int dsos__write_buildid_table(int fd) | 224 | static int dsos__write_buildid_table(struct perf_header *header, int fd) |
230 | { | 225 | { |
231 | int err = __dsos__write_buildid_table(&dsos__kernel, | 226 | struct perf_session *session = container_of(header, |
232 | PERF_RECORD_MISC_KERNEL, fd); | 227 | struct perf_session, header); |
233 | if (err == 0) | 228 | struct rb_node *nd; |
234 | err = __dsos__write_buildid_table(&dsos__user, | 229 | int err = 0; |
235 | PERF_RECORD_MISC_USER, fd); | 230 | u16 kmisc, umisc; |
231 | |||
232 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { | ||
233 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
234 | if (machine__is_host(pos)) { | ||
235 | kmisc = PERF_RECORD_MISC_KERNEL; | ||
236 | umisc = PERF_RECORD_MISC_USER; | ||
237 | } else { | ||
238 | kmisc = PERF_RECORD_MISC_GUEST_KERNEL; | ||
239 | umisc = PERF_RECORD_MISC_GUEST_USER; | ||
240 | } | ||
241 | |||
242 | err = __dsos__write_buildid_table(&pos->kernel_dsos, pos->pid, | ||
243 | kmisc, fd); | ||
244 | if (err == 0) | ||
245 | err = __dsos__write_buildid_table(&pos->user_dsos, | ||
246 | pos->pid, umisc, fd); | ||
247 | if (err) | ||
248 | break; | ||
249 | } | ||
236 | return err; | 250 | return err; |
237 | } | 251 | } |
238 | 252 | ||
@@ -349,9 +363,12 @@ static int __dsos__cache_build_ids(struct list_head *head, const char *debugdir) | |||
349 | return err; | 363 | return err; |
350 | } | 364 | } |
351 | 365 | ||
352 | static int dsos__cache_build_ids(void) | 366 | static int dsos__cache_build_ids(struct perf_header *self) |
353 | { | 367 | { |
354 | int err_kernel, err_user; | 368 | struct perf_session *session = container_of(self, |
369 | struct perf_session, header); | ||
370 | struct rb_node *nd; | ||
371 | int ret = 0; | ||
355 | char debugdir[PATH_MAX]; | 372 | char debugdir[PATH_MAX]; |
356 | 373 | ||
357 | snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"), | 374 | snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"), |
@@ -360,9 +377,28 @@ static int dsos__cache_build_ids(void) | |||
360 | if (mkdir(debugdir, 0755) != 0 && errno != EEXIST) | 377 | if (mkdir(debugdir, 0755) != 0 && errno != EEXIST) |
361 | return -1; | 378 | return -1; |
362 | 379 | ||
363 | err_kernel = __dsos__cache_build_ids(&dsos__kernel, debugdir); | 380 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { |
364 | err_user = __dsos__cache_build_ids(&dsos__user, debugdir); | 381 | struct machine *pos = rb_entry(nd, struct machine, rb_node); |
365 | return err_kernel || err_user ? -1 : 0; | 382 | ret |= __dsos__cache_build_ids(&pos->kernel_dsos, debugdir); |
383 | ret |= __dsos__cache_build_ids(&pos->user_dsos, debugdir); | ||
384 | } | ||
385 | return ret ? -1 : 0; | ||
386 | } | ||
387 | |||
388 | static bool dsos__read_build_ids(struct perf_header *self, bool with_hits) | ||
389 | { | ||
390 | bool ret = false; | ||
391 | struct perf_session *session = container_of(self, | ||
392 | struct perf_session, header); | ||
393 | struct rb_node *nd; | ||
394 | |||
395 | for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) { | ||
396 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
397 | ret |= __dsos__read_build_ids(&pos->kernel_dsos, with_hits); | ||
398 | ret |= __dsos__read_build_ids(&pos->user_dsos, with_hits); | ||
399 | } | ||
400 | |||
401 | return ret; | ||
366 | } | 402 | } |
367 | 403 | ||
368 | static int perf_header__adds_write(struct perf_header *self, int fd) | 404 | static int perf_header__adds_write(struct perf_header *self, int fd) |
@@ -373,7 +409,7 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
373 | u64 sec_start; | 409 | u64 sec_start; |
374 | int idx = 0, err; | 410 | int idx = 0, err; |
375 | 411 | ||
376 | if (dsos__read_build_ids(true)) | 412 | if (dsos__read_build_ids(self, true)) |
377 | perf_header__set_feat(self, HEADER_BUILD_ID); | 413 | perf_header__set_feat(self, HEADER_BUILD_ID); |
378 | 414 | ||
379 | nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); | 415 | nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); |
@@ -400,7 +436,6 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
400 | trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset; | 436 | trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset; |
401 | } | 437 | } |
402 | 438 | ||
403 | |||
404 | if (perf_header__has_feat(self, HEADER_BUILD_ID)) { | 439 | if (perf_header__has_feat(self, HEADER_BUILD_ID)) { |
405 | struct perf_file_section *buildid_sec; | 440 | struct perf_file_section *buildid_sec; |
406 | 441 | ||
@@ -408,14 +443,14 @@ static int perf_header__adds_write(struct perf_header *self, int fd) | |||
408 | 443 | ||
409 | /* Write build-ids */ | 444 | /* Write build-ids */ |
410 | buildid_sec->offset = lseek(fd, 0, SEEK_CUR); | 445 | buildid_sec->offset = lseek(fd, 0, SEEK_CUR); |
411 | err = dsos__write_buildid_table(fd); | 446 | err = dsos__write_buildid_table(self, fd); |
412 | if (err < 0) { | 447 | if (err < 0) { |
413 | pr_debug("failed to write buildid table\n"); | 448 | pr_debug("failed to write buildid table\n"); |
414 | goto out_free; | 449 | goto out_free; |
415 | } | 450 | } |
416 | buildid_sec->size = lseek(fd, 0, SEEK_CUR) - | 451 | buildid_sec->size = lseek(fd, 0, SEEK_CUR) - |
417 | buildid_sec->offset; | 452 | buildid_sec->offset; |
418 | dsos__cache_build_ids(); | 453 | dsos__cache_build_ids(self); |
419 | } | 454 | } |
420 | 455 | ||
421 | lseek(fd, sec_start, SEEK_SET); | 456 | lseek(fd, sec_start, SEEK_SET); |
@@ -427,6 +462,25 @@ out_free: | |||
427 | return err; | 462 | return err; |
428 | } | 463 | } |
429 | 464 | ||
465 | int perf_header__write_pipe(int fd) | ||
466 | { | ||
467 | struct perf_pipe_file_header f_header; | ||
468 | int err; | ||
469 | |||
470 | f_header = (struct perf_pipe_file_header){ | ||
471 | .magic = PERF_MAGIC, | ||
472 | .size = sizeof(f_header), | ||
473 | }; | ||
474 | |||
475 | err = do_write(fd, &f_header, sizeof(f_header)); | ||
476 | if (err < 0) { | ||
477 | pr_debug("failed to write perf pipe header\n"); | ||
478 | return err; | ||
479 | } | ||
480 | |||
481 | return 0; | ||
482 | } | ||
483 | |||
430 | int perf_header__write(struct perf_header *self, int fd, bool at_exit) | 484 | int perf_header__write(struct perf_header *self, int fd, bool at_exit) |
431 | { | 485 | { |
432 | struct perf_file_header f_header; | 486 | struct perf_file_header f_header; |
@@ -518,25 +572,10 @@ int perf_header__write(struct perf_header *self, int fd, bool at_exit) | |||
518 | return 0; | 572 | return 0; |
519 | } | 573 | } |
520 | 574 | ||
521 | static int do_read(int fd, void *buf, size_t size) | ||
522 | { | ||
523 | while (size) { | ||
524 | int ret = read(fd, buf, size); | ||
525 | |||
526 | if (ret <= 0) | ||
527 | return -1; | ||
528 | |||
529 | size -= ret; | ||
530 | buf += ret; | ||
531 | } | ||
532 | |||
533 | return 0; | ||
534 | } | ||
535 | |||
536 | static int perf_header__getbuffer64(struct perf_header *self, | 575 | static int perf_header__getbuffer64(struct perf_header *self, |
537 | int fd, void *buf, size_t size) | 576 | int fd, void *buf, size_t size) |
538 | { | 577 | { |
539 | if (do_read(fd, buf, size)) | 578 | if (do_read(fd, buf, size) <= 0) |
540 | return -1; | 579 | return -1; |
541 | 580 | ||
542 | if (self->needs_swap) | 581 | if (self->needs_swap) |
@@ -592,7 +631,7 @@ int perf_file_header__read(struct perf_file_header *self, | |||
592 | { | 631 | { |
593 | lseek(fd, 0, SEEK_SET); | 632 | lseek(fd, 0, SEEK_SET); |
594 | 633 | ||
595 | if (do_read(fd, self, sizeof(*self)) || | 634 | if (do_read(fd, self, sizeof(*self)) <= 0 || |
596 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) | 635 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) |
597 | return -1; | 636 | return -1; |
598 | 637 | ||
@@ -636,6 +675,93 @@ int perf_file_header__read(struct perf_file_header *self, | |||
636 | return 0; | 675 | return 0; |
637 | } | 676 | } |
638 | 677 | ||
678 | static int __event_process_build_id(struct build_id_event *bev, | ||
679 | char *filename, | ||
680 | struct perf_session *session) | ||
681 | { | ||
682 | int err = -1; | ||
683 | struct list_head *head; | ||
684 | struct machine *machine; | ||
685 | u16 misc; | ||
686 | struct dso *dso; | ||
687 | enum dso_kernel_type dso_type; | ||
688 | |||
689 | machine = perf_session__findnew_machine(session, bev->pid); | ||
690 | if (!machine) | ||
691 | goto out; | ||
692 | |||
693 | misc = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; | ||
694 | |||
695 | switch (misc) { | ||
696 | case PERF_RECORD_MISC_KERNEL: | ||
697 | dso_type = DSO_TYPE_KERNEL; | ||
698 | head = &machine->kernel_dsos; | ||
699 | break; | ||
700 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
701 | dso_type = DSO_TYPE_GUEST_KERNEL; | ||
702 | head = &machine->kernel_dsos; | ||
703 | break; | ||
704 | case PERF_RECORD_MISC_USER: | ||
705 | case PERF_RECORD_MISC_GUEST_USER: | ||
706 | dso_type = DSO_TYPE_USER; | ||
707 | head = &machine->user_dsos; | ||
708 | break; | ||
709 | default: | ||
710 | goto out; | ||
711 | } | ||
712 | |||
713 | dso = __dsos__findnew(head, filename); | ||
714 | if (dso != NULL) { | ||
715 | char sbuild_id[BUILD_ID_SIZE * 2 + 1]; | ||
716 | |||
717 | dso__set_build_id(dso, &bev->build_id); | ||
718 | |||
719 | if (filename[0] == '[') | ||
720 | dso->kernel = dso_type; | ||
721 | |||
722 | build_id__sprintf(dso->build_id, sizeof(dso->build_id), | ||
723 | sbuild_id); | ||
724 | pr_debug("build id event received for %s: %s\n", | ||
725 | dso->long_name, sbuild_id); | ||
726 | } | ||
727 | |||
728 | err = 0; | ||
729 | out: | ||
730 | return err; | ||
731 | } | ||
732 | |||
733 | static int perf_header__read_build_ids(struct perf_header *self, | ||
734 | int input, u64 offset, u64 size) | ||
735 | { | ||
736 | struct perf_session *session = container_of(self, | ||
737 | struct perf_session, header); | ||
738 | struct build_id_event bev; | ||
739 | char filename[PATH_MAX]; | ||
740 | u64 limit = offset + size; | ||
741 | int err = -1; | ||
742 | |||
743 | while (offset < limit) { | ||
744 | ssize_t len; | ||
745 | |||
746 | if (read(input, &bev, sizeof(bev)) != sizeof(bev)) | ||
747 | goto out; | ||
748 | |||
749 | if (self->needs_swap) | ||
750 | perf_event_header__bswap(&bev.header); | ||
751 | |||
752 | len = bev.header.size - sizeof(bev); | ||
753 | if (read(input, filename, len) != len) | ||
754 | goto out; | ||
755 | |||
756 | __event_process_build_id(&bev, filename, session); | ||
757 | |||
758 | offset += bev.header.size; | ||
759 | } | ||
760 | err = 0; | ||
761 | out: | ||
762 | return err; | ||
763 | } | ||
764 | |||
639 | static int perf_file_section__process(struct perf_file_section *self, | 765 | static int perf_file_section__process(struct perf_file_section *self, |
640 | struct perf_header *ph, | 766 | struct perf_header *ph, |
641 | int feat, int fd) | 767 | int feat, int fd) |
@@ -648,7 +774,7 @@ static int perf_file_section__process(struct perf_file_section *self, | |||
648 | 774 | ||
649 | switch (feat) { | 775 | switch (feat) { |
650 | case HEADER_TRACE_INFO: | 776 | case HEADER_TRACE_INFO: |
651 | trace_report(fd); | 777 | trace_report(fd, false); |
652 | break; | 778 | break; |
653 | 779 | ||
654 | case HEADER_BUILD_ID: | 780 | case HEADER_BUILD_ID: |
@@ -662,13 +788,56 @@ static int perf_file_section__process(struct perf_file_section *self, | |||
662 | return 0; | 788 | return 0; |
663 | } | 789 | } |
664 | 790 | ||
665 | int perf_header__read(struct perf_header *self, int fd) | 791 | static int perf_file_header__read_pipe(struct perf_pipe_file_header *self, |
792 | struct perf_header *ph, int fd, | ||
793 | bool repipe) | ||
794 | { | ||
795 | if (do_read(fd, self, sizeof(*self)) <= 0 || | ||
796 | memcmp(&self->magic, __perf_magic, sizeof(self->magic))) | ||
797 | return -1; | ||
798 | |||
799 | if (repipe && do_write(STDOUT_FILENO, self, sizeof(*self)) < 0) | ||
800 | return -1; | ||
801 | |||
802 | if (self->size != sizeof(*self)) { | ||
803 | u64 size = bswap_64(self->size); | ||
804 | |||
805 | if (size != sizeof(*self)) | ||
806 | return -1; | ||
807 | |||
808 | ph->needs_swap = true; | ||
809 | } | ||
810 | |||
811 | return 0; | ||
812 | } | ||
813 | |||
814 | static int perf_header__read_pipe(struct perf_session *session, int fd) | ||
666 | { | 815 | { |
816 | struct perf_header *self = &session->header; | ||
817 | struct perf_pipe_file_header f_header; | ||
818 | |||
819 | if (perf_file_header__read_pipe(&f_header, self, fd, | ||
820 | session->repipe) < 0) { | ||
821 | pr_debug("incompatible file format\n"); | ||
822 | return -EINVAL; | ||
823 | } | ||
824 | |||
825 | session->fd = fd; | ||
826 | |||
827 | return 0; | ||
828 | } | ||
829 | |||
830 | int perf_header__read(struct perf_session *session, int fd) | ||
831 | { | ||
832 | struct perf_header *self = &session->header; | ||
667 | struct perf_file_header f_header; | 833 | struct perf_file_header f_header; |
668 | struct perf_file_attr f_attr; | 834 | struct perf_file_attr f_attr; |
669 | u64 f_id; | 835 | u64 f_id; |
670 | int nr_attrs, nr_ids, i, j; | 836 | int nr_attrs, nr_ids, i, j; |
671 | 837 | ||
838 | if (session->fd_pipe) | ||
839 | return perf_header__read_pipe(session, fd); | ||
840 | |||
672 | if (perf_file_header__read(&f_header, self, fd) < 0) { | 841 | if (perf_file_header__read(&f_header, self, fd) < 0) { |
673 | pr_debug("incompatible file format\n"); | 842 | pr_debug("incompatible file format\n"); |
674 | return -EINVAL; | 843 | return -EINVAL; |
@@ -753,6 +922,14 @@ perf_header__find_attr(u64 id, struct perf_header *header) | |||
753 | { | 922 | { |
754 | int i; | 923 | int i; |
755 | 924 | ||
925 | /* | ||
926 | * We set id to -1 if the data file doesn't contain sample | ||
927 | * ids. Check for this and avoid walking through the entire | ||
928 | * list of ids which may be large. | ||
929 | */ | ||
930 | if (id == -1ULL) | ||
931 | return NULL; | ||
932 | |||
756 | for (i = 0; i < header->attrs; i++) { | 933 | for (i = 0; i < header->attrs; i++) { |
757 | struct perf_header_attr *attr = header->attr[i]; | 934 | struct perf_header_attr *attr = header->attr[i]; |
758 | int j; | 935 | int j; |
@@ -765,3 +942,231 @@ perf_header__find_attr(u64 id, struct perf_header *header) | |||
765 | 942 | ||
766 | return NULL; | 943 | return NULL; |
767 | } | 944 | } |
945 | |||
946 | int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id, | ||
947 | event__handler_t process, | ||
948 | struct perf_session *session) | ||
949 | { | ||
950 | event_t *ev; | ||
951 | size_t size; | ||
952 | int err; | ||
953 | |||
954 | size = sizeof(struct perf_event_attr); | ||
955 | size = ALIGN(size, sizeof(u64)); | ||
956 | size += sizeof(struct perf_event_header); | ||
957 | size += ids * sizeof(u64); | ||
958 | |||
959 | ev = malloc(size); | ||
960 | |||
961 | ev->attr.attr = *attr; | ||
962 | memcpy(ev->attr.id, id, ids * sizeof(u64)); | ||
963 | |||
964 | ev->attr.header.type = PERF_RECORD_HEADER_ATTR; | ||
965 | ev->attr.header.size = size; | ||
966 | |||
967 | err = process(ev, session); | ||
968 | |||
969 | free(ev); | ||
970 | |||
971 | return err; | ||
972 | } | ||
973 | |||
974 | int event__synthesize_attrs(struct perf_header *self, | ||
975 | event__handler_t process, | ||
976 | struct perf_session *session) | ||
977 | { | ||
978 | struct perf_header_attr *attr; | ||
979 | int i, err = 0; | ||
980 | |||
981 | for (i = 0; i < self->attrs; i++) { | ||
982 | attr = self->attr[i]; | ||
983 | |||
984 | err = event__synthesize_attr(&attr->attr, attr->ids, attr->id, | ||
985 | process, session); | ||
986 | if (err) { | ||
987 | pr_debug("failed to create perf header attribute\n"); | ||
988 | return err; | ||
989 | } | ||
990 | } | ||
991 | |||
992 | return err; | ||
993 | } | ||
994 | |||
995 | int event__process_attr(event_t *self, struct perf_session *session) | ||
996 | { | ||
997 | struct perf_header_attr *attr; | ||
998 | unsigned int i, ids, n_ids; | ||
999 | |||
1000 | attr = perf_header_attr__new(&self->attr.attr); | ||
1001 | if (attr == NULL) | ||
1002 | return -ENOMEM; | ||
1003 | |||
1004 | ids = self->header.size; | ||
1005 | ids -= (void *)&self->attr.id - (void *)self; | ||
1006 | n_ids = ids / sizeof(u64); | ||
1007 | |||
1008 | for (i = 0; i < n_ids; i++) { | ||
1009 | if (perf_header_attr__add_id(attr, self->attr.id[i]) < 0) { | ||
1010 | perf_header_attr__delete(attr); | ||
1011 | return -ENOMEM; | ||
1012 | } | ||
1013 | } | ||
1014 | |||
1015 | if (perf_header__add_attr(&session->header, attr) < 0) { | ||
1016 | perf_header_attr__delete(attr); | ||
1017 | return -ENOMEM; | ||
1018 | } | ||
1019 | |||
1020 | perf_session__update_sample_type(session); | ||
1021 | |||
1022 | return 0; | ||
1023 | } | ||
1024 | |||
1025 | int event__synthesize_event_type(u64 event_id, char *name, | ||
1026 | event__handler_t process, | ||
1027 | struct perf_session *session) | ||
1028 | { | ||
1029 | event_t ev; | ||
1030 | size_t size = 0; | ||
1031 | int err = 0; | ||
1032 | |||
1033 | memset(&ev, 0, sizeof(ev)); | ||
1034 | |||
1035 | ev.event_type.event_type.event_id = event_id; | ||
1036 | memset(ev.event_type.event_type.name, 0, MAX_EVENT_NAME); | ||
1037 | strncpy(ev.event_type.event_type.name, name, MAX_EVENT_NAME - 1); | ||
1038 | |||
1039 | ev.event_type.header.type = PERF_RECORD_HEADER_EVENT_TYPE; | ||
1040 | size = strlen(name); | ||
1041 | size = ALIGN(size, sizeof(u64)); | ||
1042 | ev.event_type.header.size = sizeof(ev.event_type) - | ||
1043 | (sizeof(ev.event_type.event_type.name) - size); | ||
1044 | |||
1045 | err = process(&ev, session); | ||
1046 | |||
1047 | return err; | ||
1048 | } | ||
1049 | |||
1050 | int event__synthesize_event_types(event__handler_t process, | ||
1051 | struct perf_session *session) | ||
1052 | { | ||
1053 | struct perf_trace_event_type *type; | ||
1054 | int i, err = 0; | ||
1055 | |||
1056 | for (i = 0; i < event_count; i++) { | ||
1057 | type = &events[i]; | ||
1058 | |||
1059 | err = event__synthesize_event_type(type->event_id, type->name, | ||
1060 | process, session); | ||
1061 | if (err) { | ||
1062 | pr_debug("failed to create perf header event type\n"); | ||
1063 | return err; | ||
1064 | } | ||
1065 | } | ||
1066 | |||
1067 | return err; | ||
1068 | } | ||
1069 | |||
1070 | int event__process_event_type(event_t *self, | ||
1071 | struct perf_session *session __unused) | ||
1072 | { | ||
1073 | if (perf_header__push_event(self->event_type.event_type.event_id, | ||
1074 | self->event_type.event_type.name) < 0) | ||
1075 | return -ENOMEM; | ||
1076 | |||
1077 | return 0; | ||
1078 | } | ||
1079 | |||
1080 | int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs, | ||
1081 | int nb_events, | ||
1082 | event__handler_t process, | ||
1083 | struct perf_session *session __unused) | ||
1084 | { | ||
1085 | event_t ev; | ||
1086 | ssize_t size = 0, aligned_size = 0, padding; | ||
1087 | int err = 0; | ||
1088 | |||
1089 | memset(&ev, 0, sizeof(ev)); | ||
1090 | |||
1091 | ev.tracing_data.header.type = PERF_RECORD_HEADER_TRACING_DATA; | ||
1092 | size = read_tracing_data_size(fd, pattrs, nb_events); | ||
1093 | if (size <= 0) | ||
1094 | return size; | ||
1095 | aligned_size = ALIGN(size, sizeof(u64)); | ||
1096 | padding = aligned_size - size; | ||
1097 | ev.tracing_data.header.size = sizeof(ev.tracing_data); | ||
1098 | ev.tracing_data.size = aligned_size; | ||
1099 | |||
1100 | process(&ev, session); | ||
1101 | |||
1102 | err = read_tracing_data(fd, pattrs, nb_events); | ||
1103 | write_padded(fd, NULL, 0, padding); | ||
1104 | |||
1105 | return aligned_size; | ||
1106 | } | ||
1107 | |||
1108 | int event__process_tracing_data(event_t *self, | ||
1109 | struct perf_session *session) | ||
1110 | { | ||
1111 | ssize_t size_read, padding, size = self->tracing_data.size; | ||
1112 | off_t offset = lseek(session->fd, 0, SEEK_CUR); | ||
1113 | char buf[BUFSIZ]; | ||
1114 | |||
1115 | /* setup for reading amidst mmap */ | ||
1116 | lseek(session->fd, offset + sizeof(struct tracing_data_event), | ||
1117 | SEEK_SET); | ||
1118 | |||
1119 | size_read = trace_report(session->fd, session->repipe); | ||
1120 | |||
1121 | padding = ALIGN(size_read, sizeof(u64)) - size_read; | ||
1122 | |||
1123 | if (read(session->fd, buf, padding) < 0) | ||
1124 | die("reading input file"); | ||
1125 | if (session->repipe) { | ||
1126 | int retw = write(STDOUT_FILENO, buf, padding); | ||
1127 | if (retw <= 0 || retw != padding) | ||
1128 | die("repiping tracing data padding"); | ||
1129 | } | ||
1130 | |||
1131 | if (size_read + padding != size) | ||
1132 | die("tracing data size mismatch"); | ||
1133 | |||
1134 | return size_read + padding; | ||
1135 | } | ||
1136 | |||
1137 | int event__synthesize_build_id(struct dso *pos, u16 misc, | ||
1138 | event__handler_t process, | ||
1139 | struct machine *machine, | ||
1140 | struct perf_session *session) | ||
1141 | { | ||
1142 | event_t ev; | ||
1143 | size_t len; | ||
1144 | int err = 0; | ||
1145 | |||
1146 | if (!pos->hit) | ||
1147 | return err; | ||
1148 | |||
1149 | memset(&ev, 0, sizeof(ev)); | ||
1150 | |||
1151 | len = pos->long_name_len + 1; | ||
1152 | len = ALIGN(len, NAME_ALIGN); | ||
1153 | memcpy(&ev.build_id.build_id, pos->build_id, sizeof(pos->build_id)); | ||
1154 | ev.build_id.header.type = PERF_RECORD_HEADER_BUILD_ID; | ||
1155 | ev.build_id.header.misc = misc; | ||
1156 | ev.build_id.pid = machine->pid; | ||
1157 | ev.build_id.header.size = sizeof(ev.build_id) + len; | ||
1158 | memcpy(&ev.build_id.filename, pos->long_name, pos->long_name_len); | ||
1159 | |||
1160 | err = process(&ev, session); | ||
1161 | |||
1162 | return err; | ||
1163 | } | ||
1164 | |||
1165 | int event__process_build_id(event_t *self, | ||
1166 | struct perf_session *session) | ||
1167 | { | ||
1168 | __event_process_build_id(&self->build_id, | ||
1169 | self->build_id.filename, | ||
1170 | session); | ||
1171 | return 0; | ||
1172 | } | ||
diff --git a/tools/perf/util/header.h b/tools/perf/util/header.h index 82a6af72d4cc..402ac2454cf8 100644 --- a/tools/perf/util/header.h +++ b/tools/perf/util/header.h | |||
@@ -39,6 +39,11 @@ struct perf_file_header { | |||
39 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); | 39 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); |
40 | }; | 40 | }; |
41 | 41 | ||
42 | struct perf_pipe_file_header { | ||
43 | u64 magic; | ||
44 | u64 size; | ||
45 | }; | ||
46 | |||
42 | struct perf_header; | 47 | struct perf_header; |
43 | 48 | ||
44 | int perf_file_header__read(struct perf_file_header *self, | 49 | int perf_file_header__read(struct perf_file_header *self, |
@@ -47,21 +52,22 @@ int perf_file_header__read(struct perf_file_header *self, | |||
47 | struct perf_header { | 52 | struct perf_header { |
48 | int frozen; | 53 | int frozen; |
49 | int attrs, size; | 54 | int attrs, size; |
55 | bool needs_swap; | ||
50 | struct perf_header_attr **attr; | 56 | struct perf_header_attr **attr; |
51 | s64 attr_offset; | 57 | s64 attr_offset; |
52 | u64 data_offset; | 58 | u64 data_offset; |
53 | u64 data_size; | 59 | u64 data_size; |
54 | u64 event_offset; | 60 | u64 event_offset; |
55 | u64 event_size; | 61 | u64 event_size; |
56 | bool needs_swap; | ||
57 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); | 62 | DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); |
58 | }; | 63 | }; |
59 | 64 | ||
60 | int perf_header__init(struct perf_header *self); | 65 | int perf_header__init(struct perf_header *self); |
61 | void perf_header__exit(struct perf_header *self); | 66 | void perf_header__exit(struct perf_header *self); |
62 | 67 | ||
63 | int perf_header__read(struct perf_header *self, int fd); | 68 | int perf_header__read(struct perf_session *session, int fd); |
64 | int perf_header__write(struct perf_header *self, int fd, bool at_exit); | 69 | int perf_header__write(struct perf_header *self, int fd, bool at_exit); |
70 | int perf_header__write_pipe(int fd); | ||
65 | 71 | ||
66 | int perf_header__add_attr(struct perf_header *self, | 72 | int perf_header__add_attr(struct perf_header *self, |
67 | struct perf_header_attr *attr); | 73 | struct perf_header_attr *attr); |
@@ -89,4 +95,33 @@ int build_id_cache__add_s(const char *sbuild_id, const char *debugdir, | |||
89 | const char *name, bool is_kallsyms); | 95 | const char *name, bool is_kallsyms); |
90 | int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir); | 96 | int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir); |
91 | 97 | ||
98 | int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id, | ||
99 | event__handler_t process, | ||
100 | struct perf_session *session); | ||
101 | int event__synthesize_attrs(struct perf_header *self, | ||
102 | event__handler_t process, | ||
103 | struct perf_session *session); | ||
104 | int event__process_attr(event_t *self, struct perf_session *session); | ||
105 | |||
106 | int event__synthesize_event_type(u64 event_id, char *name, | ||
107 | event__handler_t process, | ||
108 | struct perf_session *session); | ||
109 | int event__synthesize_event_types(event__handler_t process, | ||
110 | struct perf_session *session); | ||
111 | int event__process_event_type(event_t *self, | ||
112 | struct perf_session *session); | ||
113 | |||
114 | int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs, | ||
115 | int nb_events, | ||
116 | event__handler_t process, | ||
117 | struct perf_session *session); | ||
118 | int event__process_tracing_data(event_t *self, | ||
119 | struct perf_session *session); | ||
120 | |||
121 | int event__synthesize_build_id(struct dso *pos, u16 misc, | ||
122 | event__handler_t process, | ||
123 | struct machine *machine, | ||
124 | struct perf_session *session); | ||
125 | int event__process_build_id(event_t *self, struct perf_session *session); | ||
126 | |||
92 | #endif /* __PERF_HEADER_H */ | 127 | #endif /* __PERF_HEADER_H */ |
diff --git a/tools/perf/util/hist.c b/tools/perf/util/hist.c index 2be33c7dbf03..f75c5f62401c 100644 --- a/tools/perf/util/hist.c +++ b/tools/perf/util/hist.c | |||
@@ -1,3 +1,4 @@ | |||
1 | #include "util.h" | ||
1 | #include "hist.h" | 2 | #include "hist.h" |
2 | #include "session.h" | 3 | #include "session.h" |
3 | #include "sort.h" | 4 | #include "sort.h" |
@@ -8,25 +9,69 @@ struct callchain_param callchain_param = { | |||
8 | .min_percent = 0.5 | 9 | .min_percent = 0.5 |
9 | }; | 10 | }; |
10 | 11 | ||
12 | static void hist_entry__add_cpumode_period(struct hist_entry *self, | ||
13 | unsigned int cpumode, u64 period) | ||
14 | { | ||
15 | switch (cpumode) { | ||
16 | case PERF_RECORD_MISC_KERNEL: | ||
17 | self->period_sys += period; | ||
18 | break; | ||
19 | case PERF_RECORD_MISC_USER: | ||
20 | self->period_us += period; | ||
21 | break; | ||
22 | case PERF_RECORD_MISC_GUEST_KERNEL: | ||
23 | self->period_guest_sys += period; | ||
24 | break; | ||
25 | case PERF_RECORD_MISC_GUEST_USER: | ||
26 | self->period_guest_us += period; | ||
27 | break; | ||
28 | default: | ||
29 | break; | ||
30 | } | ||
31 | } | ||
32 | |||
11 | /* | 33 | /* |
12 | * histogram, sorted on item, collects counts | 34 | * histogram, sorted on item, collects periods |
13 | */ | 35 | */ |
14 | 36 | ||
15 | struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | 37 | static struct hist_entry *hist_entry__new(struct hist_entry *template) |
16 | struct addr_location *al, | 38 | { |
17 | struct symbol *sym_parent, | 39 | size_t callchain_size = symbol_conf.use_callchain ? sizeof(struct callchain_node) : 0; |
18 | u64 count, bool *hit) | 40 | struct hist_entry *self = malloc(sizeof(*self) + callchain_size); |
41 | |||
42 | if (self != NULL) { | ||
43 | *self = *template; | ||
44 | self->nr_events = 1; | ||
45 | if (symbol_conf.use_callchain) | ||
46 | callchain_init(self->callchain); | ||
47 | } | ||
48 | |||
49 | return self; | ||
50 | } | ||
51 | |||
52 | static void hists__inc_nr_entries(struct hists *self, struct hist_entry *entry) | ||
19 | { | 53 | { |
20 | struct rb_node **p = &hists->rb_node; | 54 | if (entry->ms.sym && self->max_sym_namelen < entry->ms.sym->namelen) |
55 | self->max_sym_namelen = entry->ms.sym->namelen; | ||
56 | ++self->nr_entries; | ||
57 | } | ||
58 | |||
59 | struct hist_entry *__hists__add_entry(struct hists *self, | ||
60 | struct addr_location *al, | ||
61 | struct symbol *sym_parent, u64 period) | ||
62 | { | ||
63 | struct rb_node **p = &self->entries.rb_node; | ||
21 | struct rb_node *parent = NULL; | 64 | struct rb_node *parent = NULL; |
22 | struct hist_entry *he; | 65 | struct hist_entry *he; |
23 | struct hist_entry entry = { | 66 | struct hist_entry entry = { |
24 | .thread = al->thread, | 67 | .thread = al->thread, |
25 | .map = al->map, | 68 | .ms = { |
26 | .sym = al->sym, | 69 | .map = al->map, |
70 | .sym = al->sym, | ||
71 | }, | ||
27 | .ip = al->addr, | 72 | .ip = al->addr, |
28 | .level = al->level, | 73 | .level = al->level, |
29 | .count = count, | 74 | .period = period, |
30 | .parent = sym_parent, | 75 | .parent = sym_parent, |
31 | }; | 76 | }; |
32 | int cmp; | 77 | int cmp; |
@@ -38,8 +83,9 @@ struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | |||
38 | cmp = hist_entry__cmp(&entry, he); | 83 | cmp = hist_entry__cmp(&entry, he); |
39 | 84 | ||
40 | if (!cmp) { | 85 | if (!cmp) { |
41 | *hit = true; | 86 | he->period += period; |
42 | return he; | 87 | ++he->nr_events; |
88 | goto out; | ||
43 | } | 89 | } |
44 | 90 | ||
45 | if (cmp < 0) | 91 | if (cmp < 0) |
@@ -48,13 +94,14 @@ struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | |||
48 | p = &(*p)->rb_right; | 94 | p = &(*p)->rb_right; |
49 | } | 95 | } |
50 | 96 | ||
51 | he = malloc(sizeof(*he)); | 97 | he = hist_entry__new(&entry); |
52 | if (!he) | 98 | if (!he) |
53 | return NULL; | 99 | return NULL; |
54 | *he = entry; | ||
55 | rb_link_node(&he->rb_node, parent, p); | 100 | rb_link_node(&he->rb_node, parent, p); |
56 | rb_insert_color(&he->rb_node, hists); | 101 | rb_insert_color(&he->rb_node, &self->entries); |
57 | *hit = false; | 102 | hists__inc_nr_entries(self, he); |
103 | out: | ||
104 | hist_entry__add_cpumode_period(he, al->cpumode, period); | ||
58 | return he; | 105 | return he; |
59 | } | 106 | } |
60 | 107 | ||
@@ -65,7 +112,7 @@ hist_entry__cmp(struct hist_entry *left, struct hist_entry *right) | |||
65 | int64_t cmp = 0; | 112 | int64_t cmp = 0; |
66 | 113 | ||
67 | list_for_each_entry(se, &hist_entry__sort_list, list) { | 114 | list_for_each_entry(se, &hist_entry__sort_list, list) { |
68 | cmp = se->cmp(left, right); | 115 | cmp = se->se_cmp(left, right); |
69 | if (cmp) | 116 | if (cmp) |
70 | break; | 117 | break; |
71 | } | 118 | } |
@@ -82,7 +129,7 @@ hist_entry__collapse(struct hist_entry *left, struct hist_entry *right) | |||
82 | list_for_each_entry(se, &hist_entry__sort_list, list) { | 129 | list_for_each_entry(se, &hist_entry__sort_list, list) { |
83 | int64_t (*f)(struct hist_entry *, struct hist_entry *); | 130 | int64_t (*f)(struct hist_entry *, struct hist_entry *); |
84 | 131 | ||
85 | f = se->collapse ?: se->cmp; | 132 | f = se->se_collapse ?: se->se_cmp; |
86 | 133 | ||
87 | cmp = f(left, right); | 134 | cmp = f(left, right); |
88 | if (cmp) | 135 | if (cmp) |
@@ -101,7 +148,7 @@ void hist_entry__free(struct hist_entry *he) | |||
101 | * collapse the histogram | 148 | * collapse the histogram |
102 | */ | 149 | */ |
103 | 150 | ||
104 | static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | 151 | static bool collapse__insert_entry(struct rb_root *root, struct hist_entry *he) |
105 | { | 152 | { |
106 | struct rb_node **p = &root->rb_node; | 153 | struct rb_node **p = &root->rb_node; |
107 | struct rb_node *parent = NULL; | 154 | struct rb_node *parent = NULL; |
@@ -115,9 +162,9 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | |||
115 | cmp = hist_entry__collapse(iter, he); | 162 | cmp = hist_entry__collapse(iter, he); |
116 | 163 | ||
117 | if (!cmp) { | 164 | if (!cmp) { |
118 | iter->count += he->count; | 165 | iter->period += he->period; |
119 | hist_entry__free(he); | 166 | hist_entry__free(he); |
120 | return; | 167 | return false; |
121 | } | 168 | } |
122 | 169 | ||
123 | if (cmp < 0) | 170 | if (cmp < 0) |
@@ -128,9 +175,10 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) | |||
128 | 175 | ||
129 | rb_link_node(&he->rb_node, parent, p); | 176 | rb_link_node(&he->rb_node, parent, p); |
130 | rb_insert_color(&he->rb_node, root); | 177 | rb_insert_color(&he->rb_node, root); |
178 | return true; | ||
131 | } | 179 | } |
132 | 180 | ||
133 | void perf_session__collapse_resort(struct rb_root *hists) | 181 | void hists__collapse_resort(struct hists *self) |
134 | { | 182 | { |
135 | struct rb_root tmp; | 183 | struct rb_root tmp; |
136 | struct rb_node *next; | 184 | struct rb_node *next; |
@@ -140,72 +188,77 @@ void perf_session__collapse_resort(struct rb_root *hists) | |||
140 | return; | 188 | return; |
141 | 189 | ||
142 | tmp = RB_ROOT; | 190 | tmp = RB_ROOT; |
143 | next = rb_first(hists); | 191 | next = rb_first(&self->entries); |
192 | self->nr_entries = 0; | ||
193 | self->max_sym_namelen = 0; | ||
144 | 194 | ||
145 | while (next) { | 195 | while (next) { |
146 | n = rb_entry(next, struct hist_entry, rb_node); | 196 | n = rb_entry(next, struct hist_entry, rb_node); |
147 | next = rb_next(&n->rb_node); | 197 | next = rb_next(&n->rb_node); |
148 | 198 | ||
149 | rb_erase(&n->rb_node, hists); | 199 | rb_erase(&n->rb_node, &self->entries); |
150 | collapse__insert_entry(&tmp, n); | 200 | if (collapse__insert_entry(&tmp, n)) |
201 | hists__inc_nr_entries(self, n); | ||
151 | } | 202 | } |
152 | 203 | ||
153 | *hists = tmp; | 204 | self->entries = tmp; |
154 | } | 205 | } |
155 | 206 | ||
156 | /* | 207 | /* |
157 | * reverse the map, sort on count. | 208 | * reverse the map, sort on period. |
158 | */ | 209 | */ |
159 | 210 | ||
160 | static void perf_session__insert_output_hist_entry(struct rb_root *root, | 211 | static void __hists__insert_output_entry(struct rb_root *entries, |
161 | struct hist_entry *he, | 212 | struct hist_entry *he, |
162 | u64 min_callchain_hits) | 213 | u64 min_callchain_hits) |
163 | { | 214 | { |
164 | struct rb_node **p = &root->rb_node; | 215 | struct rb_node **p = &entries->rb_node; |
165 | struct rb_node *parent = NULL; | 216 | struct rb_node *parent = NULL; |
166 | struct hist_entry *iter; | 217 | struct hist_entry *iter; |
167 | 218 | ||
168 | if (symbol_conf.use_callchain) | 219 | if (symbol_conf.use_callchain) |
169 | callchain_param.sort(&he->sorted_chain, &he->callchain, | 220 | callchain_param.sort(&he->sorted_chain, he->callchain, |
170 | min_callchain_hits, &callchain_param); | 221 | min_callchain_hits, &callchain_param); |
171 | 222 | ||
172 | while (*p != NULL) { | 223 | while (*p != NULL) { |
173 | parent = *p; | 224 | parent = *p; |
174 | iter = rb_entry(parent, struct hist_entry, rb_node); | 225 | iter = rb_entry(parent, struct hist_entry, rb_node); |
175 | 226 | ||
176 | if (he->count > iter->count) | 227 | if (he->period > iter->period) |
177 | p = &(*p)->rb_left; | 228 | p = &(*p)->rb_left; |
178 | else | 229 | else |
179 | p = &(*p)->rb_right; | 230 | p = &(*p)->rb_right; |
180 | } | 231 | } |
181 | 232 | ||
182 | rb_link_node(&he->rb_node, parent, p); | 233 | rb_link_node(&he->rb_node, parent, p); |
183 | rb_insert_color(&he->rb_node, root); | 234 | rb_insert_color(&he->rb_node, entries); |
184 | } | 235 | } |
185 | 236 | ||
186 | void perf_session__output_resort(struct rb_root *hists, u64 total_samples) | 237 | void hists__output_resort(struct hists *self) |
187 | { | 238 | { |
188 | struct rb_root tmp; | 239 | struct rb_root tmp; |
189 | struct rb_node *next; | 240 | struct rb_node *next; |
190 | struct hist_entry *n; | 241 | struct hist_entry *n; |
191 | u64 min_callchain_hits; | 242 | u64 min_callchain_hits; |
192 | 243 | ||
193 | min_callchain_hits = | 244 | min_callchain_hits = self->stats.total_period * (callchain_param.min_percent / 100); |
194 | total_samples * (callchain_param.min_percent / 100); | ||
195 | 245 | ||
196 | tmp = RB_ROOT; | 246 | tmp = RB_ROOT; |
197 | next = rb_first(hists); | 247 | next = rb_first(&self->entries); |
248 | |||
249 | self->nr_entries = 0; | ||
250 | self->max_sym_namelen = 0; | ||
198 | 251 | ||
199 | while (next) { | 252 | while (next) { |
200 | n = rb_entry(next, struct hist_entry, rb_node); | 253 | n = rb_entry(next, struct hist_entry, rb_node); |
201 | next = rb_next(&n->rb_node); | 254 | next = rb_next(&n->rb_node); |
202 | 255 | ||
203 | rb_erase(&n->rb_node, hists); | 256 | rb_erase(&n->rb_node, &self->entries); |
204 | perf_session__insert_output_hist_entry(&tmp, n, | 257 | __hists__insert_output_entry(&tmp, n, min_callchain_hits); |
205 | min_callchain_hits); | 258 | hists__inc_nr_entries(self, n); |
206 | } | 259 | } |
207 | 260 | ||
208 | *hists = tmp; | 261 | self->entries = tmp; |
209 | } | 262 | } |
210 | 263 | ||
211 | static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin) | 264 | static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin) |
@@ -237,7 +290,7 @@ static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask, | |||
237 | } | 290 | } |
238 | 291 | ||
239 | static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | 292 | static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, |
240 | int depth, int depth_mask, int count, | 293 | int depth, int depth_mask, int period, |
241 | u64 total_samples, int hits, | 294 | u64 total_samples, int hits, |
242 | int left_margin) | 295 | int left_margin) |
243 | { | 296 | { |
@@ -250,7 +303,7 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | |||
250 | ret += fprintf(fp, "|"); | 303 | ret += fprintf(fp, "|"); |
251 | else | 304 | else |
252 | ret += fprintf(fp, " "); | 305 | ret += fprintf(fp, " "); |
253 | if (!count && i == depth - 1) { | 306 | if (!period && i == depth - 1) { |
254 | double percent; | 307 | double percent; |
255 | 308 | ||
256 | percent = hits * 100.0 / total_samples; | 309 | percent = hits * 100.0 / total_samples; |
@@ -258,8 +311,8 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, | |||
258 | } else | 311 | } else |
259 | ret += fprintf(fp, "%s", " "); | 312 | ret += fprintf(fp, "%s", " "); |
260 | } | 313 | } |
261 | if (chain->sym) | 314 | if (chain->ms.sym) |
262 | ret += fprintf(fp, "%s\n", chain->sym->name); | 315 | ret += fprintf(fp, "%s\n", chain->ms.sym->name); |
263 | else | 316 | else |
264 | ret += fprintf(fp, "%p\n", (void *)(long)chain->ip); | 317 | ret += fprintf(fp, "%p\n", (void *)(long)chain->ip); |
265 | 318 | ||
@@ -278,7 +331,7 @@ static void init_rem_hits(void) | |||
278 | } | 331 | } |
279 | 332 | ||
280 | strcpy(rem_sq_bracket->name, "[...]"); | 333 | strcpy(rem_sq_bracket->name, "[...]"); |
281 | rem_hits.sym = rem_sq_bracket; | 334 | rem_hits.ms.sym = rem_sq_bracket; |
282 | } | 335 | } |
283 | 336 | ||
284 | static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | 337 | static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, |
@@ -293,6 +346,7 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
293 | u64 remaining; | 346 | u64 remaining; |
294 | size_t ret = 0; | 347 | size_t ret = 0; |
295 | int i; | 348 | int i; |
349 | uint entries_printed = 0; | ||
296 | 350 | ||
297 | if (callchain_param.mode == CHAIN_GRAPH_REL) | 351 | if (callchain_param.mode == CHAIN_GRAPH_REL) |
298 | new_total = self->children_hit; | 352 | new_total = self->children_hit; |
@@ -328,8 +382,6 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
328 | left_margin); | 382 | left_margin); |
329 | i = 0; | 383 | i = 0; |
330 | list_for_each_entry(chain, &child->val, list) { | 384 | list_for_each_entry(chain, &child->val, list) { |
331 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
332 | continue; | ||
333 | ret += ipchain__fprintf_graph(fp, chain, depth, | 385 | ret += ipchain__fprintf_graph(fp, chain, depth, |
334 | new_depth_mask, i++, | 386 | new_depth_mask, i++, |
335 | new_total, | 387 | new_total, |
@@ -341,6 +393,8 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
341 | new_depth_mask | (1 << depth), | 393 | new_depth_mask | (1 << depth), |
342 | left_margin); | 394 | left_margin); |
343 | node = next; | 395 | node = next; |
396 | if (++entries_printed == callchain_param.print_limit) | ||
397 | break; | ||
344 | } | 398 | } |
345 | 399 | ||
346 | if (callchain_param.mode == CHAIN_GRAPH_REL && | 400 | if (callchain_param.mode == CHAIN_GRAPH_REL && |
@@ -366,11 +420,9 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
366 | bool printed = false; | 420 | bool printed = false; |
367 | int i = 0; | 421 | int i = 0; |
368 | int ret = 0; | 422 | int ret = 0; |
423 | u32 entries_printed = 0; | ||
369 | 424 | ||
370 | list_for_each_entry(chain, &self->val, list) { | 425 | list_for_each_entry(chain, &self->val, list) { |
371 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
372 | continue; | ||
373 | |||
374 | if (!i++ && sort__first_dimension == SORT_SYM) | 426 | if (!i++ && sort__first_dimension == SORT_SYM) |
375 | continue; | 427 | continue; |
376 | 428 | ||
@@ -385,10 +437,13 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self, | |||
385 | } else | 437 | } else |
386 | ret += callchain__fprintf_left_margin(fp, left_margin); | 438 | ret += callchain__fprintf_left_margin(fp, left_margin); |
387 | 439 | ||
388 | if (chain->sym) | 440 | if (chain->ms.sym) |
389 | ret += fprintf(fp, " %s\n", chain->sym->name); | 441 | ret += fprintf(fp, " %s\n", chain->ms.sym->name); |
390 | else | 442 | else |
391 | ret += fprintf(fp, " %p\n", (void *)(long)chain->ip); | 443 | ret += fprintf(fp, " %p\n", (void *)(long)chain->ip); |
444 | |||
445 | if (++entries_printed == callchain_param.print_limit) | ||
446 | break; | ||
392 | } | 447 | } |
393 | 448 | ||
394 | ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin); | 449 | ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin); |
@@ -411,8 +466,8 @@ static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self, | |||
411 | list_for_each_entry(chain, &self->val, list) { | 466 | list_for_each_entry(chain, &self->val, list) { |
412 | if (chain->ip >= PERF_CONTEXT_MAX) | 467 | if (chain->ip >= PERF_CONTEXT_MAX) |
413 | continue; | 468 | continue; |
414 | if (chain->sym) | 469 | if (chain->ms.sym) |
415 | ret += fprintf(fp, " %s\n", chain->sym->name); | 470 | ret += fprintf(fp, " %s\n", chain->ms.sym->name); |
416 | else | 471 | else |
417 | ret += fprintf(fp, " %p\n", | 472 | ret += fprintf(fp, " %p\n", |
418 | (void *)(long)chain->ip); | 473 | (void *)(long)chain->ip); |
@@ -427,6 +482,7 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self, | |||
427 | struct rb_node *rb_node; | 482 | struct rb_node *rb_node; |
428 | struct callchain_node *chain; | 483 | struct callchain_node *chain; |
429 | size_t ret = 0; | 484 | size_t ret = 0; |
485 | u32 entries_printed = 0; | ||
430 | 486 | ||
431 | rb_node = rb_first(&self->sorted_chain); | 487 | rb_node = rb_first(&self->sorted_chain); |
432 | while (rb_node) { | 488 | while (rb_node) { |
@@ -449,55 +505,88 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self, | |||
449 | break; | 505 | break; |
450 | } | 506 | } |
451 | ret += fprintf(fp, "\n"); | 507 | ret += fprintf(fp, "\n"); |
508 | if (++entries_printed == callchain_param.print_limit) | ||
509 | break; | ||
452 | rb_node = rb_next(rb_node); | 510 | rb_node = rb_next(rb_node); |
453 | } | 511 | } |
454 | 512 | ||
455 | return ret; | 513 | return ret; |
456 | } | 514 | } |
457 | 515 | ||
458 | static size_t hist_entry__fprintf(struct hist_entry *self, | 516 | int hist_entry__snprintf(struct hist_entry *self, char *s, size_t size, |
459 | struct perf_session *pair_session, | 517 | struct hists *pair_hists, bool show_displacement, |
460 | bool show_displacement, | 518 | long displacement, bool color, u64 session_total) |
461 | long displacement, FILE *fp, | ||
462 | u64 session_total) | ||
463 | { | 519 | { |
464 | struct sort_entry *se; | 520 | struct sort_entry *se; |
465 | u64 count, total; | 521 | u64 period, total, period_sys, period_us, period_guest_sys, period_guest_us; |
466 | const char *sep = symbol_conf.field_sep; | 522 | const char *sep = symbol_conf.field_sep; |
467 | size_t ret; | 523 | int ret; |
468 | 524 | ||
469 | if (symbol_conf.exclude_other && !self->parent) | 525 | if (symbol_conf.exclude_other && !self->parent) |
470 | return 0; | 526 | return 0; |
471 | 527 | ||
472 | if (pair_session) { | 528 | if (pair_hists) { |
473 | count = self->pair ? self->pair->count : 0; | 529 | period = self->pair ? self->pair->period : 0; |
474 | total = pair_session->events_stats.total; | 530 | total = pair_hists->stats.total_period; |
531 | period_sys = self->pair ? self->pair->period_sys : 0; | ||
532 | period_us = self->pair ? self->pair->period_us : 0; | ||
533 | period_guest_sys = self->pair ? self->pair->period_guest_sys : 0; | ||
534 | period_guest_us = self->pair ? self->pair->period_guest_us : 0; | ||
475 | } else { | 535 | } else { |
476 | count = self->count; | 536 | period = self->period; |
477 | total = session_total; | 537 | total = session_total; |
538 | period_sys = self->period_sys; | ||
539 | period_us = self->period_us; | ||
540 | period_guest_sys = self->period_guest_sys; | ||
541 | period_guest_us = self->period_guest_us; | ||
478 | } | 542 | } |
479 | 543 | ||
480 | if (total) | 544 | if (total) { |
481 | ret = percent_color_fprintf(fp, sep ? "%.2f" : " %6.2f%%", | 545 | if (color) |
482 | (count * 100.0) / total); | 546 | ret = percent_color_snprintf(s, size, |
483 | else | 547 | sep ? "%.2f" : " %6.2f%%", |
484 | ret = fprintf(fp, sep ? "%lld" : "%12lld ", count); | 548 | (period * 100.0) / total); |
549 | else | ||
550 | ret = snprintf(s, size, sep ? "%.2f" : " %6.2f%%", | ||
551 | (period * 100.0) / total); | ||
552 | if (symbol_conf.show_cpu_utilization) { | ||
553 | ret += percent_color_snprintf(s + ret, size - ret, | ||
554 | sep ? "%.2f" : " %6.2f%%", | ||
555 | (period_sys * 100.0) / total); | ||
556 | ret += percent_color_snprintf(s + ret, size - ret, | ||
557 | sep ? "%.2f" : " %6.2f%%", | ||
558 | (period_us * 100.0) / total); | ||
559 | if (perf_guest) { | ||
560 | ret += percent_color_snprintf(s + ret, | ||
561 | size - ret, | ||
562 | sep ? "%.2f" : " %6.2f%%", | ||
563 | (period_guest_sys * 100.0) / | ||
564 | total); | ||
565 | ret += percent_color_snprintf(s + ret, | ||
566 | size - ret, | ||
567 | sep ? "%.2f" : " %6.2f%%", | ||
568 | (period_guest_us * 100.0) / | ||
569 | total); | ||
570 | } | ||
571 | } | ||
572 | } else | ||
573 | ret = snprintf(s, size, sep ? "%lld" : "%12lld ", period); | ||
485 | 574 | ||
486 | if (symbol_conf.show_nr_samples) { | 575 | if (symbol_conf.show_nr_samples) { |
487 | if (sep) | 576 | if (sep) |
488 | fprintf(fp, "%c%lld", *sep, count); | 577 | ret += snprintf(s + ret, size - ret, "%c%lld", *sep, period); |
489 | else | 578 | else |
490 | fprintf(fp, "%11lld", count); | 579 | ret += snprintf(s + ret, size - ret, "%11lld", period); |
491 | } | 580 | } |
492 | 581 | ||
493 | if (pair_session) { | 582 | if (pair_hists) { |
494 | char bf[32]; | 583 | char bf[32]; |
495 | double old_percent = 0, new_percent = 0, diff; | 584 | double old_percent = 0, new_percent = 0, diff; |
496 | 585 | ||
497 | if (total > 0) | 586 | if (total > 0) |
498 | old_percent = (count * 100.0) / total; | 587 | old_percent = (period * 100.0) / total; |
499 | if (session_total > 0) | 588 | if (session_total > 0) |
500 | new_percent = (self->count * 100.0) / session_total; | 589 | new_percent = (self->period * 100.0) / session_total; |
501 | 590 | ||
502 | diff = new_percent - old_percent; | 591 | diff = new_percent - old_percent; |
503 | 592 | ||
@@ -507,9 +596,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
507 | snprintf(bf, sizeof(bf), " "); | 596 | snprintf(bf, sizeof(bf), " "); |
508 | 597 | ||
509 | if (sep) | 598 | if (sep) |
510 | ret += fprintf(fp, "%c%s", *sep, bf); | 599 | ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf); |
511 | else | 600 | else |
512 | ret += fprintf(fp, "%11.11s", bf); | 601 | ret += snprintf(s + ret, size - ret, "%11.11s", bf); |
513 | 602 | ||
514 | if (show_displacement) { | 603 | if (show_displacement) { |
515 | if (displacement) | 604 | if (displacement) |
@@ -518,9 +607,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
518 | snprintf(bf, sizeof(bf), " "); | 607 | snprintf(bf, sizeof(bf), " "); |
519 | 608 | ||
520 | if (sep) | 609 | if (sep) |
521 | fprintf(fp, "%c%s", *sep, bf); | 610 | ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf); |
522 | else | 611 | else |
523 | fprintf(fp, "%6.6s", bf); | 612 | ret += snprintf(s + ret, size - ret, "%6.6s", bf); |
524 | } | 613 | } |
525 | } | 614 | } |
526 | 615 | ||
@@ -528,33 +617,43 @@ static size_t hist_entry__fprintf(struct hist_entry *self, | |||
528 | if (se->elide) | 617 | if (se->elide) |
529 | continue; | 618 | continue; |
530 | 619 | ||
531 | fprintf(fp, "%s", sep ?: " "); | 620 | ret += snprintf(s + ret, size - ret, "%s", sep ?: " "); |
532 | ret += se->print(fp, self, se->width ? *se->width : 0); | 621 | ret += se->se_snprintf(self, s + ret, size - ret, |
622 | se->se_width ? *se->se_width : 0); | ||
533 | } | 623 | } |
534 | 624 | ||
535 | ret += fprintf(fp, "\n"); | 625 | return ret; |
626 | } | ||
536 | 627 | ||
537 | if (symbol_conf.use_callchain) { | 628 | int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists, |
538 | int left_margin = 0; | 629 | bool show_displacement, long displacement, FILE *fp, |
630 | u64 session_total) | ||
631 | { | ||
632 | char bf[512]; | ||
633 | hist_entry__snprintf(self, bf, sizeof(bf), pair_hists, | ||
634 | show_displacement, displacement, | ||
635 | true, session_total); | ||
636 | return fprintf(fp, "%s\n", bf); | ||
637 | } | ||
539 | 638 | ||
540 | if (sort__first_dimension == SORT_COMM) { | 639 | static size_t hist_entry__fprintf_callchain(struct hist_entry *self, FILE *fp, |
541 | se = list_first_entry(&hist_entry__sort_list, typeof(*se), | 640 | u64 session_total) |
542 | list); | 641 | { |
543 | left_margin = se->width ? *se->width : 0; | 642 | int left_margin = 0; |
544 | left_margin -= thread__comm_len(self->thread); | ||
545 | } | ||
546 | 643 | ||
547 | hist_entry_callchain__fprintf(fp, self, session_total, | 644 | if (sort__first_dimension == SORT_COMM) { |
548 | left_margin); | 645 | struct sort_entry *se = list_first_entry(&hist_entry__sort_list, |
646 | typeof(*se), list); | ||
647 | left_margin = se->se_width ? *se->se_width : 0; | ||
648 | left_margin -= thread__comm_len(self->thread); | ||
549 | } | 649 | } |
550 | 650 | ||
551 | return ret; | 651 | return hist_entry_callchain__fprintf(fp, self, session_total, |
652 | left_margin); | ||
552 | } | 653 | } |
553 | 654 | ||
554 | size_t perf_session__fprintf_hists(struct rb_root *hists, | 655 | size_t hists__fprintf(struct hists *self, struct hists *pair, |
555 | struct perf_session *pair, | 656 | bool show_displacement, FILE *fp) |
556 | bool show_displacement, FILE *fp, | ||
557 | u64 session_total) | ||
558 | { | 657 | { |
559 | struct sort_entry *se; | 658 | struct sort_entry *se; |
560 | struct rb_node *nd; | 659 | struct rb_node *nd; |
@@ -576,6 +675,24 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
576 | fputs(" Samples ", fp); | 675 | fputs(" Samples ", fp); |
577 | } | 676 | } |
578 | 677 | ||
678 | if (symbol_conf.show_cpu_utilization) { | ||
679 | if (sep) { | ||
680 | ret += fprintf(fp, "%csys", *sep); | ||
681 | ret += fprintf(fp, "%cus", *sep); | ||
682 | if (perf_guest) { | ||
683 | ret += fprintf(fp, "%cguest sys", *sep); | ||
684 | ret += fprintf(fp, "%cguest us", *sep); | ||
685 | } | ||
686 | } else { | ||
687 | ret += fprintf(fp, " sys "); | ||
688 | ret += fprintf(fp, " us "); | ||
689 | if (perf_guest) { | ||
690 | ret += fprintf(fp, " guest sys "); | ||
691 | ret += fprintf(fp, " guest us "); | ||
692 | } | ||
693 | } | ||
694 | } | ||
695 | |||
579 | if (pair) { | 696 | if (pair) { |
580 | if (sep) | 697 | if (sep) |
581 | ret += fprintf(fp, "%cDelta", *sep); | 698 | ret += fprintf(fp, "%cDelta", *sep); |
@@ -594,22 +711,22 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
594 | if (se->elide) | 711 | if (se->elide) |
595 | continue; | 712 | continue; |
596 | if (sep) { | 713 | if (sep) { |
597 | fprintf(fp, "%c%s", *sep, se->header); | 714 | fprintf(fp, "%c%s", *sep, se->se_header); |
598 | continue; | 715 | continue; |
599 | } | 716 | } |
600 | width = strlen(se->header); | 717 | width = strlen(se->se_header); |
601 | if (se->width) { | 718 | if (se->se_width) { |
602 | if (symbol_conf.col_width_list_str) { | 719 | if (symbol_conf.col_width_list_str) { |
603 | if (col_width) { | 720 | if (col_width) { |
604 | *se->width = atoi(col_width); | 721 | *se->se_width = atoi(col_width); |
605 | col_width = strchr(col_width, ','); | 722 | col_width = strchr(col_width, ','); |
606 | if (col_width) | 723 | if (col_width) |
607 | ++col_width; | 724 | ++col_width; |
608 | } | 725 | } |
609 | } | 726 | } |
610 | width = *se->width = max(*se->width, width); | 727 | width = *se->se_width = max(*se->se_width, width); |
611 | } | 728 | } |
612 | fprintf(fp, " %*s", width, se->header); | 729 | fprintf(fp, " %*s", width, se->se_header); |
613 | } | 730 | } |
614 | fprintf(fp, "\n"); | 731 | fprintf(fp, "\n"); |
615 | 732 | ||
@@ -631,10 +748,10 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
631 | continue; | 748 | continue; |
632 | 749 | ||
633 | fprintf(fp, " "); | 750 | fprintf(fp, " "); |
634 | if (se->width) | 751 | if (se->se_width) |
635 | width = *se->width; | 752 | width = *se->se_width; |
636 | else | 753 | else |
637 | width = strlen(se->header); | 754 | width = strlen(se->se_header); |
638 | for (i = 0; i < width; i++) | 755 | for (i = 0; i < width; i++) |
639 | fprintf(fp, "."); | 756 | fprintf(fp, "."); |
640 | } | 757 | } |
@@ -642,7 +759,7 @@ size_t perf_session__fprintf_hists(struct rb_root *hists, | |||
642 | fprintf(fp, "\n#\n"); | 759 | fprintf(fp, "\n#\n"); |
643 | 760 | ||
644 | print_entries: | 761 | print_entries: |
645 | for (nd = rb_first(hists); nd; nd = rb_next(nd)) { | 762 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { |
646 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | 763 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); |
647 | 764 | ||
648 | if (show_displacement) { | 765 | if (show_displacement) { |
@@ -654,10 +771,14 @@ print_entries: | |||
654 | ++position; | 771 | ++position; |
655 | } | 772 | } |
656 | ret += hist_entry__fprintf(h, pair, show_displacement, | 773 | ret += hist_entry__fprintf(h, pair, show_displacement, |
657 | displacement, fp, session_total); | 774 | displacement, fp, self->stats.total_period); |
658 | if (h->map == NULL && verbose > 1) { | 775 | |
776 | if (symbol_conf.use_callchain) | ||
777 | ret += hist_entry__fprintf_callchain(h, fp, self->stats.total_period); | ||
778 | |||
779 | if (h->ms.map == NULL && verbose > 1) { | ||
659 | __map_groups__fprintf_maps(&h->thread->mg, | 780 | __map_groups__fprintf_maps(&h->thread->mg, |
660 | MAP__FUNCTION, fp); | 781 | MAP__FUNCTION, verbose, fp); |
661 | fprintf(fp, "%.10s end\n", graph_dotted_line); | 782 | fprintf(fp, "%.10s end\n", graph_dotted_line); |
662 | } | 783 | } |
663 | } | 784 | } |
@@ -666,3 +787,271 @@ print_entries: | |||
666 | 787 | ||
667 | return ret; | 788 | return ret; |
668 | } | 789 | } |
790 | |||
791 | enum hist_filter { | ||
792 | HIST_FILTER__DSO, | ||
793 | HIST_FILTER__THREAD, | ||
794 | }; | ||
795 | |||
796 | void hists__filter_by_dso(struct hists *self, const struct dso *dso) | ||
797 | { | ||
798 | struct rb_node *nd; | ||
799 | |||
800 | self->nr_entries = self->stats.total_period = 0; | ||
801 | self->stats.nr_events[PERF_RECORD_SAMPLE] = 0; | ||
802 | self->max_sym_namelen = 0; | ||
803 | |||
804 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { | ||
805 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
806 | |||
807 | if (symbol_conf.exclude_other && !h->parent) | ||
808 | continue; | ||
809 | |||
810 | if (dso != NULL && (h->ms.map == NULL || h->ms.map->dso != dso)) { | ||
811 | h->filtered |= (1 << HIST_FILTER__DSO); | ||
812 | continue; | ||
813 | } | ||
814 | |||
815 | h->filtered &= ~(1 << HIST_FILTER__DSO); | ||
816 | if (!h->filtered) { | ||
817 | ++self->nr_entries; | ||
818 | self->stats.total_period += h->period; | ||
819 | self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events; | ||
820 | if (h->ms.sym && | ||
821 | self->max_sym_namelen < h->ms.sym->namelen) | ||
822 | self->max_sym_namelen = h->ms.sym->namelen; | ||
823 | } | ||
824 | } | ||
825 | } | ||
826 | |||
827 | void hists__filter_by_thread(struct hists *self, const struct thread *thread) | ||
828 | { | ||
829 | struct rb_node *nd; | ||
830 | |||
831 | self->nr_entries = self->stats.total_period = 0; | ||
832 | self->stats.nr_events[PERF_RECORD_SAMPLE] = 0; | ||
833 | self->max_sym_namelen = 0; | ||
834 | |||
835 | for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) { | ||
836 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
837 | |||
838 | if (thread != NULL && h->thread != thread) { | ||
839 | h->filtered |= (1 << HIST_FILTER__THREAD); | ||
840 | continue; | ||
841 | } | ||
842 | h->filtered &= ~(1 << HIST_FILTER__THREAD); | ||
843 | if (!h->filtered) { | ||
844 | ++self->nr_entries; | ||
845 | self->stats.total_period += h->period; | ||
846 | self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events; | ||
847 | if (h->ms.sym && | ||
848 | self->max_sym_namelen < h->ms.sym->namelen) | ||
849 | self->max_sym_namelen = h->ms.sym->namelen; | ||
850 | } | ||
851 | } | ||
852 | } | ||
853 | |||
854 | static int symbol__alloc_hist(struct symbol *self) | ||
855 | { | ||
856 | struct sym_priv *priv = symbol__priv(self); | ||
857 | const int size = (sizeof(*priv->hist) + | ||
858 | (self->end - self->start) * sizeof(u64)); | ||
859 | |||
860 | priv->hist = zalloc(size); | ||
861 | return priv->hist == NULL ? -1 : 0; | ||
862 | } | ||
863 | |||
864 | int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip) | ||
865 | { | ||
866 | unsigned int sym_size, offset; | ||
867 | struct symbol *sym = self->ms.sym; | ||
868 | struct sym_priv *priv; | ||
869 | struct sym_hist *h; | ||
870 | |||
871 | if (!sym || !self->ms.map) | ||
872 | return 0; | ||
873 | |||
874 | priv = symbol__priv(sym); | ||
875 | if (priv->hist == NULL && symbol__alloc_hist(sym) < 0) | ||
876 | return -ENOMEM; | ||
877 | |||
878 | sym_size = sym->end - sym->start; | ||
879 | offset = ip - sym->start; | ||
880 | |||
881 | pr_debug3("%s: ip=%#Lx\n", __func__, self->ms.map->unmap_ip(self->ms.map, ip)); | ||
882 | |||
883 | if (offset >= sym_size) | ||
884 | return 0; | ||
885 | |||
886 | h = priv->hist; | ||
887 | h->sum++; | ||
888 | h->ip[offset]++; | ||
889 | |||
890 | pr_debug3("%#Lx %s: period++ [ip: %#Lx, %#Lx] => %Ld\n", self->ms.sym->start, | ||
891 | self->ms.sym->name, ip, ip - self->ms.sym->start, h->ip[offset]); | ||
892 | return 0; | ||
893 | } | ||
894 | |||
895 | static struct objdump_line *objdump_line__new(s64 offset, char *line) | ||
896 | { | ||
897 | struct objdump_line *self = malloc(sizeof(*self)); | ||
898 | |||
899 | if (self != NULL) { | ||
900 | self->offset = offset; | ||
901 | self->line = line; | ||
902 | } | ||
903 | |||
904 | return self; | ||
905 | } | ||
906 | |||
907 | void objdump_line__free(struct objdump_line *self) | ||
908 | { | ||
909 | free(self->line); | ||
910 | free(self); | ||
911 | } | ||
912 | |||
913 | static void objdump__add_line(struct list_head *head, struct objdump_line *line) | ||
914 | { | ||
915 | list_add_tail(&line->node, head); | ||
916 | } | ||
917 | |||
918 | struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
919 | struct objdump_line *pos) | ||
920 | { | ||
921 | list_for_each_entry_continue(pos, head, node) | ||
922 | if (pos->offset >= 0) | ||
923 | return pos; | ||
924 | |||
925 | return NULL; | ||
926 | } | ||
927 | |||
928 | static int hist_entry__parse_objdump_line(struct hist_entry *self, FILE *file, | ||
929 | struct list_head *head) | ||
930 | { | ||
931 | struct symbol *sym = self->ms.sym; | ||
932 | struct objdump_line *objdump_line; | ||
933 | char *line = NULL, *tmp, *tmp2, *c; | ||
934 | size_t line_len; | ||
935 | s64 line_ip, offset = -1; | ||
936 | |||
937 | if (getline(&line, &line_len, file) < 0) | ||
938 | return -1; | ||
939 | |||
940 | if (!line) | ||
941 | return -1; | ||
942 | |||
943 | while (line_len != 0 && isspace(line[line_len - 1])) | ||
944 | line[--line_len] = '\0'; | ||
945 | |||
946 | c = strchr(line, '\n'); | ||
947 | if (c) | ||
948 | *c = 0; | ||
949 | |||
950 | line_ip = -1; | ||
951 | |||
952 | /* | ||
953 | * Strip leading spaces: | ||
954 | */ | ||
955 | tmp = line; | ||
956 | while (*tmp) { | ||
957 | if (*tmp != ' ') | ||
958 | break; | ||
959 | tmp++; | ||
960 | } | ||
961 | |||
962 | if (*tmp) { | ||
963 | /* | ||
964 | * Parse hexa addresses followed by ':' | ||
965 | */ | ||
966 | line_ip = strtoull(tmp, &tmp2, 16); | ||
967 | if (*tmp2 != ':') | ||
968 | line_ip = -1; | ||
969 | } | ||
970 | |||
971 | if (line_ip != -1) { | ||
972 | u64 start = map__rip_2objdump(self->ms.map, sym->start); | ||
973 | offset = line_ip - start; | ||
974 | } | ||
975 | |||
976 | objdump_line = objdump_line__new(offset, line); | ||
977 | if (objdump_line == NULL) { | ||
978 | free(line); | ||
979 | return -1; | ||
980 | } | ||
981 | objdump__add_line(head, objdump_line); | ||
982 | |||
983 | return 0; | ||
984 | } | ||
985 | |||
986 | int hist_entry__annotate(struct hist_entry *self, struct list_head *head) | ||
987 | { | ||
988 | struct symbol *sym = self->ms.sym; | ||
989 | struct map *map = self->ms.map; | ||
990 | struct dso *dso = map->dso; | ||
991 | const char *filename = dso->long_name; | ||
992 | char command[PATH_MAX * 2]; | ||
993 | FILE *file; | ||
994 | u64 len; | ||
995 | |||
996 | if (!filename) | ||
997 | return -1; | ||
998 | |||
999 | if (dso->origin == DSO__ORIG_KERNEL) { | ||
1000 | if (dso->annotate_warned) | ||
1001 | return 0; | ||
1002 | dso->annotate_warned = 1; | ||
1003 | pr_err("Can't annotate %s: No vmlinux file was found in the " | ||
1004 | "path:\n", sym->name); | ||
1005 | vmlinux_path__fprintf(stderr); | ||
1006 | return -1; | ||
1007 | } | ||
1008 | |||
1009 | pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__, | ||
1010 | filename, sym->name, map->unmap_ip(map, sym->start), | ||
1011 | map->unmap_ip(map, sym->end)); | ||
1012 | |||
1013 | len = sym->end - sym->start; | ||
1014 | |||
1015 | pr_debug("annotating [%p] %30s : [%p] %30s\n", | ||
1016 | dso, dso->long_name, sym, sym->name); | ||
1017 | |||
1018 | snprintf(command, sizeof(command), | ||
1019 | "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s|expand", | ||
1020 | map__rip_2objdump(map, sym->start), | ||
1021 | map__rip_2objdump(map, sym->end), | ||
1022 | filename, filename); | ||
1023 | |||
1024 | pr_debug("Executing: %s\n", command); | ||
1025 | |||
1026 | file = popen(command, "r"); | ||
1027 | if (!file) | ||
1028 | return -1; | ||
1029 | |||
1030 | while (!feof(file)) | ||
1031 | if (hist_entry__parse_objdump_line(self, file, head) < 0) | ||
1032 | break; | ||
1033 | |||
1034 | pclose(file); | ||
1035 | return 0; | ||
1036 | } | ||
1037 | |||
1038 | void hists__inc_nr_events(struct hists *self, u32 type) | ||
1039 | { | ||
1040 | ++self->stats.nr_events[0]; | ||
1041 | ++self->stats.nr_events[type]; | ||
1042 | } | ||
1043 | |||
1044 | size_t hists__fprintf_nr_events(struct hists *self, FILE *fp) | ||
1045 | { | ||
1046 | int i; | ||
1047 | size_t ret = 0; | ||
1048 | |||
1049 | for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) { | ||
1050 | if (!event__name[i]) | ||
1051 | continue; | ||
1052 | ret += fprintf(fp, "%10s events: %10d\n", | ||
1053 | event__name[i], self->stats.nr_events[i]); | ||
1054 | } | ||
1055 | |||
1056 | return ret; | ||
1057 | } | ||
diff --git a/tools/perf/util/hist.h b/tools/perf/util/hist.h index 16f360cce5bf..6f17dcd8412c 100644 --- a/tools/perf/util/hist.h +++ b/tools/perf/util/hist.h | |||
@@ -6,24 +6,104 @@ | |||
6 | 6 | ||
7 | extern struct callchain_param callchain_param; | 7 | extern struct callchain_param callchain_param; |
8 | 8 | ||
9 | struct perf_session; | ||
10 | struct hist_entry; | 9 | struct hist_entry; |
11 | struct addr_location; | 10 | struct addr_location; |
12 | struct symbol; | 11 | struct symbol; |
13 | struct rb_root; | 12 | struct rb_root; |
14 | 13 | ||
15 | struct hist_entry *__perf_session__add_hist_entry(struct rb_root *hists, | 14 | struct objdump_line { |
16 | struct addr_location *al, | 15 | struct list_head node; |
17 | struct symbol *parent, | 16 | s64 offset; |
18 | u64 count, bool *hit); | 17 | char *line; |
18 | }; | ||
19 | |||
20 | void objdump_line__free(struct objdump_line *self); | ||
21 | struct objdump_line *objdump__get_next_ip_line(struct list_head *head, | ||
22 | struct objdump_line *pos); | ||
23 | |||
24 | struct sym_hist { | ||
25 | u64 sum; | ||
26 | u64 ip[0]; | ||
27 | }; | ||
28 | |||
29 | struct sym_ext { | ||
30 | struct rb_node node; | ||
31 | double percent; | ||
32 | char *path; | ||
33 | }; | ||
34 | |||
35 | struct sym_priv { | ||
36 | struct sym_hist *hist; | ||
37 | struct sym_ext *ext; | ||
38 | }; | ||
39 | |||
40 | /* | ||
41 | * The kernel collects the number of events it couldn't send in a stretch and | ||
42 | * when possible sends this number in a PERF_RECORD_LOST event. The number of | ||
43 | * such "chunks" of lost events is stored in .nr_events[PERF_EVENT_LOST] while | ||
44 | * total_lost tells exactly how many events the kernel in fact lost, i.e. it is | ||
45 | * the sum of all struct lost_event.lost fields reported. | ||
46 | * | ||
47 | * The total_period is needed because by default auto-freq is used, so | ||
48 | * multipling nr_events[PERF_EVENT_SAMPLE] by a frequency isn't possible to get | ||
49 | * the total number of low level events, it is necessary to to sum all struct | ||
50 | * sample_event.period and stash the result in total_period. | ||
51 | */ | ||
52 | struct events_stats { | ||
53 | u64 total_period; | ||
54 | u64 total_lost; | ||
55 | u32 nr_events[PERF_RECORD_HEADER_MAX]; | ||
56 | u32 nr_unknown_events; | ||
57 | }; | ||
58 | |||
59 | struct hists { | ||
60 | struct rb_node rb_node; | ||
61 | struct rb_root entries; | ||
62 | u64 nr_entries; | ||
63 | struct events_stats stats; | ||
64 | u64 config; | ||
65 | u64 event_stream; | ||
66 | u32 type; | ||
67 | u32 max_sym_namelen; | ||
68 | }; | ||
69 | |||
70 | struct hist_entry *__hists__add_entry(struct hists *self, | ||
71 | struct addr_location *al, | ||
72 | struct symbol *parent, u64 period); | ||
19 | extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *); | 73 | extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *); |
20 | extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *); | 74 | extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *); |
75 | int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists, | ||
76 | bool show_displacement, long displacement, FILE *fp, | ||
77 | u64 total); | ||
78 | int hist_entry__snprintf(struct hist_entry *self, char *bf, size_t size, | ||
79 | struct hists *pair_hists, bool show_displacement, | ||
80 | long displacement, bool color, u64 total); | ||
21 | void hist_entry__free(struct hist_entry *); | 81 | void hist_entry__free(struct hist_entry *); |
22 | 82 | ||
23 | void perf_session__output_resort(struct rb_root *hists, u64 total_samples); | 83 | void hists__output_resort(struct hists *self); |
24 | void perf_session__collapse_resort(struct rb_root *hists); | 84 | void hists__collapse_resort(struct hists *self); |
25 | size_t perf_session__fprintf_hists(struct rb_root *hists, | 85 | |
26 | struct perf_session *pair, | 86 | void hists__inc_nr_events(struct hists *self, u32 type); |
27 | bool show_displacement, FILE *fp, | 87 | size_t hists__fprintf_nr_events(struct hists *self, FILE *fp); |
28 | u64 session_total); | 88 | |
89 | size_t hists__fprintf(struct hists *self, struct hists *pair, | ||
90 | bool show_displacement, FILE *fp); | ||
91 | |||
92 | int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip); | ||
93 | int hist_entry__annotate(struct hist_entry *self, struct list_head *head); | ||
94 | |||
95 | void hists__filter_by_dso(struct hists *self, const struct dso *dso); | ||
96 | void hists__filter_by_thread(struct hists *self, const struct thread *thread); | ||
97 | |||
98 | #ifdef NO_NEWT_SUPPORT | ||
99 | static inline int hists__browse(struct hists *self __used, | ||
100 | const char *helpline __used, | ||
101 | const char *input_name __used) | ||
102 | { | ||
103 | return 0; | ||
104 | } | ||
105 | #else | ||
106 | int hists__browse(struct hists *self, const char *helpline, | ||
107 | const char *input_name); | ||
108 | #endif | ||
29 | #endif /* __PERF_HIST_H */ | 109 | #endif /* __PERF_HIST_H */ |
diff --git a/tools/perf/util/hweight.c b/tools/perf/util/hweight.c new file mode 100644 index 000000000000..5c1d0d099f0d --- /dev/null +++ b/tools/perf/util/hweight.c | |||
@@ -0,0 +1,31 @@ | |||
1 | #include <linux/bitops.h> | ||
2 | |||
3 | /** | ||
4 | * hweightN - returns the hamming weight of a N-bit word | ||
5 | * @x: the word to weigh | ||
6 | * | ||
7 | * The Hamming Weight of a number is the total number of bits set in it. | ||
8 | */ | ||
9 | |||
10 | unsigned int hweight32(unsigned int w) | ||
11 | { | ||
12 | unsigned int res = w - ((w >> 1) & 0x55555555); | ||
13 | res = (res & 0x33333333) + ((res >> 2) & 0x33333333); | ||
14 | res = (res + (res >> 4)) & 0x0F0F0F0F; | ||
15 | res = res + (res >> 8); | ||
16 | return (res + (res >> 16)) & 0x000000FF; | ||
17 | } | ||
18 | |||
19 | unsigned long hweight64(__u64 w) | ||
20 | { | ||
21 | #if BITS_PER_LONG == 32 | ||
22 | return hweight32((unsigned int)(w >> 32)) + hweight32((unsigned int)w); | ||
23 | #elif BITS_PER_LONG == 64 | ||
24 | __u64 res = w - ((w >> 1) & 0x5555555555555555ul); | ||
25 | res = (res & 0x3333333333333333ul) + ((res >> 2) & 0x3333333333333333ul); | ||
26 | res = (res + (res >> 4)) & 0x0F0F0F0F0F0F0F0Ful; | ||
27 | res = res + (res >> 8); | ||
28 | res = res + (res >> 16); | ||
29 | return (res + (res >> 32)) & 0x00000000000000FFul; | ||
30 | #endif | ||
31 | } | ||
diff --git a/tools/perf/util/include/asm/bitops.h b/tools/perf/util/include/asm/bitops.h deleted file mode 100644 index 58e9817ffae0..000000000000 --- a/tools/perf/util/include/asm/bitops.h +++ /dev/null | |||
@@ -1,18 +0,0 @@ | |||
1 | #ifndef _PERF_ASM_BITOPS_H_ | ||
2 | #define _PERF_ASM_BITOPS_H_ | ||
3 | |||
4 | #include <sys/types.h> | ||
5 | #include "../../types.h" | ||
6 | #include <linux/compiler.h> | ||
7 | |||
8 | /* CHECKME: Not sure both always match */ | ||
9 | #define BITS_PER_LONG __WORDSIZE | ||
10 | |||
11 | #include "../../../../include/asm-generic/bitops/__fls.h" | ||
12 | #include "../../../../include/asm-generic/bitops/fls.h" | ||
13 | #include "../../../../include/asm-generic/bitops/fls64.h" | ||
14 | #include "../../../../include/asm-generic/bitops/__ffs.h" | ||
15 | #include "../../../../include/asm-generic/bitops/ffz.h" | ||
16 | #include "../../../../include/asm-generic/bitops/hweight.h" | ||
17 | |||
18 | #endif | ||
diff --git a/tools/perf/util/include/asm/hweight.h b/tools/perf/util/include/asm/hweight.h new file mode 100644 index 000000000000..36cf26d434a5 --- /dev/null +++ b/tools/perf/util/include/asm/hweight.h | |||
@@ -0,0 +1,8 @@ | |||
1 | #ifndef PERF_HWEIGHT_H | ||
2 | #define PERF_HWEIGHT_H | ||
3 | |||
4 | #include <linux/types.h> | ||
5 | unsigned int hweight32(unsigned int w); | ||
6 | unsigned long hweight64(__u64 w); | ||
7 | |||
8 | #endif /* PERF_HWEIGHT_H */ | ||
diff --git a/tools/perf/util/include/dwarf-regs.h b/tools/perf/util/include/dwarf-regs.h new file mode 100644 index 000000000000..cf6727e99c44 --- /dev/null +++ b/tools/perf/util/include/dwarf-regs.h | |||
@@ -0,0 +1,8 @@ | |||
1 | #ifndef _PERF_DWARF_REGS_H_ | ||
2 | #define _PERF_DWARF_REGS_H_ | ||
3 | |||
4 | #ifdef DWARF_SUPPORT | ||
5 | const char *get_arch_regstr(unsigned int n); | ||
6 | #endif | ||
7 | |||
8 | #endif | ||
diff --git a/tools/perf/util/include/linux/bitmap.h b/tools/perf/util/include/linux/bitmap.h index 94507639a8c4..eda4416efa0a 100644 --- a/tools/perf/util/include/linux/bitmap.h +++ b/tools/perf/util/include/linux/bitmap.h | |||
@@ -1,3 +1,35 @@ | |||
1 | #include "../../../../include/linux/bitmap.h" | 1 | #ifndef _PERF_BITOPS_H |
2 | #include "../../../../include/asm-generic/bitops/find.h" | 2 | #define _PERF_BITOPS_H |
3 | #include <linux/errno.h> | 3 | |
4 | #include <string.h> | ||
5 | #include <linux/bitops.h> | ||
6 | |||
7 | int __bitmap_weight(const unsigned long *bitmap, int bits); | ||
8 | |||
9 | #define BITMAP_LAST_WORD_MASK(nbits) \ | ||
10 | ( \ | ||
11 | ((nbits) % BITS_PER_LONG) ? \ | ||
12 | (1UL<<((nbits) % BITS_PER_LONG))-1 : ~0UL \ | ||
13 | ) | ||
14 | |||
15 | #define small_const_nbits(nbits) \ | ||
16 | (__builtin_constant_p(nbits) && (nbits) <= BITS_PER_LONG) | ||
17 | |||
18 | static inline void bitmap_zero(unsigned long *dst, int nbits) | ||
19 | { | ||
20 | if (small_const_nbits(nbits)) | ||
21 | *dst = 0UL; | ||
22 | else { | ||
23 | int len = BITS_TO_LONGS(nbits) * sizeof(unsigned long); | ||
24 | memset(dst, 0, len); | ||
25 | } | ||
26 | } | ||
27 | |||
28 | static inline int bitmap_weight(const unsigned long *src, int nbits) | ||
29 | { | ||
30 | if (small_const_nbits(nbits)) | ||
31 | return hweight_long(*src & BITMAP_LAST_WORD_MASK(nbits)); | ||
32 | return __bitmap_weight(src, nbits); | ||
33 | } | ||
34 | |||
35 | #endif /* _PERF_BITOPS_H */ | ||
diff --git a/tools/perf/util/include/linux/bitops.h b/tools/perf/util/include/linux/bitops.h index 8d63116e9435..bb4ac2e05385 100644 --- a/tools/perf/util/include/linux/bitops.h +++ b/tools/perf/util/include/linux/bitops.h | |||
@@ -1,13 +1,12 @@ | |||
1 | #ifndef _PERF_LINUX_BITOPS_H_ | 1 | #ifndef _PERF_LINUX_BITOPS_H_ |
2 | #define _PERF_LINUX_BITOPS_H_ | 2 | #define _PERF_LINUX_BITOPS_H_ |
3 | 3 | ||
4 | #define __KERNEL__ | 4 | #include <linux/kernel.h> |
5 | #include <asm/hweight.h> | ||
5 | 6 | ||
6 | #define CONFIG_GENERIC_FIND_NEXT_BIT | 7 | #define BITS_PER_LONG __WORDSIZE |
7 | #define CONFIG_GENERIC_FIND_FIRST_BIT | 8 | #define BITS_PER_BYTE 8 |
8 | #include "../../../../include/linux/bitops.h" | 9 | #define BITS_TO_LONGS(nr) DIV_ROUND_UP(nr, BITS_PER_BYTE * sizeof(long)) |
9 | |||
10 | #undef __KERNEL__ | ||
11 | 10 | ||
12 | static inline void set_bit(int nr, unsigned long *addr) | 11 | static inline void set_bit(int nr, unsigned long *addr) |
13 | { | 12 | { |
@@ -20,10 +19,9 @@ static __always_inline int test_bit(unsigned int nr, const unsigned long *addr) | |||
20 | (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0; | 19 | (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0; |
21 | } | 20 | } |
22 | 21 | ||
23 | unsigned long generic_find_next_zero_le_bit(const unsigned long *addr, unsigned | 22 | static inline unsigned long hweight_long(unsigned long w) |
24 | long size, unsigned long offset); | 23 | { |
25 | 24 | return sizeof(w) == 4 ? hweight32(w) : hweight64(w); | |
26 | unsigned long generic_find_next_le_bit(const unsigned long *addr, unsigned | 25 | } |
27 | long size, unsigned long offset); | ||
28 | 26 | ||
29 | #endif | 27 | #endif |
diff --git a/tools/perf/util/include/linux/compiler.h b/tools/perf/util/include/linux/compiler.h index dfb0713ed47f..791f9dd27ebf 100644 --- a/tools/perf/util/include/linux/compiler.h +++ b/tools/perf/util/include/linux/compiler.h | |||
@@ -7,4 +7,6 @@ | |||
7 | #define __user | 7 | #define __user |
8 | #define __attribute_const__ | 8 | #define __attribute_const__ |
9 | 9 | ||
10 | #define __used __attribute__((__unused__)) | ||
11 | |||
10 | #endif | 12 | #endif |
diff --git a/tools/perf/util/include/linux/kernel.h b/tools/perf/util/include/linux/kernel.h index f2611655ab51..388ab1bfd114 100644 --- a/tools/perf/util/include/linux/kernel.h +++ b/tools/perf/util/include/linux/kernel.h | |||
@@ -85,16 +85,19 @@ simple_strtoul(const char *nptr, char **endptr, int base) | |||
85 | return strtoul(nptr, endptr, base); | 85 | return strtoul(nptr, endptr, base); |
86 | } | 86 | } |
87 | 87 | ||
88 | int eprintf(int level, | ||
89 | const char *fmt, ...) __attribute__((format(printf, 2, 3))); | ||
90 | |||
88 | #ifndef pr_fmt | 91 | #ifndef pr_fmt |
89 | #define pr_fmt(fmt) fmt | 92 | #define pr_fmt(fmt) fmt |
90 | #endif | 93 | #endif |
91 | 94 | ||
92 | #define pr_err(fmt, ...) \ | 95 | #define pr_err(fmt, ...) \ |
93 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 96 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
94 | #define pr_warning(fmt, ...) \ | 97 | #define pr_warning(fmt, ...) \ |
95 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 98 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
96 | #define pr_info(fmt, ...) \ | 99 | #define pr_info(fmt, ...) \ |
97 | do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) | 100 | eprintf(0, pr_fmt(fmt), ##__VA_ARGS__) |
98 | #define pr_debug(fmt, ...) \ | 101 | #define pr_debug(fmt, ...) \ |
99 | eprintf(1, pr_fmt(fmt), ##__VA_ARGS__) | 102 | eprintf(1, pr_fmt(fmt), ##__VA_ARGS__) |
100 | #define pr_debugN(n, fmt, ...) \ | 103 | #define pr_debugN(n, fmt, ...) \ |
diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c index e509cd59c67d..e672f2fef65b 100644 --- a/tools/perf/util/map.c +++ b/tools/perf/util/map.c | |||
@@ -1,9 +1,11 @@ | |||
1 | #include "event.h" | ||
2 | #include "symbol.h" | 1 | #include "symbol.h" |
2 | #include <errno.h> | ||
3 | #include <limits.h> | ||
3 | #include <stdlib.h> | 4 | #include <stdlib.h> |
4 | #include <string.h> | 5 | #include <string.h> |
5 | #include <stdio.h> | 6 | #include <stdio.h> |
6 | #include "debug.h" | 7 | #include <unistd.h> |
8 | #include "map.h" | ||
7 | 9 | ||
8 | const char *map_type__name[MAP__NR_TYPES] = { | 10 | const char *map_type__name[MAP__NR_TYPES] = { |
9 | [MAP__FUNCTION] = "Functions", | 11 | [MAP__FUNCTION] = "Functions", |
@@ -36,15 +38,16 @@ void map__init(struct map *self, enum map_type type, | |||
36 | self->map_ip = map__map_ip; | 38 | self->map_ip = map__map_ip; |
37 | self->unmap_ip = map__unmap_ip; | 39 | self->unmap_ip = map__unmap_ip; |
38 | RB_CLEAR_NODE(&self->rb_node); | 40 | RB_CLEAR_NODE(&self->rb_node); |
41 | self->groups = NULL; | ||
39 | } | 42 | } |
40 | 43 | ||
41 | struct map *map__new(struct mmap_event *event, enum map_type type, | 44 | struct map *map__new(struct list_head *dsos__list, u64 start, u64 len, |
42 | char *cwd, int cwdlen) | 45 | u64 pgoff, u32 pid, char *filename, |
46 | enum map_type type, char *cwd, int cwdlen) | ||
43 | { | 47 | { |
44 | struct map *self = malloc(sizeof(*self)); | 48 | struct map *self = malloc(sizeof(*self)); |
45 | 49 | ||
46 | if (self != NULL) { | 50 | if (self != NULL) { |
47 | const char *filename = event->filename; | ||
48 | char newfilename[PATH_MAX]; | 51 | char newfilename[PATH_MAX]; |
49 | struct dso *dso; | 52 | struct dso *dso; |
50 | int anon; | 53 | int anon; |
@@ -62,16 +65,15 @@ struct map *map__new(struct mmap_event *event, enum map_type type, | |||
62 | anon = is_anon_memory(filename); | 65 | anon = is_anon_memory(filename); |
63 | 66 | ||
64 | if (anon) { | 67 | if (anon) { |
65 | snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", event->pid); | 68 | snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", pid); |
66 | filename = newfilename; | 69 | filename = newfilename; |
67 | } | 70 | } |
68 | 71 | ||
69 | dso = dsos__findnew(filename); | 72 | dso = __dsos__findnew(dsos__list, filename); |
70 | if (dso == NULL) | 73 | if (dso == NULL) |
71 | goto out_delete; | 74 | goto out_delete; |
72 | 75 | ||
73 | map__init(self, type, event->start, event->start + event->len, | 76 | map__init(self, type, start, start + len, pgoff, dso); |
74 | event->pgoff, dso); | ||
75 | 77 | ||
76 | if (anon) { | 78 | if (anon) { |
77 | set_identity: | 79 | set_identity: |
@@ -235,3 +237,392 @@ u64 map__objdump_2ip(struct map *map, u64 addr) | |||
235 | map->unmap_ip(map, addr); /* RIP -> IP */ | 237 | map->unmap_ip(map, addr); /* RIP -> IP */ |
236 | return ip; | 238 | return ip; |
237 | } | 239 | } |
240 | |||
241 | void map_groups__init(struct map_groups *self) | ||
242 | { | ||
243 | int i; | ||
244 | for (i = 0; i < MAP__NR_TYPES; ++i) { | ||
245 | self->maps[i] = RB_ROOT; | ||
246 | INIT_LIST_HEAD(&self->removed_maps[i]); | ||
247 | } | ||
248 | self->machine = NULL; | ||
249 | } | ||
250 | |||
251 | void map_groups__flush(struct map_groups *self) | ||
252 | { | ||
253 | int type; | ||
254 | |||
255 | for (type = 0; type < MAP__NR_TYPES; type++) { | ||
256 | struct rb_root *root = &self->maps[type]; | ||
257 | struct rb_node *next = rb_first(root); | ||
258 | |||
259 | while (next) { | ||
260 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
261 | next = rb_next(&pos->rb_node); | ||
262 | rb_erase(&pos->rb_node, root); | ||
263 | /* | ||
264 | * We may have references to this map, for | ||
265 | * instance in some hist_entry instances, so | ||
266 | * just move them to a separate list. | ||
267 | */ | ||
268 | list_add_tail(&pos->node, &self->removed_maps[pos->type]); | ||
269 | } | ||
270 | } | ||
271 | } | ||
272 | |||
273 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
274 | enum map_type type, u64 addr, | ||
275 | struct map **mapp, | ||
276 | symbol_filter_t filter) | ||
277 | { | ||
278 | struct map *map = map_groups__find(self, type, addr); | ||
279 | |||
280 | if (map != NULL) { | ||
281 | if (mapp != NULL) | ||
282 | *mapp = map; | ||
283 | return map__find_symbol(map, map->map_ip(map, addr), filter); | ||
284 | } | ||
285 | |||
286 | return NULL; | ||
287 | } | ||
288 | |||
289 | struct symbol *map_groups__find_symbol_by_name(struct map_groups *self, | ||
290 | enum map_type type, | ||
291 | const char *name, | ||
292 | struct map **mapp, | ||
293 | symbol_filter_t filter) | ||
294 | { | ||
295 | struct rb_node *nd; | ||
296 | |||
297 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
298 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
299 | struct symbol *sym = map__find_symbol_by_name(pos, name, filter); | ||
300 | |||
301 | if (sym == NULL) | ||
302 | continue; | ||
303 | if (mapp != NULL) | ||
304 | *mapp = pos; | ||
305 | return sym; | ||
306 | } | ||
307 | |||
308 | return NULL; | ||
309 | } | ||
310 | |||
311 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
312 | enum map_type type, int verbose, FILE *fp) | ||
313 | { | ||
314 | size_t printed = fprintf(fp, "%s:\n", map_type__name[type]); | ||
315 | struct rb_node *nd; | ||
316 | |||
317 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
318 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
319 | printed += fprintf(fp, "Map:"); | ||
320 | printed += map__fprintf(pos, fp); | ||
321 | if (verbose > 2) { | ||
322 | printed += dso__fprintf(pos->dso, type, fp); | ||
323 | printed += fprintf(fp, "--\n"); | ||
324 | } | ||
325 | } | ||
326 | |||
327 | return printed; | ||
328 | } | ||
329 | |||
330 | size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp) | ||
331 | { | ||
332 | size_t printed = 0, i; | ||
333 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
334 | printed += __map_groups__fprintf_maps(self, i, verbose, fp); | ||
335 | return printed; | ||
336 | } | ||
337 | |||
338 | static size_t __map_groups__fprintf_removed_maps(struct map_groups *self, | ||
339 | enum map_type type, | ||
340 | int verbose, FILE *fp) | ||
341 | { | ||
342 | struct map *pos; | ||
343 | size_t printed = 0; | ||
344 | |||
345 | list_for_each_entry(pos, &self->removed_maps[type], node) { | ||
346 | printed += fprintf(fp, "Map:"); | ||
347 | printed += map__fprintf(pos, fp); | ||
348 | if (verbose > 1) { | ||
349 | printed += dso__fprintf(pos->dso, type, fp); | ||
350 | printed += fprintf(fp, "--\n"); | ||
351 | } | ||
352 | } | ||
353 | return printed; | ||
354 | } | ||
355 | |||
356 | static size_t map_groups__fprintf_removed_maps(struct map_groups *self, | ||
357 | int verbose, FILE *fp) | ||
358 | { | ||
359 | size_t printed = 0, i; | ||
360 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
361 | printed += __map_groups__fprintf_removed_maps(self, i, verbose, fp); | ||
362 | return printed; | ||
363 | } | ||
364 | |||
365 | size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp) | ||
366 | { | ||
367 | size_t printed = map_groups__fprintf_maps(self, verbose, fp); | ||
368 | printed += fprintf(fp, "Removed maps:\n"); | ||
369 | return printed + map_groups__fprintf_removed_maps(self, verbose, fp); | ||
370 | } | ||
371 | |||
372 | int map_groups__fixup_overlappings(struct map_groups *self, struct map *map, | ||
373 | int verbose, FILE *fp) | ||
374 | { | ||
375 | struct rb_root *root = &self->maps[map->type]; | ||
376 | struct rb_node *next = rb_first(root); | ||
377 | |||
378 | while (next) { | ||
379 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
380 | next = rb_next(&pos->rb_node); | ||
381 | |||
382 | if (!map__overlap(pos, map)) | ||
383 | continue; | ||
384 | |||
385 | if (verbose >= 2) { | ||
386 | fputs("overlapping maps:\n", fp); | ||
387 | map__fprintf(map, fp); | ||
388 | map__fprintf(pos, fp); | ||
389 | } | ||
390 | |||
391 | rb_erase(&pos->rb_node, root); | ||
392 | /* | ||
393 | * We may have references to this map, for instance in some | ||
394 | * hist_entry instances, so just move them to a separate | ||
395 | * list. | ||
396 | */ | ||
397 | list_add_tail(&pos->node, &self->removed_maps[map->type]); | ||
398 | /* | ||
399 | * Now check if we need to create new maps for areas not | ||
400 | * overlapped by the new map: | ||
401 | */ | ||
402 | if (map->start > pos->start) { | ||
403 | struct map *before = map__clone(pos); | ||
404 | |||
405 | if (before == NULL) | ||
406 | return -ENOMEM; | ||
407 | |||
408 | before->end = map->start - 1; | ||
409 | map_groups__insert(self, before); | ||
410 | if (verbose >= 2) | ||
411 | map__fprintf(before, fp); | ||
412 | } | ||
413 | |||
414 | if (map->end < pos->end) { | ||
415 | struct map *after = map__clone(pos); | ||
416 | |||
417 | if (after == NULL) | ||
418 | return -ENOMEM; | ||
419 | |||
420 | after->start = map->end + 1; | ||
421 | map_groups__insert(self, after); | ||
422 | if (verbose >= 2) | ||
423 | map__fprintf(after, fp); | ||
424 | } | ||
425 | } | ||
426 | |||
427 | return 0; | ||
428 | } | ||
429 | |||
430 | /* | ||
431 | * XXX This should not really _copy_ te maps, but refcount them. | ||
432 | */ | ||
433 | int map_groups__clone(struct map_groups *self, | ||
434 | struct map_groups *parent, enum map_type type) | ||
435 | { | ||
436 | struct rb_node *nd; | ||
437 | for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) { | ||
438 | struct map *map = rb_entry(nd, struct map, rb_node); | ||
439 | struct map *new = map__clone(map); | ||
440 | if (new == NULL) | ||
441 | return -ENOMEM; | ||
442 | map_groups__insert(self, new); | ||
443 | } | ||
444 | return 0; | ||
445 | } | ||
446 | |||
447 | static u64 map__reloc_map_ip(struct map *map, u64 ip) | ||
448 | { | ||
449 | return ip + (s64)map->pgoff; | ||
450 | } | ||
451 | |||
452 | static u64 map__reloc_unmap_ip(struct map *map, u64 ip) | ||
453 | { | ||
454 | return ip - (s64)map->pgoff; | ||
455 | } | ||
456 | |||
457 | void map__reloc_vmlinux(struct map *self) | ||
458 | { | ||
459 | struct kmap *kmap = map__kmap(self); | ||
460 | s64 reloc; | ||
461 | |||
462 | if (!kmap->ref_reloc_sym || !kmap->ref_reloc_sym->unrelocated_addr) | ||
463 | return; | ||
464 | |||
465 | reloc = (kmap->ref_reloc_sym->unrelocated_addr - | ||
466 | kmap->ref_reloc_sym->addr); | ||
467 | |||
468 | if (!reloc) | ||
469 | return; | ||
470 | |||
471 | self->map_ip = map__reloc_map_ip; | ||
472 | self->unmap_ip = map__reloc_unmap_ip; | ||
473 | self->pgoff = reloc; | ||
474 | } | ||
475 | |||
476 | void maps__insert(struct rb_root *maps, struct map *map) | ||
477 | { | ||
478 | struct rb_node **p = &maps->rb_node; | ||
479 | struct rb_node *parent = NULL; | ||
480 | const u64 ip = map->start; | ||
481 | struct map *m; | ||
482 | |||
483 | while (*p != NULL) { | ||
484 | parent = *p; | ||
485 | m = rb_entry(parent, struct map, rb_node); | ||
486 | if (ip < m->start) | ||
487 | p = &(*p)->rb_left; | ||
488 | else | ||
489 | p = &(*p)->rb_right; | ||
490 | } | ||
491 | |||
492 | rb_link_node(&map->rb_node, parent, p); | ||
493 | rb_insert_color(&map->rb_node, maps); | ||
494 | } | ||
495 | |||
496 | struct map *maps__find(struct rb_root *maps, u64 ip) | ||
497 | { | ||
498 | struct rb_node **p = &maps->rb_node; | ||
499 | struct rb_node *parent = NULL; | ||
500 | struct map *m; | ||
501 | |||
502 | while (*p != NULL) { | ||
503 | parent = *p; | ||
504 | m = rb_entry(parent, struct map, rb_node); | ||
505 | if (ip < m->start) | ||
506 | p = &(*p)->rb_left; | ||
507 | else if (ip > m->end) | ||
508 | p = &(*p)->rb_right; | ||
509 | else | ||
510 | return m; | ||
511 | } | ||
512 | |||
513 | return NULL; | ||
514 | } | ||
515 | |||
516 | int machine__init(struct machine *self, const char *root_dir, pid_t pid) | ||
517 | { | ||
518 | map_groups__init(&self->kmaps); | ||
519 | RB_CLEAR_NODE(&self->rb_node); | ||
520 | INIT_LIST_HEAD(&self->user_dsos); | ||
521 | INIT_LIST_HEAD(&self->kernel_dsos); | ||
522 | |||
523 | self->kmaps.machine = self; | ||
524 | self->pid = pid; | ||
525 | self->root_dir = strdup(root_dir); | ||
526 | return self->root_dir == NULL ? -ENOMEM : 0; | ||
527 | } | ||
528 | |||
529 | struct machine *machines__add(struct rb_root *self, pid_t pid, | ||
530 | const char *root_dir) | ||
531 | { | ||
532 | struct rb_node **p = &self->rb_node; | ||
533 | struct rb_node *parent = NULL; | ||
534 | struct machine *pos, *machine = malloc(sizeof(*machine)); | ||
535 | |||
536 | if (!machine) | ||
537 | return NULL; | ||
538 | |||
539 | if (machine__init(machine, root_dir, pid) != 0) { | ||
540 | free(machine); | ||
541 | return NULL; | ||
542 | } | ||
543 | |||
544 | while (*p != NULL) { | ||
545 | parent = *p; | ||
546 | pos = rb_entry(parent, struct machine, rb_node); | ||
547 | if (pid < pos->pid) | ||
548 | p = &(*p)->rb_left; | ||
549 | else | ||
550 | p = &(*p)->rb_right; | ||
551 | } | ||
552 | |||
553 | rb_link_node(&machine->rb_node, parent, p); | ||
554 | rb_insert_color(&machine->rb_node, self); | ||
555 | |||
556 | return machine; | ||
557 | } | ||
558 | |||
559 | struct machine *machines__find(struct rb_root *self, pid_t pid) | ||
560 | { | ||
561 | struct rb_node **p = &self->rb_node; | ||
562 | struct rb_node *parent = NULL; | ||
563 | struct machine *machine; | ||
564 | struct machine *default_machine = NULL; | ||
565 | |||
566 | while (*p != NULL) { | ||
567 | parent = *p; | ||
568 | machine = rb_entry(parent, struct machine, rb_node); | ||
569 | if (pid < machine->pid) | ||
570 | p = &(*p)->rb_left; | ||
571 | else if (pid > machine->pid) | ||
572 | p = &(*p)->rb_right; | ||
573 | else | ||
574 | return machine; | ||
575 | if (!machine->pid) | ||
576 | default_machine = machine; | ||
577 | } | ||
578 | |||
579 | return default_machine; | ||
580 | } | ||
581 | |||
582 | struct machine *machines__findnew(struct rb_root *self, pid_t pid) | ||
583 | { | ||
584 | char path[PATH_MAX]; | ||
585 | const char *root_dir; | ||
586 | struct machine *machine = machines__find(self, pid); | ||
587 | |||
588 | if (!machine || machine->pid != pid) { | ||
589 | if (pid == HOST_KERNEL_ID || pid == DEFAULT_GUEST_KERNEL_ID) | ||
590 | root_dir = ""; | ||
591 | else { | ||
592 | if (!symbol_conf.guestmount) | ||
593 | goto out; | ||
594 | sprintf(path, "%s/%d", symbol_conf.guestmount, pid); | ||
595 | if (access(path, R_OK)) { | ||
596 | pr_err("Can't access file %s\n", path); | ||
597 | goto out; | ||
598 | } | ||
599 | root_dir = path; | ||
600 | } | ||
601 | machine = machines__add(self, pid, root_dir); | ||
602 | } | ||
603 | |||
604 | out: | ||
605 | return machine; | ||
606 | } | ||
607 | |||
608 | void machines__process(struct rb_root *self, machine__process_t process, void *data) | ||
609 | { | ||
610 | struct rb_node *nd; | ||
611 | |||
612 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
613 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
614 | process(pos, data); | ||
615 | } | ||
616 | } | ||
617 | |||
618 | char *machine__mmap_name(struct machine *self, char *bf, size_t size) | ||
619 | { | ||
620 | if (machine__is_host(self)) | ||
621 | snprintf(bf, size, "[%s]", "kernel.kallsyms"); | ||
622 | else if (machine__is_default_guest(self)) | ||
623 | snprintf(bf, size, "[%s]", "guest.kernel.kallsyms"); | ||
624 | else | ||
625 | snprintf(bf, size, "[%s.%d]", "guest.kernel.kallsyms", self->pid); | ||
626 | |||
627 | return bf; | ||
628 | } | ||
diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h index b756368076c6..f39134512829 100644 --- a/tools/perf/util/map.h +++ b/tools/perf/util/map.h | |||
@@ -4,7 +4,9 @@ | |||
4 | #include <linux/compiler.h> | 4 | #include <linux/compiler.h> |
5 | #include <linux/list.h> | 5 | #include <linux/list.h> |
6 | #include <linux/rbtree.h> | 6 | #include <linux/rbtree.h> |
7 | #include <linux/types.h> | 7 | #include <stdio.h> |
8 | #include <stdbool.h> | ||
9 | #include "types.h" | ||
8 | 10 | ||
9 | enum map_type { | 11 | enum map_type { |
10 | MAP__FUNCTION = 0, | 12 | MAP__FUNCTION = 0, |
@@ -18,6 +20,7 @@ extern const char *map_type__name[MAP__NR_TYPES]; | |||
18 | struct dso; | 20 | struct dso; |
19 | struct ref_reloc_sym; | 21 | struct ref_reloc_sym; |
20 | struct map_groups; | 22 | struct map_groups; |
23 | struct machine; | ||
21 | 24 | ||
22 | struct map { | 25 | struct map { |
23 | union { | 26 | union { |
@@ -27,6 +30,7 @@ struct map { | |||
27 | u64 start; | 30 | u64 start; |
28 | u64 end; | 31 | u64 end; |
29 | enum map_type type; | 32 | enum map_type type; |
33 | u32 priv; | ||
30 | u64 pgoff; | 34 | u64 pgoff; |
31 | 35 | ||
32 | /* ip -> dso rip */ | 36 | /* ip -> dso rip */ |
@@ -35,6 +39,7 @@ struct map { | |||
35 | u64 (*unmap_ip)(struct map *, u64); | 39 | u64 (*unmap_ip)(struct map *, u64); |
36 | 40 | ||
37 | struct dso *dso; | 41 | struct dso *dso; |
42 | struct map_groups *groups; | ||
38 | }; | 43 | }; |
39 | 44 | ||
40 | struct kmap { | 45 | struct kmap { |
@@ -42,6 +47,32 @@ struct kmap { | |||
42 | struct map_groups *kmaps; | 47 | struct map_groups *kmaps; |
43 | }; | 48 | }; |
44 | 49 | ||
50 | struct map_groups { | ||
51 | struct rb_root maps[MAP__NR_TYPES]; | ||
52 | struct list_head removed_maps[MAP__NR_TYPES]; | ||
53 | struct machine *machine; | ||
54 | }; | ||
55 | |||
56 | /* Native host kernel uses -1 as pid index in machine */ | ||
57 | #define HOST_KERNEL_ID (-1) | ||
58 | #define DEFAULT_GUEST_KERNEL_ID (0) | ||
59 | |||
60 | struct machine { | ||
61 | struct rb_node rb_node; | ||
62 | pid_t pid; | ||
63 | char *root_dir; | ||
64 | struct list_head user_dsos; | ||
65 | struct list_head kernel_dsos; | ||
66 | struct map_groups kmaps; | ||
67 | struct map *vmlinux_maps[MAP__NR_TYPES]; | ||
68 | }; | ||
69 | |||
70 | static inline | ||
71 | struct map *machine__kernel_map(struct machine *self, enum map_type type) | ||
72 | { | ||
73 | return self->vmlinux_maps[type]; | ||
74 | } | ||
75 | |||
45 | static inline struct kmap *map__kmap(struct map *self) | 76 | static inline struct kmap *map__kmap(struct map *self) |
46 | { | 77 | { |
47 | return (struct kmap *)(self + 1); | 78 | return (struct kmap *)(self + 1); |
@@ -68,14 +99,14 @@ u64 map__rip_2objdump(struct map *map, u64 rip); | |||
68 | u64 map__objdump_2ip(struct map *map, u64 addr); | 99 | u64 map__objdump_2ip(struct map *map, u64 addr); |
69 | 100 | ||
70 | struct symbol; | 101 | struct symbol; |
71 | struct mmap_event; | ||
72 | 102 | ||
73 | typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym); | 103 | typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym); |
74 | 104 | ||
75 | void map__init(struct map *self, enum map_type type, | 105 | void map__init(struct map *self, enum map_type type, |
76 | u64 start, u64 end, u64 pgoff, struct dso *dso); | 106 | u64 start, u64 end, u64 pgoff, struct dso *dso); |
77 | struct map *map__new(struct mmap_event *event, enum map_type, | 107 | struct map *map__new(struct list_head *dsos__list, u64 start, u64 len, |
78 | char *cwd, int cwdlen); | 108 | u64 pgoff, u32 pid, char *filename, |
109 | enum map_type type, char *cwd, int cwdlen); | ||
79 | void map__delete(struct map *self); | 110 | void map__delete(struct map *self); |
80 | struct map *map__clone(struct map *self); | 111 | struct map *map__clone(struct map *self); |
81 | int map__overlap(struct map *l, struct map *r); | 112 | int map__overlap(struct map *l, struct map *r); |
@@ -91,4 +122,96 @@ void map__fixup_end(struct map *self); | |||
91 | 122 | ||
92 | void map__reloc_vmlinux(struct map *self); | 123 | void map__reloc_vmlinux(struct map *self); |
93 | 124 | ||
125 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
126 | enum map_type type, int verbose, FILE *fp); | ||
127 | void maps__insert(struct rb_root *maps, struct map *map); | ||
128 | struct map *maps__find(struct rb_root *maps, u64 addr); | ||
129 | void map_groups__init(struct map_groups *self); | ||
130 | int map_groups__clone(struct map_groups *self, | ||
131 | struct map_groups *parent, enum map_type type); | ||
132 | size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp); | ||
133 | size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp); | ||
134 | |||
135 | typedef void (*machine__process_t)(struct machine *self, void *data); | ||
136 | |||
137 | void machines__process(struct rb_root *self, machine__process_t process, void *data); | ||
138 | struct machine *machines__add(struct rb_root *self, pid_t pid, | ||
139 | const char *root_dir); | ||
140 | struct machine *machines__find_host(struct rb_root *self); | ||
141 | struct machine *machines__find(struct rb_root *self, pid_t pid); | ||
142 | struct machine *machines__findnew(struct rb_root *self, pid_t pid); | ||
143 | char *machine__mmap_name(struct machine *self, char *bf, size_t size); | ||
144 | int machine__init(struct machine *self, const char *root_dir, pid_t pid); | ||
145 | |||
146 | /* | ||
147 | * Default guest kernel is defined by parameter --guestkallsyms | ||
148 | * and --guestmodules | ||
149 | */ | ||
150 | static inline bool machine__is_default_guest(struct machine *self) | ||
151 | { | ||
152 | return self ? self->pid == DEFAULT_GUEST_KERNEL_ID : false; | ||
153 | } | ||
154 | |||
155 | static inline bool machine__is_host(struct machine *self) | ||
156 | { | ||
157 | return self ? self->pid == HOST_KERNEL_ID : false; | ||
158 | } | ||
159 | |||
160 | static inline void map_groups__insert(struct map_groups *self, struct map *map) | ||
161 | { | ||
162 | maps__insert(&self->maps[map->type], map); | ||
163 | map->groups = self; | ||
164 | } | ||
165 | |||
166 | static inline struct map *map_groups__find(struct map_groups *self, | ||
167 | enum map_type type, u64 addr) | ||
168 | { | ||
169 | return maps__find(&self->maps[type], addr); | ||
170 | } | ||
171 | |||
172 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
173 | enum map_type type, u64 addr, | ||
174 | struct map **mapp, | ||
175 | symbol_filter_t filter); | ||
176 | |||
177 | struct symbol *map_groups__find_symbol_by_name(struct map_groups *self, | ||
178 | enum map_type type, | ||
179 | const char *name, | ||
180 | struct map **mapp, | ||
181 | symbol_filter_t filter); | ||
182 | |||
183 | static inline | ||
184 | struct symbol *machine__find_kernel_symbol(struct machine *self, | ||
185 | enum map_type type, u64 addr, | ||
186 | struct map **mapp, | ||
187 | symbol_filter_t filter) | ||
188 | { | ||
189 | return map_groups__find_symbol(&self->kmaps, type, addr, mapp, filter); | ||
190 | } | ||
191 | |||
192 | static inline | ||
193 | struct symbol *machine__find_kernel_function(struct machine *self, u64 addr, | ||
194 | struct map **mapp, | ||
195 | symbol_filter_t filter) | ||
196 | { | ||
197 | return machine__find_kernel_symbol(self, MAP__FUNCTION, addr, mapp, filter); | ||
198 | } | ||
199 | |||
200 | static inline | ||
201 | struct symbol *map_groups__find_function_by_name(struct map_groups *self, | ||
202 | const char *name, struct map **mapp, | ||
203 | symbol_filter_t filter) | ||
204 | { | ||
205 | return map_groups__find_symbol_by_name(self, MAP__FUNCTION, name, mapp, filter); | ||
206 | } | ||
207 | |||
208 | int map_groups__fixup_overlappings(struct map_groups *self, struct map *map, | ||
209 | int verbose, FILE *fp); | ||
210 | |||
211 | struct map *map_groups__find_by_name(struct map_groups *self, | ||
212 | enum map_type type, const char *name); | ||
213 | struct map *machine__new_module(struct machine *self, u64 start, const char *filename); | ||
214 | |||
215 | void map_groups__flush(struct map_groups *self); | ||
216 | |||
94 | #endif /* __PERF_MAP_H */ | 217 | #endif /* __PERF_MAP_H */ |
diff --git a/tools/perf/util/newt.c b/tools/perf/util/newt.c new file mode 100644 index 000000000000..6974431d212f --- /dev/null +++ b/tools/perf/util/newt.c | |||
@@ -0,0 +1,1014 @@ | |||
1 | #define _GNU_SOURCE | ||
2 | #include <stdio.h> | ||
3 | #undef _GNU_SOURCE | ||
4 | |||
5 | #include <slang.h> | ||
6 | #include <stdlib.h> | ||
7 | #include <newt.h> | ||
8 | #include <sys/ttydefaults.h> | ||
9 | |||
10 | #include "cache.h" | ||
11 | #include "hist.h" | ||
12 | #include "pstack.h" | ||
13 | #include "session.h" | ||
14 | #include "sort.h" | ||
15 | #include "symbol.h" | ||
16 | |||
17 | struct ui_progress { | ||
18 | newtComponent form, scale; | ||
19 | }; | ||
20 | |||
21 | struct ui_progress *ui_progress__new(const char *title, u64 total) | ||
22 | { | ||
23 | struct ui_progress *self = malloc(sizeof(*self)); | ||
24 | |||
25 | if (self != NULL) { | ||
26 | int cols; | ||
27 | newtGetScreenSize(&cols, NULL); | ||
28 | cols -= 4; | ||
29 | newtCenteredWindow(cols, 1, title); | ||
30 | self->form = newtForm(NULL, NULL, 0); | ||
31 | if (self->form == NULL) | ||
32 | goto out_free_self; | ||
33 | self->scale = newtScale(0, 0, cols, total); | ||
34 | if (self->scale == NULL) | ||
35 | goto out_free_form; | ||
36 | newtFormAddComponent(self->form, self->scale); | ||
37 | newtRefresh(); | ||
38 | } | ||
39 | |||
40 | return self; | ||
41 | |||
42 | out_free_form: | ||
43 | newtFormDestroy(self->form); | ||
44 | out_free_self: | ||
45 | free(self); | ||
46 | return NULL; | ||
47 | } | ||
48 | |||
49 | void ui_progress__update(struct ui_progress *self, u64 curr) | ||
50 | { | ||
51 | newtScaleSet(self->scale, curr); | ||
52 | newtRefresh(); | ||
53 | } | ||
54 | |||
55 | void ui_progress__delete(struct ui_progress *self) | ||
56 | { | ||
57 | newtFormDestroy(self->form); | ||
58 | newtPopWindow(); | ||
59 | free(self); | ||
60 | } | ||
61 | |||
62 | static void ui_helpline__pop(void) | ||
63 | { | ||
64 | newtPopHelpLine(); | ||
65 | } | ||
66 | |||
67 | static void ui_helpline__push(const char *msg) | ||
68 | { | ||
69 | newtPushHelpLine(msg); | ||
70 | } | ||
71 | |||
72 | static void ui_helpline__vpush(const char *fmt, va_list ap) | ||
73 | { | ||
74 | char *s; | ||
75 | |||
76 | if (vasprintf(&s, fmt, ap) < 0) | ||
77 | vfprintf(stderr, fmt, ap); | ||
78 | else { | ||
79 | ui_helpline__push(s); | ||
80 | free(s); | ||
81 | } | ||
82 | } | ||
83 | |||
84 | static void ui_helpline__fpush(const char *fmt, ...) | ||
85 | { | ||
86 | va_list ap; | ||
87 | |||
88 | va_start(ap, fmt); | ||
89 | ui_helpline__vpush(fmt, ap); | ||
90 | va_end(ap); | ||
91 | } | ||
92 | |||
93 | static void ui_helpline__puts(const char *msg) | ||
94 | { | ||
95 | ui_helpline__pop(); | ||
96 | ui_helpline__push(msg); | ||
97 | } | ||
98 | |||
99 | static char browser__last_msg[1024]; | ||
100 | |||
101 | int browser__show_help(const char *format, va_list ap) | ||
102 | { | ||
103 | int ret; | ||
104 | static int backlog; | ||
105 | |||
106 | ret = vsnprintf(browser__last_msg + backlog, | ||
107 | sizeof(browser__last_msg) - backlog, format, ap); | ||
108 | backlog += ret; | ||
109 | |||
110 | if (browser__last_msg[backlog - 1] == '\n') { | ||
111 | ui_helpline__puts(browser__last_msg); | ||
112 | newtRefresh(); | ||
113 | backlog = 0; | ||
114 | } | ||
115 | |||
116 | return ret; | ||
117 | } | ||
118 | |||
119 | static void newt_form__set_exit_keys(newtComponent self) | ||
120 | { | ||
121 | newtFormAddHotKey(self, NEWT_KEY_ESCAPE); | ||
122 | newtFormAddHotKey(self, 'Q'); | ||
123 | newtFormAddHotKey(self, 'q'); | ||
124 | newtFormAddHotKey(self, CTRL('c')); | ||
125 | } | ||
126 | |||
127 | static newtComponent newt_form__new(void) | ||
128 | { | ||
129 | newtComponent self = newtForm(NULL, NULL, 0); | ||
130 | if (self) | ||
131 | newt_form__set_exit_keys(self); | ||
132 | return self; | ||
133 | } | ||
134 | |||
135 | static int popup_menu(int argc, char * const argv[]) | ||
136 | { | ||
137 | struct newtExitStruct es; | ||
138 | int i, rc = -1, max_len = 5; | ||
139 | newtComponent listbox, form = newt_form__new(); | ||
140 | |||
141 | if (form == NULL) | ||
142 | return -1; | ||
143 | |||
144 | listbox = newtListbox(0, 0, argc, NEWT_FLAG_RETURNEXIT); | ||
145 | if (listbox == NULL) | ||
146 | goto out_destroy_form; | ||
147 | |||
148 | newtFormAddComponent(form, listbox); | ||
149 | |||
150 | for (i = 0; i < argc; ++i) { | ||
151 | int len = strlen(argv[i]); | ||
152 | if (len > max_len) | ||
153 | max_len = len; | ||
154 | if (newtListboxAddEntry(listbox, argv[i], (void *)(long)i)) | ||
155 | goto out_destroy_form; | ||
156 | } | ||
157 | |||
158 | newtCenteredWindow(max_len, argc, NULL); | ||
159 | newtFormRun(form, &es); | ||
160 | rc = newtListboxGetCurrent(listbox) - NULL; | ||
161 | if (es.reason == NEWT_EXIT_HOTKEY) | ||
162 | rc = -1; | ||
163 | newtPopWindow(); | ||
164 | out_destroy_form: | ||
165 | newtFormDestroy(form); | ||
166 | return rc; | ||
167 | } | ||
168 | |||
169 | static bool dialog_yesno(const char *msg) | ||
170 | { | ||
171 | /* newtWinChoice should really be accepting const char pointers... */ | ||
172 | char yes[] = "Yes", no[] = "No"; | ||
173 | return newtWinChoice(NULL, yes, no, (char *)msg) == 1; | ||
174 | } | ||
175 | |||
176 | #define HE_COLORSET_TOP 50 | ||
177 | #define HE_COLORSET_MEDIUM 51 | ||
178 | #define HE_COLORSET_NORMAL 52 | ||
179 | #define HE_COLORSET_SELECTED 53 | ||
180 | #define HE_COLORSET_CODE 54 | ||
181 | |||
182 | static int ui_browser__percent_color(double percent, bool current) | ||
183 | { | ||
184 | if (current) | ||
185 | return HE_COLORSET_SELECTED; | ||
186 | if (percent >= MIN_RED) | ||
187 | return HE_COLORSET_TOP; | ||
188 | if (percent >= MIN_GREEN) | ||
189 | return HE_COLORSET_MEDIUM; | ||
190 | return HE_COLORSET_NORMAL; | ||
191 | } | ||
192 | |||
193 | struct ui_browser { | ||
194 | newtComponent form, sb; | ||
195 | u64 index, first_visible_entry_idx; | ||
196 | void *first_visible_entry, *entries; | ||
197 | u16 top, left, width, height; | ||
198 | void *priv; | ||
199 | u32 nr_entries; | ||
200 | }; | ||
201 | |||
202 | static void ui_browser__refresh_dimensions(struct ui_browser *self) | ||
203 | { | ||
204 | int cols, rows; | ||
205 | newtGetScreenSize(&cols, &rows); | ||
206 | |||
207 | if (self->width > cols - 4) | ||
208 | self->width = cols - 4; | ||
209 | self->height = rows - 5; | ||
210 | if (self->height > self->nr_entries) | ||
211 | self->height = self->nr_entries; | ||
212 | self->top = (rows - self->height) / 2; | ||
213 | self->left = (cols - self->width) / 2; | ||
214 | } | ||
215 | |||
216 | static void ui_browser__reset_index(struct ui_browser *self) | ||
217 | { | ||
218 | self->index = self->first_visible_entry_idx = 0; | ||
219 | self->first_visible_entry = NULL; | ||
220 | } | ||
221 | |||
222 | static int objdump_line__show(struct objdump_line *self, struct list_head *head, | ||
223 | int width, struct hist_entry *he, int len, | ||
224 | bool current_entry) | ||
225 | { | ||
226 | if (self->offset != -1) { | ||
227 | struct symbol *sym = he->ms.sym; | ||
228 | unsigned int hits = 0; | ||
229 | double percent = 0.0; | ||
230 | int color; | ||
231 | struct sym_priv *priv = symbol__priv(sym); | ||
232 | struct sym_ext *sym_ext = priv->ext; | ||
233 | struct sym_hist *h = priv->hist; | ||
234 | s64 offset = self->offset; | ||
235 | struct objdump_line *next = objdump__get_next_ip_line(head, self); | ||
236 | |||
237 | while (offset < (s64)len && | ||
238 | (next == NULL || offset < next->offset)) { | ||
239 | if (sym_ext) { | ||
240 | percent += sym_ext[offset].percent; | ||
241 | } else | ||
242 | hits += h->ip[offset]; | ||
243 | |||
244 | ++offset; | ||
245 | } | ||
246 | |||
247 | if (sym_ext == NULL && h->sum) | ||
248 | percent = 100.0 * hits / h->sum; | ||
249 | |||
250 | color = ui_browser__percent_color(percent, current_entry); | ||
251 | SLsmg_set_color(color); | ||
252 | SLsmg_printf(" %7.2f ", percent); | ||
253 | if (!current_entry) | ||
254 | SLsmg_set_color(HE_COLORSET_CODE); | ||
255 | } else { | ||
256 | int color = ui_browser__percent_color(0, current_entry); | ||
257 | SLsmg_set_color(color); | ||
258 | SLsmg_write_nstring(" ", 9); | ||
259 | } | ||
260 | |||
261 | SLsmg_write_char(':'); | ||
262 | SLsmg_write_nstring(" ", 8); | ||
263 | if (!*self->line) | ||
264 | SLsmg_write_nstring(" ", width - 18); | ||
265 | else | ||
266 | SLsmg_write_nstring(self->line, width - 18); | ||
267 | |||
268 | return 0; | ||
269 | } | ||
270 | |||
271 | static int ui_browser__refresh_entries(struct ui_browser *self) | ||
272 | { | ||
273 | struct objdump_line *pos; | ||
274 | struct list_head *head = self->entries; | ||
275 | struct hist_entry *he = self->priv; | ||
276 | int row = 0; | ||
277 | int len = he->ms.sym->end - he->ms.sym->start; | ||
278 | |||
279 | if (self->first_visible_entry == NULL || self->first_visible_entry == self->entries) | ||
280 | self->first_visible_entry = head->next; | ||
281 | |||
282 | pos = list_entry(self->first_visible_entry, struct objdump_line, node); | ||
283 | |||
284 | list_for_each_entry_from(pos, head, node) { | ||
285 | bool current_entry = (self->first_visible_entry_idx + row) == self->index; | ||
286 | SLsmg_gotorc(self->top + row, self->left); | ||
287 | objdump_line__show(pos, head, self->width, | ||
288 | he, len, current_entry); | ||
289 | if (++row == self->height) | ||
290 | break; | ||
291 | } | ||
292 | |||
293 | SLsmg_set_color(HE_COLORSET_NORMAL); | ||
294 | SLsmg_fill_region(self->top + row, self->left, | ||
295 | self->height - row, self->width, ' '); | ||
296 | |||
297 | return 0; | ||
298 | } | ||
299 | |||
300 | static int ui_browser__run(struct ui_browser *self, const char *title, | ||
301 | struct newtExitStruct *es) | ||
302 | { | ||
303 | if (self->form) { | ||
304 | newtFormDestroy(self->form); | ||
305 | newtPopWindow(); | ||
306 | } | ||
307 | |||
308 | ui_browser__refresh_dimensions(self); | ||
309 | newtCenteredWindow(self->width + 2, self->height, title); | ||
310 | self->form = newt_form__new(); | ||
311 | if (self->form == NULL) | ||
312 | return -1; | ||
313 | |||
314 | self->sb = newtVerticalScrollbar(self->width + 1, 0, self->height, | ||
315 | HE_COLORSET_NORMAL, | ||
316 | HE_COLORSET_SELECTED); | ||
317 | if (self->sb == NULL) | ||
318 | return -1; | ||
319 | |||
320 | newtFormAddHotKey(self->form, NEWT_KEY_UP); | ||
321 | newtFormAddHotKey(self->form, NEWT_KEY_DOWN); | ||
322 | newtFormAddHotKey(self->form, NEWT_KEY_PGUP); | ||
323 | newtFormAddHotKey(self->form, NEWT_KEY_PGDN); | ||
324 | newtFormAddHotKey(self->form, NEWT_KEY_HOME); | ||
325 | newtFormAddHotKey(self->form, NEWT_KEY_END); | ||
326 | newtFormAddHotKey(self->form, NEWT_KEY_LEFT); | ||
327 | |||
328 | if (ui_browser__refresh_entries(self) < 0) | ||
329 | return -1; | ||
330 | newtFormAddComponent(self->form, self->sb); | ||
331 | |||
332 | while (1) { | ||
333 | unsigned int offset; | ||
334 | |||
335 | newtFormRun(self->form, es); | ||
336 | |||
337 | if (es->reason != NEWT_EXIT_HOTKEY) | ||
338 | break; | ||
339 | switch (es->u.key) { | ||
340 | case NEWT_KEY_DOWN: | ||
341 | if (self->index == self->nr_entries - 1) | ||
342 | break; | ||
343 | ++self->index; | ||
344 | if (self->index == self->first_visible_entry_idx + self->height) { | ||
345 | struct list_head *pos = self->first_visible_entry; | ||
346 | ++self->first_visible_entry_idx; | ||
347 | self->first_visible_entry = pos->next; | ||
348 | } | ||
349 | break; | ||
350 | case NEWT_KEY_UP: | ||
351 | if (self->index == 0) | ||
352 | break; | ||
353 | --self->index; | ||
354 | if (self->index < self->first_visible_entry_idx) { | ||
355 | struct list_head *pos = self->first_visible_entry; | ||
356 | --self->first_visible_entry_idx; | ||
357 | self->first_visible_entry = pos->prev; | ||
358 | } | ||
359 | break; | ||
360 | case NEWT_KEY_PGDN: | ||
361 | if (self->first_visible_entry_idx + self->height > self->nr_entries - 1) | ||
362 | break; | ||
363 | |||
364 | offset = self->height; | ||
365 | if (self->index + offset > self->nr_entries - 1) | ||
366 | offset = self->nr_entries - 1 - self->index; | ||
367 | self->index += offset; | ||
368 | self->first_visible_entry_idx += offset; | ||
369 | |||
370 | while (offset--) { | ||
371 | struct list_head *pos = self->first_visible_entry; | ||
372 | self->first_visible_entry = pos->next; | ||
373 | } | ||
374 | |||
375 | break; | ||
376 | case NEWT_KEY_PGUP: | ||
377 | if (self->first_visible_entry_idx == 0) | ||
378 | break; | ||
379 | |||
380 | if (self->first_visible_entry_idx < self->height) | ||
381 | offset = self->first_visible_entry_idx; | ||
382 | else | ||
383 | offset = self->height; | ||
384 | |||
385 | self->index -= offset; | ||
386 | self->first_visible_entry_idx -= offset; | ||
387 | |||
388 | while (offset--) { | ||
389 | struct list_head *pos = self->first_visible_entry; | ||
390 | self->first_visible_entry = pos->prev; | ||
391 | } | ||
392 | break; | ||
393 | case NEWT_KEY_HOME: | ||
394 | ui_browser__reset_index(self); | ||
395 | break; | ||
396 | case NEWT_KEY_END: { | ||
397 | struct list_head *head = self->entries; | ||
398 | offset = self->height - 1; | ||
399 | |||
400 | if (offset > self->nr_entries) | ||
401 | offset = self->nr_entries; | ||
402 | |||
403 | self->index = self->first_visible_entry_idx = self->nr_entries - 1 - offset; | ||
404 | self->first_visible_entry = head->prev; | ||
405 | while (offset-- != 0) { | ||
406 | struct list_head *pos = self->first_visible_entry; | ||
407 | self->first_visible_entry = pos->prev; | ||
408 | } | ||
409 | } | ||
410 | break; | ||
411 | case NEWT_KEY_ESCAPE: | ||
412 | case NEWT_KEY_LEFT: | ||
413 | case CTRL('c'): | ||
414 | case 'Q': | ||
415 | case 'q': | ||
416 | return 0; | ||
417 | default: | ||
418 | continue; | ||
419 | } | ||
420 | if (ui_browser__refresh_entries(self) < 0) | ||
421 | return -1; | ||
422 | } | ||
423 | return 0; | ||
424 | } | ||
425 | |||
426 | /* | ||
427 | * When debugging newt problems it was useful to be able to "unroll" | ||
428 | * the calls to newtCheckBoxTreeAdd{Array,Item}, so that we can generate | ||
429 | * a source file with the sequence of calls to these methods, to then | ||
430 | * tweak the arrays to get the intended results, so I'm keeping this code | ||
431 | * here, may be useful again in the future. | ||
432 | */ | ||
433 | #undef NEWT_DEBUG | ||
434 | |||
435 | static void newt_checkbox_tree__add(newtComponent tree, const char *str, | ||
436 | void *priv, int *indexes) | ||
437 | { | ||
438 | #ifdef NEWT_DEBUG | ||
439 | /* Print the newtCheckboxTreeAddArray to tinker with its index arrays */ | ||
440 | int i = 0, len = 40 - strlen(str); | ||
441 | |||
442 | fprintf(stderr, | ||
443 | "\tnewtCheckboxTreeAddItem(tree, %*.*s\"%s\", (void *)%p, 0, ", | ||
444 | len, len, " ", str, priv); | ||
445 | while (indexes[i] != NEWT_ARG_LAST) { | ||
446 | if (indexes[i] != NEWT_ARG_APPEND) | ||
447 | fprintf(stderr, " %d,", indexes[i]); | ||
448 | else | ||
449 | fprintf(stderr, " %s,", "NEWT_ARG_APPEND"); | ||
450 | ++i; | ||
451 | } | ||
452 | fprintf(stderr, " %s", " NEWT_ARG_LAST);\n"); | ||
453 | fflush(stderr); | ||
454 | #endif | ||
455 | newtCheckboxTreeAddArray(tree, str, priv, 0, indexes); | ||
456 | } | ||
457 | |||
458 | static char *callchain_list__sym_name(struct callchain_list *self, | ||
459 | char *bf, size_t bfsize) | ||
460 | { | ||
461 | if (self->ms.sym) | ||
462 | return self->ms.sym->name; | ||
463 | |||
464 | snprintf(bf, bfsize, "%#Lx", self->ip); | ||
465 | return bf; | ||
466 | } | ||
467 | |||
468 | static void __callchain__append_graph_browser(struct callchain_node *self, | ||
469 | newtComponent tree, u64 total, | ||
470 | int *indexes, int depth) | ||
471 | { | ||
472 | struct rb_node *node; | ||
473 | u64 new_total, remaining; | ||
474 | int idx = 0; | ||
475 | |||
476 | if (callchain_param.mode == CHAIN_GRAPH_REL) | ||
477 | new_total = self->children_hit; | ||
478 | else | ||
479 | new_total = total; | ||
480 | |||
481 | remaining = new_total; | ||
482 | node = rb_first(&self->rb_root); | ||
483 | while (node) { | ||
484 | struct callchain_node *child = rb_entry(node, struct callchain_node, rb_node); | ||
485 | struct rb_node *next = rb_next(node); | ||
486 | u64 cumul = cumul_hits(child); | ||
487 | struct callchain_list *chain; | ||
488 | int first = true, printed = 0; | ||
489 | int chain_idx = -1; | ||
490 | remaining -= cumul; | ||
491 | |||
492 | indexes[depth] = NEWT_ARG_APPEND; | ||
493 | indexes[depth + 1] = NEWT_ARG_LAST; | ||
494 | |||
495 | list_for_each_entry(chain, &child->val, list) { | ||
496 | char ipstr[BITS_PER_LONG / 4 + 1], | ||
497 | *alloc_str = NULL; | ||
498 | const char *str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr)); | ||
499 | |||
500 | if (first) { | ||
501 | double percent = cumul * 100.0 / new_total; | ||
502 | |||
503 | first = false; | ||
504 | if (asprintf(&alloc_str, "%2.2f%% %s", percent, str) < 0) | ||
505 | str = "Not enough memory!"; | ||
506 | else | ||
507 | str = alloc_str; | ||
508 | } else { | ||
509 | indexes[depth] = idx; | ||
510 | indexes[depth + 1] = NEWT_ARG_APPEND; | ||
511 | indexes[depth + 2] = NEWT_ARG_LAST; | ||
512 | ++chain_idx; | ||
513 | } | ||
514 | newt_checkbox_tree__add(tree, str, &chain->ms, indexes); | ||
515 | free(alloc_str); | ||
516 | ++printed; | ||
517 | } | ||
518 | |||
519 | indexes[depth] = idx; | ||
520 | if (chain_idx != -1) | ||
521 | indexes[depth + 1] = chain_idx; | ||
522 | if (printed != 0) | ||
523 | ++idx; | ||
524 | __callchain__append_graph_browser(child, tree, new_total, indexes, | ||
525 | depth + (chain_idx != -1 ? 2 : 1)); | ||
526 | node = next; | ||
527 | } | ||
528 | } | ||
529 | |||
530 | static void callchain__append_graph_browser(struct callchain_node *self, | ||
531 | newtComponent tree, u64 total, | ||
532 | int *indexes, int parent_idx) | ||
533 | { | ||
534 | struct callchain_list *chain; | ||
535 | int i = 0; | ||
536 | |||
537 | indexes[1] = NEWT_ARG_APPEND; | ||
538 | indexes[2] = NEWT_ARG_LAST; | ||
539 | |||
540 | list_for_each_entry(chain, &self->val, list) { | ||
541 | char ipstr[BITS_PER_LONG / 4 + 1], *str; | ||
542 | |||
543 | if (chain->ip >= PERF_CONTEXT_MAX) | ||
544 | continue; | ||
545 | |||
546 | if (!i++ && sort__first_dimension == SORT_SYM) | ||
547 | continue; | ||
548 | |||
549 | str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr)); | ||
550 | newt_checkbox_tree__add(tree, str, &chain->ms, indexes); | ||
551 | } | ||
552 | |||
553 | indexes[1] = parent_idx; | ||
554 | indexes[2] = NEWT_ARG_APPEND; | ||
555 | indexes[3] = NEWT_ARG_LAST; | ||
556 | __callchain__append_graph_browser(self, tree, total, indexes, 2); | ||
557 | } | ||
558 | |||
559 | static void hist_entry__append_callchain_browser(struct hist_entry *self, | ||
560 | newtComponent tree, u64 total, int parent_idx) | ||
561 | { | ||
562 | struct rb_node *rb_node; | ||
563 | int indexes[1024] = { [0] = parent_idx, }; | ||
564 | int idx = 0; | ||
565 | struct callchain_node *chain; | ||
566 | |||
567 | rb_node = rb_first(&self->sorted_chain); | ||
568 | while (rb_node) { | ||
569 | chain = rb_entry(rb_node, struct callchain_node, rb_node); | ||
570 | switch (callchain_param.mode) { | ||
571 | case CHAIN_FLAT: | ||
572 | break; | ||
573 | case CHAIN_GRAPH_ABS: /* falldown */ | ||
574 | case CHAIN_GRAPH_REL: | ||
575 | callchain__append_graph_browser(chain, tree, total, indexes, idx++); | ||
576 | break; | ||
577 | case CHAIN_NONE: | ||
578 | default: | ||
579 | break; | ||
580 | } | ||
581 | rb_node = rb_next(rb_node); | ||
582 | } | ||
583 | } | ||
584 | |||
585 | static size_t hist_entry__append_browser(struct hist_entry *self, | ||
586 | newtComponent tree, u64 total) | ||
587 | { | ||
588 | char s[256]; | ||
589 | size_t ret; | ||
590 | |||
591 | if (symbol_conf.exclude_other && !self->parent) | ||
592 | return 0; | ||
593 | |||
594 | ret = hist_entry__snprintf(self, s, sizeof(s), NULL, | ||
595 | false, 0, false, total); | ||
596 | if (symbol_conf.use_callchain) { | ||
597 | int indexes[2]; | ||
598 | |||
599 | indexes[0] = NEWT_ARG_APPEND; | ||
600 | indexes[1] = NEWT_ARG_LAST; | ||
601 | newt_checkbox_tree__add(tree, s, &self->ms, indexes); | ||
602 | } else | ||
603 | newtListboxAppendEntry(tree, s, &self->ms); | ||
604 | |||
605 | return ret; | ||
606 | } | ||
607 | |||
608 | static void hist_entry__annotate_browser(struct hist_entry *self) | ||
609 | { | ||
610 | struct ui_browser browser; | ||
611 | struct newtExitStruct es; | ||
612 | struct objdump_line *pos, *n; | ||
613 | LIST_HEAD(head); | ||
614 | |||
615 | if (self->ms.sym == NULL) | ||
616 | return; | ||
617 | |||
618 | if (hist_entry__annotate(self, &head) < 0) | ||
619 | return; | ||
620 | |||
621 | ui_helpline__push("Press <- or ESC to exit"); | ||
622 | |||
623 | memset(&browser, 0, sizeof(browser)); | ||
624 | browser.entries = &head; | ||
625 | browser.priv = self; | ||
626 | list_for_each_entry(pos, &head, node) { | ||
627 | size_t line_len = strlen(pos->line); | ||
628 | if (browser.width < line_len) | ||
629 | browser.width = line_len; | ||
630 | ++browser.nr_entries; | ||
631 | } | ||
632 | |||
633 | browser.width += 18; /* Percentage */ | ||
634 | ui_browser__run(&browser, self->ms.sym->name, &es); | ||
635 | newtFormDestroy(browser.form); | ||
636 | newtPopWindow(); | ||
637 | list_for_each_entry_safe(pos, n, &head, node) { | ||
638 | list_del(&pos->node); | ||
639 | objdump_line__free(pos); | ||
640 | } | ||
641 | ui_helpline__pop(); | ||
642 | } | ||
643 | |||
644 | static const void *newt__symbol_tree_get_current(newtComponent self) | ||
645 | { | ||
646 | if (symbol_conf.use_callchain) | ||
647 | return newtCheckboxTreeGetCurrent(self); | ||
648 | return newtListboxGetCurrent(self); | ||
649 | } | ||
650 | |||
651 | static void hist_browser__selection(newtComponent self, void *data) | ||
652 | { | ||
653 | const struct map_symbol **symbol_ptr = data; | ||
654 | *symbol_ptr = newt__symbol_tree_get_current(self); | ||
655 | } | ||
656 | |||
657 | struct hist_browser { | ||
658 | newtComponent form, tree; | ||
659 | const struct map_symbol *selection; | ||
660 | }; | ||
661 | |||
662 | static struct hist_browser *hist_browser__new(void) | ||
663 | { | ||
664 | struct hist_browser *self = malloc(sizeof(*self)); | ||
665 | |||
666 | if (self != NULL) | ||
667 | self->form = NULL; | ||
668 | |||
669 | return self; | ||
670 | } | ||
671 | |||
672 | static void hist_browser__delete(struct hist_browser *self) | ||
673 | { | ||
674 | newtFormDestroy(self->form); | ||
675 | newtPopWindow(); | ||
676 | free(self); | ||
677 | } | ||
678 | |||
679 | static int hist_browser__populate(struct hist_browser *self, struct hists *hists, | ||
680 | const char *title) | ||
681 | { | ||
682 | int max_len = 0, idx, cols, rows; | ||
683 | struct ui_progress *progress; | ||
684 | struct rb_node *nd; | ||
685 | u64 curr_hist = 0; | ||
686 | char seq[] = ".", unit; | ||
687 | char str[256]; | ||
688 | unsigned long nr_events = hists->stats.nr_events[PERF_RECORD_SAMPLE]; | ||
689 | |||
690 | if (self->form) { | ||
691 | newtFormDestroy(self->form); | ||
692 | newtPopWindow(); | ||
693 | } | ||
694 | |||
695 | nr_events = convert_unit(nr_events, &unit); | ||
696 | snprintf(str, sizeof(str), "Events: %lu%c ", | ||
697 | nr_events, unit); | ||
698 | newtDrawRootText(0, 0, str); | ||
699 | |||
700 | newtGetScreenSize(NULL, &rows); | ||
701 | |||
702 | if (symbol_conf.use_callchain) | ||
703 | self->tree = newtCheckboxTreeMulti(0, 0, rows - 5, seq, | ||
704 | NEWT_FLAG_SCROLL); | ||
705 | else | ||
706 | self->tree = newtListbox(0, 0, rows - 5, | ||
707 | (NEWT_FLAG_SCROLL | | ||
708 | NEWT_FLAG_RETURNEXIT)); | ||
709 | |||
710 | newtComponentAddCallback(self->tree, hist_browser__selection, | ||
711 | &self->selection); | ||
712 | |||
713 | progress = ui_progress__new("Adding entries to the browser...", | ||
714 | hists->nr_entries); | ||
715 | if (progress == NULL) | ||
716 | return -1; | ||
717 | |||
718 | idx = 0; | ||
719 | for (nd = rb_first(&hists->entries); nd; nd = rb_next(nd)) { | ||
720 | struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); | ||
721 | int len; | ||
722 | |||
723 | if (h->filtered) | ||
724 | continue; | ||
725 | |||
726 | len = hist_entry__append_browser(h, self->tree, hists->stats.total_period); | ||
727 | if (len > max_len) | ||
728 | max_len = len; | ||
729 | if (symbol_conf.use_callchain) | ||
730 | hist_entry__append_callchain_browser(h, self->tree, | ||
731 | hists->stats.total_period, idx++); | ||
732 | ++curr_hist; | ||
733 | if (curr_hist % 5) | ||
734 | ui_progress__update(progress, curr_hist); | ||
735 | } | ||
736 | |||
737 | ui_progress__delete(progress); | ||
738 | |||
739 | newtGetScreenSize(&cols, &rows); | ||
740 | |||
741 | if (max_len > cols) | ||
742 | max_len = cols - 3; | ||
743 | |||
744 | if (!symbol_conf.use_callchain) | ||
745 | newtListboxSetWidth(self->tree, max_len); | ||
746 | |||
747 | newtCenteredWindow(max_len + (symbol_conf.use_callchain ? 5 : 0), | ||
748 | rows - 5, title); | ||
749 | self->form = newt_form__new(); | ||
750 | if (self->form == NULL) | ||
751 | return -1; | ||
752 | |||
753 | newtFormAddHotKey(self->form, 'A'); | ||
754 | newtFormAddHotKey(self->form, 'a'); | ||
755 | newtFormAddHotKey(self->form, 'D'); | ||
756 | newtFormAddHotKey(self->form, 'd'); | ||
757 | newtFormAddHotKey(self->form, 'T'); | ||
758 | newtFormAddHotKey(self->form, 't'); | ||
759 | newtFormAddHotKey(self->form, NEWT_KEY_RIGHT); | ||
760 | newtFormAddHotKey(self->form, NEWT_KEY_LEFT); | ||
761 | newtFormAddComponents(self->form, self->tree, NULL); | ||
762 | self->selection = newt__symbol_tree_get_current(self->tree); | ||
763 | |||
764 | return 0; | ||
765 | } | ||
766 | |||
767 | static struct hist_entry *hist_browser__selected_entry(struct hist_browser *self) | ||
768 | { | ||
769 | int *indexes; | ||
770 | |||
771 | if (!symbol_conf.use_callchain) | ||
772 | goto out; | ||
773 | |||
774 | indexes = newtCheckboxTreeFindItem(self->tree, (void *)self->selection); | ||
775 | if (indexes) { | ||
776 | bool is_hist_entry = indexes[1] == NEWT_ARG_LAST; | ||
777 | free(indexes); | ||
778 | if (is_hist_entry) | ||
779 | goto out; | ||
780 | } | ||
781 | return NULL; | ||
782 | out: | ||
783 | return container_of(self->selection, struct hist_entry, ms); | ||
784 | } | ||
785 | |||
786 | static struct thread *hist_browser__selected_thread(struct hist_browser *self) | ||
787 | { | ||
788 | struct hist_entry *he = hist_browser__selected_entry(self); | ||
789 | return he ? he->thread : NULL; | ||
790 | } | ||
791 | |||
792 | static int hist_browser__title(char *bf, size_t size, const char *input_name, | ||
793 | const struct dso *dso, const struct thread *thread) | ||
794 | { | ||
795 | int printed = 0; | ||
796 | |||
797 | if (thread) | ||
798 | printed += snprintf(bf + printed, size - printed, | ||
799 | "Thread: %s(%d)", | ||
800 | (thread->comm_set ? thread->comm : ""), | ||
801 | thread->pid); | ||
802 | if (dso) | ||
803 | printed += snprintf(bf + printed, size - printed, | ||
804 | "%sDSO: %s", thread ? " " : "", | ||
805 | dso->short_name); | ||
806 | return printed ?: snprintf(bf, size, "Report: %s", input_name); | ||
807 | } | ||
808 | |||
809 | int hists__browse(struct hists *self, const char *helpline, const char *input_name) | ||
810 | { | ||
811 | struct hist_browser *browser = hist_browser__new(); | ||
812 | struct pstack *fstack = pstack__new(2); | ||
813 | const struct thread *thread_filter = NULL; | ||
814 | const struct dso *dso_filter = NULL; | ||
815 | struct newtExitStruct es; | ||
816 | char msg[160]; | ||
817 | int err = -1; | ||
818 | |||
819 | if (browser == NULL) | ||
820 | return -1; | ||
821 | |||
822 | fstack = pstack__new(2); | ||
823 | if (fstack == NULL) | ||
824 | goto out; | ||
825 | |||
826 | ui_helpline__push(helpline); | ||
827 | |||
828 | hist_browser__title(msg, sizeof(msg), input_name, | ||
829 | dso_filter, thread_filter); | ||
830 | if (hist_browser__populate(browser, self, msg) < 0) | ||
831 | goto out_free_stack; | ||
832 | |||
833 | while (1) { | ||
834 | const struct thread *thread; | ||
835 | const struct dso *dso; | ||
836 | char *options[16]; | ||
837 | int nr_options = 0, choice = 0, i, | ||
838 | annotate = -2, zoom_dso = -2, zoom_thread = -2; | ||
839 | |||
840 | newtFormRun(browser->form, &es); | ||
841 | |||
842 | thread = hist_browser__selected_thread(browser); | ||
843 | dso = browser->selection->map ? browser->selection->map->dso : NULL; | ||
844 | |||
845 | if (es.reason == NEWT_EXIT_HOTKEY) { | ||
846 | switch (toupper(es.u.key)) { | ||
847 | case 'A': | ||
848 | goto do_annotate; | ||
849 | case 'D': | ||
850 | goto zoom_dso; | ||
851 | case 'T': | ||
852 | goto zoom_thread; | ||
853 | default:; | ||
854 | } | ||
855 | if (toupper(es.u.key) == 'Q' || | ||
856 | es.u.key == CTRL('c')) | ||
857 | break; | ||
858 | if (es.u.key == NEWT_KEY_ESCAPE) { | ||
859 | if (dialog_yesno("Do you really want to exit?")) | ||
860 | break; | ||
861 | else | ||
862 | continue; | ||
863 | } | ||
864 | |||
865 | if (es.u.key == NEWT_KEY_LEFT) { | ||
866 | const void *top; | ||
867 | |||
868 | if (pstack__empty(fstack)) | ||
869 | continue; | ||
870 | top = pstack__pop(fstack); | ||
871 | if (top == &dso_filter) | ||
872 | goto zoom_out_dso; | ||
873 | if (top == &thread_filter) | ||
874 | goto zoom_out_thread; | ||
875 | continue; | ||
876 | } | ||
877 | } | ||
878 | |||
879 | if (browser->selection->sym != NULL && | ||
880 | asprintf(&options[nr_options], "Annotate %s", | ||
881 | browser->selection->sym->name) > 0) | ||
882 | annotate = nr_options++; | ||
883 | |||
884 | if (thread != NULL && | ||
885 | asprintf(&options[nr_options], "Zoom %s %s(%d) thread", | ||
886 | (thread_filter ? "out of" : "into"), | ||
887 | (thread->comm_set ? thread->comm : ""), | ||
888 | thread->pid) > 0) | ||
889 | zoom_thread = nr_options++; | ||
890 | |||
891 | if (dso != NULL && | ||
892 | asprintf(&options[nr_options], "Zoom %s %s DSO", | ||
893 | (dso_filter ? "out of" : "into"), | ||
894 | (dso->kernel ? "the Kernel" : dso->short_name)) > 0) | ||
895 | zoom_dso = nr_options++; | ||
896 | |||
897 | options[nr_options++] = (char *)"Exit"; | ||
898 | |||
899 | choice = popup_menu(nr_options, options); | ||
900 | |||
901 | for (i = 0; i < nr_options - 1; ++i) | ||
902 | free(options[i]); | ||
903 | |||
904 | if (choice == nr_options - 1) | ||
905 | break; | ||
906 | |||
907 | if (choice == -1) | ||
908 | continue; | ||
909 | |||
910 | if (choice == annotate) { | ||
911 | struct hist_entry *he; | ||
912 | do_annotate: | ||
913 | if (browser->selection->map->dso->origin == DSO__ORIG_KERNEL) { | ||
914 | ui_helpline__puts("No vmlinux file found, can't " | ||
915 | "annotate with just a " | ||
916 | "kallsyms file"); | ||
917 | continue; | ||
918 | } | ||
919 | |||
920 | he = hist_browser__selected_entry(browser); | ||
921 | if (he == NULL) | ||
922 | continue; | ||
923 | |||
924 | hist_entry__annotate_browser(he); | ||
925 | } else if (choice == zoom_dso) { | ||
926 | zoom_dso: | ||
927 | if (dso_filter) { | ||
928 | pstack__remove(fstack, &dso_filter); | ||
929 | zoom_out_dso: | ||
930 | ui_helpline__pop(); | ||
931 | dso_filter = NULL; | ||
932 | } else { | ||
933 | if (dso == NULL) | ||
934 | continue; | ||
935 | ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s DSO\"", | ||
936 | dso->kernel ? "the Kernel" : dso->short_name); | ||
937 | dso_filter = dso; | ||
938 | pstack__push(fstack, &dso_filter); | ||
939 | } | ||
940 | hists__filter_by_dso(self, dso_filter); | ||
941 | hist_browser__title(msg, sizeof(msg), input_name, | ||
942 | dso_filter, thread_filter); | ||
943 | if (hist_browser__populate(browser, self, msg) < 0) | ||
944 | goto out; | ||
945 | } else if (choice == zoom_thread) { | ||
946 | zoom_thread: | ||
947 | if (thread_filter) { | ||
948 | pstack__remove(fstack, &thread_filter); | ||
949 | zoom_out_thread: | ||
950 | ui_helpline__pop(); | ||
951 | thread_filter = NULL; | ||
952 | } else { | ||
953 | ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s(%d) thread\"", | ||
954 | thread->comm_set ? thread->comm : "", | ||
955 | thread->pid); | ||
956 | thread_filter = thread; | ||
957 | pstack__push(fstack, &thread_filter); | ||
958 | } | ||
959 | hists__filter_by_thread(self, thread_filter); | ||
960 | hist_browser__title(msg, sizeof(msg), input_name, | ||
961 | dso_filter, thread_filter); | ||
962 | if (hist_browser__populate(browser, self, msg) < 0) | ||
963 | goto out; | ||
964 | } | ||
965 | } | ||
966 | err = 0; | ||
967 | out_free_stack: | ||
968 | pstack__delete(fstack); | ||
969 | out: | ||
970 | hist_browser__delete(browser); | ||
971 | return err; | ||
972 | } | ||
973 | |||
974 | static struct newtPercentTreeColors { | ||
975 | const char *topColorFg, *topColorBg; | ||
976 | const char *mediumColorFg, *mediumColorBg; | ||
977 | const char *normalColorFg, *normalColorBg; | ||
978 | const char *selColorFg, *selColorBg; | ||
979 | const char *codeColorFg, *codeColorBg; | ||
980 | } defaultPercentTreeColors = { | ||
981 | "red", "lightgray", | ||
982 | "green", "lightgray", | ||
983 | "black", "lightgray", | ||
984 | "lightgray", "magenta", | ||
985 | "blue", "lightgray", | ||
986 | }; | ||
987 | |||
988 | void setup_browser(void) | ||
989 | { | ||
990 | struct newtPercentTreeColors *c = &defaultPercentTreeColors; | ||
991 | if (!isatty(1)) | ||
992 | return; | ||
993 | |||
994 | use_browser = true; | ||
995 | newtInit(); | ||
996 | newtCls(); | ||
997 | ui_helpline__puts(" "); | ||
998 | SLtt_set_color(HE_COLORSET_TOP, NULL, c->topColorFg, c->topColorBg); | ||
999 | SLtt_set_color(HE_COLORSET_MEDIUM, NULL, c->mediumColorFg, c->mediumColorBg); | ||
1000 | SLtt_set_color(HE_COLORSET_NORMAL, NULL, c->normalColorFg, c->normalColorBg); | ||
1001 | SLtt_set_color(HE_COLORSET_SELECTED, NULL, c->selColorFg, c->selColorBg); | ||
1002 | SLtt_set_color(HE_COLORSET_CODE, NULL, c->codeColorFg, c->codeColorBg); | ||
1003 | } | ||
1004 | |||
1005 | void exit_browser(bool wait_for_ok) | ||
1006 | { | ||
1007 | if (use_browser) { | ||
1008 | if (wait_for_ok) { | ||
1009 | char title[] = "Fatal Error", ok[] = "Ok"; | ||
1010 | newtWinMessage(title, ok, browser__last_msg); | ||
1011 | } | ||
1012 | newtFinished(); | ||
1013 | } | ||
1014 | } | ||
diff --git a/tools/perf/util/parse-events.c b/tools/perf/util/parse-events.c index 05d0c5c2030c..9bf0f402ca73 100644 --- a/tools/perf/util/parse-events.c +++ b/tools/perf/util/parse-events.c | |||
@@ -5,6 +5,7 @@ | |||
5 | #include "parse-events.h" | 5 | #include "parse-events.h" |
6 | #include "exec_cmd.h" | 6 | #include "exec_cmd.h" |
7 | #include "string.h" | 7 | #include "string.h" |
8 | #include "symbol.h" | ||
8 | #include "cache.h" | 9 | #include "cache.h" |
9 | #include "header.h" | 10 | #include "header.h" |
10 | #include "debugfs.h" | 11 | #include "debugfs.h" |
@@ -409,7 +410,6 @@ static enum event_result | |||
409 | parse_single_tracepoint_event(char *sys_name, | 410 | parse_single_tracepoint_event(char *sys_name, |
410 | const char *evt_name, | 411 | const char *evt_name, |
411 | unsigned int evt_length, | 412 | unsigned int evt_length, |
412 | char *flags, | ||
413 | struct perf_event_attr *attr, | 413 | struct perf_event_attr *attr, |
414 | const char **strp) | 414 | const char **strp) |
415 | { | 415 | { |
@@ -418,14 +418,6 @@ parse_single_tracepoint_event(char *sys_name, | |||
418 | u64 id; | 418 | u64 id; |
419 | int fd; | 419 | int fd; |
420 | 420 | ||
421 | if (flags) { | ||
422 | if (!strncmp(flags, "record", strlen(flags))) { | ||
423 | attr->sample_type |= PERF_SAMPLE_RAW; | ||
424 | attr->sample_type |= PERF_SAMPLE_TIME; | ||
425 | attr->sample_type |= PERF_SAMPLE_CPU; | ||
426 | } | ||
427 | } | ||
428 | |||
429 | snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path, | 421 | snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path, |
430 | sys_name, evt_name); | 422 | sys_name, evt_name); |
431 | 423 | ||
@@ -444,6 +436,13 @@ parse_single_tracepoint_event(char *sys_name, | |||
444 | attr->type = PERF_TYPE_TRACEPOINT; | 436 | attr->type = PERF_TYPE_TRACEPOINT; |
445 | *strp = evt_name + evt_length; | 437 | *strp = evt_name + evt_length; |
446 | 438 | ||
439 | attr->sample_type |= PERF_SAMPLE_RAW; | ||
440 | attr->sample_type |= PERF_SAMPLE_TIME; | ||
441 | attr->sample_type |= PERF_SAMPLE_CPU; | ||
442 | |||
443 | attr->sample_period = 1; | ||
444 | |||
445 | |||
447 | return EVT_HANDLED; | 446 | return EVT_HANDLED; |
448 | } | 447 | } |
449 | 448 | ||
@@ -532,8 +531,7 @@ static enum event_result parse_tracepoint_event(const char **strp, | |||
532 | flags); | 531 | flags); |
533 | } else | 532 | } else |
534 | return parse_single_tracepoint_event(sys_name, evt_name, | 533 | return parse_single_tracepoint_event(sys_name, evt_name, |
535 | evt_length, flags, | 534 | evt_length, attr, strp); |
536 | attr, strp); | ||
537 | } | 535 | } |
538 | 536 | ||
539 | static enum event_result | 537 | static enum event_result |
@@ -690,19 +688,29 @@ static enum event_result | |||
690 | parse_event_modifier(const char **strp, struct perf_event_attr *attr) | 688 | parse_event_modifier(const char **strp, struct perf_event_attr *attr) |
691 | { | 689 | { |
692 | const char *str = *strp; | 690 | const char *str = *strp; |
693 | int eu = 1, ek = 1, eh = 1; | 691 | int exclude = 0; |
692 | int eu = 0, ek = 0, eh = 0, precise = 0; | ||
694 | 693 | ||
695 | if (*str++ != ':') | 694 | if (*str++ != ':') |
696 | return 0; | 695 | return 0; |
697 | while (*str) { | 696 | while (*str) { |
698 | if (*str == 'u') | 697 | if (*str == 'u') { |
698 | if (!exclude) | ||
699 | exclude = eu = ek = eh = 1; | ||
699 | eu = 0; | 700 | eu = 0; |
700 | else if (*str == 'k') | 701 | } else if (*str == 'k') { |
702 | if (!exclude) | ||
703 | exclude = eu = ek = eh = 1; | ||
701 | ek = 0; | 704 | ek = 0; |
702 | else if (*str == 'h') | 705 | } else if (*str == 'h') { |
706 | if (!exclude) | ||
707 | exclude = eu = ek = eh = 1; | ||
703 | eh = 0; | 708 | eh = 0; |
704 | else | 709 | } else if (*str == 'p') { |
710 | precise++; | ||
711 | } else | ||
705 | break; | 712 | break; |
713 | |||
706 | ++str; | 714 | ++str; |
707 | } | 715 | } |
708 | if (str >= *strp + 2) { | 716 | if (str >= *strp + 2) { |
@@ -710,6 +718,7 @@ parse_event_modifier(const char **strp, struct perf_event_attr *attr) | |||
710 | attr->exclude_user = eu; | 718 | attr->exclude_user = eu; |
711 | attr->exclude_kernel = ek; | 719 | attr->exclude_kernel = ek; |
712 | attr->exclude_hv = eh; | 720 | attr->exclude_hv = eh; |
721 | attr->precise_ip = precise; | ||
713 | return 1; | 722 | return 1; |
714 | } | 723 | } |
715 | return 0; | 724 | return 0; |
@@ -934,7 +943,8 @@ void print_events(void) | |||
934 | 943 | ||
935 | printf("\n"); | 944 | printf("\n"); |
936 | printf(" %-42s [%s]\n", | 945 | printf(" %-42s [%s]\n", |
937 | "rNNN", event_type_descriptors[PERF_TYPE_RAW]); | 946 | "rNNN (see 'perf list --help' on how to encode it)", |
947 | event_type_descriptors[PERF_TYPE_RAW]); | ||
938 | printf("\n"); | 948 | printf("\n"); |
939 | 949 | ||
940 | printf(" %-42s [%s]\n", | 950 | printf(" %-42s [%s]\n", |
diff --git a/tools/perf/util/parse-events.h b/tools/perf/util/parse-events.h index b8c1f64bc935..fc4ab3fe877a 100644 --- a/tools/perf/util/parse-events.h +++ b/tools/perf/util/parse-events.h | |||
@@ -13,6 +13,7 @@ struct tracepoint_path { | |||
13 | }; | 13 | }; |
14 | 14 | ||
15 | extern struct tracepoint_path *tracepoint_id_to_path(u64 config); | 15 | extern struct tracepoint_path *tracepoint_id_to_path(u64 config); |
16 | extern bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events); | ||
16 | 17 | ||
17 | extern int nr_counters; | 18 | extern int nr_counters; |
18 | 19 | ||
diff --git a/tools/perf/util/parse-options.c b/tools/perf/util/parse-options.c index efebd5b476b3..ed887642460c 100644 --- a/tools/perf/util/parse-options.c +++ b/tools/perf/util/parse-options.c | |||
@@ -49,6 +49,7 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
49 | break; | 49 | break; |
50 | /* FALLTHROUGH */ | 50 | /* FALLTHROUGH */ |
51 | case OPTION_BOOLEAN: | 51 | case OPTION_BOOLEAN: |
52 | case OPTION_INCR: | ||
52 | case OPTION_BIT: | 53 | case OPTION_BIT: |
53 | case OPTION_SET_INT: | 54 | case OPTION_SET_INT: |
54 | case OPTION_SET_PTR: | 55 | case OPTION_SET_PTR: |
@@ -73,6 +74,10 @@ static int get_value(struct parse_opt_ctx_t *p, | |||
73 | return 0; | 74 | return 0; |
74 | 75 | ||
75 | case OPTION_BOOLEAN: | 76 | case OPTION_BOOLEAN: |
77 | *(bool *)opt->value = unset ? false : true; | ||
78 | return 0; | ||
79 | |||
80 | case OPTION_INCR: | ||
76 | *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1; | 81 | *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1; |
77 | return 0; | 82 | return 0; |
78 | 83 | ||
@@ -478,6 +483,7 @@ int usage_with_options_internal(const char * const *usagestr, | |||
478 | case OPTION_GROUP: | 483 | case OPTION_GROUP: |
479 | case OPTION_BIT: | 484 | case OPTION_BIT: |
480 | case OPTION_BOOLEAN: | 485 | case OPTION_BOOLEAN: |
486 | case OPTION_INCR: | ||
481 | case OPTION_SET_INT: | 487 | case OPTION_SET_INT: |
482 | case OPTION_SET_PTR: | 488 | case OPTION_SET_PTR: |
483 | case OPTION_LONG: | 489 | case OPTION_LONG: |
@@ -500,6 +506,7 @@ int usage_with_options_internal(const char * const *usagestr, | |||
500 | void usage_with_options(const char * const *usagestr, | 506 | void usage_with_options(const char * const *usagestr, |
501 | const struct option *opts) | 507 | const struct option *opts) |
502 | { | 508 | { |
509 | exit_browser(false); | ||
503 | usage_with_options_internal(usagestr, opts, 0); | 510 | usage_with_options_internal(usagestr, opts, 0); |
504 | exit(129); | 511 | exit(129); |
505 | } | 512 | } |
diff --git a/tools/perf/util/parse-options.h b/tools/perf/util/parse-options.h index 948805af43c2..b2da725f102a 100644 --- a/tools/perf/util/parse-options.h +++ b/tools/perf/util/parse-options.h | |||
@@ -8,7 +8,8 @@ enum parse_opt_type { | |||
8 | OPTION_GROUP, | 8 | OPTION_GROUP, |
9 | /* options with no arguments */ | 9 | /* options with no arguments */ |
10 | OPTION_BIT, | 10 | OPTION_BIT, |
11 | OPTION_BOOLEAN, /* _INCR would have been a better name */ | 11 | OPTION_BOOLEAN, |
12 | OPTION_INCR, | ||
12 | OPTION_SET_INT, | 13 | OPTION_SET_INT, |
13 | OPTION_SET_PTR, | 14 | OPTION_SET_PTR, |
14 | /* options with arguments (usually) */ | 15 | /* options with arguments (usually) */ |
@@ -95,6 +96,7 @@ struct option { | |||
95 | #define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) } | 96 | #define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) } |
96 | #define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (b) } | 97 | #define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (b) } |
97 | #define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | 98 | #define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } |
99 | #define OPT_INCR(s, l, v, h) { .type = OPTION_INCR, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | ||
98 | #define OPT_SET_INT(s, l, v, h, i) { .type = OPTION_SET_INT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (i) } | 100 | #define OPT_SET_INT(s, l, v, h, i) { .type = OPTION_SET_INT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (i) } |
99 | #define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) } | 101 | #define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) } |
100 | #define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } | 102 | #define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } |
diff --git a/tools/perf/util/probe-event.c b/tools/perf/util/probe-event.c index 7c004b6ef24f..914c67095d96 100644 --- a/tools/perf/util/probe-event.c +++ b/tools/perf/util/probe-event.c | |||
@@ -33,20 +33,27 @@ | |||
33 | #include <limits.h> | 33 | #include <limits.h> |
34 | 34 | ||
35 | #undef _GNU_SOURCE | 35 | #undef _GNU_SOURCE |
36 | #include "util.h" | ||
36 | #include "event.h" | 37 | #include "event.h" |
37 | #include "string.h" | 38 | #include "string.h" |
38 | #include "strlist.h" | 39 | #include "strlist.h" |
39 | #include "debug.h" | 40 | #include "debug.h" |
40 | #include "cache.h" | 41 | #include "cache.h" |
41 | #include "color.h" | 42 | #include "color.h" |
42 | #include "parse-events.h" /* For debugfs_path */ | 43 | #include "symbol.h" |
44 | #include "thread.h" | ||
45 | #include "debugfs.h" | ||
46 | #include "trace-event.h" /* For __unused */ | ||
43 | #include "probe-event.h" | 47 | #include "probe-event.h" |
48 | #include "probe-finder.h" | ||
44 | 49 | ||
45 | #define MAX_CMDLEN 256 | 50 | #define MAX_CMDLEN 256 |
46 | #define MAX_PROBE_ARGS 128 | 51 | #define MAX_PROBE_ARGS 128 |
47 | #define PERFPROBE_GROUP "probe" | 52 | #define PERFPROBE_GROUP "probe" |
48 | 53 | ||
49 | #define semantic_error(msg ...) die("Semantic error :" msg) | 54 | bool probe_event_dry_run; /* Dry run flag */ |
55 | |||
56 | #define semantic_error(msg ...) pr_err("Semantic error :" msg) | ||
50 | 57 | ||
51 | /* If there is no space to write, returns -E2BIG. */ | 58 | /* If there is no space to write, returns -E2BIG. */ |
52 | static int e_snprintf(char *str, size_t size, const char *format, ...) | 59 | static int e_snprintf(char *str, size_t size, const char *format, ...) |
@@ -64,7 +71,275 @@ static int e_snprintf(char *str, size_t size, const char *format, ...) | |||
64 | return ret; | 71 | return ret; |
65 | } | 72 | } |
66 | 73 | ||
67 | void parse_line_range_desc(const char *arg, struct line_range *lr) | 74 | static char *synthesize_perf_probe_point(struct perf_probe_point *pp); |
75 | static struct machine machine; | ||
76 | |||
77 | /* Initialize symbol maps and path of vmlinux */ | ||
78 | static int init_vmlinux(void) | ||
79 | { | ||
80 | struct dso *kernel; | ||
81 | int ret; | ||
82 | |||
83 | symbol_conf.sort_by_name = true; | ||
84 | if (symbol_conf.vmlinux_name == NULL) | ||
85 | symbol_conf.try_vmlinux_path = true; | ||
86 | else | ||
87 | pr_debug("Use vmlinux: %s\n", symbol_conf.vmlinux_name); | ||
88 | ret = symbol__init(); | ||
89 | if (ret < 0) { | ||
90 | pr_debug("Failed to init symbol map.\n"); | ||
91 | goto out; | ||
92 | } | ||
93 | |||
94 | ret = machine__init(&machine, "/", 0); | ||
95 | if (ret < 0) | ||
96 | goto out; | ||
97 | |||
98 | kernel = dso__new_kernel(symbol_conf.vmlinux_name); | ||
99 | if (kernel == NULL) | ||
100 | die("Failed to create kernel dso."); | ||
101 | |||
102 | ret = __machine__create_kernel_maps(&machine, kernel); | ||
103 | if (ret < 0) | ||
104 | pr_debug("Failed to create kernel maps.\n"); | ||
105 | |||
106 | out: | ||
107 | if (ret < 0) | ||
108 | pr_warning("Failed to init vmlinux path.\n"); | ||
109 | return ret; | ||
110 | } | ||
111 | |||
112 | #ifdef DWARF_SUPPORT | ||
113 | static int open_vmlinux(void) | ||
114 | { | ||
115 | if (map__load(machine.vmlinux_maps[MAP__FUNCTION], NULL) < 0) { | ||
116 | pr_debug("Failed to load kernel map.\n"); | ||
117 | return -EINVAL; | ||
118 | } | ||
119 | pr_debug("Try to open %s\n", machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name); | ||
120 | return open(machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name, O_RDONLY); | ||
121 | } | ||
122 | |||
123 | /* Convert trace point to probe point with debuginfo */ | ||
124 | static int convert_to_perf_probe_point(struct kprobe_trace_point *tp, | ||
125 | struct perf_probe_point *pp) | ||
126 | { | ||
127 | struct symbol *sym; | ||
128 | int fd, ret = -ENOENT; | ||
129 | |||
130 | sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION], | ||
131 | tp->symbol, NULL); | ||
132 | if (sym) { | ||
133 | fd = open_vmlinux(); | ||
134 | if (fd >= 0) { | ||
135 | ret = find_perf_probe_point(fd, | ||
136 | sym->start + tp->offset, pp); | ||
137 | close(fd); | ||
138 | } | ||
139 | } | ||
140 | if (ret <= 0) { | ||
141 | pr_debug("Failed to find corresponding probes from " | ||
142 | "debuginfo. Use kprobe event information.\n"); | ||
143 | pp->function = strdup(tp->symbol); | ||
144 | if (pp->function == NULL) | ||
145 | return -ENOMEM; | ||
146 | pp->offset = tp->offset; | ||
147 | } | ||
148 | pp->retprobe = tp->retprobe; | ||
149 | |||
150 | return 0; | ||
151 | } | ||
152 | |||
153 | /* Try to find perf_probe_event with debuginfo */ | ||
154 | static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev, | ||
155 | struct kprobe_trace_event **tevs, | ||
156 | int max_tevs) | ||
157 | { | ||
158 | bool need_dwarf = perf_probe_event_need_dwarf(pev); | ||
159 | int fd, ntevs; | ||
160 | |||
161 | fd = open_vmlinux(); | ||
162 | if (fd < 0) { | ||
163 | if (need_dwarf) { | ||
164 | pr_warning("Failed to open debuginfo file.\n"); | ||
165 | return fd; | ||
166 | } | ||
167 | pr_debug("Could not open vmlinux. Try to use symbols.\n"); | ||
168 | return 0; | ||
169 | } | ||
170 | |||
171 | /* Searching trace events corresponding to probe event */ | ||
172 | ntevs = find_kprobe_trace_events(fd, pev, tevs, max_tevs); | ||
173 | close(fd); | ||
174 | |||
175 | if (ntevs > 0) { /* Succeeded to find trace events */ | ||
176 | pr_debug("find %d kprobe_trace_events.\n", ntevs); | ||
177 | return ntevs; | ||
178 | } | ||
179 | |||
180 | if (ntevs == 0) { /* No error but failed to find probe point. */ | ||
181 | pr_warning("Probe point '%s' not found.\n", | ||
182 | synthesize_perf_probe_point(&pev->point)); | ||
183 | return -ENOENT; | ||
184 | } | ||
185 | /* Error path : ntevs < 0 */ | ||
186 | pr_debug("An error occurred in debuginfo analysis (%d).\n", ntevs); | ||
187 | if (ntevs == -EBADF) { | ||
188 | pr_warning("Warning: No dwarf info found in the vmlinux - " | ||
189 | "please rebuild kernel with CONFIG_DEBUG_INFO=y.\n"); | ||
190 | if (!need_dwarf) { | ||
191 | pr_debug("Trying to use symbols.\nn"); | ||
192 | return 0; | ||
193 | } | ||
194 | } | ||
195 | return ntevs; | ||
196 | } | ||
197 | |||
198 | #define LINEBUF_SIZE 256 | ||
199 | #define NR_ADDITIONAL_LINES 2 | ||
200 | |||
201 | static int show_one_line(FILE *fp, int l, bool skip, bool show_num) | ||
202 | { | ||
203 | char buf[LINEBUF_SIZE]; | ||
204 | const char *color = PERF_COLOR_BLUE; | ||
205 | |||
206 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
207 | goto error; | ||
208 | if (!skip) { | ||
209 | if (show_num) | ||
210 | fprintf(stdout, "%7d %s", l, buf); | ||
211 | else | ||
212 | color_fprintf(stdout, color, " %s", buf); | ||
213 | } | ||
214 | |||
215 | while (strlen(buf) == LINEBUF_SIZE - 1 && | ||
216 | buf[LINEBUF_SIZE - 2] != '\n') { | ||
217 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
218 | goto error; | ||
219 | if (!skip) { | ||
220 | if (show_num) | ||
221 | fprintf(stdout, "%s", buf); | ||
222 | else | ||
223 | color_fprintf(stdout, color, "%s", buf); | ||
224 | } | ||
225 | } | ||
226 | |||
227 | return 0; | ||
228 | error: | ||
229 | if (feof(fp)) | ||
230 | pr_warning("Source file is shorter than expected.\n"); | ||
231 | else | ||
232 | pr_warning("File read error: %s\n", strerror(errno)); | ||
233 | |||
234 | return -1; | ||
235 | } | ||
236 | |||
237 | /* | ||
238 | * Show line-range always requires debuginfo to find source file and | ||
239 | * line number. | ||
240 | */ | ||
241 | int show_line_range(struct line_range *lr) | ||
242 | { | ||
243 | int l = 1; | ||
244 | struct line_node *ln; | ||
245 | FILE *fp; | ||
246 | int fd, ret; | ||
247 | |||
248 | /* Search a line range */ | ||
249 | ret = init_vmlinux(); | ||
250 | if (ret < 0) | ||
251 | return ret; | ||
252 | |||
253 | fd = open_vmlinux(); | ||
254 | if (fd < 0) { | ||
255 | pr_warning("Failed to open debuginfo file.\n"); | ||
256 | return fd; | ||
257 | } | ||
258 | |||
259 | ret = find_line_range(fd, lr); | ||
260 | close(fd); | ||
261 | if (ret == 0) { | ||
262 | pr_warning("Specified source line is not found.\n"); | ||
263 | return -ENOENT; | ||
264 | } else if (ret < 0) { | ||
265 | pr_warning("Debuginfo analysis failed. (%d)\n", ret); | ||
266 | return ret; | ||
267 | } | ||
268 | |||
269 | setup_pager(); | ||
270 | |||
271 | if (lr->function) | ||
272 | fprintf(stdout, "<%s:%d>\n", lr->function, | ||
273 | lr->start - lr->offset); | ||
274 | else | ||
275 | fprintf(stdout, "<%s:%d>\n", lr->file, lr->start); | ||
276 | |||
277 | fp = fopen(lr->path, "r"); | ||
278 | if (fp == NULL) { | ||
279 | pr_warning("Failed to open %s: %s\n", lr->path, | ||
280 | strerror(errno)); | ||
281 | return -errno; | ||
282 | } | ||
283 | /* Skip to starting line number */ | ||
284 | while (l < lr->start && ret >= 0) | ||
285 | ret = show_one_line(fp, l++, true, false); | ||
286 | if (ret < 0) | ||
287 | goto end; | ||
288 | |||
289 | list_for_each_entry(ln, &lr->line_list, list) { | ||
290 | while (ln->line > l && ret >= 0) | ||
291 | ret = show_one_line(fp, (l++) - lr->offset, | ||
292 | false, false); | ||
293 | if (ret >= 0) | ||
294 | ret = show_one_line(fp, (l++) - lr->offset, | ||
295 | false, true); | ||
296 | if (ret < 0) | ||
297 | goto end; | ||
298 | } | ||
299 | |||
300 | if (lr->end == INT_MAX) | ||
301 | lr->end = l + NR_ADDITIONAL_LINES; | ||
302 | while (l <= lr->end && !feof(fp) && ret >= 0) | ||
303 | ret = show_one_line(fp, (l++) - lr->offset, false, false); | ||
304 | end: | ||
305 | fclose(fp); | ||
306 | return ret; | ||
307 | } | ||
308 | |||
309 | #else /* !DWARF_SUPPORT */ | ||
310 | |||
311 | static int convert_to_perf_probe_point(struct kprobe_trace_point *tp, | ||
312 | struct perf_probe_point *pp) | ||
313 | { | ||
314 | pp->function = strdup(tp->symbol); | ||
315 | if (pp->function == NULL) | ||
316 | return -ENOMEM; | ||
317 | pp->offset = tp->offset; | ||
318 | pp->retprobe = tp->retprobe; | ||
319 | |||
320 | return 0; | ||
321 | } | ||
322 | |||
323 | static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev, | ||
324 | struct kprobe_trace_event **tevs __unused, | ||
325 | int max_tevs __unused) | ||
326 | { | ||
327 | if (perf_probe_event_need_dwarf(pev)) { | ||
328 | pr_warning("Debuginfo-analysis is not supported.\n"); | ||
329 | return -ENOSYS; | ||
330 | } | ||
331 | return 0; | ||
332 | } | ||
333 | |||
334 | int show_line_range(struct line_range *lr __unused) | ||
335 | { | ||
336 | pr_warning("Debuginfo-analysis is not supported.\n"); | ||
337 | return -ENOSYS; | ||
338 | } | ||
339 | |||
340 | #endif | ||
341 | |||
342 | int parse_line_range_desc(const char *arg, struct line_range *lr) | ||
68 | { | 343 | { |
69 | const char *ptr; | 344 | const char *ptr; |
70 | char *tmp; | 345 | char *tmp; |
@@ -75,29 +350,45 @@ void parse_line_range_desc(const char *arg, struct line_range *lr) | |||
75 | */ | 350 | */ |
76 | ptr = strchr(arg, ':'); | 351 | ptr = strchr(arg, ':'); |
77 | if (ptr) { | 352 | if (ptr) { |
78 | lr->start = (unsigned int)strtoul(ptr + 1, &tmp, 0); | 353 | lr->start = (int)strtoul(ptr + 1, &tmp, 0); |
79 | if (*tmp == '+') | 354 | if (*tmp == '+') { |
80 | lr->end = lr->start + (unsigned int)strtoul(tmp + 1, | 355 | lr->end = lr->start + (int)strtoul(tmp + 1, &tmp, 0); |
81 | &tmp, 0); | 356 | lr->end--; /* |
82 | else if (*tmp == '-') | 357 | * Adjust the number of lines here. |
83 | lr->end = (unsigned int)strtoul(tmp + 1, &tmp, 0); | 358 | * If the number of lines == 1, the |
359 | * the end of line should be equal to | ||
360 | * the start of line. | ||
361 | */ | ||
362 | } else if (*tmp == '-') | ||
363 | lr->end = (int)strtoul(tmp + 1, &tmp, 0); | ||
84 | else | 364 | else |
85 | lr->end = 0; | 365 | lr->end = INT_MAX; |
86 | pr_debug("Line range is %u to %u\n", lr->start, lr->end); | 366 | pr_debug("Line range is %d to %d\n", lr->start, lr->end); |
87 | if (lr->end && lr->start > lr->end) | 367 | if (lr->start > lr->end) { |
88 | semantic_error("Start line must be smaller" | 368 | semantic_error("Start line must be smaller" |
89 | " than end line."); | 369 | " than end line.\n"); |
90 | if (*tmp != '\0') | 370 | return -EINVAL; |
91 | semantic_error("Tailing with invalid character '%d'.", | 371 | } |
372 | if (*tmp != '\0') { | ||
373 | semantic_error("Tailing with invalid character '%d'.\n", | ||
92 | *tmp); | 374 | *tmp); |
375 | return -EINVAL; | ||
376 | } | ||
93 | tmp = strndup(arg, (ptr - arg)); | 377 | tmp = strndup(arg, (ptr - arg)); |
94 | } else | 378 | } else { |
95 | tmp = strdup(arg); | 379 | tmp = strdup(arg); |
380 | lr->end = INT_MAX; | ||
381 | } | ||
382 | |||
383 | if (tmp == NULL) | ||
384 | return -ENOMEM; | ||
96 | 385 | ||
97 | if (strchr(tmp, '.')) | 386 | if (strchr(tmp, '.')) |
98 | lr->file = tmp; | 387 | lr->file = tmp; |
99 | else | 388 | else |
100 | lr->function = tmp; | 389 | lr->function = tmp; |
390 | |||
391 | return 0; | ||
101 | } | 392 | } |
102 | 393 | ||
103 | /* Check the name is good for event/group */ | 394 | /* Check the name is good for event/group */ |
@@ -113,8 +404,9 @@ static bool check_event_name(const char *name) | |||
113 | } | 404 | } |
114 | 405 | ||
115 | /* Parse probepoint definition. */ | 406 | /* Parse probepoint definition. */ |
116 | static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | 407 | static int parse_perf_probe_point(char *arg, struct perf_probe_event *pev) |
117 | { | 408 | { |
409 | struct perf_probe_point *pp = &pev->point; | ||
118 | char *ptr, *tmp; | 410 | char *ptr, *tmp; |
119 | char c, nc = 0; | 411 | char c, nc = 0; |
120 | /* | 412 | /* |
@@ -129,13 +421,19 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
129 | if (ptr && *ptr == '=') { /* Event name */ | 421 | if (ptr && *ptr == '=') { /* Event name */ |
130 | *ptr = '\0'; | 422 | *ptr = '\0'; |
131 | tmp = ptr + 1; | 423 | tmp = ptr + 1; |
132 | ptr = strchr(arg, ':'); | 424 | if (strchr(arg, ':')) { |
133 | if (ptr) /* Group name is not supported yet. */ | 425 | semantic_error("Group name is not supported yet.\n"); |
134 | semantic_error("Group name is not supported yet."); | 426 | return -ENOTSUP; |
135 | if (!check_event_name(arg)) | 427 | } |
428 | if (!check_event_name(arg)) { | ||
136 | semantic_error("%s is bad for event name -it must " | 429 | semantic_error("%s is bad for event name -it must " |
137 | "follow C symbol-naming rule.", arg); | 430 | "follow C symbol-naming rule.\n", arg); |
138 | pp->event = strdup(arg); | 431 | return -EINVAL; |
432 | } | ||
433 | pev->event = strdup(arg); | ||
434 | if (pev->event == NULL) | ||
435 | return -ENOMEM; | ||
436 | pev->group = NULL; | ||
139 | arg = tmp; | 437 | arg = tmp; |
140 | } | 438 | } |
141 | 439 | ||
@@ -145,12 +443,15 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
145 | *ptr++ = '\0'; | 443 | *ptr++ = '\0'; |
146 | } | 444 | } |
147 | 445 | ||
446 | tmp = strdup(arg); | ||
447 | if (tmp == NULL) | ||
448 | return -ENOMEM; | ||
449 | |||
148 | /* Check arg is function or file and copy it */ | 450 | /* Check arg is function or file and copy it */ |
149 | if (strchr(arg, '.')) /* File */ | 451 | if (strchr(tmp, '.')) /* File */ |
150 | pp->file = strdup(arg); | 452 | pp->file = tmp; |
151 | else /* Function */ | 453 | else /* Function */ |
152 | pp->function = strdup(arg); | 454 | pp->function = tmp; |
153 | DIE_IF(pp->file == NULL && pp->function == NULL); | ||
154 | 455 | ||
155 | /* Parse other options */ | 456 | /* Parse other options */ |
156 | while (ptr) { | 457 | while (ptr) { |
@@ -158,6 +459,8 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
158 | c = nc; | 459 | c = nc; |
159 | if (c == ';') { /* Lazy pattern must be the last part */ | 460 | if (c == ';') { /* Lazy pattern must be the last part */ |
160 | pp->lazy_line = strdup(arg); | 461 | pp->lazy_line = strdup(arg); |
462 | if (pp->lazy_line == NULL) | ||
463 | return -ENOMEM; | ||
161 | break; | 464 | break; |
162 | } | 465 | } |
163 | ptr = strpbrk(arg, ";:+@%"); | 466 | ptr = strpbrk(arg, ";:+@%"); |
@@ -168,266 +471,658 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) | |||
168 | switch (c) { | 471 | switch (c) { |
169 | case ':': /* Line number */ | 472 | case ':': /* Line number */ |
170 | pp->line = strtoul(arg, &tmp, 0); | 473 | pp->line = strtoul(arg, &tmp, 0); |
171 | if (*tmp != '\0') | 474 | if (*tmp != '\0') { |
172 | semantic_error("There is non-digit char" | 475 | semantic_error("There is non-digit char" |
173 | " in line number."); | 476 | " in line number.\n"); |
477 | return -EINVAL; | ||
478 | } | ||
174 | break; | 479 | break; |
175 | case '+': /* Byte offset from a symbol */ | 480 | case '+': /* Byte offset from a symbol */ |
176 | pp->offset = strtoul(arg, &tmp, 0); | 481 | pp->offset = strtoul(arg, &tmp, 0); |
177 | if (*tmp != '\0') | 482 | if (*tmp != '\0') { |
178 | semantic_error("There is non-digit character" | 483 | semantic_error("There is non-digit character" |
179 | " in offset."); | 484 | " in offset.\n"); |
485 | return -EINVAL; | ||
486 | } | ||
180 | break; | 487 | break; |
181 | case '@': /* File name */ | 488 | case '@': /* File name */ |
182 | if (pp->file) | 489 | if (pp->file) { |
183 | semantic_error("SRC@SRC is not allowed."); | 490 | semantic_error("SRC@SRC is not allowed.\n"); |
491 | return -EINVAL; | ||
492 | } | ||
184 | pp->file = strdup(arg); | 493 | pp->file = strdup(arg); |
185 | DIE_IF(pp->file == NULL); | 494 | if (pp->file == NULL) |
495 | return -ENOMEM; | ||
186 | break; | 496 | break; |
187 | case '%': /* Probe places */ | 497 | case '%': /* Probe places */ |
188 | if (strcmp(arg, "return") == 0) { | 498 | if (strcmp(arg, "return") == 0) { |
189 | pp->retprobe = 1; | 499 | pp->retprobe = 1; |
190 | } else /* Others not supported yet */ | 500 | } else { /* Others not supported yet */ |
191 | semantic_error("%%%s is not supported.", arg); | 501 | semantic_error("%%%s is not supported.\n", arg); |
502 | return -ENOTSUP; | ||
503 | } | ||
192 | break; | 504 | break; |
193 | default: | 505 | default: /* Buggy case */ |
194 | DIE_IF("Program has a bug."); | 506 | pr_err("This program has a bug at %s:%d.\n", |
507 | __FILE__, __LINE__); | ||
508 | return -ENOTSUP; | ||
195 | break; | 509 | break; |
196 | } | 510 | } |
197 | } | 511 | } |
198 | 512 | ||
199 | /* Exclusion check */ | 513 | /* Exclusion check */ |
200 | if (pp->lazy_line && pp->line) | 514 | if (pp->lazy_line && pp->line) { |
201 | semantic_error("Lazy pattern can't be used with line number."); | 515 | semantic_error("Lazy pattern can't be used with line number."); |
516 | return -EINVAL; | ||
517 | } | ||
202 | 518 | ||
203 | if (pp->lazy_line && pp->offset) | 519 | if (pp->lazy_line && pp->offset) { |
204 | semantic_error("Lazy pattern can't be used with offset."); | 520 | semantic_error("Lazy pattern can't be used with offset."); |
521 | return -EINVAL; | ||
522 | } | ||
205 | 523 | ||
206 | if (pp->line && pp->offset) | 524 | if (pp->line && pp->offset) { |
207 | semantic_error("Offset can't be used with line number."); | 525 | semantic_error("Offset can't be used with line number."); |
526 | return -EINVAL; | ||
527 | } | ||
208 | 528 | ||
209 | if (!pp->line && !pp->lazy_line && pp->file && !pp->function) | 529 | if (!pp->line && !pp->lazy_line && pp->file && !pp->function) { |
210 | semantic_error("File always requires line number or " | 530 | semantic_error("File always requires line number or " |
211 | "lazy pattern."); | 531 | "lazy pattern."); |
532 | return -EINVAL; | ||
533 | } | ||
212 | 534 | ||
213 | if (pp->offset && !pp->function) | 535 | if (pp->offset && !pp->function) { |
214 | semantic_error("Offset requires an entry function."); | 536 | semantic_error("Offset requires an entry function."); |
537 | return -EINVAL; | ||
538 | } | ||
215 | 539 | ||
216 | if (pp->retprobe && !pp->function) | 540 | if (pp->retprobe && !pp->function) { |
217 | semantic_error("Return probe requires an entry function."); | 541 | semantic_error("Return probe requires an entry function."); |
542 | return -EINVAL; | ||
543 | } | ||
218 | 544 | ||
219 | if ((pp->offset || pp->line || pp->lazy_line) && pp->retprobe) | 545 | if ((pp->offset || pp->line || pp->lazy_line) && pp->retprobe) { |
220 | semantic_error("Offset/Line/Lazy pattern can't be used with " | 546 | semantic_error("Offset/Line/Lazy pattern can't be used with " |
221 | "return probe."); | 547 | "return probe."); |
548 | return -EINVAL; | ||
549 | } | ||
222 | 550 | ||
223 | pr_debug("symbol:%s file:%s line:%d offset:%d return:%d lazy:%s\n", | 551 | pr_debug("symbol:%s file:%s line:%d offset:%lu return:%d lazy:%s\n", |
224 | pp->function, pp->file, pp->line, pp->offset, pp->retprobe, | 552 | pp->function, pp->file, pp->line, pp->offset, pp->retprobe, |
225 | pp->lazy_line); | 553 | pp->lazy_line); |
554 | return 0; | ||
226 | } | 555 | } |
227 | 556 | ||
228 | /* Parse perf-probe event definition */ | 557 | /* Parse perf-probe event argument */ |
229 | void parse_perf_probe_event(const char *str, struct probe_point *pp, | 558 | static int parse_perf_probe_arg(char *str, struct perf_probe_arg *arg) |
230 | bool *need_dwarf) | ||
231 | { | 559 | { |
232 | char **argv; | 560 | char *tmp; |
233 | int argc, i; | 561 | struct perf_probe_arg_field **fieldp; |
562 | |||
563 | pr_debug("parsing arg: %s into ", str); | ||
234 | 564 | ||
235 | *need_dwarf = false; | 565 | tmp = strchr(str, '='); |
566 | if (tmp) { | ||
567 | arg->name = strndup(str, tmp - str); | ||
568 | if (arg->name == NULL) | ||
569 | return -ENOMEM; | ||
570 | pr_debug("name:%s ", arg->name); | ||
571 | str = tmp + 1; | ||
572 | } | ||
236 | 573 | ||
237 | argv = argv_split(str, &argc); | 574 | tmp = strchr(str, ':'); |
238 | if (!argv) | 575 | if (tmp) { /* Type setting */ |
239 | die("argv_split failed."); | 576 | *tmp = '\0'; |
240 | if (argc > MAX_PROBE_ARGS + 1) | 577 | arg->type = strdup(tmp + 1); |
241 | semantic_error("Too many arguments"); | 578 | if (arg->type == NULL) |
579 | return -ENOMEM; | ||
580 | pr_debug("type:%s ", arg->type); | ||
581 | } | ||
242 | 582 | ||
583 | tmp = strpbrk(str, "-."); | ||
584 | if (!is_c_varname(str) || !tmp) { | ||
585 | /* A variable, register, symbol or special value */ | ||
586 | arg->var = strdup(str); | ||
587 | if (arg->var == NULL) | ||
588 | return -ENOMEM; | ||
589 | pr_debug("%s\n", arg->var); | ||
590 | return 0; | ||
591 | } | ||
592 | |||
593 | /* Structure fields */ | ||
594 | arg->var = strndup(str, tmp - str); | ||
595 | if (arg->var == NULL) | ||
596 | return -ENOMEM; | ||
597 | pr_debug("%s, ", arg->var); | ||
598 | fieldp = &arg->field; | ||
599 | |||
600 | do { | ||
601 | *fieldp = zalloc(sizeof(struct perf_probe_arg_field)); | ||
602 | if (*fieldp == NULL) | ||
603 | return -ENOMEM; | ||
604 | if (*tmp == '.') { | ||
605 | str = tmp + 1; | ||
606 | (*fieldp)->ref = false; | ||
607 | } else if (tmp[1] == '>') { | ||
608 | str = tmp + 2; | ||
609 | (*fieldp)->ref = true; | ||
610 | } else { | ||
611 | semantic_error("Argument parse error: %s\n", str); | ||
612 | return -EINVAL; | ||
613 | } | ||
614 | |||
615 | tmp = strpbrk(str, "-."); | ||
616 | if (tmp) { | ||
617 | (*fieldp)->name = strndup(str, tmp - str); | ||
618 | if ((*fieldp)->name == NULL) | ||
619 | return -ENOMEM; | ||
620 | pr_debug("%s(%d), ", (*fieldp)->name, (*fieldp)->ref); | ||
621 | fieldp = &(*fieldp)->next; | ||
622 | } | ||
623 | } while (tmp); | ||
624 | (*fieldp)->name = strdup(str); | ||
625 | if ((*fieldp)->name == NULL) | ||
626 | return -ENOMEM; | ||
627 | pr_debug("%s(%d)\n", (*fieldp)->name, (*fieldp)->ref); | ||
628 | |||
629 | /* If no name is specified, set the last field name */ | ||
630 | if (!arg->name) { | ||
631 | arg->name = strdup((*fieldp)->name); | ||
632 | if (arg->name == NULL) | ||
633 | return -ENOMEM; | ||
634 | } | ||
635 | return 0; | ||
636 | } | ||
637 | |||
638 | /* Parse perf-probe event command */ | ||
639 | int parse_perf_probe_command(const char *cmd, struct perf_probe_event *pev) | ||
640 | { | ||
641 | char **argv; | ||
642 | int argc, i, ret = 0; | ||
643 | |||
644 | argv = argv_split(cmd, &argc); | ||
645 | if (!argv) { | ||
646 | pr_debug("Failed to split arguments.\n"); | ||
647 | return -ENOMEM; | ||
648 | } | ||
649 | if (argc - 1 > MAX_PROBE_ARGS) { | ||
650 | semantic_error("Too many probe arguments (%d).\n", argc - 1); | ||
651 | ret = -ERANGE; | ||
652 | goto out; | ||
653 | } | ||
243 | /* Parse probe point */ | 654 | /* Parse probe point */ |
244 | parse_perf_probe_probepoint(argv[0], pp); | 655 | ret = parse_perf_probe_point(argv[0], pev); |
245 | if (pp->file || pp->line || pp->lazy_line) | 656 | if (ret < 0) |
246 | *need_dwarf = true; | 657 | goto out; |
247 | 658 | ||
248 | /* Copy arguments and ensure return probe has no C argument */ | 659 | /* Copy arguments and ensure return probe has no C argument */ |
249 | pp->nr_args = argc - 1; | 660 | pev->nargs = argc - 1; |
250 | pp->args = zalloc(sizeof(char *) * pp->nr_args); | 661 | pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs); |
251 | for (i = 0; i < pp->nr_args; i++) { | 662 | if (pev->args == NULL) { |
252 | pp->args[i] = strdup(argv[i + 1]); | 663 | ret = -ENOMEM; |
253 | if (!pp->args[i]) | 664 | goto out; |
254 | die("Failed to copy argument."); | 665 | } |
255 | if (is_c_varname(pp->args[i])) { | 666 | for (i = 0; i < pev->nargs && ret >= 0; i++) { |
256 | if (pp->retprobe) | 667 | ret = parse_perf_probe_arg(argv[i + 1], &pev->args[i]); |
257 | semantic_error("You can't specify local" | 668 | if (ret >= 0 && |
258 | " variable for kretprobe"); | 669 | is_c_varname(pev->args[i].var) && pev->point.retprobe) { |
259 | *need_dwarf = true; | 670 | semantic_error("You can't specify local variable for" |
671 | " kretprobe.\n"); | ||
672 | ret = -EINVAL; | ||
260 | } | 673 | } |
261 | } | 674 | } |
262 | 675 | out: | |
263 | argv_free(argv); | 676 | argv_free(argv); |
677 | |||
678 | return ret; | ||
679 | } | ||
680 | |||
681 | /* Return true if this perf_probe_event requires debuginfo */ | ||
682 | bool perf_probe_event_need_dwarf(struct perf_probe_event *pev) | ||
683 | { | ||
684 | int i; | ||
685 | |||
686 | if (pev->point.file || pev->point.line || pev->point.lazy_line) | ||
687 | return true; | ||
688 | |||
689 | for (i = 0; i < pev->nargs; i++) | ||
690 | if (is_c_varname(pev->args[i].var)) | ||
691 | return true; | ||
692 | |||
693 | return false; | ||
264 | } | 694 | } |
265 | 695 | ||
266 | /* Parse kprobe_events event into struct probe_point */ | 696 | /* Parse kprobe_events event into struct probe_point */ |
267 | void parse_trace_kprobe_event(const char *str, struct probe_point *pp) | 697 | int parse_kprobe_trace_command(const char *cmd, struct kprobe_trace_event *tev) |
268 | { | 698 | { |
699 | struct kprobe_trace_point *tp = &tev->point; | ||
269 | char pr; | 700 | char pr; |
270 | char *p; | 701 | char *p; |
271 | int ret, i, argc; | 702 | int ret, i, argc; |
272 | char **argv; | 703 | char **argv; |
273 | 704 | ||
274 | pr_debug("Parsing kprobe_events: %s\n", str); | 705 | pr_debug("Parsing kprobe_events: %s\n", cmd); |
275 | argv = argv_split(str, &argc); | 706 | argv = argv_split(cmd, &argc); |
276 | if (!argv) | 707 | if (!argv) { |
277 | die("argv_split failed."); | 708 | pr_debug("Failed to split arguments.\n"); |
278 | if (argc < 2) | 709 | return -ENOMEM; |
279 | semantic_error("Too less arguments."); | 710 | } |
711 | if (argc < 2) { | ||
712 | semantic_error("Too few probe arguments.\n"); | ||
713 | ret = -ERANGE; | ||
714 | goto out; | ||
715 | } | ||
280 | 716 | ||
281 | /* Scan event and group name. */ | 717 | /* Scan event and group name. */ |
282 | ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]", | 718 | ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]", |
283 | &pr, (float *)(void *)&pp->group, | 719 | &pr, (float *)(void *)&tev->group, |
284 | (float *)(void *)&pp->event); | 720 | (float *)(void *)&tev->event); |
285 | if (ret != 3) | 721 | if (ret != 3) { |
286 | semantic_error("Failed to parse event name: %s", argv[0]); | 722 | semantic_error("Failed to parse event name: %s\n", argv[0]); |
287 | pr_debug("Group:%s Event:%s probe:%c\n", pp->group, pp->event, pr); | 723 | ret = -EINVAL; |
724 | goto out; | ||
725 | } | ||
726 | pr_debug("Group:%s Event:%s probe:%c\n", tev->group, tev->event, pr); | ||
288 | 727 | ||
289 | pp->retprobe = (pr == 'r'); | 728 | tp->retprobe = (pr == 'r'); |
290 | 729 | ||
291 | /* Scan function name and offset */ | 730 | /* Scan function name and offset */ |
292 | ret = sscanf(argv[1], "%a[^+]+%d", (float *)(void *)&pp->function, | 731 | ret = sscanf(argv[1], "%a[^+]+%lu", (float *)(void *)&tp->symbol, |
293 | &pp->offset); | 732 | &tp->offset); |
294 | if (ret == 1) | 733 | if (ret == 1) |
295 | pp->offset = 0; | 734 | tp->offset = 0; |
296 | |||
297 | /* kprobe_events doesn't have this information */ | ||
298 | pp->line = 0; | ||
299 | pp->file = NULL; | ||
300 | 735 | ||
301 | pp->nr_args = argc - 2; | 736 | tev->nargs = argc - 2; |
302 | pp->args = zalloc(sizeof(char *) * pp->nr_args); | 737 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs); |
303 | for (i = 0; i < pp->nr_args; i++) { | 738 | if (tev->args == NULL) { |
739 | ret = -ENOMEM; | ||
740 | goto out; | ||
741 | } | ||
742 | for (i = 0; i < tev->nargs; i++) { | ||
304 | p = strchr(argv[i + 2], '='); | 743 | p = strchr(argv[i + 2], '='); |
305 | if (p) /* We don't need which register is assigned. */ | 744 | if (p) /* We don't need which register is assigned. */ |
306 | *p = '\0'; | 745 | *p++ = '\0'; |
307 | pp->args[i] = strdup(argv[i + 2]); | 746 | else |
308 | if (!pp->args[i]) | 747 | p = argv[i + 2]; |
309 | die("Failed to copy argument."); | 748 | tev->args[i].name = strdup(argv[i + 2]); |
749 | /* TODO: parse regs and offset */ | ||
750 | tev->args[i].value = strdup(p); | ||
751 | if (tev->args[i].name == NULL || tev->args[i].value == NULL) { | ||
752 | ret = -ENOMEM; | ||
753 | goto out; | ||
754 | } | ||
310 | } | 755 | } |
311 | 756 | ret = 0; | |
757 | out: | ||
312 | argv_free(argv); | 758 | argv_free(argv); |
759 | return ret; | ||
313 | } | 760 | } |
314 | 761 | ||
315 | /* Synthesize only probe point (not argument) */ | 762 | /* Compose only probe arg */ |
316 | int synthesize_perf_probe_point(struct probe_point *pp) | 763 | int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf, size_t len) |
317 | { | 764 | { |
318 | char *buf; | 765 | struct perf_probe_arg_field *field = pa->field; |
319 | char offs[64] = "", line[64] = ""; | ||
320 | int ret; | 766 | int ret; |
767 | char *tmp = buf; | ||
321 | 768 | ||
322 | pp->probes[0] = buf = zalloc(MAX_CMDLEN); | 769 | if (pa->name && pa->var) |
323 | pp->found = 1; | 770 | ret = e_snprintf(tmp, len, "%s=%s", pa->name, pa->var); |
324 | if (!buf) | 771 | else |
325 | die("Failed to allocate memory by zalloc."); | 772 | ret = e_snprintf(tmp, len, "%s", pa->name ? pa->name : pa->var); |
773 | if (ret <= 0) | ||
774 | goto error; | ||
775 | tmp += ret; | ||
776 | len -= ret; | ||
777 | |||
778 | while (field) { | ||
779 | ret = e_snprintf(tmp, len, "%s%s", field->ref ? "->" : ".", | ||
780 | field->name); | ||
781 | if (ret <= 0) | ||
782 | goto error; | ||
783 | tmp += ret; | ||
784 | len -= ret; | ||
785 | field = field->next; | ||
786 | } | ||
787 | |||
788 | if (pa->type) { | ||
789 | ret = e_snprintf(tmp, len, ":%s", pa->type); | ||
790 | if (ret <= 0) | ||
791 | goto error; | ||
792 | tmp += ret; | ||
793 | len -= ret; | ||
794 | } | ||
795 | |||
796 | return tmp - buf; | ||
797 | error: | ||
798 | pr_debug("Failed to synthesize perf probe argument: %s", | ||
799 | strerror(-ret)); | ||
800 | return ret; | ||
801 | } | ||
802 | |||
803 | /* Compose only probe point (not argument) */ | ||
804 | static char *synthesize_perf_probe_point(struct perf_probe_point *pp) | ||
805 | { | ||
806 | char *buf, *tmp; | ||
807 | char offs[32] = "", line[32] = "", file[32] = ""; | ||
808 | int ret, len; | ||
809 | |||
810 | buf = zalloc(MAX_CMDLEN); | ||
811 | if (buf == NULL) { | ||
812 | ret = -ENOMEM; | ||
813 | goto error; | ||
814 | } | ||
326 | if (pp->offset) { | 815 | if (pp->offset) { |
327 | ret = e_snprintf(offs, 64, "+%d", pp->offset); | 816 | ret = e_snprintf(offs, 32, "+%lu", pp->offset); |
328 | if (ret <= 0) | 817 | if (ret <= 0) |
329 | goto error; | 818 | goto error; |
330 | } | 819 | } |
331 | if (pp->line) { | 820 | if (pp->line) { |
332 | ret = e_snprintf(line, 64, ":%d", pp->line); | 821 | ret = e_snprintf(line, 32, ":%d", pp->line); |
822 | if (ret <= 0) | ||
823 | goto error; | ||
824 | } | ||
825 | if (pp->file) { | ||
826 | len = strlen(pp->file) - 31; | ||
827 | if (len < 0) | ||
828 | len = 0; | ||
829 | tmp = strchr(pp->file + len, '/'); | ||
830 | if (!tmp) | ||
831 | tmp = pp->file + len; | ||
832 | ret = e_snprintf(file, 32, "@%s", tmp + 1); | ||
333 | if (ret <= 0) | 833 | if (ret <= 0) |
334 | goto error; | 834 | goto error; |
335 | } | 835 | } |
336 | 836 | ||
337 | if (pp->function) | 837 | if (pp->function) |
338 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s", pp->function, | 838 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s%s", pp->function, |
339 | offs, pp->retprobe ? "%return" : "", line); | 839 | offs, pp->retprobe ? "%return" : "", line, |
840 | file); | ||
340 | else | 841 | else |
341 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", pp->file, line); | 842 | ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", file, line); |
342 | if (ret <= 0) { | 843 | if (ret <= 0) |
844 | goto error; | ||
845 | |||
846 | return buf; | ||
343 | error: | 847 | error: |
344 | free(pp->probes[0]); | 848 | pr_debug("Failed to synthesize perf probe point: %s", |
345 | pp->probes[0] = NULL; | 849 | strerror(-ret)); |
346 | pp->found = 0; | 850 | if (buf) |
347 | } | 851 | free(buf); |
348 | return ret; | 852 | return NULL; |
349 | } | 853 | } |
350 | 854 | ||
351 | int synthesize_perf_probe_event(struct probe_point *pp) | 855 | #if 0 |
856 | char *synthesize_perf_probe_command(struct perf_probe_event *pev) | ||
352 | { | 857 | { |
353 | char *buf; | 858 | char *buf; |
354 | int i, len, ret; | 859 | int i, len, ret; |
355 | 860 | ||
356 | len = synthesize_perf_probe_point(pp); | 861 | buf = synthesize_perf_probe_point(&pev->point); |
357 | if (len < 0) | 862 | if (!buf) |
358 | return 0; | 863 | return NULL; |
359 | 864 | ||
360 | buf = pp->probes[0]; | 865 | len = strlen(buf); |
361 | for (i = 0; i < pp->nr_args; i++) { | 866 | for (i = 0; i < pev->nargs; i++) { |
362 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", | 867 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", |
363 | pp->args[i]); | 868 | pev->args[i].name); |
364 | if (ret <= 0) | 869 | if (ret <= 0) { |
365 | goto error; | 870 | free(buf); |
871 | return NULL; | ||
872 | } | ||
366 | len += ret; | 873 | len += ret; |
367 | } | 874 | } |
368 | pp->found = 1; | ||
369 | 875 | ||
370 | return pp->found; | 876 | return buf; |
371 | error: | 877 | } |
372 | free(pp->probes[0]); | 878 | #endif |
373 | pp->probes[0] = NULL; | 879 | |
880 | static int __synthesize_kprobe_trace_arg_ref(struct kprobe_trace_arg_ref *ref, | ||
881 | char **buf, size_t *buflen, | ||
882 | int depth) | ||
883 | { | ||
884 | int ret; | ||
885 | if (ref->next) { | ||
886 | depth = __synthesize_kprobe_trace_arg_ref(ref->next, buf, | ||
887 | buflen, depth + 1); | ||
888 | if (depth < 0) | ||
889 | goto out; | ||
890 | } | ||
891 | |||
892 | ret = e_snprintf(*buf, *buflen, "%+ld(", ref->offset); | ||
893 | if (ret < 0) | ||
894 | depth = ret; | ||
895 | else { | ||
896 | *buf += ret; | ||
897 | *buflen -= ret; | ||
898 | } | ||
899 | out: | ||
900 | return depth; | ||
374 | 901 | ||
375 | return ret; | ||
376 | } | 902 | } |
377 | 903 | ||
378 | int synthesize_trace_kprobe_event(struct probe_point *pp) | 904 | static int synthesize_kprobe_trace_arg(struct kprobe_trace_arg *arg, |
905 | char *buf, size_t buflen) | ||
379 | { | 906 | { |
907 | int ret, depth = 0; | ||
908 | char *tmp = buf; | ||
909 | |||
910 | /* Argument name or separator */ | ||
911 | if (arg->name) | ||
912 | ret = e_snprintf(buf, buflen, " %s=", arg->name); | ||
913 | else | ||
914 | ret = e_snprintf(buf, buflen, " "); | ||
915 | if (ret < 0) | ||
916 | return ret; | ||
917 | buf += ret; | ||
918 | buflen -= ret; | ||
919 | |||
920 | /* Dereferencing arguments */ | ||
921 | if (arg->ref) { | ||
922 | depth = __synthesize_kprobe_trace_arg_ref(arg->ref, &buf, | ||
923 | &buflen, 1); | ||
924 | if (depth < 0) | ||
925 | return depth; | ||
926 | } | ||
927 | |||
928 | /* Print argument value */ | ||
929 | ret = e_snprintf(buf, buflen, "%s", arg->value); | ||
930 | if (ret < 0) | ||
931 | return ret; | ||
932 | buf += ret; | ||
933 | buflen -= ret; | ||
934 | |||
935 | /* Closing */ | ||
936 | while (depth--) { | ||
937 | ret = e_snprintf(buf, buflen, ")"); | ||
938 | if (ret < 0) | ||
939 | return ret; | ||
940 | buf += ret; | ||
941 | buflen -= ret; | ||
942 | } | ||
943 | /* Print argument type */ | ||
944 | if (arg->type) { | ||
945 | ret = e_snprintf(buf, buflen, ":%s", arg->type); | ||
946 | if (ret <= 0) | ||
947 | return ret; | ||
948 | buf += ret; | ||
949 | } | ||
950 | |||
951 | return buf - tmp; | ||
952 | } | ||
953 | |||
954 | char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev) | ||
955 | { | ||
956 | struct kprobe_trace_point *tp = &tev->point; | ||
380 | char *buf; | 957 | char *buf; |
381 | int i, len, ret; | 958 | int i, len, ret; |
382 | 959 | ||
383 | pp->probes[0] = buf = zalloc(MAX_CMDLEN); | 960 | buf = zalloc(MAX_CMDLEN); |
384 | if (!buf) | 961 | if (buf == NULL) |
385 | die("Failed to allocate memory by zalloc."); | 962 | return NULL; |
386 | ret = e_snprintf(buf, MAX_CMDLEN, "%s+%d", pp->function, pp->offset); | 963 | |
387 | if (ret <= 0) | 964 | len = e_snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s+%lu", |
965 | tp->retprobe ? 'r' : 'p', | ||
966 | tev->group, tev->event, | ||
967 | tp->symbol, tp->offset); | ||
968 | if (len <= 0) | ||
388 | goto error; | 969 | goto error; |
389 | len = ret; | ||
390 | 970 | ||
391 | for (i = 0; i < pp->nr_args; i++) { | 971 | for (i = 0; i < tev->nargs; i++) { |
392 | ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", | 972 | ret = synthesize_kprobe_trace_arg(&tev->args[i], buf + len, |
393 | pp->args[i]); | 973 | MAX_CMDLEN - len); |
394 | if (ret <= 0) | 974 | if (ret <= 0) |
395 | goto error; | 975 | goto error; |
396 | len += ret; | 976 | len += ret; |
397 | } | 977 | } |
398 | pp->found = 1; | ||
399 | 978 | ||
400 | return pp->found; | 979 | return buf; |
401 | error: | 980 | error: |
402 | free(pp->probes[0]); | 981 | free(buf); |
403 | pp->probes[0] = NULL; | 982 | return NULL; |
983 | } | ||
984 | |||
985 | int convert_to_perf_probe_event(struct kprobe_trace_event *tev, | ||
986 | struct perf_probe_event *pev) | ||
987 | { | ||
988 | char buf[64] = ""; | ||
989 | int i, ret; | ||
990 | |||
991 | /* Convert event/group name */ | ||
992 | pev->event = strdup(tev->event); | ||
993 | pev->group = strdup(tev->group); | ||
994 | if (pev->event == NULL || pev->group == NULL) | ||
995 | return -ENOMEM; | ||
996 | |||
997 | /* Convert trace_point to probe_point */ | ||
998 | ret = convert_to_perf_probe_point(&tev->point, &pev->point); | ||
999 | if (ret < 0) | ||
1000 | return ret; | ||
1001 | |||
1002 | /* Convert trace_arg to probe_arg */ | ||
1003 | pev->nargs = tev->nargs; | ||
1004 | pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs); | ||
1005 | if (pev->args == NULL) | ||
1006 | return -ENOMEM; | ||
1007 | for (i = 0; i < tev->nargs && ret >= 0; i++) { | ||
1008 | if (tev->args[i].name) | ||
1009 | pev->args[i].name = strdup(tev->args[i].name); | ||
1010 | else { | ||
1011 | ret = synthesize_kprobe_trace_arg(&tev->args[i], | ||
1012 | buf, 64); | ||
1013 | pev->args[i].name = strdup(buf); | ||
1014 | } | ||
1015 | if (pev->args[i].name == NULL && ret >= 0) | ||
1016 | ret = -ENOMEM; | ||
1017 | } | ||
1018 | |||
1019 | if (ret < 0) | ||
1020 | clear_perf_probe_event(pev); | ||
404 | 1021 | ||
405 | return ret; | 1022 | return ret; |
406 | } | 1023 | } |
407 | 1024 | ||
408 | static int open_kprobe_events(int flags, int mode) | 1025 | void clear_perf_probe_event(struct perf_probe_event *pev) |
1026 | { | ||
1027 | struct perf_probe_point *pp = &pev->point; | ||
1028 | struct perf_probe_arg_field *field, *next; | ||
1029 | int i; | ||
1030 | |||
1031 | if (pev->event) | ||
1032 | free(pev->event); | ||
1033 | if (pev->group) | ||
1034 | free(pev->group); | ||
1035 | if (pp->file) | ||
1036 | free(pp->file); | ||
1037 | if (pp->function) | ||
1038 | free(pp->function); | ||
1039 | if (pp->lazy_line) | ||
1040 | free(pp->lazy_line); | ||
1041 | for (i = 0; i < pev->nargs; i++) { | ||
1042 | if (pev->args[i].name) | ||
1043 | free(pev->args[i].name); | ||
1044 | if (pev->args[i].var) | ||
1045 | free(pev->args[i].var); | ||
1046 | if (pev->args[i].type) | ||
1047 | free(pev->args[i].type); | ||
1048 | field = pev->args[i].field; | ||
1049 | while (field) { | ||
1050 | next = field->next; | ||
1051 | if (field->name) | ||
1052 | free(field->name); | ||
1053 | free(field); | ||
1054 | field = next; | ||
1055 | } | ||
1056 | } | ||
1057 | if (pev->args) | ||
1058 | free(pev->args); | ||
1059 | memset(pev, 0, sizeof(*pev)); | ||
1060 | } | ||
1061 | |||
1062 | void clear_kprobe_trace_event(struct kprobe_trace_event *tev) | ||
1063 | { | ||
1064 | struct kprobe_trace_arg_ref *ref, *next; | ||
1065 | int i; | ||
1066 | |||
1067 | if (tev->event) | ||
1068 | free(tev->event); | ||
1069 | if (tev->group) | ||
1070 | free(tev->group); | ||
1071 | if (tev->point.symbol) | ||
1072 | free(tev->point.symbol); | ||
1073 | for (i = 0; i < tev->nargs; i++) { | ||
1074 | if (tev->args[i].name) | ||
1075 | free(tev->args[i].name); | ||
1076 | if (tev->args[i].value) | ||
1077 | free(tev->args[i].value); | ||
1078 | if (tev->args[i].type) | ||
1079 | free(tev->args[i].type); | ||
1080 | ref = tev->args[i].ref; | ||
1081 | while (ref) { | ||
1082 | next = ref->next; | ||
1083 | free(ref); | ||
1084 | ref = next; | ||
1085 | } | ||
1086 | } | ||
1087 | if (tev->args) | ||
1088 | free(tev->args); | ||
1089 | memset(tev, 0, sizeof(*tev)); | ||
1090 | } | ||
1091 | |||
1092 | static int open_kprobe_events(bool readwrite) | ||
409 | { | 1093 | { |
410 | char buf[PATH_MAX]; | 1094 | char buf[PATH_MAX]; |
1095 | const char *__debugfs; | ||
411 | int ret; | 1096 | int ret; |
412 | 1097 | ||
413 | ret = e_snprintf(buf, PATH_MAX, "%s/../kprobe_events", debugfs_path); | 1098 | __debugfs = debugfs_find_mountpoint(); |
414 | if (ret < 0) | 1099 | if (__debugfs == NULL) { |
415 | die("Failed to make kprobe_events path."); | 1100 | pr_warning("Debugfs is not mounted.\n"); |
1101 | return -ENOENT; | ||
1102 | } | ||
1103 | |||
1104 | ret = e_snprintf(buf, PATH_MAX, "%stracing/kprobe_events", __debugfs); | ||
1105 | if (ret >= 0) { | ||
1106 | pr_debug("Opening %s write=%d\n", buf, readwrite); | ||
1107 | if (readwrite && !probe_event_dry_run) | ||
1108 | ret = open(buf, O_RDWR, O_APPEND); | ||
1109 | else | ||
1110 | ret = open(buf, O_RDONLY, 0); | ||
1111 | } | ||
416 | 1112 | ||
417 | ret = open(buf, flags, mode); | ||
418 | if (ret < 0) { | 1113 | if (ret < 0) { |
419 | if (errno == ENOENT) | 1114 | if (errno == ENOENT) |
420 | die("kprobe_events file does not exist -" | 1115 | pr_warning("kprobe_events file does not exist - please" |
421 | " please rebuild with CONFIG_KPROBE_EVENT."); | 1116 | " rebuild kernel with CONFIG_KPROBE_EVENT.\n"); |
422 | else | 1117 | else |
423 | die("Could not open kprobe_events file: %s", | 1118 | pr_warning("Failed to open kprobe_events file: %s\n", |
424 | strerror(errno)); | 1119 | strerror(errno)); |
425 | } | 1120 | } |
426 | return ret; | 1121 | return ret; |
427 | } | 1122 | } |
428 | 1123 | ||
429 | /* Get raw string list of current kprobe_events */ | 1124 | /* Get raw string list of current kprobe_events */ |
430 | static struct strlist *get_trace_kprobe_event_rawlist(int fd) | 1125 | static struct strlist *get_kprobe_trace_command_rawlist(int fd) |
431 | { | 1126 | { |
432 | int ret, idx; | 1127 | int ret, idx; |
433 | FILE *fp; | 1128 | FILE *fp; |
@@ -447,271 +1142,486 @@ static struct strlist *get_trace_kprobe_event_rawlist(int fd) | |||
447 | if (p[idx] == '\n') | 1142 | if (p[idx] == '\n') |
448 | p[idx] = '\0'; | 1143 | p[idx] = '\0'; |
449 | ret = strlist__add(sl, buf); | 1144 | ret = strlist__add(sl, buf); |
450 | if (ret < 0) | 1145 | if (ret < 0) { |
451 | die("strlist__add failed: %s", strerror(-ret)); | 1146 | pr_debug("strlist__add failed: %s\n", strerror(-ret)); |
1147 | strlist__delete(sl); | ||
1148 | return NULL; | ||
1149 | } | ||
452 | } | 1150 | } |
453 | fclose(fp); | 1151 | fclose(fp); |
454 | 1152 | ||
455 | return sl; | 1153 | return sl; |
456 | } | 1154 | } |
457 | 1155 | ||
458 | /* Free and zero clear probe_point */ | ||
459 | static void clear_probe_point(struct probe_point *pp) | ||
460 | { | ||
461 | int i; | ||
462 | |||
463 | if (pp->event) | ||
464 | free(pp->event); | ||
465 | if (pp->group) | ||
466 | free(pp->group); | ||
467 | if (pp->function) | ||
468 | free(pp->function); | ||
469 | if (pp->file) | ||
470 | free(pp->file); | ||
471 | if (pp->lazy_line) | ||
472 | free(pp->lazy_line); | ||
473 | for (i = 0; i < pp->nr_args; i++) | ||
474 | free(pp->args[i]); | ||
475 | if (pp->args) | ||
476 | free(pp->args); | ||
477 | for (i = 0; i < pp->found; i++) | ||
478 | free(pp->probes[i]); | ||
479 | memset(pp, 0, sizeof(*pp)); | ||
480 | } | ||
481 | |||
482 | /* Show an event */ | 1156 | /* Show an event */ |
483 | static void show_perf_probe_event(const char *event, const char *place, | 1157 | static int show_perf_probe_event(struct perf_probe_event *pev) |
484 | struct probe_point *pp) | ||
485 | { | 1158 | { |
486 | int i, ret; | 1159 | int i, ret; |
487 | char buf[128]; | 1160 | char buf[128]; |
1161 | char *place; | ||
1162 | |||
1163 | /* Synthesize only event probe point */ | ||
1164 | place = synthesize_perf_probe_point(&pev->point); | ||
1165 | if (!place) | ||
1166 | return -EINVAL; | ||
488 | 1167 | ||
489 | ret = e_snprintf(buf, 128, "%s:%s", pp->group, event); | 1168 | ret = e_snprintf(buf, 128, "%s:%s", pev->group, pev->event); |
490 | if (ret < 0) | 1169 | if (ret < 0) |
491 | die("Failed to copy event: %s", strerror(-ret)); | 1170 | return ret; |
492 | printf(" %-40s (on %s", buf, place); | 1171 | |
1172 | printf(" %-20s (on %s", buf, place); | ||
493 | 1173 | ||
494 | if (pp->nr_args > 0) { | 1174 | if (pev->nargs > 0) { |
495 | printf(" with"); | 1175 | printf(" with"); |
496 | for (i = 0; i < pp->nr_args; i++) | 1176 | for (i = 0; i < pev->nargs; i++) { |
497 | printf(" %s", pp->args[i]); | 1177 | ret = synthesize_perf_probe_arg(&pev->args[i], |
1178 | buf, 128); | ||
1179 | if (ret < 0) | ||
1180 | break; | ||
1181 | printf(" %s", buf); | ||
1182 | } | ||
498 | } | 1183 | } |
499 | printf(")\n"); | 1184 | printf(")\n"); |
1185 | free(place); | ||
1186 | return ret; | ||
500 | } | 1187 | } |
501 | 1188 | ||
502 | /* List up current perf-probe events */ | 1189 | /* List up current perf-probe events */ |
503 | void show_perf_probe_events(void) | 1190 | int show_perf_probe_events(void) |
504 | { | 1191 | { |
505 | int fd; | 1192 | int fd, ret; |
506 | struct probe_point pp; | 1193 | struct kprobe_trace_event tev; |
1194 | struct perf_probe_event pev; | ||
507 | struct strlist *rawlist; | 1195 | struct strlist *rawlist; |
508 | struct str_node *ent; | 1196 | struct str_node *ent; |
509 | 1197 | ||
510 | setup_pager(); | 1198 | setup_pager(); |
511 | memset(&pp, 0, sizeof(pp)); | 1199 | ret = init_vmlinux(); |
1200 | if (ret < 0) | ||
1201 | return ret; | ||
1202 | |||
1203 | memset(&tev, 0, sizeof(tev)); | ||
1204 | memset(&pev, 0, sizeof(pev)); | ||
512 | 1205 | ||
513 | fd = open_kprobe_events(O_RDONLY, 0); | 1206 | fd = open_kprobe_events(false); |
514 | rawlist = get_trace_kprobe_event_rawlist(fd); | 1207 | if (fd < 0) |
1208 | return fd; | ||
1209 | |||
1210 | rawlist = get_kprobe_trace_command_rawlist(fd); | ||
515 | close(fd); | 1211 | close(fd); |
1212 | if (!rawlist) | ||
1213 | return -ENOENT; | ||
516 | 1214 | ||
517 | strlist__for_each(ent, rawlist) { | 1215 | strlist__for_each(ent, rawlist) { |
518 | parse_trace_kprobe_event(ent->s, &pp); | 1216 | ret = parse_kprobe_trace_command(ent->s, &tev); |
519 | /* Synthesize only event probe point */ | 1217 | if (ret >= 0) { |
520 | synthesize_perf_probe_point(&pp); | 1218 | ret = convert_to_perf_probe_event(&tev, &pev); |
521 | /* Show an event */ | 1219 | if (ret >= 0) |
522 | show_perf_probe_event(pp.event, pp.probes[0], &pp); | 1220 | ret = show_perf_probe_event(&pev); |
523 | clear_probe_point(&pp); | 1221 | } |
1222 | clear_perf_probe_event(&pev); | ||
1223 | clear_kprobe_trace_event(&tev); | ||
1224 | if (ret < 0) | ||
1225 | break; | ||
524 | } | 1226 | } |
525 | |||
526 | strlist__delete(rawlist); | 1227 | strlist__delete(rawlist); |
1228 | |||
1229 | return ret; | ||
527 | } | 1230 | } |
528 | 1231 | ||
529 | /* Get current perf-probe event names */ | 1232 | /* Get current perf-probe event names */ |
530 | static struct strlist *get_perf_event_names(int fd, bool include_group) | 1233 | static struct strlist *get_kprobe_trace_event_names(int fd, bool include_group) |
531 | { | 1234 | { |
532 | char buf[128]; | 1235 | char buf[128]; |
533 | struct strlist *sl, *rawlist; | 1236 | struct strlist *sl, *rawlist; |
534 | struct str_node *ent; | 1237 | struct str_node *ent; |
535 | struct probe_point pp; | 1238 | struct kprobe_trace_event tev; |
1239 | int ret = 0; | ||
536 | 1240 | ||
537 | memset(&pp, 0, sizeof(pp)); | 1241 | memset(&tev, 0, sizeof(tev)); |
538 | rawlist = get_trace_kprobe_event_rawlist(fd); | ||
539 | 1242 | ||
1243 | rawlist = get_kprobe_trace_command_rawlist(fd); | ||
540 | sl = strlist__new(true, NULL); | 1244 | sl = strlist__new(true, NULL); |
541 | strlist__for_each(ent, rawlist) { | 1245 | strlist__for_each(ent, rawlist) { |
542 | parse_trace_kprobe_event(ent->s, &pp); | 1246 | ret = parse_kprobe_trace_command(ent->s, &tev); |
1247 | if (ret < 0) | ||
1248 | break; | ||
543 | if (include_group) { | 1249 | if (include_group) { |
544 | if (e_snprintf(buf, 128, "%s:%s", pp.group, | 1250 | ret = e_snprintf(buf, 128, "%s:%s", tev.group, |
545 | pp.event) < 0) | 1251 | tev.event); |
546 | die("Failed to copy group:event name."); | 1252 | if (ret >= 0) |
547 | strlist__add(sl, buf); | 1253 | ret = strlist__add(sl, buf); |
548 | } else | 1254 | } else |
549 | strlist__add(sl, pp.event); | 1255 | ret = strlist__add(sl, tev.event); |
550 | clear_probe_point(&pp); | 1256 | clear_kprobe_trace_event(&tev); |
1257 | if (ret < 0) | ||
1258 | break; | ||
551 | } | 1259 | } |
552 | |||
553 | strlist__delete(rawlist); | 1260 | strlist__delete(rawlist); |
554 | 1261 | ||
1262 | if (ret < 0) { | ||
1263 | strlist__delete(sl); | ||
1264 | return NULL; | ||
1265 | } | ||
555 | return sl; | 1266 | return sl; |
556 | } | 1267 | } |
557 | 1268 | ||
558 | static void write_trace_kprobe_event(int fd, const char *buf) | 1269 | static int write_kprobe_trace_event(int fd, struct kprobe_trace_event *tev) |
559 | { | 1270 | { |
560 | int ret; | 1271 | int ret = 0; |
1272 | char *buf = synthesize_kprobe_trace_command(tev); | ||
1273 | |||
1274 | if (!buf) { | ||
1275 | pr_debug("Failed to synthesize kprobe trace event.\n"); | ||
1276 | return -EINVAL; | ||
1277 | } | ||
561 | 1278 | ||
562 | pr_debug("Writing event: %s\n", buf); | 1279 | pr_debug("Writing event: %s\n", buf); |
563 | ret = write(fd, buf, strlen(buf)); | 1280 | if (!probe_event_dry_run) { |
564 | if (ret <= 0) | 1281 | ret = write(fd, buf, strlen(buf)); |
565 | die("Failed to write event: %s", strerror(errno)); | 1282 | if (ret <= 0) |
1283 | pr_warning("Failed to write event: %s\n", | ||
1284 | strerror(errno)); | ||
1285 | } | ||
1286 | free(buf); | ||
1287 | return ret; | ||
566 | } | 1288 | } |
567 | 1289 | ||
568 | static void get_new_event_name(char *buf, size_t len, const char *base, | 1290 | static int get_new_event_name(char *buf, size_t len, const char *base, |
569 | struct strlist *namelist, bool allow_suffix) | 1291 | struct strlist *namelist, bool allow_suffix) |
570 | { | 1292 | { |
571 | int i, ret; | 1293 | int i, ret; |
572 | 1294 | ||
573 | /* Try no suffix */ | 1295 | /* Try no suffix */ |
574 | ret = e_snprintf(buf, len, "%s", base); | 1296 | ret = e_snprintf(buf, len, "%s", base); |
575 | if (ret < 0) | 1297 | if (ret < 0) { |
576 | die("snprintf() failed: %s", strerror(-ret)); | 1298 | pr_debug("snprintf() failed: %s\n", strerror(-ret)); |
1299 | return ret; | ||
1300 | } | ||
577 | if (!strlist__has_entry(namelist, buf)) | 1301 | if (!strlist__has_entry(namelist, buf)) |
578 | return; | 1302 | return 0; |
579 | 1303 | ||
580 | if (!allow_suffix) { | 1304 | if (!allow_suffix) { |
581 | pr_warning("Error: event \"%s\" already exists. " | 1305 | pr_warning("Error: event \"%s\" already exists. " |
582 | "(Use -f to force duplicates.)\n", base); | 1306 | "(Use -f to force duplicates.)\n", base); |
583 | die("Can't add new event."); | 1307 | return -EEXIST; |
584 | } | 1308 | } |
585 | 1309 | ||
586 | /* Try to add suffix */ | 1310 | /* Try to add suffix */ |
587 | for (i = 1; i < MAX_EVENT_INDEX; i++) { | 1311 | for (i = 1; i < MAX_EVENT_INDEX; i++) { |
588 | ret = e_snprintf(buf, len, "%s_%d", base, i); | 1312 | ret = e_snprintf(buf, len, "%s_%d", base, i); |
589 | if (ret < 0) | 1313 | if (ret < 0) { |
590 | die("snprintf() failed: %s", strerror(-ret)); | 1314 | pr_debug("snprintf() failed: %s\n", strerror(-ret)); |
1315 | return ret; | ||
1316 | } | ||
591 | if (!strlist__has_entry(namelist, buf)) | 1317 | if (!strlist__has_entry(namelist, buf)) |
592 | break; | 1318 | break; |
593 | } | 1319 | } |
594 | if (i == MAX_EVENT_INDEX) | 1320 | if (i == MAX_EVENT_INDEX) { |
595 | die("Too many events are on the same function."); | 1321 | pr_warning("Too many events are on the same function.\n"); |
1322 | ret = -ERANGE; | ||
1323 | } | ||
1324 | |||
1325 | return ret; | ||
596 | } | 1326 | } |
597 | 1327 | ||
598 | void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, | 1328 | static int __add_kprobe_trace_events(struct perf_probe_event *pev, |
599 | bool force_add) | 1329 | struct kprobe_trace_event *tevs, |
1330 | int ntevs, bool allow_suffix) | ||
600 | { | 1331 | { |
601 | int i, j, fd; | 1332 | int i, fd, ret; |
602 | struct probe_point *pp; | 1333 | struct kprobe_trace_event *tev = NULL; |
603 | char buf[MAX_CMDLEN]; | 1334 | char buf[64]; |
604 | char event[64]; | 1335 | const char *event, *group; |
605 | struct strlist *namelist; | 1336 | struct strlist *namelist; |
606 | bool allow_suffix; | ||
607 | 1337 | ||
608 | fd = open_kprobe_events(O_RDWR, O_APPEND); | 1338 | fd = open_kprobe_events(true); |
1339 | if (fd < 0) | ||
1340 | return fd; | ||
609 | /* Get current event names */ | 1341 | /* Get current event names */ |
610 | namelist = get_perf_event_names(fd, false); | 1342 | namelist = get_kprobe_trace_event_names(fd, false); |
611 | 1343 | if (!namelist) { | |
612 | for (j = 0; j < nr_probes; j++) { | 1344 | pr_debug("Failed to get current event list.\n"); |
613 | pp = probes + j; | 1345 | return -EIO; |
614 | if (!pp->event) | 1346 | } |
615 | pp->event = strdup(pp->function); | 1347 | |
616 | if (!pp->group) | 1348 | ret = 0; |
617 | pp->group = strdup(PERFPROBE_GROUP); | 1349 | printf("Add new event%s\n", (ntevs > 1) ? "s:" : ":"); |
618 | DIE_IF(!pp->event || !pp->group); | 1350 | for (i = 0; i < ntevs; i++) { |
619 | /* If force_add is true, suffix search is allowed */ | 1351 | tev = &tevs[i]; |
620 | allow_suffix = force_add; | 1352 | if (pev->event) |
621 | for (i = 0; i < pp->found; i++) { | 1353 | event = pev->event; |
622 | /* Get an unused new event name */ | 1354 | else |
623 | get_new_event_name(event, 64, pp->event, namelist, | 1355 | if (pev->point.function) |
624 | allow_suffix); | 1356 | event = pev->point.function; |
625 | snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s\n", | 1357 | else |
626 | pp->retprobe ? 'r' : 'p', | 1358 | event = tev->point.symbol; |
627 | pp->group, event, | 1359 | if (pev->group) |
628 | pp->probes[i]); | 1360 | group = pev->group; |
629 | write_trace_kprobe_event(fd, buf); | 1361 | else |
630 | printf("Added new event:\n"); | 1362 | group = PERFPROBE_GROUP; |
631 | /* Get the first parameter (probe-point) */ | 1363 | |
632 | sscanf(pp->probes[i], "%s", buf); | 1364 | /* Get an unused new event name */ |
633 | show_perf_probe_event(event, buf, pp); | 1365 | ret = get_new_event_name(buf, 64, event, |
634 | /* Add added event name to namelist */ | 1366 | namelist, allow_suffix); |
635 | strlist__add(namelist, event); | 1367 | if (ret < 0) |
636 | /* | 1368 | break; |
637 | * Probes after the first probe which comes from same | 1369 | event = buf; |
638 | * user input are always allowed to add suffix, because | 1370 | |
639 | * there might be several addresses corresponding to | 1371 | tev->event = strdup(event); |
640 | * one code line. | 1372 | tev->group = strdup(group); |
641 | */ | 1373 | if (tev->event == NULL || tev->group == NULL) { |
642 | allow_suffix = true; | 1374 | ret = -ENOMEM; |
1375 | break; | ||
643 | } | 1376 | } |
1377 | ret = write_kprobe_trace_event(fd, tev); | ||
1378 | if (ret < 0) | ||
1379 | break; | ||
1380 | /* Add added event name to namelist */ | ||
1381 | strlist__add(namelist, event); | ||
1382 | |||
1383 | /* Trick here - save current event/group */ | ||
1384 | event = pev->event; | ||
1385 | group = pev->group; | ||
1386 | pev->event = tev->event; | ||
1387 | pev->group = tev->group; | ||
1388 | show_perf_probe_event(pev); | ||
1389 | /* Trick here - restore current event/group */ | ||
1390 | pev->event = (char *)event; | ||
1391 | pev->group = (char *)group; | ||
1392 | |||
1393 | /* | ||
1394 | * Probes after the first probe which comes from same | ||
1395 | * user input are always allowed to add suffix, because | ||
1396 | * there might be several addresses corresponding to | ||
1397 | * one code line. | ||
1398 | */ | ||
1399 | allow_suffix = true; | ||
1400 | } | ||
1401 | |||
1402 | if (ret >= 0) { | ||
1403 | /* Show how to use the event. */ | ||
1404 | printf("\nYou can now use it on all perf tools, such as:\n\n"); | ||
1405 | printf("\tperf record -e %s:%s -aR sleep 1\n\n", tev->group, | ||
1406 | tev->event); | ||
644 | } | 1407 | } |
645 | /* Show how to use the event. */ | ||
646 | printf("\nYou can now use it on all perf tools, such as:\n\n"); | ||
647 | printf("\tperf record -e %s:%s -a sleep 1\n\n", PERFPROBE_GROUP, event); | ||
648 | 1408 | ||
649 | strlist__delete(namelist); | 1409 | strlist__delete(namelist); |
650 | close(fd); | 1410 | close(fd); |
1411 | return ret; | ||
1412 | } | ||
1413 | |||
1414 | static int convert_to_kprobe_trace_events(struct perf_probe_event *pev, | ||
1415 | struct kprobe_trace_event **tevs, | ||
1416 | int max_tevs) | ||
1417 | { | ||
1418 | struct symbol *sym; | ||
1419 | int ret = 0, i; | ||
1420 | struct kprobe_trace_event *tev; | ||
1421 | |||
1422 | /* Convert perf_probe_event with debuginfo */ | ||
1423 | ret = try_to_find_kprobe_trace_events(pev, tevs, max_tevs); | ||
1424 | if (ret != 0) | ||
1425 | return ret; | ||
1426 | |||
1427 | /* Allocate trace event buffer */ | ||
1428 | tev = *tevs = zalloc(sizeof(struct kprobe_trace_event)); | ||
1429 | if (tev == NULL) | ||
1430 | return -ENOMEM; | ||
1431 | |||
1432 | /* Copy parameters */ | ||
1433 | tev->point.symbol = strdup(pev->point.function); | ||
1434 | if (tev->point.symbol == NULL) { | ||
1435 | ret = -ENOMEM; | ||
1436 | goto error; | ||
1437 | } | ||
1438 | tev->point.offset = pev->point.offset; | ||
1439 | tev->nargs = pev->nargs; | ||
1440 | if (tev->nargs) { | ||
1441 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) | ||
1442 | * tev->nargs); | ||
1443 | if (tev->args == NULL) { | ||
1444 | ret = -ENOMEM; | ||
1445 | goto error; | ||
1446 | } | ||
1447 | for (i = 0; i < tev->nargs; i++) { | ||
1448 | if (pev->args[i].name) { | ||
1449 | tev->args[i].name = strdup(pev->args[i].name); | ||
1450 | if (tev->args[i].name == NULL) { | ||
1451 | ret = -ENOMEM; | ||
1452 | goto error; | ||
1453 | } | ||
1454 | } | ||
1455 | tev->args[i].value = strdup(pev->args[i].var); | ||
1456 | if (tev->args[i].value == NULL) { | ||
1457 | ret = -ENOMEM; | ||
1458 | goto error; | ||
1459 | } | ||
1460 | if (pev->args[i].type) { | ||
1461 | tev->args[i].type = strdup(pev->args[i].type); | ||
1462 | if (tev->args[i].type == NULL) { | ||
1463 | ret = -ENOMEM; | ||
1464 | goto error; | ||
1465 | } | ||
1466 | } | ||
1467 | } | ||
1468 | } | ||
1469 | |||
1470 | /* Currently just checking function name from symbol map */ | ||
1471 | sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION], | ||
1472 | tev->point.symbol, NULL); | ||
1473 | if (!sym) { | ||
1474 | pr_warning("Kernel symbol \'%s\' not found.\n", | ||
1475 | tev->point.symbol); | ||
1476 | ret = -ENOENT; | ||
1477 | goto error; | ||
1478 | } | ||
1479 | |||
1480 | return 1; | ||
1481 | error: | ||
1482 | clear_kprobe_trace_event(tev); | ||
1483 | free(tev); | ||
1484 | *tevs = NULL; | ||
1485 | return ret; | ||
1486 | } | ||
1487 | |||
1488 | struct __event_package { | ||
1489 | struct perf_probe_event *pev; | ||
1490 | struct kprobe_trace_event *tevs; | ||
1491 | int ntevs; | ||
1492 | }; | ||
1493 | |||
1494 | int add_perf_probe_events(struct perf_probe_event *pevs, int npevs, | ||
1495 | bool force_add, int max_tevs) | ||
1496 | { | ||
1497 | int i, j, ret; | ||
1498 | struct __event_package *pkgs; | ||
1499 | |||
1500 | pkgs = zalloc(sizeof(struct __event_package) * npevs); | ||
1501 | if (pkgs == NULL) | ||
1502 | return -ENOMEM; | ||
1503 | |||
1504 | /* Init vmlinux path */ | ||
1505 | ret = init_vmlinux(); | ||
1506 | if (ret < 0) | ||
1507 | return ret; | ||
1508 | |||
1509 | /* Loop 1: convert all events */ | ||
1510 | for (i = 0; i < npevs; i++) { | ||
1511 | pkgs[i].pev = &pevs[i]; | ||
1512 | /* Convert with or without debuginfo */ | ||
1513 | ret = convert_to_kprobe_trace_events(pkgs[i].pev, | ||
1514 | &pkgs[i].tevs, max_tevs); | ||
1515 | if (ret < 0) | ||
1516 | goto end; | ||
1517 | pkgs[i].ntevs = ret; | ||
1518 | } | ||
1519 | |||
1520 | /* Loop 2: add all events */ | ||
1521 | for (i = 0; i < npevs && ret >= 0; i++) | ||
1522 | ret = __add_kprobe_trace_events(pkgs[i].pev, pkgs[i].tevs, | ||
1523 | pkgs[i].ntevs, force_add); | ||
1524 | end: | ||
1525 | /* Loop 3: cleanup trace events */ | ||
1526 | for (i = 0; i < npevs; i++) | ||
1527 | for (j = 0; j < pkgs[i].ntevs; j++) | ||
1528 | clear_kprobe_trace_event(&pkgs[i].tevs[j]); | ||
1529 | |||
1530 | return ret; | ||
651 | } | 1531 | } |
652 | 1532 | ||
653 | static void __del_trace_kprobe_event(int fd, struct str_node *ent) | 1533 | static int __del_trace_kprobe_event(int fd, struct str_node *ent) |
654 | { | 1534 | { |
655 | char *p; | 1535 | char *p; |
656 | char buf[128]; | 1536 | char buf[128]; |
1537 | int ret; | ||
657 | 1538 | ||
658 | /* Convert from perf-probe event to trace-kprobe event */ | 1539 | /* Convert from perf-probe event to trace-kprobe event */ |
659 | if (e_snprintf(buf, 128, "-:%s", ent->s) < 0) | 1540 | ret = e_snprintf(buf, 128, "-:%s", ent->s); |
660 | die("Failed to copy event."); | 1541 | if (ret < 0) |
1542 | goto error; | ||
1543 | |||
661 | p = strchr(buf + 2, ':'); | 1544 | p = strchr(buf + 2, ':'); |
662 | if (!p) | 1545 | if (!p) { |
663 | die("Internal error: %s should have ':' but not.", ent->s); | 1546 | pr_debug("Internal error: %s should have ':' but not.\n", |
1547 | ent->s); | ||
1548 | ret = -ENOTSUP; | ||
1549 | goto error; | ||
1550 | } | ||
664 | *p = '/'; | 1551 | *p = '/'; |
665 | 1552 | ||
666 | write_trace_kprobe_event(fd, buf); | 1553 | pr_debug("Writing event: %s\n", buf); |
1554 | ret = write(fd, buf, strlen(buf)); | ||
1555 | if (ret < 0) | ||
1556 | goto error; | ||
1557 | |||
667 | printf("Remove event: %s\n", ent->s); | 1558 | printf("Remove event: %s\n", ent->s); |
1559 | return 0; | ||
1560 | error: | ||
1561 | pr_warning("Failed to delete event: %s\n", strerror(-ret)); | ||
1562 | return ret; | ||
668 | } | 1563 | } |
669 | 1564 | ||
670 | static void del_trace_kprobe_event(int fd, const char *group, | 1565 | static int del_trace_kprobe_event(int fd, const char *group, |
671 | const char *event, struct strlist *namelist) | 1566 | const char *event, struct strlist *namelist) |
672 | { | 1567 | { |
673 | char buf[128]; | 1568 | char buf[128]; |
674 | struct str_node *ent, *n; | 1569 | struct str_node *ent, *n; |
675 | int found = 0; | 1570 | int found = 0, ret = 0; |
676 | 1571 | ||
677 | if (e_snprintf(buf, 128, "%s:%s", group, event) < 0) | 1572 | ret = e_snprintf(buf, 128, "%s:%s", group, event); |
678 | die("Failed to copy event."); | 1573 | if (ret < 0) { |
1574 | pr_err("Failed to copy event."); | ||
1575 | return ret; | ||
1576 | } | ||
679 | 1577 | ||
680 | if (strpbrk(buf, "*?")) { /* Glob-exp */ | 1578 | if (strpbrk(buf, "*?")) { /* Glob-exp */ |
681 | strlist__for_each_safe(ent, n, namelist) | 1579 | strlist__for_each_safe(ent, n, namelist) |
682 | if (strglobmatch(ent->s, buf)) { | 1580 | if (strglobmatch(ent->s, buf)) { |
683 | found++; | 1581 | found++; |
684 | __del_trace_kprobe_event(fd, ent); | 1582 | ret = __del_trace_kprobe_event(fd, ent); |
1583 | if (ret < 0) | ||
1584 | break; | ||
685 | strlist__remove(namelist, ent); | 1585 | strlist__remove(namelist, ent); |
686 | } | 1586 | } |
687 | } else { | 1587 | } else { |
688 | ent = strlist__find(namelist, buf); | 1588 | ent = strlist__find(namelist, buf); |
689 | if (ent) { | 1589 | if (ent) { |
690 | found++; | 1590 | found++; |
691 | __del_trace_kprobe_event(fd, ent); | 1591 | ret = __del_trace_kprobe_event(fd, ent); |
692 | strlist__remove(namelist, ent); | 1592 | if (ret >= 0) |
1593 | strlist__remove(namelist, ent); | ||
693 | } | 1594 | } |
694 | } | 1595 | } |
695 | if (found == 0) | 1596 | if (found == 0 && ret >= 0) |
696 | pr_info("Info: event \"%s\" does not exist, could not remove it.\n", buf); | 1597 | pr_info("Info: Event \"%s\" does not exist.\n", buf); |
1598 | |||
1599 | return ret; | ||
697 | } | 1600 | } |
698 | 1601 | ||
699 | void del_trace_kprobe_events(struct strlist *dellist) | 1602 | int del_perf_probe_events(struct strlist *dellist) |
700 | { | 1603 | { |
701 | int fd; | 1604 | int fd, ret = 0; |
702 | const char *group, *event; | 1605 | const char *group, *event; |
703 | char *p, *str; | 1606 | char *p, *str; |
704 | struct str_node *ent; | 1607 | struct str_node *ent; |
705 | struct strlist *namelist; | 1608 | struct strlist *namelist; |
706 | 1609 | ||
707 | fd = open_kprobe_events(O_RDWR, O_APPEND); | 1610 | fd = open_kprobe_events(true); |
1611 | if (fd < 0) | ||
1612 | return fd; | ||
1613 | |||
708 | /* Get current event names */ | 1614 | /* Get current event names */ |
709 | namelist = get_perf_event_names(fd, true); | 1615 | namelist = get_kprobe_trace_event_names(fd, true); |
1616 | if (namelist == NULL) | ||
1617 | return -EINVAL; | ||
710 | 1618 | ||
711 | strlist__for_each(ent, dellist) { | 1619 | strlist__for_each(ent, dellist) { |
712 | str = strdup(ent->s); | 1620 | str = strdup(ent->s); |
713 | if (!str) | 1621 | if (str == NULL) { |
714 | die("Failed to copy event."); | 1622 | ret = -ENOMEM; |
1623 | break; | ||
1624 | } | ||
715 | pr_debug("Parsing: %s\n", str); | 1625 | pr_debug("Parsing: %s\n", str); |
716 | p = strchr(str, ':'); | 1626 | p = strchr(str, ':'); |
717 | if (p) { | 1627 | if (p) { |
@@ -723,80 +1633,14 @@ void del_trace_kprobe_events(struct strlist *dellist) | |||
723 | event = str; | 1633 | event = str; |
724 | } | 1634 | } |
725 | pr_debug("Group: %s, Event: %s\n", group, event); | 1635 | pr_debug("Group: %s, Event: %s\n", group, event); |
726 | del_trace_kprobe_event(fd, group, event, namelist); | 1636 | ret = del_trace_kprobe_event(fd, group, event, namelist); |
727 | free(str); | 1637 | free(str); |
1638 | if (ret < 0) | ||
1639 | break; | ||
728 | } | 1640 | } |
729 | strlist__delete(namelist); | 1641 | strlist__delete(namelist); |
730 | close(fd); | 1642 | close(fd); |
731 | } | ||
732 | 1643 | ||
733 | #define LINEBUF_SIZE 256 | 1644 | return ret; |
734 | #define NR_ADDITIONAL_LINES 2 | ||
735 | |||
736 | static void show_one_line(FILE *fp, unsigned int l, bool skip, bool show_num) | ||
737 | { | ||
738 | char buf[LINEBUF_SIZE]; | ||
739 | const char *color = PERF_COLOR_BLUE; | ||
740 | |||
741 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
742 | goto error; | ||
743 | if (!skip) { | ||
744 | if (show_num) | ||
745 | fprintf(stdout, "%7u %s", l, buf); | ||
746 | else | ||
747 | color_fprintf(stdout, color, " %s", buf); | ||
748 | } | ||
749 | |||
750 | while (strlen(buf) == LINEBUF_SIZE - 1 && | ||
751 | buf[LINEBUF_SIZE - 2] != '\n') { | ||
752 | if (fgets(buf, LINEBUF_SIZE, fp) == NULL) | ||
753 | goto error; | ||
754 | if (!skip) { | ||
755 | if (show_num) | ||
756 | fprintf(stdout, "%s", buf); | ||
757 | else | ||
758 | color_fprintf(stdout, color, "%s", buf); | ||
759 | } | ||
760 | } | ||
761 | return; | ||
762 | error: | ||
763 | if (feof(fp)) | ||
764 | die("Source file is shorter than expected."); | ||
765 | else | ||
766 | die("File read error: %s", strerror(errno)); | ||
767 | } | 1645 | } |
768 | 1646 | ||
769 | void show_line_range(struct line_range *lr) | ||
770 | { | ||
771 | unsigned int l = 1; | ||
772 | struct line_node *ln; | ||
773 | FILE *fp; | ||
774 | |||
775 | setup_pager(); | ||
776 | |||
777 | if (lr->function) | ||
778 | fprintf(stdout, "<%s:%d>\n", lr->function, | ||
779 | lr->start - lr->offset); | ||
780 | else | ||
781 | fprintf(stdout, "<%s:%d>\n", lr->file, lr->start); | ||
782 | |||
783 | fp = fopen(lr->path, "r"); | ||
784 | if (fp == NULL) | ||
785 | die("Failed to open %s: %s", lr->path, strerror(errno)); | ||
786 | /* Skip to starting line number */ | ||
787 | while (l < lr->start) | ||
788 | show_one_line(fp, l++, true, false); | ||
789 | |||
790 | list_for_each_entry(ln, &lr->line_list, list) { | ||
791 | while (ln->line > l) | ||
792 | show_one_line(fp, (l++) - lr->offset, false, false); | ||
793 | show_one_line(fp, (l++) - lr->offset, false, true); | ||
794 | } | ||
795 | |||
796 | if (lr->end == INT_MAX) | ||
797 | lr->end = l + NR_ADDITIONAL_LINES; | ||
798 | while (l < lr->end && !feof(fp)) | ||
799 | show_one_line(fp, (l++) - lr->offset, false, false); | ||
800 | |||
801 | fclose(fp); | ||
802 | } | ||
diff --git a/tools/perf/util/probe-event.h b/tools/perf/util/probe-event.h index 711287d4baea..e9db1a214ca4 100644 --- a/tools/perf/util/probe-event.h +++ b/tools/perf/util/probe-event.h | |||
@@ -2,21 +2,125 @@ | |||
2 | #define _PROBE_EVENT_H | 2 | #define _PROBE_EVENT_H |
3 | 3 | ||
4 | #include <stdbool.h> | 4 | #include <stdbool.h> |
5 | #include "probe-finder.h" | ||
6 | #include "strlist.h" | 5 | #include "strlist.h" |
7 | 6 | ||
8 | extern void parse_line_range_desc(const char *arg, struct line_range *lr); | 7 | extern bool probe_event_dry_run; |
9 | extern void parse_perf_probe_event(const char *str, struct probe_point *pp, | 8 | |
10 | bool *need_dwarf); | 9 | /* kprobe-tracer tracing point */ |
11 | extern int synthesize_perf_probe_point(struct probe_point *pp); | 10 | struct kprobe_trace_point { |
12 | extern int synthesize_perf_probe_event(struct probe_point *pp); | 11 | char *symbol; /* Base symbol */ |
13 | extern void parse_trace_kprobe_event(const char *str, struct probe_point *pp); | 12 | unsigned long offset; /* Offset from symbol */ |
14 | extern int synthesize_trace_kprobe_event(struct probe_point *pp); | 13 | bool retprobe; /* Return probe flag */ |
15 | extern void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, | 14 | }; |
16 | bool force_add); | 15 | |
17 | extern void del_trace_kprobe_events(struct strlist *dellist); | 16 | /* kprobe-tracer tracing argument referencing offset */ |
18 | extern void show_perf_probe_events(void); | 17 | struct kprobe_trace_arg_ref { |
19 | extern void show_line_range(struct line_range *lr); | 18 | struct kprobe_trace_arg_ref *next; /* Next reference */ |
19 | long offset; /* Offset value */ | ||
20 | }; | ||
21 | |||
22 | /* kprobe-tracer tracing argument */ | ||
23 | struct kprobe_trace_arg { | ||
24 | char *name; /* Argument name */ | ||
25 | char *value; /* Base value */ | ||
26 | char *type; /* Type name */ | ||
27 | struct kprobe_trace_arg_ref *ref; /* Referencing offset */ | ||
28 | }; | ||
29 | |||
30 | /* kprobe-tracer tracing event (point + arg) */ | ||
31 | struct kprobe_trace_event { | ||
32 | char *event; /* Event name */ | ||
33 | char *group; /* Group name */ | ||
34 | struct kprobe_trace_point point; /* Trace point */ | ||
35 | int nargs; /* Number of args */ | ||
36 | struct kprobe_trace_arg *args; /* Arguments */ | ||
37 | }; | ||
38 | |||
39 | /* Perf probe probing point */ | ||
40 | struct perf_probe_point { | ||
41 | char *file; /* File path */ | ||
42 | char *function; /* Function name */ | ||
43 | int line; /* Line number */ | ||
44 | bool retprobe; /* Return probe flag */ | ||
45 | char *lazy_line; /* Lazy matching pattern */ | ||
46 | unsigned long offset; /* Offset from function entry */ | ||
47 | }; | ||
48 | |||
49 | /* Perf probe probing argument field chain */ | ||
50 | struct perf_probe_arg_field { | ||
51 | struct perf_probe_arg_field *next; /* Next field */ | ||
52 | char *name; /* Name of the field */ | ||
53 | bool ref; /* Referencing flag */ | ||
54 | }; | ||
55 | |||
56 | /* Perf probe probing argument */ | ||
57 | struct perf_probe_arg { | ||
58 | char *name; /* Argument name */ | ||
59 | char *var; /* Variable name */ | ||
60 | char *type; /* Type name */ | ||
61 | struct perf_probe_arg_field *field; /* Structure fields */ | ||
62 | }; | ||
63 | |||
64 | /* Perf probe probing event (point + arg) */ | ||
65 | struct perf_probe_event { | ||
66 | char *event; /* Event name */ | ||
67 | char *group; /* Group name */ | ||
68 | struct perf_probe_point point; /* Probe point */ | ||
69 | int nargs; /* Number of arguments */ | ||
70 | struct perf_probe_arg *args; /* Arguments */ | ||
71 | }; | ||
72 | |||
73 | |||
74 | /* Line number container */ | ||
75 | struct line_node { | ||
76 | struct list_head list; | ||
77 | int line; | ||
78 | }; | ||
79 | |||
80 | /* Line range */ | ||
81 | struct line_range { | ||
82 | char *file; /* File name */ | ||
83 | char *function; /* Function name */ | ||
84 | int start; /* Start line number */ | ||
85 | int end; /* End line number */ | ||
86 | int offset; /* Start line offset */ | ||
87 | char *path; /* Real path name */ | ||
88 | struct list_head line_list; /* Visible lines */ | ||
89 | }; | ||
90 | |||
91 | /* Command string to events */ | ||
92 | extern int parse_perf_probe_command(const char *cmd, | ||
93 | struct perf_probe_event *pev); | ||
94 | extern int parse_kprobe_trace_command(const char *cmd, | ||
95 | struct kprobe_trace_event *tev); | ||
96 | |||
97 | /* Events to command string */ | ||
98 | extern char *synthesize_perf_probe_command(struct perf_probe_event *pev); | ||
99 | extern char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev); | ||
100 | extern int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf, | ||
101 | size_t len); | ||
102 | |||
103 | /* Check the perf_probe_event needs debuginfo */ | ||
104 | extern bool perf_probe_event_need_dwarf(struct perf_probe_event *pev); | ||
105 | |||
106 | /* Convert from kprobe_trace_event to perf_probe_event */ | ||
107 | extern int convert_to_perf_probe_event(struct kprobe_trace_event *tev, | ||
108 | struct perf_probe_event *pev); | ||
109 | |||
110 | /* Release event contents */ | ||
111 | extern void clear_perf_probe_event(struct perf_probe_event *pev); | ||
112 | extern void clear_kprobe_trace_event(struct kprobe_trace_event *tev); | ||
113 | |||
114 | /* Command string to line-range */ | ||
115 | extern int parse_line_range_desc(const char *cmd, struct line_range *lr); | ||
116 | |||
117 | |||
118 | extern int add_perf_probe_events(struct perf_probe_event *pevs, int npevs, | ||
119 | bool force_add, int max_probe_points); | ||
120 | extern int del_perf_probe_events(struct strlist *dellist); | ||
121 | extern int show_perf_probe_events(void); | ||
122 | extern int show_line_range(struct line_range *lr); | ||
123 | |||
20 | 124 | ||
21 | /* Maximum index number of event-name postfix */ | 125 | /* Maximum index number of event-name postfix */ |
22 | #define MAX_EVENT_INDEX 1024 | 126 | #define MAX_EVENT_INDEX 1024 |
diff --git a/tools/perf/util/probe-finder.c b/tools/perf/util/probe-finder.c index c171a243d05b..562b1443e785 100644 --- a/tools/perf/util/probe-finder.c +++ b/tools/perf/util/probe-finder.c | |||
@@ -31,6 +31,7 @@ | |||
31 | #include <string.h> | 31 | #include <string.h> |
32 | #include <stdarg.h> | 32 | #include <stdarg.h> |
33 | #include <ctype.h> | 33 | #include <ctype.h> |
34 | #include <dwarf-regs.h> | ||
34 | 35 | ||
35 | #include "string.h" | 36 | #include "string.h" |
36 | #include "event.h" | 37 | #include "event.h" |
@@ -38,57 +39,8 @@ | |||
38 | #include "util.h" | 39 | #include "util.h" |
39 | #include "probe-finder.h" | 40 | #include "probe-finder.h" |
40 | 41 | ||
41 | 42 | /* Kprobe tracer basic type is up to u64 */ | |
42 | /* | 43 | #define MAX_BASIC_TYPE_BITS 64 |
43 | * Generic dwarf analysis helpers | ||
44 | */ | ||
45 | |||
46 | #define X86_32_MAX_REGS 8 | ||
47 | const char *x86_32_regs_table[X86_32_MAX_REGS] = { | ||
48 | "%ax", | ||
49 | "%cx", | ||
50 | "%dx", | ||
51 | "%bx", | ||
52 | "$stack", /* Stack address instead of %sp */ | ||
53 | "%bp", | ||
54 | "%si", | ||
55 | "%di", | ||
56 | }; | ||
57 | |||
58 | #define X86_64_MAX_REGS 16 | ||
59 | const char *x86_64_regs_table[X86_64_MAX_REGS] = { | ||
60 | "%ax", | ||
61 | "%dx", | ||
62 | "%cx", | ||
63 | "%bx", | ||
64 | "%si", | ||
65 | "%di", | ||
66 | "%bp", | ||
67 | "%sp", | ||
68 | "%r8", | ||
69 | "%r9", | ||
70 | "%r10", | ||
71 | "%r11", | ||
72 | "%r12", | ||
73 | "%r13", | ||
74 | "%r14", | ||
75 | "%r15", | ||
76 | }; | ||
77 | |||
78 | /* TODO: switching by dwarf address size */ | ||
79 | #ifdef __x86_64__ | ||
80 | #define ARCH_MAX_REGS X86_64_MAX_REGS | ||
81 | #define arch_regs_table x86_64_regs_table | ||
82 | #else | ||
83 | #define ARCH_MAX_REGS X86_32_MAX_REGS | ||
84 | #define arch_regs_table x86_32_regs_table | ||
85 | #endif | ||
86 | |||
87 | /* Return architecture dependent register string (for kprobe-tracer) */ | ||
88 | static const char *get_arch_regstr(unsigned int n) | ||
89 | { | ||
90 | return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL; | ||
91 | } | ||
92 | 44 | ||
93 | /* | 45 | /* |
94 | * Compare the tail of two strings. | 46 | * Compare the tail of two strings. |
@@ -108,7 +60,7 @@ static int strtailcmp(const char *s1, const char *s2) | |||
108 | /* Line number list operations */ | 60 | /* Line number list operations */ |
109 | 61 | ||
110 | /* Add a line to line number list */ | 62 | /* Add a line to line number list */ |
111 | static void line_list__add_line(struct list_head *head, unsigned int line) | 63 | static int line_list__add_line(struct list_head *head, int line) |
112 | { | 64 | { |
113 | struct line_node *ln; | 65 | struct line_node *ln; |
114 | struct list_head *p; | 66 | struct list_head *p; |
@@ -119,21 +71,23 @@ static void line_list__add_line(struct list_head *head, unsigned int line) | |||
119 | p = &ln->list; | 71 | p = &ln->list; |
120 | goto found; | 72 | goto found; |
121 | } else if (ln->line == line) /* Already exist */ | 73 | } else if (ln->line == line) /* Already exist */ |
122 | return ; | 74 | return 1; |
123 | } | 75 | } |
124 | /* List is empty, or the smallest entry */ | 76 | /* List is empty, or the smallest entry */ |
125 | p = head; | 77 | p = head; |
126 | found: | 78 | found: |
127 | pr_debug("line list: add a line %u\n", line); | 79 | pr_debug("line list: add a line %u\n", line); |
128 | ln = zalloc(sizeof(struct line_node)); | 80 | ln = zalloc(sizeof(struct line_node)); |
129 | DIE_IF(ln == NULL); | 81 | if (ln == NULL) |
82 | return -ENOMEM; | ||
130 | ln->line = line; | 83 | ln->line = line; |
131 | INIT_LIST_HEAD(&ln->list); | 84 | INIT_LIST_HEAD(&ln->list); |
132 | list_add(&ln->list, p); | 85 | list_add(&ln->list, p); |
86 | return 0; | ||
133 | } | 87 | } |
134 | 88 | ||
135 | /* Check if the line in line number list */ | 89 | /* Check if the line in line number list */ |
136 | static int line_list__has_line(struct list_head *head, unsigned int line) | 90 | static int line_list__has_line(struct list_head *head, int line) |
137 | { | 91 | { |
138 | struct line_node *ln; | 92 | struct line_node *ln; |
139 | 93 | ||
@@ -184,9 +138,129 @@ static const char *cu_find_realpath(Dwarf_Die *cu_die, const char *fname) | |||
184 | if (strtailcmp(src, fname) == 0) | 138 | if (strtailcmp(src, fname) == 0) |
185 | break; | 139 | break; |
186 | } | 140 | } |
141 | if (i == nfiles) | ||
142 | return NULL; | ||
187 | return src; | 143 | return src; |
188 | } | 144 | } |
189 | 145 | ||
146 | /* Compare diename and tname */ | ||
147 | static bool die_compare_name(Dwarf_Die *dw_die, const char *tname) | ||
148 | { | ||
149 | const char *name; | ||
150 | name = dwarf_diename(dw_die); | ||
151 | return name ? strcmp(tname, name) : -1; | ||
152 | } | ||
153 | |||
154 | /* Get type die, but skip qualifiers and typedef */ | ||
155 | static Dwarf_Die *die_get_real_type(Dwarf_Die *vr_die, Dwarf_Die *die_mem) | ||
156 | { | ||
157 | Dwarf_Attribute attr; | ||
158 | int tag; | ||
159 | |||
160 | do { | ||
161 | if (dwarf_attr(vr_die, DW_AT_type, &attr) == NULL || | ||
162 | dwarf_formref_die(&attr, die_mem) == NULL) | ||
163 | return NULL; | ||
164 | |||
165 | tag = dwarf_tag(die_mem); | ||
166 | vr_die = die_mem; | ||
167 | } while (tag == DW_TAG_const_type || | ||
168 | tag == DW_TAG_restrict_type || | ||
169 | tag == DW_TAG_volatile_type || | ||
170 | tag == DW_TAG_shared_type || | ||
171 | tag == DW_TAG_typedef); | ||
172 | |||
173 | return die_mem; | ||
174 | } | ||
175 | |||
176 | static bool die_is_signed_type(Dwarf_Die *tp_die) | ||
177 | { | ||
178 | Dwarf_Attribute attr; | ||
179 | Dwarf_Word ret; | ||
180 | |||
181 | if (dwarf_attr(tp_die, DW_AT_encoding, &attr) == NULL || | ||
182 | dwarf_formudata(&attr, &ret) != 0) | ||
183 | return false; | ||
184 | |||
185 | return (ret == DW_ATE_signed_char || ret == DW_ATE_signed || | ||
186 | ret == DW_ATE_signed_fixed); | ||
187 | } | ||
188 | |||
189 | static int die_get_byte_size(Dwarf_Die *tp_die) | ||
190 | { | ||
191 | Dwarf_Attribute attr; | ||
192 | Dwarf_Word ret; | ||
193 | |||
194 | if (dwarf_attr(tp_die, DW_AT_byte_size, &attr) == NULL || | ||
195 | dwarf_formudata(&attr, &ret) != 0) | ||
196 | return 0; | ||
197 | |||
198 | return (int)ret; | ||
199 | } | ||
200 | |||
201 | /* Get data_member_location offset */ | ||
202 | static int die_get_data_member_location(Dwarf_Die *mb_die, Dwarf_Word *offs) | ||
203 | { | ||
204 | Dwarf_Attribute attr; | ||
205 | Dwarf_Op *expr; | ||
206 | size_t nexpr; | ||
207 | int ret; | ||
208 | |||
209 | if (dwarf_attr(mb_die, DW_AT_data_member_location, &attr) == NULL) | ||
210 | return -ENOENT; | ||
211 | |||
212 | if (dwarf_formudata(&attr, offs) != 0) { | ||
213 | /* DW_AT_data_member_location should be DW_OP_plus_uconst */ | ||
214 | ret = dwarf_getlocation(&attr, &expr, &nexpr); | ||
215 | if (ret < 0 || nexpr == 0) | ||
216 | return -ENOENT; | ||
217 | |||
218 | if (expr[0].atom != DW_OP_plus_uconst || nexpr != 1) { | ||
219 | pr_debug("Unable to get offset:Unexpected OP %x (%zd)\n", | ||
220 | expr[0].atom, nexpr); | ||
221 | return -ENOTSUP; | ||
222 | } | ||
223 | *offs = (Dwarf_Word)expr[0].number; | ||
224 | } | ||
225 | return 0; | ||
226 | } | ||
227 | |||
228 | /* Return values for die_find callbacks */ | ||
229 | enum { | ||
230 | DIE_FIND_CB_FOUND = 0, /* End of Search */ | ||
231 | DIE_FIND_CB_CHILD = 1, /* Search only children */ | ||
232 | DIE_FIND_CB_SIBLING = 2, /* Search only siblings */ | ||
233 | DIE_FIND_CB_CONTINUE = 3, /* Search children and siblings */ | ||
234 | }; | ||
235 | |||
236 | /* Search a child die */ | ||
237 | static Dwarf_Die *die_find_child(Dwarf_Die *rt_die, | ||
238 | int (*callback)(Dwarf_Die *, void *), | ||
239 | void *data, Dwarf_Die *die_mem) | ||
240 | { | ||
241 | Dwarf_Die child_die; | ||
242 | int ret; | ||
243 | |||
244 | ret = dwarf_child(rt_die, die_mem); | ||
245 | if (ret != 0) | ||
246 | return NULL; | ||
247 | |||
248 | do { | ||
249 | ret = callback(die_mem, data); | ||
250 | if (ret == DIE_FIND_CB_FOUND) | ||
251 | return die_mem; | ||
252 | |||
253 | if ((ret & DIE_FIND_CB_CHILD) && | ||
254 | die_find_child(die_mem, callback, data, &child_die)) { | ||
255 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | ||
256 | return die_mem; | ||
257 | } | ||
258 | } while ((ret & DIE_FIND_CB_SIBLING) && | ||
259 | dwarf_siblingof(die_mem, die_mem) == 0); | ||
260 | |||
261 | return NULL; | ||
262 | } | ||
263 | |||
190 | struct __addr_die_search_param { | 264 | struct __addr_die_search_param { |
191 | Dwarf_Addr addr; | 265 | Dwarf_Addr addr; |
192 | Dwarf_Die *die_mem; | 266 | Dwarf_Die *die_mem; |
@@ -205,8 +279,8 @@ static int __die_search_func_cb(Dwarf_Die *fn_die, void *data) | |||
205 | } | 279 | } |
206 | 280 | ||
207 | /* Search a real subprogram including this line, */ | 281 | /* Search a real subprogram including this line, */ |
208 | static Dwarf_Die *die_get_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, | 282 | static Dwarf_Die *die_find_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, |
209 | Dwarf_Die *die_mem) | 283 | Dwarf_Die *die_mem) |
210 | { | 284 | { |
211 | struct __addr_die_search_param ad; | 285 | struct __addr_die_search_param ad; |
212 | ad.addr = addr; | 286 | ad.addr = addr; |
@@ -218,77 +292,64 @@ static Dwarf_Die *die_get_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr, | |||
218 | return die_mem; | 292 | return die_mem; |
219 | } | 293 | } |
220 | 294 | ||
221 | /* Similar to dwarf_getfuncs, but returns inlined_subroutine if exists. */ | 295 | /* die_find callback for inline function search */ |
222 | static Dwarf_Die *die_get_inlinefunc(Dwarf_Die *sp_die, Dwarf_Addr addr, | 296 | static int __die_find_inline_cb(Dwarf_Die *die_mem, void *data) |
223 | Dwarf_Die *die_mem) | ||
224 | { | 297 | { |
225 | Dwarf_Die child_die; | 298 | Dwarf_Addr *addr = data; |
226 | int ret; | ||
227 | 299 | ||
228 | ret = dwarf_child(sp_die, die_mem); | 300 | if (dwarf_tag(die_mem) == DW_TAG_inlined_subroutine && |
229 | if (ret != 0) | 301 | dwarf_haspc(die_mem, *addr)) |
230 | return NULL; | 302 | return DIE_FIND_CB_FOUND; |
231 | 303 | ||
232 | do { | 304 | return DIE_FIND_CB_CONTINUE; |
233 | if (dwarf_tag(die_mem) == DW_TAG_inlined_subroutine && | ||
234 | dwarf_haspc(die_mem, addr)) | ||
235 | return die_mem; | ||
236 | |||
237 | if (die_get_inlinefunc(die_mem, addr, &child_die)) { | ||
238 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | ||
239 | return die_mem; | ||
240 | } | ||
241 | } while (dwarf_siblingof(die_mem, die_mem) == 0); | ||
242 | |||
243 | return NULL; | ||
244 | } | 305 | } |
245 | 306 | ||
246 | /* Compare diename and tname */ | 307 | /* Similar to dwarf_getfuncs, but returns inlined_subroutine if exists. */ |
247 | static bool die_compare_name(Dwarf_Die *dw_die, const char *tname) | 308 | static Dwarf_Die *die_find_inlinefunc(Dwarf_Die *sp_die, Dwarf_Addr addr, |
309 | Dwarf_Die *die_mem) | ||
248 | { | 310 | { |
249 | const char *name; | 311 | return die_find_child(sp_die, __die_find_inline_cb, &addr, die_mem); |
250 | name = dwarf_diename(dw_die); | ||
251 | DIE_IF(name == NULL); | ||
252 | return strcmp(tname, name); | ||
253 | } | 312 | } |
254 | 313 | ||
255 | /* Get entry pc(or low pc, 1st entry of ranges) of the die */ | 314 | static int __die_find_variable_cb(Dwarf_Die *die_mem, void *data) |
256 | static Dwarf_Addr die_get_entrypc(Dwarf_Die *dw_die) | ||
257 | { | 315 | { |
258 | Dwarf_Addr epc; | 316 | const char *name = data; |
259 | int ret; | 317 | int tag; |
260 | 318 | ||
261 | ret = dwarf_entrypc(dw_die, &epc); | 319 | tag = dwarf_tag(die_mem); |
262 | DIE_IF(ret == -1); | 320 | if ((tag == DW_TAG_formal_parameter || |
263 | return epc; | 321 | tag == DW_TAG_variable) && |
322 | (die_compare_name(die_mem, name) == 0)) | ||
323 | return DIE_FIND_CB_FOUND; | ||
324 | |||
325 | return DIE_FIND_CB_CONTINUE; | ||
264 | } | 326 | } |
265 | 327 | ||
266 | /* Get a variable die */ | 328 | /* Find a variable called 'name' */ |
267 | static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, | 329 | static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, |
268 | Dwarf_Die *die_mem) | 330 | Dwarf_Die *die_mem) |
269 | { | 331 | { |
270 | Dwarf_Die child_die; | 332 | return die_find_child(sp_die, __die_find_variable_cb, (void *)name, |
271 | int tag; | 333 | die_mem); |
272 | int ret; | 334 | } |
273 | 335 | ||
274 | ret = dwarf_child(sp_die, die_mem); | 336 | static int __die_find_member_cb(Dwarf_Die *die_mem, void *data) |
275 | if (ret != 0) | 337 | { |
276 | return NULL; | 338 | const char *name = data; |
277 | 339 | ||
278 | do { | 340 | if ((dwarf_tag(die_mem) == DW_TAG_member) && |
279 | tag = dwarf_tag(die_mem); | 341 | (die_compare_name(die_mem, name) == 0)) |
280 | if ((tag == DW_TAG_formal_parameter || | 342 | return DIE_FIND_CB_FOUND; |
281 | tag == DW_TAG_variable) && | ||
282 | (die_compare_name(die_mem, name) == 0)) | ||
283 | return die_mem; | ||
284 | 343 | ||
285 | if (die_find_variable(die_mem, name, &child_die)) { | 344 | return DIE_FIND_CB_SIBLING; |
286 | memcpy(die_mem, &child_die, sizeof(Dwarf_Die)); | 345 | } |
287 | return die_mem; | ||
288 | } | ||
289 | } while (dwarf_siblingof(die_mem, die_mem) == 0); | ||
290 | 346 | ||
291 | return NULL; | 347 | /* Find a member called 'name' */ |
348 | static Dwarf_Die *die_find_member(Dwarf_Die *st_die, const char *name, | ||
349 | Dwarf_Die *die_mem) | ||
350 | { | ||
351 | return die_find_child(st_die, __die_find_member_cb, (void *)name, | ||
352 | die_mem); | ||
292 | } | 353 | } |
293 | 354 | ||
294 | /* | 355 | /* |
@@ -296,19 +357,22 @@ static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name, | |||
296 | */ | 357 | */ |
297 | 358 | ||
298 | /* Show a location */ | 359 | /* Show a location */ |
299 | static void show_location(Dwarf_Op *op, struct probe_finder *pf) | 360 | static int convert_location(Dwarf_Op *op, struct probe_finder *pf) |
300 | { | 361 | { |
301 | unsigned int regn; | 362 | unsigned int regn; |
302 | Dwarf_Word offs = 0; | 363 | Dwarf_Word offs = 0; |
303 | int deref = 0, ret; | 364 | bool ref = false; |
304 | const char *regs; | 365 | const char *regs; |
366 | struct kprobe_trace_arg *tvar = pf->tvar; | ||
305 | 367 | ||
306 | /* TODO: support CFA */ | ||
307 | /* If this is based on frame buffer, set the offset */ | 368 | /* If this is based on frame buffer, set the offset */ |
308 | if (op->atom == DW_OP_fbreg) { | 369 | if (op->atom == DW_OP_fbreg) { |
309 | if (pf->fb_ops == NULL) | 370 | if (pf->fb_ops == NULL) { |
310 | die("The attribute of frame base is not supported.\n"); | 371 | pr_warning("The attribute of frame base is not " |
311 | deref = 1; | 372 | "supported.\n"); |
373 | return -ENOTSUP; | ||
374 | } | ||
375 | ref = true; | ||
312 | offs = op->number; | 376 | offs = op->number; |
313 | op = &pf->fb_ops[0]; | 377 | op = &pf->fb_ops[0]; |
314 | } | 378 | } |
@@ -316,35 +380,164 @@ static void show_location(Dwarf_Op *op, struct probe_finder *pf) | |||
316 | if (op->atom >= DW_OP_breg0 && op->atom <= DW_OP_breg31) { | 380 | if (op->atom >= DW_OP_breg0 && op->atom <= DW_OP_breg31) { |
317 | regn = op->atom - DW_OP_breg0; | 381 | regn = op->atom - DW_OP_breg0; |
318 | offs += op->number; | 382 | offs += op->number; |
319 | deref = 1; | 383 | ref = true; |
320 | } else if (op->atom >= DW_OP_reg0 && op->atom <= DW_OP_reg31) { | 384 | } else if (op->atom >= DW_OP_reg0 && op->atom <= DW_OP_reg31) { |
321 | regn = op->atom - DW_OP_reg0; | 385 | regn = op->atom - DW_OP_reg0; |
322 | } else if (op->atom == DW_OP_bregx) { | 386 | } else if (op->atom == DW_OP_bregx) { |
323 | regn = op->number; | 387 | regn = op->number; |
324 | offs += op->number2; | 388 | offs += op->number2; |
325 | deref = 1; | 389 | ref = true; |
326 | } else if (op->atom == DW_OP_regx) { | 390 | } else if (op->atom == DW_OP_regx) { |
327 | regn = op->number; | 391 | regn = op->number; |
328 | } else | 392 | } else { |
329 | die("DW_OP %d is not supported.", op->atom); | 393 | pr_warning("DW_OP %x is not supported.\n", op->atom); |
394 | return -ENOTSUP; | ||
395 | } | ||
330 | 396 | ||
331 | regs = get_arch_regstr(regn); | 397 | regs = get_arch_regstr(regn); |
332 | if (!regs) | 398 | if (!regs) { |
333 | die("%u exceeds max register number.", regn); | 399 | pr_warning("Mapping for DWARF register number %u missing on this architecture.", regn); |
400 | return -ERANGE; | ||
401 | } | ||
402 | |||
403 | tvar->value = strdup(regs); | ||
404 | if (tvar->value == NULL) | ||
405 | return -ENOMEM; | ||
406 | |||
407 | if (ref) { | ||
408 | tvar->ref = zalloc(sizeof(struct kprobe_trace_arg_ref)); | ||
409 | if (tvar->ref == NULL) | ||
410 | return -ENOMEM; | ||
411 | tvar->ref->offset = (long)offs; | ||
412 | } | ||
413 | return 0; | ||
414 | } | ||
415 | |||
416 | static int convert_variable_type(Dwarf_Die *vr_die, | ||
417 | struct kprobe_trace_arg *targ) | ||
418 | { | ||
419 | Dwarf_Die type; | ||
420 | char buf[16]; | ||
421 | int ret; | ||
422 | |||
423 | if (die_get_real_type(vr_die, &type) == NULL) { | ||
424 | pr_warning("Failed to get a type information of %s.\n", | ||
425 | dwarf_diename(vr_die)); | ||
426 | return -ENOENT; | ||
427 | } | ||
428 | |||
429 | ret = die_get_byte_size(&type) * 8; | ||
430 | if (ret) { | ||
431 | /* Check the bitwidth */ | ||
432 | if (ret > MAX_BASIC_TYPE_BITS) { | ||
433 | pr_info("%s exceeds max-bitwidth." | ||
434 | " Cut down to %d bits.\n", | ||
435 | dwarf_diename(&type), MAX_BASIC_TYPE_BITS); | ||
436 | ret = MAX_BASIC_TYPE_BITS; | ||
437 | } | ||
438 | |||
439 | ret = snprintf(buf, 16, "%c%d", | ||
440 | die_is_signed_type(&type) ? 's' : 'u', ret); | ||
441 | if (ret < 0 || ret >= 16) { | ||
442 | if (ret >= 16) | ||
443 | ret = -E2BIG; | ||
444 | pr_warning("Failed to convert variable type: %s\n", | ||
445 | strerror(-ret)); | ||
446 | return ret; | ||
447 | } | ||
448 | targ->type = strdup(buf); | ||
449 | if (targ->type == NULL) | ||
450 | return -ENOMEM; | ||
451 | } | ||
452 | return 0; | ||
453 | } | ||
454 | |||
455 | static int convert_variable_fields(Dwarf_Die *vr_die, const char *varname, | ||
456 | struct perf_probe_arg_field *field, | ||
457 | struct kprobe_trace_arg_ref **ref_ptr, | ||
458 | Dwarf_Die *die_mem) | ||
459 | { | ||
460 | struct kprobe_trace_arg_ref *ref = *ref_ptr; | ||
461 | Dwarf_Die type; | ||
462 | Dwarf_Word offs; | ||
463 | int ret; | ||
464 | |||
465 | pr_debug("converting %s in %s\n", field->name, varname); | ||
466 | if (die_get_real_type(vr_die, &type) == NULL) { | ||
467 | pr_warning("Failed to get the type of %s.\n", varname); | ||
468 | return -ENOENT; | ||
469 | } | ||
470 | |||
471 | /* Check the pointer and dereference */ | ||
472 | if (dwarf_tag(&type) == DW_TAG_pointer_type) { | ||
473 | if (!field->ref) { | ||
474 | pr_err("Semantic error: %s must be referred by '->'\n", | ||
475 | field->name); | ||
476 | return -EINVAL; | ||
477 | } | ||
478 | /* Get the type pointed by this pointer */ | ||
479 | if (die_get_real_type(&type, &type) == NULL) { | ||
480 | pr_warning("Failed to get the type of %s.\n", varname); | ||
481 | return -ENOENT; | ||
482 | } | ||
483 | /* Verify it is a data structure */ | ||
484 | if (dwarf_tag(&type) != DW_TAG_structure_type) { | ||
485 | pr_warning("%s is not a data structure.\n", varname); | ||
486 | return -EINVAL; | ||
487 | } | ||
488 | |||
489 | ref = zalloc(sizeof(struct kprobe_trace_arg_ref)); | ||
490 | if (ref == NULL) | ||
491 | return -ENOMEM; | ||
492 | if (*ref_ptr) | ||
493 | (*ref_ptr)->next = ref; | ||
494 | else | ||
495 | *ref_ptr = ref; | ||
496 | } else { | ||
497 | /* Verify it is a data structure */ | ||
498 | if (dwarf_tag(&type) != DW_TAG_structure_type) { | ||
499 | pr_warning("%s is not a data structure.\n", varname); | ||
500 | return -EINVAL; | ||
501 | } | ||
502 | if (field->ref) { | ||
503 | pr_err("Semantic error: %s must be referred by '.'\n", | ||
504 | field->name); | ||
505 | return -EINVAL; | ||
506 | } | ||
507 | if (!ref) { | ||
508 | pr_warning("Structure on a register is not " | ||
509 | "supported yet.\n"); | ||
510 | return -ENOTSUP; | ||
511 | } | ||
512 | } | ||
513 | |||
514 | if (die_find_member(&type, field->name, die_mem) == NULL) { | ||
515 | pr_warning("%s(tyep:%s) has no member %s.\n", varname, | ||
516 | dwarf_diename(&type), field->name); | ||
517 | return -EINVAL; | ||
518 | } | ||
334 | 519 | ||
335 | if (deref) | 520 | /* Get the offset of the field */ |
336 | ret = snprintf(pf->buf, pf->len, " %s=%+jd(%s)", | 521 | ret = die_get_data_member_location(die_mem, &offs); |
337 | pf->var, (intmax_t)offs, regs); | 522 | if (ret < 0) { |
523 | pr_warning("Failed to get the offset of %s.\n", field->name); | ||
524 | return ret; | ||
525 | } | ||
526 | ref->offset += (long)offs; | ||
527 | |||
528 | /* Converting next field */ | ||
529 | if (field->next) | ||
530 | return convert_variable_fields(die_mem, field->name, | ||
531 | field->next, &ref, die_mem); | ||
338 | else | 532 | else |
339 | ret = snprintf(pf->buf, pf->len, " %s=%s", pf->var, regs); | 533 | return 0; |
340 | DIE_IF(ret < 0); | ||
341 | DIE_IF(ret >= pf->len); | ||
342 | } | 534 | } |
343 | 535 | ||
344 | /* Show a variables in kprobe event format */ | 536 | /* Show a variables in kprobe event format */ |
345 | static void show_variable(Dwarf_Die *vr_die, struct probe_finder *pf) | 537 | static int convert_variable(Dwarf_Die *vr_die, struct probe_finder *pf) |
346 | { | 538 | { |
347 | Dwarf_Attribute attr; | 539 | Dwarf_Attribute attr; |
540 | Dwarf_Die die_mem; | ||
348 | Dwarf_Op *expr; | 541 | Dwarf_Op *expr; |
349 | size_t nexpr; | 542 | size_t nexpr; |
350 | int ret; | 543 | int ret; |
@@ -356,142 +549,191 @@ static void show_variable(Dwarf_Die *vr_die, struct probe_finder *pf) | |||
356 | if (ret <= 0 || nexpr == 0) | 549 | if (ret <= 0 || nexpr == 0) |
357 | goto error; | 550 | goto error; |
358 | 551 | ||
359 | show_location(expr, pf); | 552 | ret = convert_location(expr, pf); |
553 | if (ret == 0 && pf->pvar->field) { | ||
554 | ret = convert_variable_fields(vr_die, pf->pvar->var, | ||
555 | pf->pvar->field, &pf->tvar->ref, | ||
556 | &die_mem); | ||
557 | vr_die = &die_mem; | ||
558 | } | ||
559 | if (ret == 0) { | ||
560 | if (pf->pvar->type) { | ||
561 | pf->tvar->type = strdup(pf->pvar->type); | ||
562 | if (pf->tvar->type == NULL) | ||
563 | ret = -ENOMEM; | ||
564 | } else | ||
565 | ret = convert_variable_type(vr_die, pf->tvar); | ||
566 | } | ||
360 | /* *expr will be cached in libdw. Don't free it. */ | 567 | /* *expr will be cached in libdw. Don't free it. */ |
361 | return ; | 568 | return ret; |
362 | error: | 569 | error: |
363 | /* TODO: Support const_value */ | 570 | /* TODO: Support const_value */ |
364 | die("Failed to find the location of %s at this address.\n" | 571 | pr_err("Failed to find the location of %s at this address.\n" |
365 | " Perhaps, it has been optimized out.", pf->var); | 572 | " Perhaps, it has been optimized out.\n", pf->pvar->var); |
573 | return -ENOENT; | ||
366 | } | 574 | } |
367 | 575 | ||
368 | /* Find a variable in a subprogram die */ | 576 | /* Find a variable in a subprogram die */ |
369 | static void find_variable(Dwarf_Die *sp_die, struct probe_finder *pf) | 577 | static int find_variable(Dwarf_Die *sp_die, struct probe_finder *pf) |
370 | { | 578 | { |
371 | int ret; | ||
372 | Dwarf_Die vr_die; | 579 | Dwarf_Die vr_die; |
580 | char buf[32], *ptr; | ||
581 | int ret; | ||
373 | 582 | ||
374 | /* TODO: Support struct members and arrays */ | 583 | /* TODO: Support arrays */ |
375 | if (!is_c_varname(pf->var)) { | 584 | if (pf->pvar->name) |
376 | /* Output raw parameters */ | 585 | pf->tvar->name = strdup(pf->pvar->name); |
377 | ret = snprintf(pf->buf, pf->len, " %s", pf->var); | 586 | else { |
378 | DIE_IF(ret < 0); | 587 | ret = synthesize_perf_probe_arg(pf->pvar, buf, 32); |
379 | DIE_IF(ret >= pf->len); | 588 | if (ret < 0) |
380 | return ; | 589 | return ret; |
590 | ptr = strchr(buf, ':'); /* Change type separator to _ */ | ||
591 | if (ptr) | ||
592 | *ptr = '_'; | ||
593 | pf->tvar->name = strdup(buf); | ||
594 | } | ||
595 | if (pf->tvar->name == NULL) | ||
596 | return -ENOMEM; | ||
597 | |||
598 | if (!is_c_varname(pf->pvar->var)) { | ||
599 | /* Copy raw parameters */ | ||
600 | pf->tvar->value = strdup(pf->pvar->var); | ||
601 | if (pf->tvar->value == NULL) | ||
602 | return -ENOMEM; | ||
603 | else | ||
604 | return 0; | ||
381 | } | 605 | } |
382 | 606 | ||
383 | pr_debug("Searching '%s' variable in context.\n", pf->var); | 607 | pr_debug("Searching '%s' variable in context.\n", |
608 | pf->pvar->var); | ||
384 | /* Search child die for local variables and parameters. */ | 609 | /* Search child die for local variables and parameters. */ |
385 | if (!die_find_variable(sp_die, pf->var, &vr_die)) | 610 | if (!die_find_variable(sp_die, pf->pvar->var, &vr_die)) { |
386 | die("Failed to find '%s' in this function.", pf->var); | 611 | pr_warning("Failed to find '%s' in this function.\n", |
387 | 612 | pf->pvar->var); | |
388 | show_variable(&vr_die, pf); | 613 | return -ENOENT; |
614 | } | ||
615 | return convert_variable(&vr_die, pf); | ||
389 | } | 616 | } |
390 | 617 | ||
391 | /* Show a probe point to output buffer */ | 618 | /* Show a probe point to output buffer */ |
392 | static void show_probe_point(Dwarf_Die *sp_die, struct probe_finder *pf) | 619 | static int convert_probe_point(Dwarf_Die *sp_die, struct probe_finder *pf) |
393 | { | 620 | { |
394 | struct probe_point *pp = pf->pp; | 621 | struct kprobe_trace_event *tev; |
395 | Dwarf_Addr eaddr; | 622 | Dwarf_Addr eaddr; |
396 | Dwarf_Die die_mem; | 623 | Dwarf_Die die_mem; |
397 | const char *name; | 624 | const char *name; |
398 | char tmp[MAX_PROBE_BUFFER]; | 625 | int ret, i; |
399 | int ret, i, len; | ||
400 | Dwarf_Attribute fb_attr; | 626 | Dwarf_Attribute fb_attr; |
401 | size_t nops; | 627 | size_t nops; |
402 | 628 | ||
629 | if (pf->ntevs == pf->max_tevs) { | ||
630 | pr_warning("Too many( > %d) probe point found.\n", | ||
631 | pf->max_tevs); | ||
632 | return -ERANGE; | ||
633 | } | ||
634 | tev = &pf->tevs[pf->ntevs++]; | ||
635 | |||
403 | /* If no real subprogram, find a real one */ | 636 | /* If no real subprogram, find a real one */ |
404 | if (!sp_die || dwarf_tag(sp_die) != DW_TAG_subprogram) { | 637 | if (!sp_die || dwarf_tag(sp_die) != DW_TAG_subprogram) { |
405 | sp_die = die_get_real_subprogram(&pf->cu_die, | 638 | sp_die = die_find_real_subprogram(&pf->cu_die, |
406 | pf->addr, &die_mem); | 639 | pf->addr, &die_mem); |
407 | if (!sp_die) | 640 | if (!sp_die) { |
408 | die("Probe point is not found in subprograms."); | 641 | pr_warning("Failed to find probe point in any " |
642 | "functions.\n"); | ||
643 | return -ENOENT; | ||
644 | } | ||
409 | } | 645 | } |
410 | 646 | ||
411 | /* Output name of probe point */ | 647 | /* Copy the name of probe point */ |
412 | name = dwarf_diename(sp_die); | 648 | name = dwarf_diename(sp_die); |
413 | if (name) { | 649 | if (name) { |
414 | dwarf_entrypc(sp_die, &eaddr); | 650 | if (dwarf_entrypc(sp_die, &eaddr) != 0) { |
415 | ret = snprintf(tmp, MAX_PROBE_BUFFER, "%s+%lu", name, | 651 | pr_warning("Failed to get entry pc of %s\n", |
416 | (unsigned long)(pf->addr - eaddr)); | 652 | dwarf_diename(sp_die)); |
417 | /* Copy the function name if possible */ | 653 | return -ENOENT; |
418 | if (!pp->function) { | ||
419 | pp->function = strdup(name); | ||
420 | pp->offset = (size_t)(pf->addr - eaddr); | ||
421 | } | 654 | } |
422 | } else { | 655 | tev->point.symbol = strdup(name); |
656 | if (tev->point.symbol == NULL) | ||
657 | return -ENOMEM; | ||
658 | tev->point.offset = (unsigned long)(pf->addr - eaddr); | ||
659 | } else | ||
423 | /* This function has no name. */ | 660 | /* This function has no name. */ |
424 | ret = snprintf(tmp, MAX_PROBE_BUFFER, "0x%jx", | 661 | tev->point.offset = (unsigned long)pf->addr; |
425 | (uintmax_t)pf->addr); | 662 | |
426 | if (!pp->function) { | 663 | pr_debug("Probe point found: %s+%lu\n", tev->point.symbol, |
427 | /* TODO: Use _stext */ | 664 | tev->point.offset); |
428 | pp->function = strdup(""); | ||
429 | pp->offset = (size_t)pf->addr; | ||
430 | } | ||
431 | } | ||
432 | DIE_IF(ret < 0); | ||
433 | DIE_IF(ret >= MAX_PROBE_BUFFER); | ||
434 | len = ret; | ||
435 | pr_debug("Probe point found: %s\n", tmp); | ||
436 | 665 | ||
437 | /* Get the frame base attribute/ops */ | 666 | /* Get the frame base attribute/ops */ |
438 | dwarf_attr(sp_die, DW_AT_frame_base, &fb_attr); | 667 | dwarf_attr(sp_die, DW_AT_frame_base, &fb_attr); |
439 | ret = dwarf_getlocation_addr(&fb_attr, pf->addr, &pf->fb_ops, &nops, 1); | 668 | ret = dwarf_getlocation_addr(&fb_attr, pf->addr, &pf->fb_ops, &nops, 1); |
440 | if (ret <= 0 || nops == 0) | 669 | if (ret <= 0 || nops == 0) { |
441 | pf->fb_ops = NULL; | 670 | pf->fb_ops = NULL; |
671 | } else if (nops == 1 && pf->fb_ops[0].atom == DW_OP_call_frame_cfa && | ||
672 | pf->cfi != NULL) { | ||
673 | Dwarf_Frame *frame; | ||
674 | if (dwarf_cfi_addrframe(pf->cfi, pf->addr, &frame) != 0 || | ||
675 | dwarf_frame_cfa(frame, &pf->fb_ops, &nops) != 0) { | ||
676 | pr_warning("Failed to get CFA on 0x%jx\n", | ||
677 | (uintmax_t)pf->addr); | ||
678 | return -ENOENT; | ||
679 | } | ||
680 | } | ||
442 | 681 | ||
443 | /* Find each argument */ | 682 | /* Find each argument */ |
444 | /* TODO: use dwarf_cfi_addrframe */ | 683 | tev->nargs = pf->pev->nargs; |
445 | for (i = 0; i < pp->nr_args; i++) { | 684 | tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs); |
446 | pf->var = pp->args[i]; | 685 | if (tev->args == NULL) |
447 | pf->buf = &tmp[len]; | 686 | return -ENOMEM; |
448 | pf->len = MAX_PROBE_BUFFER - len; | 687 | for (i = 0; i < pf->pev->nargs; i++) { |
449 | find_variable(sp_die, pf); | 688 | pf->pvar = &pf->pev->args[i]; |
450 | len += strlen(pf->buf); | 689 | pf->tvar = &tev->args[i]; |
690 | ret = find_variable(sp_die, pf); | ||
691 | if (ret != 0) | ||
692 | return ret; | ||
451 | } | 693 | } |
452 | 694 | ||
453 | /* *pf->fb_ops will be cached in libdw. Don't free it. */ | 695 | /* *pf->fb_ops will be cached in libdw. Don't free it. */ |
454 | pf->fb_ops = NULL; | 696 | pf->fb_ops = NULL; |
455 | 697 | return 0; | |
456 | if (pp->found == MAX_PROBES) | ||
457 | die("Too many( > %d) probe point found.\n", MAX_PROBES); | ||
458 | |||
459 | pp->probes[pp->found] = strdup(tmp); | ||
460 | pp->found++; | ||
461 | } | 698 | } |
462 | 699 | ||
463 | /* Find probe point from its line number */ | 700 | /* Find probe point from its line number */ |
464 | static void find_probe_point_by_line(struct probe_finder *pf) | 701 | static int find_probe_point_by_line(struct probe_finder *pf) |
465 | { | 702 | { |
466 | Dwarf_Lines *lines; | 703 | Dwarf_Lines *lines; |
467 | Dwarf_Line *line; | 704 | Dwarf_Line *line; |
468 | size_t nlines, i; | 705 | size_t nlines, i; |
469 | Dwarf_Addr addr; | 706 | Dwarf_Addr addr; |
470 | int lineno; | 707 | int lineno; |
471 | int ret; | 708 | int ret = 0; |
472 | 709 | ||
473 | ret = dwarf_getsrclines(&pf->cu_die, &lines, &nlines); | 710 | if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) { |
474 | DIE_IF(ret != 0); | 711 | pr_warning("No source lines found in this CU.\n"); |
712 | return -ENOENT; | ||
713 | } | ||
475 | 714 | ||
476 | for (i = 0; i < nlines; i++) { | 715 | for (i = 0; i < nlines && ret == 0; i++) { |
477 | line = dwarf_onesrcline(lines, i); | 716 | line = dwarf_onesrcline(lines, i); |
478 | dwarf_lineno(line, &lineno); | 717 | if (dwarf_lineno(line, &lineno) != 0 || |
479 | if (lineno != pf->lno) | 718 | lineno != pf->lno) |
480 | continue; | 719 | continue; |
481 | 720 | ||
482 | /* TODO: Get fileno from line, but how? */ | 721 | /* TODO: Get fileno from line, but how? */ |
483 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) | 722 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) |
484 | continue; | 723 | continue; |
485 | 724 | ||
486 | ret = dwarf_lineaddr(line, &addr); | 725 | if (dwarf_lineaddr(line, &addr) != 0) { |
487 | DIE_IF(ret != 0); | 726 | pr_warning("Failed to get the address of the line.\n"); |
727 | return -ENOENT; | ||
728 | } | ||
488 | pr_debug("Probe line found: line[%d]:%d addr:0x%jx\n", | 729 | pr_debug("Probe line found: line[%d]:%d addr:0x%jx\n", |
489 | (int)i, lineno, (uintmax_t)addr); | 730 | (int)i, lineno, (uintmax_t)addr); |
490 | pf->addr = addr; | 731 | pf->addr = addr; |
491 | 732 | ||
492 | show_probe_point(NULL, pf); | 733 | ret = convert_probe_point(NULL, pf); |
493 | /* Continuing, because target line might be inlined. */ | 734 | /* Continuing, because target line might be inlined. */ |
494 | } | 735 | } |
736 | return ret; | ||
495 | } | 737 | } |
496 | 738 | ||
497 | /* Find lines which match lazy pattern */ | 739 | /* Find lines which match lazy pattern */ |
@@ -499,16 +741,27 @@ static int find_lazy_match_lines(struct list_head *head, | |||
499 | const char *fname, const char *pat) | 741 | const char *fname, const char *pat) |
500 | { | 742 | { |
501 | char *fbuf, *p1, *p2; | 743 | char *fbuf, *p1, *p2; |
502 | int fd, line, nlines = 0; | 744 | int fd, ret, line, nlines = 0; |
503 | struct stat st; | 745 | struct stat st; |
504 | 746 | ||
505 | fd = open(fname, O_RDONLY); | 747 | fd = open(fname, O_RDONLY); |
506 | if (fd < 0) | 748 | if (fd < 0) { |
507 | die("failed to open %s", fname); | 749 | pr_warning("Failed to open %s: %s\n", fname, strerror(-fd)); |
508 | DIE_IF(fstat(fd, &st) < 0); | 750 | return fd; |
509 | fbuf = malloc(st.st_size + 2); | 751 | } |
510 | DIE_IF(fbuf == NULL); | 752 | |
511 | DIE_IF(read(fd, fbuf, st.st_size) < 0); | 753 | ret = fstat(fd, &st); |
754 | if (ret < 0) { | ||
755 | pr_warning("Failed to get the size of %s: %s\n", | ||
756 | fname, strerror(errno)); | ||
757 | return ret; | ||
758 | } | ||
759 | fbuf = xmalloc(st.st_size + 2); | ||
760 | ret = read(fd, fbuf, st.st_size); | ||
761 | if (ret < 0) { | ||
762 | pr_warning("Failed to read %s: %s\n", fname, strerror(errno)); | ||
763 | return ret; | ||
764 | } | ||
512 | close(fd); | 765 | close(fd); |
513 | fbuf[st.st_size] = '\n'; /* Dummy line */ | 766 | fbuf[st.st_size] = '\n'; /* Dummy line */ |
514 | fbuf[st.st_size + 1] = '\0'; | 767 | fbuf[st.st_size + 1] = '\0'; |
@@ -528,7 +781,7 @@ static int find_lazy_match_lines(struct list_head *head, | |||
528 | } | 781 | } |
529 | 782 | ||
530 | /* Find probe points from lazy pattern */ | 783 | /* Find probe points from lazy pattern */ |
531 | static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | 784 | static int find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) |
532 | { | 785 | { |
533 | Dwarf_Lines *lines; | 786 | Dwarf_Lines *lines; |
534 | Dwarf_Line *line; | 787 | Dwarf_Line *line; |
@@ -536,37 +789,46 @@ static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | |||
536 | Dwarf_Addr addr; | 789 | Dwarf_Addr addr; |
537 | Dwarf_Die die_mem; | 790 | Dwarf_Die die_mem; |
538 | int lineno; | 791 | int lineno; |
539 | int ret; | 792 | int ret = 0; |
540 | 793 | ||
541 | if (list_empty(&pf->lcache)) { | 794 | if (list_empty(&pf->lcache)) { |
542 | /* Matching lazy line pattern */ | 795 | /* Matching lazy line pattern */ |
543 | ret = find_lazy_match_lines(&pf->lcache, pf->fname, | 796 | ret = find_lazy_match_lines(&pf->lcache, pf->fname, |
544 | pf->pp->lazy_line); | 797 | pf->pev->point.lazy_line); |
545 | if (ret <= 0) | 798 | if (ret == 0) { |
546 | die("No matched lines found in %s.", pf->fname); | 799 | pr_debug("No matched lines found in %s.\n", pf->fname); |
800 | return 0; | ||
801 | } else if (ret < 0) | ||
802 | return ret; | ||
547 | } | 803 | } |
548 | 804 | ||
549 | ret = dwarf_getsrclines(&pf->cu_die, &lines, &nlines); | 805 | if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) { |
550 | DIE_IF(ret != 0); | 806 | pr_warning("No source lines found in this CU.\n"); |
551 | for (i = 0; i < nlines; i++) { | 807 | return -ENOENT; |
808 | } | ||
809 | |||
810 | for (i = 0; i < nlines && ret >= 0; i++) { | ||
552 | line = dwarf_onesrcline(lines, i); | 811 | line = dwarf_onesrcline(lines, i); |
553 | 812 | ||
554 | dwarf_lineno(line, &lineno); | 813 | if (dwarf_lineno(line, &lineno) != 0 || |
555 | if (!line_list__has_line(&pf->lcache, lineno)) | 814 | !line_list__has_line(&pf->lcache, lineno)) |
556 | continue; | 815 | continue; |
557 | 816 | ||
558 | /* TODO: Get fileno from line, but how? */ | 817 | /* TODO: Get fileno from line, but how? */ |
559 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) | 818 | if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0) |
560 | continue; | 819 | continue; |
561 | 820 | ||
562 | ret = dwarf_lineaddr(line, &addr); | 821 | if (dwarf_lineaddr(line, &addr) != 0) { |
563 | DIE_IF(ret != 0); | 822 | pr_debug("Failed to get the address of line %d.\n", |
823 | lineno); | ||
824 | continue; | ||
825 | } | ||
564 | if (sp_die) { | 826 | if (sp_die) { |
565 | /* Address filtering 1: does sp_die include addr? */ | 827 | /* Address filtering 1: does sp_die include addr? */ |
566 | if (!dwarf_haspc(sp_die, addr)) | 828 | if (!dwarf_haspc(sp_die, addr)) |
567 | continue; | 829 | continue; |
568 | /* Address filtering 2: No child include addr? */ | 830 | /* Address filtering 2: No child include addr? */ |
569 | if (die_get_inlinefunc(sp_die, addr, &die_mem)) | 831 | if (die_find_inlinefunc(sp_die, addr, &die_mem)) |
570 | continue; | 832 | continue; |
571 | } | 833 | } |
572 | 834 | ||
@@ -574,27 +836,44 @@ static void find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf) | |||
574 | (int)i, lineno, (unsigned long long)addr); | 836 | (int)i, lineno, (unsigned long long)addr); |
575 | pf->addr = addr; | 837 | pf->addr = addr; |
576 | 838 | ||
577 | show_probe_point(sp_die, pf); | 839 | ret = convert_probe_point(sp_die, pf); |
578 | /* Continuing, because target line might be inlined. */ | 840 | /* Continuing, because target line might be inlined. */ |
579 | } | 841 | } |
580 | /* TODO: deallocate lines, but how? */ | 842 | /* TODO: deallocate lines, but how? */ |
843 | return ret; | ||
581 | } | 844 | } |
582 | 845 | ||
846 | /* Callback parameter with return value */ | ||
847 | struct dwarf_callback_param { | ||
848 | void *data; | ||
849 | int retval; | ||
850 | }; | ||
851 | |||
583 | static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) | 852 | static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) |
584 | { | 853 | { |
585 | struct probe_finder *pf = (struct probe_finder *)data; | 854 | struct dwarf_callback_param *param = data; |
586 | struct probe_point *pp = pf->pp; | 855 | struct probe_finder *pf = param->data; |
856 | struct perf_probe_point *pp = &pf->pev->point; | ||
857 | Dwarf_Addr addr; | ||
587 | 858 | ||
588 | if (pp->lazy_line) | 859 | if (pp->lazy_line) |
589 | find_probe_point_lazy(in_die, pf); | 860 | param->retval = find_probe_point_lazy(in_die, pf); |
590 | else { | 861 | else { |
591 | /* Get probe address */ | 862 | /* Get probe address */ |
592 | pf->addr = die_get_entrypc(in_die); | 863 | if (dwarf_entrypc(in_die, &addr) != 0) { |
864 | pr_warning("Failed to get entry pc of %s.\n", | ||
865 | dwarf_diename(in_die)); | ||
866 | param->retval = -ENOENT; | ||
867 | return DWARF_CB_ABORT; | ||
868 | } | ||
869 | pf->addr = addr; | ||
593 | pf->addr += pp->offset; | 870 | pf->addr += pp->offset; |
594 | pr_debug("found inline addr: 0x%jx\n", | 871 | pr_debug("found inline addr: 0x%jx\n", |
595 | (uintmax_t)pf->addr); | 872 | (uintmax_t)pf->addr); |
596 | 873 | ||
597 | show_probe_point(in_die, pf); | 874 | param->retval = convert_probe_point(in_die, pf); |
875 | if (param->retval < 0) | ||
876 | return DWARF_CB_ABORT; | ||
598 | } | 877 | } |
599 | 878 | ||
600 | return DWARF_CB_OK; | 879 | return DWARF_CB_OK; |
@@ -603,59 +882,88 @@ static int probe_point_inline_cb(Dwarf_Die *in_die, void *data) | |||
603 | /* Search function from function name */ | 882 | /* Search function from function name */ |
604 | static int probe_point_search_cb(Dwarf_Die *sp_die, void *data) | 883 | static int probe_point_search_cb(Dwarf_Die *sp_die, void *data) |
605 | { | 884 | { |
606 | struct probe_finder *pf = (struct probe_finder *)data; | 885 | struct dwarf_callback_param *param = data; |
607 | struct probe_point *pp = pf->pp; | 886 | struct probe_finder *pf = param->data; |
887 | struct perf_probe_point *pp = &pf->pev->point; | ||
608 | 888 | ||
609 | /* Check tag and diename */ | 889 | /* Check tag and diename */ |
610 | if (dwarf_tag(sp_die) != DW_TAG_subprogram || | 890 | if (dwarf_tag(sp_die) != DW_TAG_subprogram || |
611 | die_compare_name(sp_die, pp->function) != 0) | 891 | die_compare_name(sp_die, pp->function) != 0) |
612 | return 0; | 892 | return DWARF_CB_OK; |
613 | 893 | ||
614 | pf->fname = dwarf_decl_file(sp_die); | 894 | pf->fname = dwarf_decl_file(sp_die); |
615 | if (pp->line) { /* Function relative line */ | 895 | if (pp->line) { /* Function relative line */ |
616 | dwarf_decl_line(sp_die, &pf->lno); | 896 | dwarf_decl_line(sp_die, &pf->lno); |
617 | pf->lno += pp->line; | 897 | pf->lno += pp->line; |
618 | find_probe_point_by_line(pf); | 898 | param->retval = find_probe_point_by_line(pf); |
619 | } else if (!dwarf_func_inline(sp_die)) { | 899 | } else if (!dwarf_func_inline(sp_die)) { |
620 | /* Real function */ | 900 | /* Real function */ |
621 | if (pp->lazy_line) | 901 | if (pp->lazy_line) |
622 | find_probe_point_lazy(sp_die, pf); | 902 | param->retval = find_probe_point_lazy(sp_die, pf); |
623 | else { | 903 | else { |
624 | pf->addr = die_get_entrypc(sp_die); | 904 | if (dwarf_entrypc(sp_die, &pf->addr) != 0) { |
905 | pr_warning("Failed to get entry pc of %s.\n", | ||
906 | dwarf_diename(sp_die)); | ||
907 | param->retval = -ENOENT; | ||
908 | return DWARF_CB_ABORT; | ||
909 | } | ||
625 | pf->addr += pp->offset; | 910 | pf->addr += pp->offset; |
626 | /* TODO: Check the address in this function */ | 911 | /* TODO: Check the address in this function */ |
627 | show_probe_point(sp_die, pf); | 912 | param->retval = convert_probe_point(sp_die, pf); |
628 | } | 913 | } |
629 | } else | 914 | } else { |
915 | struct dwarf_callback_param _param = {.data = (void *)pf, | ||
916 | .retval = 0}; | ||
630 | /* Inlined function: search instances */ | 917 | /* Inlined function: search instances */ |
631 | dwarf_func_inline_instances(sp_die, probe_point_inline_cb, pf); | 918 | dwarf_func_inline_instances(sp_die, probe_point_inline_cb, |
919 | &_param); | ||
920 | param->retval = _param.retval; | ||
921 | } | ||
632 | 922 | ||
633 | return 1; /* Exit; no same symbol in this CU. */ | 923 | return DWARF_CB_ABORT; /* Exit; no same symbol in this CU. */ |
634 | } | 924 | } |
635 | 925 | ||
636 | static void find_probe_point_by_func(struct probe_finder *pf) | 926 | static int find_probe_point_by_func(struct probe_finder *pf) |
637 | { | 927 | { |
638 | dwarf_getfuncs(&pf->cu_die, probe_point_search_cb, pf, 0); | 928 | struct dwarf_callback_param _param = {.data = (void *)pf, |
929 | .retval = 0}; | ||
930 | dwarf_getfuncs(&pf->cu_die, probe_point_search_cb, &_param, 0); | ||
931 | return _param.retval; | ||
639 | } | 932 | } |
640 | 933 | ||
641 | /* Find a probe point */ | 934 | /* Find kprobe_trace_events specified by perf_probe_event from debuginfo */ |
642 | int find_probe_point(int fd, struct probe_point *pp) | 935 | int find_kprobe_trace_events(int fd, struct perf_probe_event *pev, |
936 | struct kprobe_trace_event **tevs, int max_tevs) | ||
643 | { | 937 | { |
644 | struct probe_finder pf = {.pp = pp}; | 938 | struct probe_finder pf = {.pev = pev, .max_tevs = max_tevs}; |
939 | struct perf_probe_point *pp = &pev->point; | ||
645 | Dwarf_Off off, noff; | 940 | Dwarf_Off off, noff; |
646 | size_t cuhl; | 941 | size_t cuhl; |
647 | Dwarf_Die *diep; | 942 | Dwarf_Die *diep; |
648 | Dwarf *dbg; | 943 | Dwarf *dbg; |
944 | int ret = 0; | ||
945 | |||
946 | pf.tevs = zalloc(sizeof(struct kprobe_trace_event) * max_tevs); | ||
947 | if (pf.tevs == NULL) | ||
948 | return -ENOMEM; | ||
949 | *tevs = pf.tevs; | ||
950 | pf.ntevs = 0; | ||
649 | 951 | ||
650 | dbg = dwarf_begin(fd, DWARF_C_READ); | 952 | dbg = dwarf_begin(fd, DWARF_C_READ); |
651 | if (!dbg) | 953 | if (!dbg) { |
652 | return -ENOENT; | 954 | pr_warning("No dwarf info found in the vmlinux - " |
955 | "please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
956 | return -EBADF; | ||
957 | } | ||
958 | |||
959 | /* Get the call frame information from this dwarf */ | ||
960 | pf.cfi = dwarf_getcfi(dbg); | ||
653 | 961 | ||
654 | pp->found = 0; | ||
655 | off = 0; | 962 | off = 0; |
656 | line_list__init(&pf.lcache); | 963 | line_list__init(&pf.lcache); |
657 | /* Loop on CUs (Compilation Unit) */ | 964 | /* Loop on CUs (Compilation Unit) */ |
658 | while (!dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL)) { | 965 | while (!dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) && |
966 | ret >= 0) { | ||
659 | /* Get the DIE(Debugging Information Entry) of this CU */ | 967 | /* Get the DIE(Debugging Information Entry) of this CU */ |
660 | diep = dwarf_offdie(dbg, off + cuhl, &pf.cu_die); | 968 | diep = dwarf_offdie(dbg, off + cuhl, &pf.cu_die); |
661 | if (!diep) | 969 | if (!diep) |
@@ -669,12 +977,12 @@ int find_probe_point(int fd, struct probe_point *pp) | |||
669 | 977 | ||
670 | if (!pp->file || pf.fname) { | 978 | if (!pp->file || pf.fname) { |
671 | if (pp->function) | 979 | if (pp->function) |
672 | find_probe_point_by_func(&pf); | 980 | ret = find_probe_point_by_func(&pf); |
673 | else if (pp->lazy_line) | 981 | else if (pp->lazy_line) |
674 | find_probe_point_lazy(NULL, &pf); | 982 | ret = find_probe_point_lazy(NULL, &pf); |
675 | else { | 983 | else { |
676 | pf.lno = pp->line; | 984 | pf.lno = pp->line; |
677 | find_probe_point_by_line(&pf); | 985 | ret = find_probe_point_by_line(&pf); |
678 | } | 986 | } |
679 | } | 987 | } |
680 | off = noff; | 988 | off = noff; |
@@ -682,41 +990,169 @@ int find_probe_point(int fd, struct probe_point *pp) | |||
682 | line_list__free(&pf.lcache); | 990 | line_list__free(&pf.lcache); |
683 | dwarf_end(dbg); | 991 | dwarf_end(dbg); |
684 | 992 | ||
685 | return pp->found; | 993 | return (ret < 0) ? ret : pf.ntevs; |
994 | } | ||
995 | |||
996 | /* Reverse search */ | ||
997 | int find_perf_probe_point(int fd, unsigned long addr, | ||
998 | struct perf_probe_point *ppt) | ||
999 | { | ||
1000 | Dwarf_Die cudie, spdie, indie; | ||
1001 | Dwarf *dbg; | ||
1002 | Dwarf_Line *line; | ||
1003 | Dwarf_Addr laddr, eaddr; | ||
1004 | const char *tmp; | ||
1005 | int lineno, ret = 0; | ||
1006 | bool found = false; | ||
1007 | |||
1008 | dbg = dwarf_begin(fd, DWARF_C_READ); | ||
1009 | if (!dbg) | ||
1010 | return -EBADF; | ||
1011 | |||
1012 | /* Find cu die */ | ||
1013 | if (!dwarf_addrdie(dbg, (Dwarf_Addr)addr, &cudie)) { | ||
1014 | ret = -EINVAL; | ||
1015 | goto end; | ||
1016 | } | ||
1017 | |||
1018 | /* Find a corresponding line */ | ||
1019 | line = dwarf_getsrc_die(&cudie, (Dwarf_Addr)addr); | ||
1020 | if (line) { | ||
1021 | if (dwarf_lineaddr(line, &laddr) == 0 && | ||
1022 | (Dwarf_Addr)addr == laddr && | ||
1023 | dwarf_lineno(line, &lineno) == 0) { | ||
1024 | tmp = dwarf_linesrc(line, NULL, NULL); | ||
1025 | if (tmp) { | ||
1026 | ppt->line = lineno; | ||
1027 | ppt->file = strdup(tmp); | ||
1028 | if (ppt->file == NULL) { | ||
1029 | ret = -ENOMEM; | ||
1030 | goto end; | ||
1031 | } | ||
1032 | found = true; | ||
1033 | } | ||
1034 | } | ||
1035 | } | ||
1036 | |||
1037 | /* Find a corresponding function */ | ||
1038 | if (die_find_real_subprogram(&cudie, (Dwarf_Addr)addr, &spdie)) { | ||
1039 | tmp = dwarf_diename(&spdie); | ||
1040 | if (!tmp || dwarf_entrypc(&spdie, &eaddr) != 0) | ||
1041 | goto end; | ||
1042 | |||
1043 | if (ppt->line) { | ||
1044 | if (die_find_inlinefunc(&spdie, (Dwarf_Addr)addr, | ||
1045 | &indie)) { | ||
1046 | /* addr in an inline function */ | ||
1047 | tmp = dwarf_diename(&indie); | ||
1048 | if (!tmp) | ||
1049 | goto end; | ||
1050 | ret = dwarf_decl_line(&indie, &lineno); | ||
1051 | } else { | ||
1052 | if (eaddr == addr) { /* Function entry */ | ||
1053 | lineno = ppt->line; | ||
1054 | ret = 0; | ||
1055 | } else | ||
1056 | ret = dwarf_decl_line(&spdie, &lineno); | ||
1057 | } | ||
1058 | if (ret == 0) { | ||
1059 | /* Make a relative line number */ | ||
1060 | ppt->line -= lineno; | ||
1061 | goto found; | ||
1062 | } | ||
1063 | } | ||
1064 | /* We don't have a line number, let's use offset */ | ||
1065 | ppt->offset = addr - (unsigned long)eaddr; | ||
1066 | found: | ||
1067 | ppt->function = strdup(tmp); | ||
1068 | if (ppt->function == NULL) { | ||
1069 | ret = -ENOMEM; | ||
1070 | goto end; | ||
1071 | } | ||
1072 | found = true; | ||
1073 | } | ||
1074 | |||
1075 | end: | ||
1076 | dwarf_end(dbg); | ||
1077 | if (ret >= 0) | ||
1078 | ret = found ? 1 : 0; | ||
1079 | return ret; | ||
1080 | } | ||
1081 | |||
1082 | /* Add a line and store the src path */ | ||
1083 | static int line_range_add_line(const char *src, unsigned int lineno, | ||
1084 | struct line_range *lr) | ||
1085 | { | ||
1086 | /* Copy real path */ | ||
1087 | if (!lr->path) { | ||
1088 | lr->path = strdup(src); | ||
1089 | if (lr->path == NULL) | ||
1090 | return -ENOMEM; | ||
1091 | } | ||
1092 | return line_list__add_line(&lr->line_list, lineno); | ||
1093 | } | ||
1094 | |||
1095 | /* Search function declaration lines */ | ||
1096 | static int line_range_funcdecl_cb(Dwarf_Die *sp_die, void *data) | ||
1097 | { | ||
1098 | struct dwarf_callback_param *param = data; | ||
1099 | struct line_finder *lf = param->data; | ||
1100 | const char *src; | ||
1101 | int lineno; | ||
1102 | |||
1103 | src = dwarf_decl_file(sp_die); | ||
1104 | if (src && strtailcmp(src, lf->fname) != 0) | ||
1105 | return DWARF_CB_OK; | ||
1106 | |||
1107 | if (dwarf_decl_line(sp_die, &lineno) != 0 || | ||
1108 | (lf->lno_s > lineno || lf->lno_e < lineno)) | ||
1109 | return DWARF_CB_OK; | ||
1110 | |||
1111 | param->retval = line_range_add_line(src, lineno, lf->lr); | ||
1112 | if (param->retval < 0) | ||
1113 | return DWARF_CB_ABORT; | ||
1114 | return DWARF_CB_OK; | ||
1115 | } | ||
1116 | |||
1117 | static int find_line_range_func_decl_lines(struct line_finder *lf) | ||
1118 | { | ||
1119 | struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0}; | ||
1120 | dwarf_getfuncs(&lf->cu_die, line_range_funcdecl_cb, ¶m, 0); | ||
1121 | return param.retval; | ||
686 | } | 1122 | } |
687 | 1123 | ||
688 | /* Find line range from its line number */ | 1124 | /* Find line range from its line number */ |
689 | static void find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) | 1125 | static int find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) |
690 | { | 1126 | { |
691 | Dwarf_Lines *lines; | 1127 | Dwarf_Lines *lines; |
692 | Dwarf_Line *line; | 1128 | Dwarf_Line *line; |
693 | size_t nlines, i; | 1129 | size_t nlines, i; |
694 | Dwarf_Addr addr; | 1130 | Dwarf_Addr addr; |
695 | int lineno; | 1131 | int lineno, ret = 0; |
696 | int ret; | ||
697 | const char *src; | 1132 | const char *src; |
698 | Dwarf_Die die_mem; | 1133 | Dwarf_Die die_mem; |
699 | 1134 | ||
700 | line_list__init(&lf->lr->line_list); | 1135 | line_list__init(&lf->lr->line_list); |
701 | ret = dwarf_getsrclines(&lf->cu_die, &lines, &nlines); | 1136 | if (dwarf_getsrclines(&lf->cu_die, &lines, &nlines) != 0) { |
702 | DIE_IF(ret != 0); | 1137 | pr_warning("No source lines found in this CU.\n"); |
1138 | return -ENOENT; | ||
1139 | } | ||
703 | 1140 | ||
1141 | /* Search probable lines on lines list */ | ||
704 | for (i = 0; i < nlines; i++) { | 1142 | for (i = 0; i < nlines; i++) { |
705 | line = dwarf_onesrcline(lines, i); | 1143 | line = dwarf_onesrcline(lines, i); |
706 | ret = dwarf_lineno(line, &lineno); | 1144 | if (dwarf_lineno(line, &lineno) != 0 || |
707 | DIE_IF(ret != 0); | 1145 | (lf->lno_s > lineno || lf->lno_e < lineno)) |
708 | if (lf->lno_s > lineno || lf->lno_e < lineno) | ||
709 | continue; | 1146 | continue; |
710 | 1147 | ||
711 | if (sp_die) { | 1148 | if (sp_die) { |
712 | /* Address filtering 1: does sp_die include addr? */ | 1149 | /* Address filtering 1: does sp_die include addr? */ |
713 | ret = dwarf_lineaddr(line, &addr); | 1150 | if (dwarf_lineaddr(line, &addr) != 0 || |
714 | DIE_IF(ret != 0); | 1151 | !dwarf_haspc(sp_die, addr)) |
715 | if (!dwarf_haspc(sp_die, addr)) | ||
716 | continue; | 1152 | continue; |
717 | 1153 | ||
718 | /* Address filtering 2: No child include addr? */ | 1154 | /* Address filtering 2: No child include addr? */ |
719 | if (die_get_inlinefunc(sp_die, addr, &die_mem)) | 1155 | if (die_find_inlinefunc(sp_die, addr, &die_mem)) |
720 | continue; | 1156 | continue; |
721 | } | 1157 | } |
722 | 1158 | ||
@@ -725,30 +1161,49 @@ static void find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf) | |||
725 | if (strtailcmp(src, lf->fname) != 0) | 1161 | if (strtailcmp(src, lf->fname) != 0) |
726 | continue; | 1162 | continue; |
727 | 1163 | ||
728 | /* Copy real path */ | 1164 | ret = line_range_add_line(src, lineno, lf->lr); |
729 | if (!lf->lr->path) | 1165 | if (ret < 0) |
730 | lf->lr->path = strdup(src); | 1166 | return ret; |
731 | line_list__add_line(&lf->lr->line_list, (unsigned int)lineno); | ||
732 | } | 1167 | } |
1168 | |||
1169 | /* | ||
1170 | * Dwarf lines doesn't include function declarations. We have to | ||
1171 | * check functions list or given function. | ||
1172 | */ | ||
1173 | if (sp_die) { | ||
1174 | src = dwarf_decl_file(sp_die); | ||
1175 | if (src && dwarf_decl_line(sp_die, &lineno) == 0 && | ||
1176 | (lf->lno_s <= lineno && lf->lno_e >= lineno)) | ||
1177 | ret = line_range_add_line(src, lineno, lf->lr); | ||
1178 | } else | ||
1179 | ret = find_line_range_func_decl_lines(lf); | ||
1180 | |||
733 | /* Update status */ | 1181 | /* Update status */ |
734 | if (!list_empty(&lf->lr->line_list)) | 1182 | if (ret >= 0) |
735 | lf->found = 1; | 1183 | if (!list_empty(&lf->lr->line_list)) |
1184 | ret = lf->found = 1; | ||
1185 | else | ||
1186 | ret = 0; /* Lines are not found */ | ||
736 | else { | 1187 | else { |
737 | free(lf->lr->path); | 1188 | free(lf->lr->path); |
738 | lf->lr->path = NULL; | 1189 | lf->lr->path = NULL; |
739 | } | 1190 | } |
1191 | return ret; | ||
740 | } | 1192 | } |
741 | 1193 | ||
742 | static int line_range_inline_cb(Dwarf_Die *in_die, void *data) | 1194 | static int line_range_inline_cb(Dwarf_Die *in_die, void *data) |
743 | { | 1195 | { |
744 | find_line_range_by_line(in_die, (struct line_finder *)data); | 1196 | struct dwarf_callback_param *param = data; |
1197 | |||
1198 | param->retval = find_line_range_by_line(in_die, param->data); | ||
745 | return DWARF_CB_ABORT; /* No need to find other instances */ | 1199 | return DWARF_CB_ABORT; /* No need to find other instances */ |
746 | } | 1200 | } |
747 | 1201 | ||
748 | /* Search function from function name */ | 1202 | /* Search function from function name */ |
749 | static int line_range_search_cb(Dwarf_Die *sp_die, void *data) | 1203 | static int line_range_search_cb(Dwarf_Die *sp_die, void *data) |
750 | { | 1204 | { |
751 | struct line_finder *lf = (struct line_finder *)data; | 1205 | struct dwarf_callback_param *param = data; |
1206 | struct line_finder *lf = param->data; | ||
752 | struct line_range *lr = lf->lr; | 1207 | struct line_range *lr = lf->lr; |
753 | 1208 | ||
754 | if (dwarf_tag(sp_die) == DW_TAG_subprogram && | 1209 | if (dwarf_tag(sp_die) == DW_TAG_subprogram && |
@@ -757,44 +1212,55 @@ static int line_range_search_cb(Dwarf_Die *sp_die, void *data) | |||
757 | dwarf_decl_line(sp_die, &lr->offset); | 1212 | dwarf_decl_line(sp_die, &lr->offset); |
758 | pr_debug("fname: %s, lineno:%d\n", lf->fname, lr->offset); | 1213 | pr_debug("fname: %s, lineno:%d\n", lf->fname, lr->offset); |
759 | lf->lno_s = lr->offset + lr->start; | 1214 | lf->lno_s = lr->offset + lr->start; |
760 | if (!lr->end) | 1215 | if (lf->lno_s < 0) /* Overflow */ |
1216 | lf->lno_s = INT_MAX; | ||
1217 | lf->lno_e = lr->offset + lr->end; | ||
1218 | if (lf->lno_e < 0) /* Overflow */ | ||
761 | lf->lno_e = INT_MAX; | 1219 | lf->lno_e = INT_MAX; |
762 | else | 1220 | pr_debug("New line range: %d to %d\n", lf->lno_s, lf->lno_e); |
763 | lf->lno_e = lr->offset + lr->end; | ||
764 | lr->start = lf->lno_s; | 1221 | lr->start = lf->lno_s; |
765 | lr->end = lf->lno_e; | 1222 | lr->end = lf->lno_e; |
766 | if (dwarf_func_inline(sp_die)) | 1223 | if (dwarf_func_inline(sp_die)) { |
1224 | struct dwarf_callback_param _param; | ||
1225 | _param.data = (void *)lf; | ||
1226 | _param.retval = 0; | ||
767 | dwarf_func_inline_instances(sp_die, | 1227 | dwarf_func_inline_instances(sp_die, |
768 | line_range_inline_cb, lf); | 1228 | line_range_inline_cb, |
769 | else | 1229 | &_param); |
770 | find_line_range_by_line(sp_die, lf); | 1230 | param->retval = _param.retval; |
771 | return 1; | 1231 | } else |
1232 | param->retval = find_line_range_by_line(sp_die, lf); | ||
1233 | return DWARF_CB_ABORT; | ||
772 | } | 1234 | } |
773 | return 0; | 1235 | return DWARF_CB_OK; |
774 | } | 1236 | } |
775 | 1237 | ||
776 | static void find_line_range_by_func(struct line_finder *lf) | 1238 | static int find_line_range_by_func(struct line_finder *lf) |
777 | { | 1239 | { |
778 | dwarf_getfuncs(&lf->cu_die, line_range_search_cb, lf, 0); | 1240 | struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0}; |
1241 | dwarf_getfuncs(&lf->cu_die, line_range_search_cb, ¶m, 0); | ||
1242 | return param.retval; | ||
779 | } | 1243 | } |
780 | 1244 | ||
781 | int find_line_range(int fd, struct line_range *lr) | 1245 | int find_line_range(int fd, struct line_range *lr) |
782 | { | 1246 | { |
783 | struct line_finder lf = {.lr = lr, .found = 0}; | 1247 | struct line_finder lf = {.lr = lr, .found = 0}; |
784 | int ret; | 1248 | int ret = 0; |
785 | Dwarf_Off off = 0, noff; | 1249 | Dwarf_Off off = 0, noff; |
786 | size_t cuhl; | 1250 | size_t cuhl; |
787 | Dwarf_Die *diep; | 1251 | Dwarf_Die *diep; |
788 | Dwarf *dbg; | 1252 | Dwarf *dbg; |
789 | 1253 | ||
790 | dbg = dwarf_begin(fd, DWARF_C_READ); | 1254 | dbg = dwarf_begin(fd, DWARF_C_READ); |
791 | if (!dbg) | 1255 | if (!dbg) { |
792 | return -ENOENT; | 1256 | pr_warning("No dwarf info found in the vmlinux - " |
1257 | "please rebuild with CONFIG_DEBUG_INFO=y.\n"); | ||
1258 | return -EBADF; | ||
1259 | } | ||
793 | 1260 | ||
794 | /* Loop on CUs (Compilation Unit) */ | 1261 | /* Loop on CUs (Compilation Unit) */ |
795 | while (!lf.found) { | 1262 | while (!lf.found && ret >= 0) { |
796 | ret = dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL); | 1263 | if (dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) != 0) |
797 | if (ret != 0) | ||
798 | break; | 1264 | break; |
799 | 1265 | ||
800 | /* Get the DIE(Debugging Information Entry) of this CU */ | 1266 | /* Get the DIE(Debugging Information Entry) of this CU */ |
@@ -810,20 +1276,18 @@ int find_line_range(int fd, struct line_range *lr) | |||
810 | 1276 | ||
811 | if (!lr->file || lf.fname) { | 1277 | if (!lr->file || lf.fname) { |
812 | if (lr->function) | 1278 | if (lr->function) |
813 | find_line_range_by_func(&lf); | 1279 | ret = find_line_range_by_func(&lf); |
814 | else { | 1280 | else { |
815 | lf.lno_s = lr->start; | 1281 | lf.lno_s = lr->start; |
816 | if (!lr->end) | 1282 | lf.lno_e = lr->end; |
817 | lf.lno_e = INT_MAX; | 1283 | ret = find_line_range_by_line(NULL, &lf); |
818 | else | ||
819 | lf.lno_e = lr->end; | ||
820 | find_line_range_by_line(NULL, &lf); | ||
821 | } | 1284 | } |
822 | } | 1285 | } |
823 | off = noff; | 1286 | off = noff; |
824 | } | 1287 | } |
825 | pr_debug("path: %lx\n", (unsigned long)lr->path); | 1288 | pr_debug("path: %lx\n", (unsigned long)lr->path); |
826 | dwarf_end(dbg); | 1289 | dwarf_end(dbg); |
827 | return lf.found; | 1290 | |
1291 | return (ret < 0) ? ret : lf.found; | ||
828 | } | 1292 | } |
829 | 1293 | ||
diff --git a/tools/perf/util/probe-finder.h b/tools/perf/util/probe-finder.h index 21f7354397b4..66f1980e3855 100644 --- a/tools/perf/util/probe-finder.h +++ b/tools/perf/util/probe-finder.h | |||
@@ -3,6 +3,7 @@ | |||
3 | 3 | ||
4 | #include <stdbool.h> | 4 | #include <stdbool.h> |
5 | #include "util.h" | 5 | #include "util.h" |
6 | #include "probe-event.h" | ||
6 | 7 | ||
7 | #define MAX_PATH_LEN 256 | 8 | #define MAX_PATH_LEN 256 |
8 | #define MAX_PROBE_BUFFER 1024 | 9 | #define MAX_PROBE_BUFFER 1024 |
@@ -14,67 +15,39 @@ static inline int is_c_varname(const char *name) | |||
14 | return isalpha(name[0]) || name[0] == '_'; | 15 | return isalpha(name[0]) || name[0] == '_'; |
15 | } | 16 | } |
16 | 17 | ||
17 | struct probe_point { | 18 | #ifdef DWARF_SUPPORT |
18 | char *event; /* Event name */ | 19 | /* Find kprobe_trace_events specified by perf_probe_event from debuginfo */ |
19 | char *group; /* Event group */ | 20 | extern int find_kprobe_trace_events(int fd, struct perf_probe_event *pev, |
21 | struct kprobe_trace_event **tevs, | ||
22 | int max_tevs); | ||
20 | 23 | ||
21 | /* Inputs */ | 24 | /* Find a perf_probe_point from debuginfo */ |
22 | char *file; /* File name */ | 25 | extern int find_perf_probe_point(int fd, unsigned long addr, |
23 | int line; /* Line number */ | 26 | struct perf_probe_point *ppt); |
24 | char *lazy_line; /* Lazy line pattern */ | ||
25 | 27 | ||
26 | char *function; /* Function name */ | ||
27 | int offset; /* Offset bytes */ | ||
28 | |||
29 | int nr_args; /* Number of arguments */ | ||
30 | char **args; /* Arguments */ | ||
31 | |||
32 | int retprobe; /* Return probe */ | ||
33 | |||
34 | /* Output */ | ||
35 | int found; /* Number of found probe points */ | ||
36 | char *probes[MAX_PROBES]; /* Output buffers (will be allocated)*/ | ||
37 | }; | ||
38 | |||
39 | /* Line number container */ | ||
40 | struct line_node { | ||
41 | struct list_head list; | ||
42 | unsigned int line; | ||
43 | }; | ||
44 | |||
45 | /* Line range */ | ||
46 | struct line_range { | ||
47 | char *file; /* File name */ | ||
48 | char *function; /* Function name */ | ||
49 | unsigned int start; /* Start line number */ | ||
50 | unsigned int end; /* End line number */ | ||
51 | int offset; /* Start line offset */ | ||
52 | char *path; /* Real path name */ | ||
53 | struct list_head line_list; /* Visible lines */ | ||
54 | }; | ||
55 | |||
56 | #ifndef NO_DWARF_SUPPORT | ||
57 | extern int find_probe_point(int fd, struct probe_point *pp); | ||
58 | extern int find_line_range(int fd, struct line_range *lr); | 28 | extern int find_line_range(int fd, struct line_range *lr); |
59 | 29 | ||
60 | #include <dwarf.h> | 30 | #include <dwarf.h> |
61 | #include <libdw.h> | 31 | #include <libdw.h> |
62 | 32 | ||
63 | struct probe_finder { | 33 | struct probe_finder { |
64 | struct probe_point *pp; /* Target probe point */ | 34 | struct perf_probe_event *pev; /* Target probe event */ |
35 | struct kprobe_trace_event *tevs; /* Result trace events */ | ||
36 | int ntevs; /* Number of trace events */ | ||
37 | int max_tevs; /* Max number of trace events */ | ||
65 | 38 | ||
66 | /* For function searching */ | 39 | /* For function searching */ |
67 | Dwarf_Addr addr; /* Address */ | ||
68 | const char *fname; /* File name */ | ||
69 | int lno; /* Line number */ | 40 | int lno; /* Line number */ |
41 | Dwarf_Addr addr; /* Address */ | ||
42 | const char *fname; /* Real file name */ | ||
70 | Dwarf_Die cu_die; /* Current CU */ | 43 | Dwarf_Die cu_die; /* Current CU */ |
44 | struct list_head lcache; /* Line cache for lazy match */ | ||
71 | 45 | ||
72 | /* For variable searching */ | 46 | /* For variable searching */ |
47 | Dwarf_CFI *cfi; /* Call Frame Information */ | ||
73 | Dwarf_Op *fb_ops; /* Frame base attribute */ | 48 | Dwarf_Op *fb_ops; /* Frame base attribute */ |
74 | const char *var; /* Current variable name */ | 49 | struct perf_probe_arg *pvar; /* Current target variable */ |
75 | char *buf; /* Current output buffer */ | 50 | struct kprobe_trace_arg *tvar; /* Current result variable */ |
76 | int len; /* Length of output buffer */ | ||
77 | struct list_head lcache; /* Line cache for lazy match */ | ||
78 | }; | 51 | }; |
79 | 52 | ||
80 | struct line_finder { | 53 | struct line_finder { |
@@ -87,6 +60,6 @@ struct line_finder { | |||
87 | int found; | 60 | int found; |
88 | }; | 61 | }; |
89 | 62 | ||
90 | #endif /* NO_DWARF_SUPPORT */ | 63 | #endif /* DWARF_SUPPORT */ |
91 | 64 | ||
92 | #endif /*_PROBE_FINDER_H */ | 65 | #endif /*_PROBE_FINDER_H */ |
diff --git a/tools/perf/util/pstack.c b/tools/perf/util/pstack.c new file mode 100644 index 000000000000..13d36faf64eb --- /dev/null +++ b/tools/perf/util/pstack.c | |||
@@ -0,0 +1,75 @@ | |||
1 | /* | ||
2 | * Simple pointer stack | ||
3 | * | ||
4 | * (c) 2010 Arnaldo Carvalho de Melo <acme@redhat.com> | ||
5 | */ | ||
6 | |||
7 | #include "util.h" | ||
8 | #include "pstack.h" | ||
9 | #include <linux/kernel.h> | ||
10 | #include <stdlib.h> | ||
11 | |||
12 | struct pstack { | ||
13 | unsigned short top; | ||
14 | unsigned short max_nr_entries; | ||
15 | void *entries[0]; | ||
16 | }; | ||
17 | |||
18 | struct pstack *pstack__new(unsigned short max_nr_entries) | ||
19 | { | ||
20 | struct pstack *self = zalloc((sizeof(*self) + | ||
21 | max_nr_entries * sizeof(void *))); | ||
22 | if (self != NULL) | ||
23 | self->max_nr_entries = max_nr_entries; | ||
24 | return self; | ||
25 | } | ||
26 | |||
27 | void pstack__delete(struct pstack *self) | ||
28 | { | ||
29 | free(self); | ||
30 | } | ||
31 | |||
32 | bool pstack__empty(const struct pstack *self) | ||
33 | { | ||
34 | return self->top == 0; | ||
35 | } | ||
36 | |||
37 | void pstack__remove(struct pstack *self, void *key) | ||
38 | { | ||
39 | unsigned short i = self->top, last_index = self->top - 1; | ||
40 | |||
41 | while (i-- != 0) { | ||
42 | if (self->entries[i] == key) { | ||
43 | if (i < last_index) | ||
44 | memmove(self->entries + i, | ||
45 | self->entries + i + 1, | ||
46 | (last_index - i) * sizeof(void *)); | ||
47 | --self->top; | ||
48 | return; | ||
49 | } | ||
50 | } | ||
51 | pr_err("%s: %p not on the pstack!\n", __func__, key); | ||
52 | } | ||
53 | |||
54 | void pstack__push(struct pstack *self, void *key) | ||
55 | { | ||
56 | if (self->top == self->max_nr_entries) { | ||
57 | pr_err("%s: top=%d, overflow!\n", __func__, self->top); | ||
58 | return; | ||
59 | } | ||
60 | self->entries[self->top++] = key; | ||
61 | } | ||
62 | |||
63 | void *pstack__pop(struct pstack *self) | ||
64 | { | ||
65 | void *ret; | ||
66 | |||
67 | if (self->top == 0) { | ||
68 | pr_err("%s: underflow!\n", __func__); | ||
69 | return NULL; | ||
70 | } | ||
71 | |||
72 | ret = self->entries[--self->top]; | ||
73 | self->entries[self->top] = NULL; | ||
74 | return ret; | ||
75 | } | ||
diff --git a/tools/perf/util/pstack.h b/tools/perf/util/pstack.h new file mode 100644 index 000000000000..5ad07023504b --- /dev/null +++ b/tools/perf/util/pstack.h | |||
@@ -0,0 +1,12 @@ | |||
1 | #ifndef _PERF_PSTACK_ | ||
2 | #define _PERF_PSTACK_ | ||
3 | |||
4 | struct pstack; | ||
5 | struct pstack *pstack__new(unsigned short max_nr_entries); | ||
6 | void pstack__delete(struct pstack *self); | ||
7 | bool pstack__empty(const struct pstack *self); | ||
8 | void pstack__remove(struct pstack *self, void *key); | ||
9 | void pstack__push(struct pstack *self, void *key); | ||
10 | void *pstack__pop(struct pstack *self); | ||
11 | |||
12 | #endif /* _PERF_PSTACK_ */ | ||
diff --git a/tools/perf/util/scripting-engines/trace-event-perl.c b/tools/perf/util/scripting-engines/trace-event-perl.c index 5376378e0cfc..b059dc50cc2d 100644 --- a/tools/perf/util/scripting-engines/trace-event-perl.c +++ b/tools/perf/util/scripting-engines/trace-event-perl.c | |||
@@ -371,7 +371,6 @@ static int perl_start_script(const char *script, int argc, const char **argv) | |||
371 | run_start_sub(); | 371 | run_start_sub(); |
372 | 372 | ||
373 | free(command_line); | 373 | free(command_line); |
374 | fprintf(stderr, "perf trace started with Perl script %s\n\n", script); | ||
375 | return 0; | 374 | return 0; |
376 | error: | 375 | error: |
377 | perl_free(my_perl); | 376 | perl_free(my_perl); |
@@ -394,8 +393,6 @@ static int perl_stop_script(void) | |||
394 | perl_destruct(my_perl); | 393 | perl_destruct(my_perl); |
395 | perl_free(my_perl); | 394 | perl_free(my_perl); |
396 | 395 | ||
397 | fprintf(stderr, "\nperf trace Perl script stopped\n"); | ||
398 | |||
399 | return 0; | 396 | return 0; |
400 | } | 397 | } |
401 | 398 | ||
diff --git a/tools/perf/util/scripting-engines/trace-event-python.c b/tools/perf/util/scripting-engines/trace-event-python.c index 6a72f14c5986..81f39cab3aaa 100644 --- a/tools/perf/util/scripting-engines/trace-event-python.c +++ b/tools/perf/util/scripting-engines/trace-event-python.c | |||
@@ -374,8 +374,6 @@ static int python_start_script(const char *script, int argc, const char **argv) | |||
374 | } | 374 | } |
375 | 375 | ||
376 | free(command_line); | 376 | free(command_line); |
377 | fprintf(stderr, "perf trace started with Python script %s\n\n", | ||
378 | script); | ||
379 | 377 | ||
380 | return err; | 378 | return err; |
381 | error: | 379 | error: |
@@ -407,8 +405,6 @@ out: | |||
407 | Py_XDECREF(main_module); | 405 | Py_XDECREF(main_module); |
408 | Py_Finalize(); | 406 | Py_Finalize(); |
409 | 407 | ||
410 | fprintf(stderr, "\nperf trace Python script stopped\n"); | ||
411 | |||
412 | return err; | 408 | return err; |
413 | } | 409 | } |
414 | 410 | ||
diff --git a/tools/perf/util/session.c b/tools/perf/util/session.c index eed1cb889008..25bfca4f10f0 100644 --- a/tools/perf/util/session.c +++ b/tools/perf/util/session.c | |||
@@ -14,6 +14,16 @@ static int perf_session__open(struct perf_session *self, bool force) | |||
14 | { | 14 | { |
15 | struct stat input_stat; | 15 | struct stat input_stat; |
16 | 16 | ||
17 | if (!strcmp(self->filename, "-")) { | ||
18 | self->fd_pipe = true; | ||
19 | self->fd = STDIN_FILENO; | ||
20 | |||
21 | if (perf_header__read(self, self->fd) < 0) | ||
22 | pr_err("incompatible file format"); | ||
23 | |||
24 | return 0; | ||
25 | } | ||
26 | |||
17 | self->fd = open(self->filename, O_RDONLY); | 27 | self->fd = open(self->filename, O_RDONLY); |
18 | if (self->fd < 0) { | 28 | if (self->fd < 0) { |
19 | pr_err("failed to open file: %s", self->filename); | 29 | pr_err("failed to open file: %s", self->filename); |
@@ -38,7 +48,7 @@ static int perf_session__open(struct perf_session *self, bool force) | |||
38 | goto out_close; | 48 | goto out_close; |
39 | } | 49 | } |
40 | 50 | ||
41 | if (perf_header__read(&self->header, self->fd) < 0) { | 51 | if (perf_header__read(self, self->fd) < 0) { |
42 | pr_err("incompatible file format"); | 52 | pr_err("incompatible file format"); |
43 | goto out_close; | 53 | goto out_close; |
44 | } | 54 | } |
@@ -52,12 +62,21 @@ out_close: | |||
52 | return -1; | 62 | return -1; |
53 | } | 63 | } |
54 | 64 | ||
55 | static inline int perf_session__create_kernel_maps(struct perf_session *self) | 65 | void perf_session__update_sample_type(struct perf_session *self) |
66 | { | ||
67 | self->sample_type = perf_header__sample_type(&self->header); | ||
68 | } | ||
69 | |||
70 | int perf_session__create_kernel_maps(struct perf_session *self) | ||
56 | { | 71 | { |
57 | return map_groups__create_kernel_maps(&self->kmaps, self->vmlinux_maps); | 72 | int ret = machine__create_kernel_maps(&self->host_machine); |
73 | |||
74 | if (ret >= 0) | ||
75 | ret = machines__create_guest_kernel_maps(&self->machines); | ||
76 | return ret; | ||
58 | } | 77 | } |
59 | 78 | ||
60 | struct perf_session *perf_session__new(const char *filename, int mode, bool force) | 79 | struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe) |
61 | { | 80 | { |
62 | size_t len = filename ? strlen(filename) + 1 : 0; | 81 | size_t len = filename ? strlen(filename) + 1 : 0; |
63 | struct perf_session *self = zalloc(sizeof(*self) + len); | 82 | struct perf_session *self = zalloc(sizeof(*self) + len); |
@@ -70,13 +89,15 @@ struct perf_session *perf_session__new(const char *filename, int mode, bool forc | |||
70 | 89 | ||
71 | memcpy(self->filename, filename, len); | 90 | memcpy(self->filename, filename, len); |
72 | self->threads = RB_ROOT; | 91 | self->threads = RB_ROOT; |
73 | self->stats_by_id = RB_ROOT; | 92 | self->hists_tree = RB_ROOT; |
74 | self->last_match = NULL; | 93 | self->last_match = NULL; |
75 | self->mmap_window = 32; | 94 | self->mmap_window = 32; |
76 | self->cwd = NULL; | 95 | self->cwd = NULL; |
77 | self->cwdlen = 0; | 96 | self->cwdlen = 0; |
78 | self->unknown_events = 0; | 97 | self->machines = RB_ROOT; |
79 | map_groups__init(&self->kmaps); | 98 | self->repipe = repipe; |
99 | INIT_LIST_HEAD(&self->ordered_samples.samples_head); | ||
100 | machine__init(&self->host_machine, "", HOST_KERNEL_ID); | ||
80 | 101 | ||
81 | if (mode == O_RDONLY) { | 102 | if (mode == O_RDONLY) { |
82 | if (perf_session__open(self, force) < 0) | 103 | if (perf_session__open(self, force) < 0) |
@@ -90,7 +111,7 @@ struct perf_session *perf_session__new(const char *filename, int mode, bool forc | |||
90 | goto out_delete; | 111 | goto out_delete; |
91 | } | 112 | } |
92 | 113 | ||
93 | self->sample_type = perf_header__sample_type(&self->header); | 114 | perf_session__update_sample_type(self); |
94 | out: | 115 | out: |
95 | return self; | 116 | return self; |
96 | out_free: | 117 | out_free: |
@@ -117,22 +138,17 @@ static bool symbol__match_parent_regex(struct symbol *sym) | |||
117 | return 0; | 138 | return 0; |
118 | } | 139 | } |
119 | 140 | ||
120 | struct symbol **perf_session__resolve_callchain(struct perf_session *self, | 141 | struct map_symbol *perf_session__resolve_callchain(struct perf_session *self, |
121 | struct thread *thread, | 142 | struct thread *thread, |
122 | struct ip_callchain *chain, | 143 | struct ip_callchain *chain, |
123 | struct symbol **parent) | 144 | struct symbol **parent) |
124 | { | 145 | { |
125 | u8 cpumode = PERF_RECORD_MISC_USER; | 146 | u8 cpumode = PERF_RECORD_MISC_USER; |
126 | struct symbol **syms = NULL; | ||
127 | unsigned int i; | 147 | unsigned int i; |
148 | struct map_symbol *syms = calloc(chain->nr, sizeof(*syms)); | ||
128 | 149 | ||
129 | if (symbol_conf.use_callchain) { | 150 | if (!syms) |
130 | syms = calloc(chain->nr, sizeof(*syms)); | 151 | return NULL; |
131 | if (!syms) { | ||
132 | fprintf(stderr, "Can't allocate memory for symbols\n"); | ||
133 | exit(-1); | ||
134 | } | ||
135 | } | ||
136 | 152 | ||
137 | for (i = 0; i < chain->nr; i++) { | 153 | for (i = 0; i < chain->nr; i++) { |
138 | u64 ip = chain->ips[i]; | 154 | u64 ip = chain->ips[i]; |
@@ -152,15 +168,17 @@ struct symbol **perf_session__resolve_callchain(struct perf_session *self, | |||
152 | continue; | 168 | continue; |
153 | } | 169 | } |
154 | 170 | ||
171 | al.filtered = false; | ||
155 | thread__find_addr_location(thread, self, cpumode, | 172 | thread__find_addr_location(thread, self, cpumode, |
156 | MAP__FUNCTION, ip, &al, NULL); | 173 | MAP__FUNCTION, thread->pid, ip, &al, NULL); |
157 | if (al.sym != NULL) { | 174 | if (al.sym != NULL) { |
158 | if (sort__has_parent && !*parent && | 175 | if (sort__has_parent && !*parent && |
159 | symbol__match_parent_regex(al.sym)) | 176 | symbol__match_parent_regex(al.sym)) |
160 | *parent = al.sym; | 177 | *parent = al.sym; |
161 | if (!symbol_conf.use_callchain) | 178 | if (!symbol_conf.use_callchain) |
162 | break; | 179 | break; |
163 | syms[i] = al.sym; | 180 | syms[i].map = al.map; |
181 | syms[i].sym = al.sym; | ||
164 | } | 182 | } |
165 | } | 183 | } |
166 | 184 | ||
@@ -174,6 +192,18 @@ static int process_event_stub(event_t *event __used, | |||
174 | return 0; | 192 | return 0; |
175 | } | 193 | } |
176 | 194 | ||
195 | static int process_finished_round_stub(event_t *event __used, | ||
196 | struct perf_session *session __used, | ||
197 | struct perf_event_ops *ops __used) | ||
198 | { | ||
199 | dump_printf(": unhandled!\n"); | ||
200 | return 0; | ||
201 | } | ||
202 | |||
203 | static int process_finished_round(event_t *event, | ||
204 | struct perf_session *session, | ||
205 | struct perf_event_ops *ops); | ||
206 | |||
177 | static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) | 207 | static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) |
178 | { | 208 | { |
179 | if (handler->sample == NULL) | 209 | if (handler->sample == NULL) |
@@ -194,29 +224,20 @@ static void perf_event_ops__fill_defaults(struct perf_event_ops *handler) | |||
194 | handler->throttle = process_event_stub; | 224 | handler->throttle = process_event_stub; |
195 | if (handler->unthrottle == NULL) | 225 | if (handler->unthrottle == NULL) |
196 | handler->unthrottle = process_event_stub; | 226 | handler->unthrottle = process_event_stub; |
197 | } | 227 | if (handler->attr == NULL) |
198 | 228 | handler->attr = process_event_stub; | |
199 | static const char *event__name[] = { | 229 | if (handler->event_type == NULL) |
200 | [0] = "TOTAL", | 230 | handler->event_type = process_event_stub; |
201 | [PERF_RECORD_MMAP] = "MMAP", | 231 | if (handler->tracing_data == NULL) |
202 | [PERF_RECORD_LOST] = "LOST", | 232 | handler->tracing_data = process_event_stub; |
203 | [PERF_RECORD_COMM] = "COMM", | 233 | if (handler->build_id == NULL) |
204 | [PERF_RECORD_EXIT] = "EXIT", | 234 | handler->build_id = process_event_stub; |
205 | [PERF_RECORD_THROTTLE] = "THROTTLE", | 235 | if (handler->finished_round == NULL) { |
206 | [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE", | 236 | if (handler->ordered_samples) |
207 | [PERF_RECORD_FORK] = "FORK", | 237 | handler->finished_round = process_finished_round; |
208 | [PERF_RECORD_READ] = "READ", | 238 | else |
209 | [PERF_RECORD_SAMPLE] = "SAMPLE", | 239 | handler->finished_round = process_finished_round_stub; |
210 | }; | 240 | } |
211 | |||
212 | unsigned long event__total[PERF_RECORD_MAX]; | ||
213 | |||
214 | void event__print_totals(void) | ||
215 | { | ||
216 | int i; | ||
217 | for (i = 0; i < PERF_RECORD_MAX; ++i) | ||
218 | pr_info("%10s events: %10ld\n", | ||
219 | event__name[i], event__total[i]); | ||
220 | } | 241 | } |
221 | 242 | ||
222 | void mem_bswap_64(void *src, int byte_size) | 243 | void mem_bswap_64(void *src, int byte_size) |
@@ -270,6 +291,37 @@ static void event__read_swap(event_t *self) | |||
270 | self->read.id = bswap_64(self->read.id); | 291 | self->read.id = bswap_64(self->read.id); |
271 | } | 292 | } |
272 | 293 | ||
294 | static void event__attr_swap(event_t *self) | ||
295 | { | ||
296 | size_t size; | ||
297 | |||
298 | self->attr.attr.type = bswap_32(self->attr.attr.type); | ||
299 | self->attr.attr.size = bswap_32(self->attr.attr.size); | ||
300 | self->attr.attr.config = bswap_64(self->attr.attr.config); | ||
301 | self->attr.attr.sample_period = bswap_64(self->attr.attr.sample_period); | ||
302 | self->attr.attr.sample_type = bswap_64(self->attr.attr.sample_type); | ||
303 | self->attr.attr.read_format = bswap_64(self->attr.attr.read_format); | ||
304 | self->attr.attr.wakeup_events = bswap_32(self->attr.attr.wakeup_events); | ||
305 | self->attr.attr.bp_type = bswap_32(self->attr.attr.bp_type); | ||
306 | self->attr.attr.bp_addr = bswap_64(self->attr.attr.bp_addr); | ||
307 | self->attr.attr.bp_len = bswap_64(self->attr.attr.bp_len); | ||
308 | |||
309 | size = self->header.size; | ||
310 | size -= (void *)&self->attr.id - (void *)self; | ||
311 | mem_bswap_64(self->attr.id, size); | ||
312 | } | ||
313 | |||
314 | static void event__event_type_swap(event_t *self) | ||
315 | { | ||
316 | self->event_type.event_type.event_id = | ||
317 | bswap_64(self->event_type.event_type.event_id); | ||
318 | } | ||
319 | |||
320 | static void event__tracing_data_swap(event_t *self) | ||
321 | { | ||
322 | self->tracing_data.size = bswap_32(self->tracing_data.size); | ||
323 | } | ||
324 | |||
273 | typedef void (*event__swap_op)(event_t *self); | 325 | typedef void (*event__swap_op)(event_t *self); |
274 | 326 | ||
275 | static event__swap_op event__swap_ops[] = { | 327 | static event__swap_op event__swap_ops[] = { |
@@ -280,9 +332,212 @@ static event__swap_op event__swap_ops[] = { | |||
280 | [PERF_RECORD_LOST] = event__all64_swap, | 332 | [PERF_RECORD_LOST] = event__all64_swap, |
281 | [PERF_RECORD_READ] = event__read_swap, | 333 | [PERF_RECORD_READ] = event__read_swap, |
282 | [PERF_RECORD_SAMPLE] = event__all64_swap, | 334 | [PERF_RECORD_SAMPLE] = event__all64_swap, |
283 | [PERF_RECORD_MAX] = NULL, | 335 | [PERF_RECORD_HEADER_ATTR] = event__attr_swap, |
336 | [PERF_RECORD_HEADER_EVENT_TYPE] = event__event_type_swap, | ||
337 | [PERF_RECORD_HEADER_TRACING_DATA] = event__tracing_data_swap, | ||
338 | [PERF_RECORD_HEADER_BUILD_ID] = NULL, | ||
339 | [PERF_RECORD_HEADER_MAX] = NULL, | ||
284 | }; | 340 | }; |
285 | 341 | ||
342 | struct sample_queue { | ||
343 | u64 timestamp; | ||
344 | struct sample_event *event; | ||
345 | struct list_head list; | ||
346 | }; | ||
347 | |||
348 | static void flush_sample_queue(struct perf_session *s, | ||
349 | struct perf_event_ops *ops) | ||
350 | { | ||
351 | struct list_head *head = &s->ordered_samples.samples_head; | ||
352 | u64 limit = s->ordered_samples.next_flush; | ||
353 | struct sample_queue *tmp, *iter; | ||
354 | |||
355 | if (!ops->ordered_samples || !limit) | ||
356 | return; | ||
357 | |||
358 | list_for_each_entry_safe(iter, tmp, head, list) { | ||
359 | if (iter->timestamp > limit) | ||
360 | return; | ||
361 | |||
362 | if (iter == s->ordered_samples.last_inserted) | ||
363 | s->ordered_samples.last_inserted = NULL; | ||
364 | |||
365 | ops->sample((event_t *)iter->event, s); | ||
366 | |||
367 | s->ordered_samples.last_flush = iter->timestamp; | ||
368 | list_del(&iter->list); | ||
369 | free(iter->event); | ||
370 | free(iter); | ||
371 | } | ||
372 | } | ||
373 | |||
374 | /* | ||
375 | * When perf record finishes a pass on every buffers, it records this pseudo | ||
376 | * event. | ||
377 | * We record the max timestamp t found in the pass n. | ||
378 | * Assuming these timestamps are monotonic across cpus, we know that if | ||
379 | * a buffer still has events with timestamps below t, they will be all | ||
380 | * available and then read in the pass n + 1. | ||
381 | * Hence when we start to read the pass n + 2, we can safely flush every | ||
382 | * events with timestamps below t. | ||
383 | * | ||
384 | * ============ PASS n ================= | ||
385 | * CPU 0 | CPU 1 | ||
386 | * | | ||
387 | * cnt1 timestamps | cnt2 timestamps | ||
388 | * 1 | 2 | ||
389 | * 2 | 3 | ||
390 | * - | 4 <--- max recorded | ||
391 | * | ||
392 | * ============ PASS n + 1 ============== | ||
393 | * CPU 0 | CPU 1 | ||
394 | * | | ||
395 | * cnt1 timestamps | cnt2 timestamps | ||
396 | * 3 | 5 | ||
397 | * 4 | 6 | ||
398 | * 5 | 7 <---- max recorded | ||
399 | * | ||
400 | * Flush every events below timestamp 4 | ||
401 | * | ||
402 | * ============ PASS n + 2 ============== | ||
403 | * CPU 0 | CPU 1 | ||
404 | * | | ||
405 | * cnt1 timestamps | cnt2 timestamps | ||
406 | * 6 | 8 | ||
407 | * 7 | 9 | ||
408 | * - | 10 | ||
409 | * | ||
410 | * Flush every events below timestamp 7 | ||
411 | * etc... | ||
412 | */ | ||
413 | static int process_finished_round(event_t *event __used, | ||
414 | struct perf_session *session, | ||
415 | struct perf_event_ops *ops) | ||
416 | { | ||
417 | flush_sample_queue(session, ops); | ||
418 | session->ordered_samples.next_flush = session->ordered_samples.max_timestamp; | ||
419 | |||
420 | return 0; | ||
421 | } | ||
422 | |||
423 | static void __queue_sample_end(struct sample_queue *new, struct list_head *head) | ||
424 | { | ||
425 | struct sample_queue *iter; | ||
426 | |||
427 | list_for_each_entry_reverse(iter, head, list) { | ||
428 | if (iter->timestamp < new->timestamp) { | ||
429 | list_add(&new->list, &iter->list); | ||
430 | return; | ||
431 | } | ||
432 | } | ||
433 | |||
434 | list_add(&new->list, head); | ||
435 | } | ||
436 | |||
437 | static void __queue_sample_before(struct sample_queue *new, | ||
438 | struct sample_queue *iter, | ||
439 | struct list_head *head) | ||
440 | { | ||
441 | list_for_each_entry_continue_reverse(iter, head, list) { | ||
442 | if (iter->timestamp < new->timestamp) { | ||
443 | list_add(&new->list, &iter->list); | ||
444 | return; | ||
445 | } | ||
446 | } | ||
447 | |||
448 | list_add(&new->list, head); | ||
449 | } | ||
450 | |||
451 | static void __queue_sample_after(struct sample_queue *new, | ||
452 | struct sample_queue *iter, | ||
453 | struct list_head *head) | ||
454 | { | ||
455 | list_for_each_entry_continue(iter, head, list) { | ||
456 | if (iter->timestamp > new->timestamp) { | ||
457 | list_add_tail(&new->list, &iter->list); | ||
458 | return; | ||
459 | } | ||
460 | } | ||
461 | list_add_tail(&new->list, head); | ||
462 | } | ||
463 | |||
464 | /* The queue is ordered by time */ | ||
465 | static void __queue_sample_event(struct sample_queue *new, | ||
466 | struct perf_session *s) | ||
467 | { | ||
468 | struct sample_queue *last_inserted = s->ordered_samples.last_inserted; | ||
469 | struct list_head *head = &s->ordered_samples.samples_head; | ||
470 | |||
471 | |||
472 | if (!last_inserted) { | ||
473 | __queue_sample_end(new, head); | ||
474 | return; | ||
475 | } | ||
476 | |||
477 | /* | ||
478 | * Most of the time the current event has a timestamp | ||
479 | * very close to the last event inserted, unless we just switched | ||
480 | * to another event buffer. Having a sorting based on a list and | ||
481 | * on the last inserted event that is close to the current one is | ||
482 | * probably more efficient than an rbtree based sorting. | ||
483 | */ | ||
484 | if (last_inserted->timestamp >= new->timestamp) | ||
485 | __queue_sample_before(new, last_inserted, head); | ||
486 | else | ||
487 | __queue_sample_after(new, last_inserted, head); | ||
488 | } | ||
489 | |||
490 | static int queue_sample_event(event_t *event, struct sample_data *data, | ||
491 | struct perf_session *s) | ||
492 | { | ||
493 | u64 timestamp = data->time; | ||
494 | struct sample_queue *new; | ||
495 | |||
496 | |||
497 | if (timestamp < s->ordered_samples.last_flush) { | ||
498 | printf("Warning: Timestamp below last timeslice flush\n"); | ||
499 | return -EINVAL; | ||
500 | } | ||
501 | |||
502 | new = malloc(sizeof(*new)); | ||
503 | if (!new) | ||
504 | return -ENOMEM; | ||
505 | |||
506 | new->timestamp = timestamp; | ||
507 | |||
508 | new->event = malloc(event->header.size); | ||
509 | if (!new->event) { | ||
510 | free(new); | ||
511 | return -ENOMEM; | ||
512 | } | ||
513 | |||
514 | memcpy(new->event, event, event->header.size); | ||
515 | |||
516 | __queue_sample_event(new, s); | ||
517 | s->ordered_samples.last_inserted = new; | ||
518 | |||
519 | if (new->timestamp > s->ordered_samples.max_timestamp) | ||
520 | s->ordered_samples.max_timestamp = new->timestamp; | ||
521 | |||
522 | return 0; | ||
523 | } | ||
524 | |||
525 | static int perf_session__process_sample(event_t *event, struct perf_session *s, | ||
526 | struct perf_event_ops *ops) | ||
527 | { | ||
528 | struct sample_data data; | ||
529 | |||
530 | if (!ops->ordered_samples) | ||
531 | return ops->sample(event, s); | ||
532 | |||
533 | bzero(&data, sizeof(struct sample_data)); | ||
534 | event__parse_sample(event, s->sample_type, &data); | ||
535 | |||
536 | queue_sample_event(event, &data, s); | ||
537 | |||
538 | return 0; | ||
539 | } | ||
540 | |||
286 | static int perf_session__process_event(struct perf_session *self, | 541 | static int perf_session__process_event(struct perf_session *self, |
287 | event_t *event, | 542 | event_t *event, |
288 | struct perf_event_ops *ops, | 543 | struct perf_event_ops *ops, |
@@ -290,12 +545,11 @@ static int perf_session__process_event(struct perf_session *self, | |||
290 | { | 545 | { |
291 | trace_event(event); | 546 | trace_event(event); |
292 | 547 | ||
293 | if (event->header.type < PERF_RECORD_MAX) { | 548 | if (event->header.type < PERF_RECORD_HEADER_MAX) { |
294 | dump_printf("%#Lx [%#x]: PERF_RECORD_%s", | 549 | dump_printf("%#Lx [%#x]: PERF_RECORD_%s", |
295 | offset + head, event->header.size, | 550 | offset + head, event->header.size, |
296 | event__name[event->header.type]); | 551 | event__name[event->header.type]); |
297 | ++event__total[0]; | 552 | hists__inc_nr_events(&self->hists, event->header.type); |
298 | ++event__total[event->header.type]; | ||
299 | } | 553 | } |
300 | 554 | ||
301 | if (self->header.needs_swap && event__swap_ops[event->header.type]) | 555 | if (self->header.needs_swap && event__swap_ops[event->header.type]) |
@@ -303,7 +557,7 @@ static int perf_session__process_event(struct perf_session *self, | |||
303 | 557 | ||
304 | switch (event->header.type) { | 558 | switch (event->header.type) { |
305 | case PERF_RECORD_SAMPLE: | 559 | case PERF_RECORD_SAMPLE: |
306 | return ops->sample(event, self); | 560 | return perf_session__process_sample(event, self, ops); |
307 | case PERF_RECORD_MMAP: | 561 | case PERF_RECORD_MMAP: |
308 | return ops->mmap(event, self); | 562 | return ops->mmap(event, self); |
309 | case PERF_RECORD_COMM: | 563 | case PERF_RECORD_COMM: |
@@ -320,8 +574,20 @@ static int perf_session__process_event(struct perf_session *self, | |||
320 | return ops->throttle(event, self); | 574 | return ops->throttle(event, self); |
321 | case PERF_RECORD_UNTHROTTLE: | 575 | case PERF_RECORD_UNTHROTTLE: |
322 | return ops->unthrottle(event, self); | 576 | return ops->unthrottle(event, self); |
577 | case PERF_RECORD_HEADER_ATTR: | ||
578 | return ops->attr(event, self); | ||
579 | case PERF_RECORD_HEADER_EVENT_TYPE: | ||
580 | return ops->event_type(event, self); | ||
581 | case PERF_RECORD_HEADER_TRACING_DATA: | ||
582 | /* setup for reading amidst mmap */ | ||
583 | lseek(self->fd, offset + head, SEEK_SET); | ||
584 | return ops->tracing_data(event, self); | ||
585 | case PERF_RECORD_HEADER_BUILD_ID: | ||
586 | return ops->build_id(event, self); | ||
587 | case PERF_RECORD_FINISHED_ROUND: | ||
588 | return ops->finished_round(event, self, ops); | ||
323 | default: | 589 | default: |
324 | self->unknown_events++; | 590 | ++self->hists.stats.nr_unknown_events; |
325 | return -1; | 591 | return -1; |
326 | } | 592 | } |
327 | } | 593 | } |
@@ -333,56 +599,114 @@ void perf_event_header__bswap(struct perf_event_header *self) | |||
333 | self->size = bswap_16(self->size); | 599 | self->size = bswap_16(self->size); |
334 | } | 600 | } |
335 | 601 | ||
336 | int perf_header__read_build_ids(struct perf_header *self, | 602 | static struct thread *perf_session__register_idle_thread(struct perf_session *self) |
337 | int input, u64 offset, u64 size) | ||
338 | { | 603 | { |
339 | struct build_id_event bev; | 604 | struct thread *thread = perf_session__findnew(self, 0); |
340 | char filename[PATH_MAX]; | ||
341 | u64 limit = offset + size; | ||
342 | int err = -1; | ||
343 | |||
344 | while (offset < limit) { | ||
345 | struct dso *dso; | ||
346 | ssize_t len; | ||
347 | struct list_head *head = &dsos__user; | ||
348 | 605 | ||
349 | if (read(input, &bev, sizeof(bev)) != sizeof(bev)) | 606 | if (thread == NULL || thread__set_comm(thread, "swapper")) { |
350 | goto out; | 607 | pr_err("problem inserting idle task.\n"); |
608 | thread = NULL; | ||
609 | } | ||
351 | 610 | ||
352 | if (self->needs_swap) | 611 | return thread; |
353 | perf_event_header__bswap(&bev.header); | 612 | } |
354 | 613 | ||
355 | len = bev.header.size - sizeof(bev); | 614 | int do_read(int fd, void *buf, size_t size) |
356 | if (read(input, filename, len) != len) | 615 | { |
357 | goto out; | 616 | void *buf_start = buf; |
358 | 617 | ||
359 | if (bev.header.misc & PERF_RECORD_MISC_KERNEL) | 618 | while (size) { |
360 | head = &dsos__kernel; | 619 | int ret = read(fd, buf, size); |
361 | 620 | ||
362 | dso = __dsos__findnew(head, filename); | 621 | if (ret <= 0) |
363 | if (dso != NULL) { | 622 | return ret; |
364 | dso__set_build_id(dso, &bev.build_id); | ||
365 | if (head == &dsos__kernel && filename[0] == '[') | ||
366 | dso->kernel = 1; | ||
367 | } | ||
368 | 623 | ||
369 | offset += bev.header.size; | 624 | size -= ret; |
625 | buf += ret; | ||
370 | } | 626 | } |
371 | err = 0; | 627 | |
372 | out: | 628 | return buf - buf_start; |
373 | return err; | ||
374 | } | 629 | } |
375 | 630 | ||
376 | static struct thread *perf_session__register_idle_thread(struct perf_session *self) | 631 | #define session_done() (*(volatile int *)(&session_done)) |
632 | volatile int session_done; | ||
633 | |||
634 | static int __perf_session__process_pipe_events(struct perf_session *self, | ||
635 | struct perf_event_ops *ops) | ||
377 | { | 636 | { |
378 | struct thread *thread = perf_session__findnew(self, 0); | 637 | event_t event; |
638 | uint32_t size; | ||
639 | int skip = 0; | ||
640 | u64 head; | ||
641 | int err; | ||
642 | void *p; | ||
379 | 643 | ||
380 | if (thread == NULL || thread__set_comm(thread, "swapper")) { | 644 | perf_event_ops__fill_defaults(ops); |
381 | pr_err("problem inserting idle task.\n"); | 645 | |
382 | thread = NULL; | 646 | head = 0; |
647 | more: | ||
648 | err = do_read(self->fd, &event, sizeof(struct perf_event_header)); | ||
649 | if (err <= 0) { | ||
650 | if (err == 0) | ||
651 | goto done; | ||
652 | |||
653 | pr_err("failed to read event header\n"); | ||
654 | goto out_err; | ||
383 | } | 655 | } |
384 | 656 | ||
385 | return thread; | 657 | if (self->header.needs_swap) |
658 | perf_event_header__bswap(&event.header); | ||
659 | |||
660 | size = event.header.size; | ||
661 | if (size == 0) | ||
662 | size = 8; | ||
663 | |||
664 | p = &event; | ||
665 | p += sizeof(struct perf_event_header); | ||
666 | |||
667 | if (size - sizeof(struct perf_event_header)) { | ||
668 | err = do_read(self->fd, p, | ||
669 | size - sizeof(struct perf_event_header)); | ||
670 | if (err <= 0) { | ||
671 | if (err == 0) { | ||
672 | pr_err("unexpected end of event stream\n"); | ||
673 | goto done; | ||
674 | } | ||
675 | |||
676 | pr_err("failed to read event data\n"); | ||
677 | goto out_err; | ||
678 | } | ||
679 | } | ||
680 | |||
681 | if (size == 0 || | ||
682 | (skip = perf_session__process_event(self, &event, ops, | ||
683 | 0, head)) < 0) { | ||
684 | dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n", | ||
685 | head, event.header.size, event.header.type); | ||
686 | /* | ||
687 | * assume we lost track of the stream, check alignment, and | ||
688 | * increment a single u64 in the hope to catch on again 'soon'. | ||
689 | */ | ||
690 | if (unlikely(head & 7)) | ||
691 | head &= ~7ULL; | ||
692 | |||
693 | size = 8; | ||
694 | } | ||
695 | |||
696 | head += size; | ||
697 | |||
698 | dump_printf("\n%#Lx [%#x]: event: %d\n", | ||
699 | head, event.header.size, event.header.type); | ||
700 | |||
701 | if (skip > 0) | ||
702 | head += skip; | ||
703 | |||
704 | if (!session_done()) | ||
705 | goto more; | ||
706 | done: | ||
707 | err = 0; | ||
708 | out_err: | ||
709 | return err; | ||
386 | } | 710 | } |
387 | 711 | ||
388 | int __perf_session__process_events(struct perf_session *self, | 712 | int __perf_session__process_events(struct perf_session *self, |
@@ -396,6 +720,10 @@ int __perf_session__process_events(struct perf_session *self, | |||
396 | event_t *event; | 720 | event_t *event; |
397 | uint32_t size; | 721 | uint32_t size; |
398 | char *buf; | 722 | char *buf; |
723 | struct ui_progress *progress = ui_progress__new("Processing events...", | ||
724 | self->size); | ||
725 | if (progress == NULL) | ||
726 | return -1; | ||
399 | 727 | ||
400 | perf_event_ops__fill_defaults(ops); | 728 | perf_event_ops__fill_defaults(ops); |
401 | 729 | ||
@@ -424,6 +752,7 @@ remap: | |||
424 | 752 | ||
425 | more: | 753 | more: |
426 | event = (event_t *)(buf + head); | 754 | event = (event_t *)(buf + head); |
755 | ui_progress__update(progress, offset); | ||
427 | 756 | ||
428 | if (self->header.needs_swap) | 757 | if (self->header.needs_swap) |
429 | perf_event_header__bswap(&event->header); | 758 | perf_event_header__bswap(&event->header); |
@@ -473,7 +802,11 @@ more: | |||
473 | goto more; | 802 | goto more; |
474 | done: | 803 | done: |
475 | err = 0; | 804 | err = 0; |
805 | /* do the final flush for ordered samples */ | ||
806 | self->ordered_samples.next_flush = ULLONG_MAX; | ||
807 | flush_sample_queue(self, ops); | ||
476 | out_err: | 808 | out_err: |
809 | ui_progress__delete(progress); | ||
477 | return err; | 810 | return err; |
478 | } | 811 | } |
479 | 812 | ||
@@ -502,9 +835,13 @@ out_getcwd_err: | |||
502 | self->cwdlen = strlen(self->cwd); | 835 | self->cwdlen = strlen(self->cwd); |
503 | } | 836 | } |
504 | 837 | ||
505 | err = __perf_session__process_events(self, self->header.data_offset, | 838 | if (!self->fd_pipe) |
506 | self->header.data_size, | 839 | err = __perf_session__process_events(self, |
507 | self->size, ops); | 840 | self->header.data_offset, |
841 | self->header.data_size, | ||
842 | self->size, ops); | ||
843 | else | ||
844 | err = __perf_session__process_pipe_events(self, ops); | ||
508 | out_err: | 845 | out_err: |
509 | return err; | 846 | return err; |
510 | } | 847 | } |
@@ -519,56 +856,41 @@ bool perf_session__has_traces(struct perf_session *self, const char *msg) | |||
519 | return true; | 856 | return true; |
520 | } | 857 | } |
521 | 858 | ||
522 | int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self, | 859 | int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps, |
523 | const char *symbol_name, | 860 | const char *symbol_name, |
524 | u64 addr) | 861 | u64 addr) |
525 | { | 862 | { |
526 | char *bracket; | 863 | char *bracket; |
527 | enum map_type i; | 864 | enum map_type i; |
865 | struct ref_reloc_sym *ref; | ||
528 | 866 | ||
529 | self->ref_reloc_sym.name = strdup(symbol_name); | 867 | ref = zalloc(sizeof(struct ref_reloc_sym)); |
530 | if (self->ref_reloc_sym.name == NULL) | 868 | if (ref == NULL) |
531 | return -ENOMEM; | 869 | return -ENOMEM; |
532 | 870 | ||
533 | bracket = strchr(self->ref_reloc_sym.name, ']'); | 871 | ref->name = strdup(symbol_name); |
872 | if (ref->name == NULL) { | ||
873 | free(ref); | ||
874 | return -ENOMEM; | ||
875 | } | ||
876 | |||
877 | bracket = strchr(ref->name, ']'); | ||
534 | if (bracket) | 878 | if (bracket) |
535 | *bracket = '\0'; | 879 | *bracket = '\0'; |
536 | 880 | ||
537 | self->ref_reloc_sym.addr = addr; | 881 | ref->addr = addr; |
538 | 882 | ||
539 | for (i = 0; i < MAP__NR_TYPES; ++i) { | 883 | for (i = 0; i < MAP__NR_TYPES; ++i) { |
540 | struct kmap *kmap = map__kmap(self->vmlinux_maps[i]); | 884 | struct kmap *kmap = map__kmap(maps[i]); |
541 | kmap->ref_reloc_sym = &self->ref_reloc_sym; | 885 | kmap->ref_reloc_sym = ref; |
542 | } | 886 | } |
543 | 887 | ||
544 | return 0; | 888 | return 0; |
545 | } | 889 | } |
546 | 890 | ||
547 | static u64 map__reloc_map_ip(struct map *map, u64 ip) | 891 | size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp) |
548 | { | ||
549 | return ip + (s64)map->pgoff; | ||
550 | } | ||
551 | |||
552 | static u64 map__reloc_unmap_ip(struct map *map, u64 ip) | ||
553 | { | ||
554 | return ip - (s64)map->pgoff; | ||
555 | } | ||
556 | |||
557 | void map__reloc_vmlinux(struct map *self) | ||
558 | { | 892 | { |
559 | struct kmap *kmap = map__kmap(self); | 893 | return __dsos__fprintf(&self->host_machine.kernel_dsos, fp) + |
560 | s64 reloc; | 894 | __dsos__fprintf(&self->host_machine.user_dsos, fp) + |
561 | 895 | machines__fprintf_dsos(&self->machines, fp); | |
562 | if (!kmap->ref_reloc_sym || !kmap->ref_reloc_sym->unrelocated_addr) | ||
563 | return; | ||
564 | |||
565 | reloc = (kmap->ref_reloc_sym->unrelocated_addr - | ||
566 | kmap->ref_reloc_sym->addr); | ||
567 | |||
568 | if (!reloc) | ||
569 | return; | ||
570 | |||
571 | self->map_ip = map__reloc_map_ip; | ||
572 | self->unmap_ip = map__reloc_unmap_ip; | ||
573 | self->pgoff = reloc; | ||
574 | } | 896 | } |
diff --git a/tools/perf/util/session.h b/tools/perf/util/session.h index 5c33417eebb3..e7fce486ebe2 100644 --- a/tools/perf/util/session.h +++ b/tools/perf/util/session.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_SESSION_H | 1 | #ifndef __PERF_SESSION_H |
2 | #define __PERF_SESSION_H | 2 | #define __PERF_SESSION_H |
3 | 3 | ||
4 | #include "hist.h" | ||
4 | #include "event.h" | 5 | #include "event.h" |
5 | #include "header.h" | 6 | #include "header.h" |
6 | #include "symbol.h" | 7 | #include "symbol.h" |
@@ -8,45 +9,69 @@ | |||
8 | #include <linux/rbtree.h> | 9 | #include <linux/rbtree.h> |
9 | #include "../../../include/linux/perf_event.h" | 10 | #include "../../../include/linux/perf_event.h" |
10 | 11 | ||
12 | struct sample_queue; | ||
11 | struct ip_callchain; | 13 | struct ip_callchain; |
12 | struct thread; | 14 | struct thread; |
13 | 15 | ||
16 | struct ordered_samples { | ||
17 | u64 last_flush; | ||
18 | u64 next_flush; | ||
19 | u64 max_timestamp; | ||
20 | struct list_head samples_head; | ||
21 | struct sample_queue *last_inserted; | ||
22 | }; | ||
23 | |||
14 | struct perf_session { | 24 | struct perf_session { |
15 | struct perf_header header; | 25 | struct perf_header header; |
16 | unsigned long size; | 26 | unsigned long size; |
17 | unsigned long mmap_window; | 27 | unsigned long mmap_window; |
18 | struct map_groups kmaps; | ||
19 | struct rb_root threads; | 28 | struct rb_root threads; |
20 | struct thread *last_match; | 29 | struct thread *last_match; |
21 | struct map *vmlinux_maps[MAP__NR_TYPES]; | 30 | struct machine host_machine; |
22 | struct events_stats events_stats; | 31 | struct rb_root machines; |
23 | struct rb_root stats_by_id; | 32 | struct rb_root hists_tree; |
24 | unsigned long event_total[PERF_RECORD_MAX]; | 33 | /* |
25 | unsigned long unknown_events; | 34 | * FIXME: should point to the first entry in hists_tree and |
26 | struct rb_root hists; | 35 | * be a hists instance. Right now its only 'report' |
36 | * that is using ->hists_tree while all the rest use | ||
37 | * ->hists. | ||
38 | */ | ||
39 | struct hists hists; | ||
27 | u64 sample_type; | 40 | u64 sample_type; |
28 | struct ref_reloc_sym ref_reloc_sym; | ||
29 | int fd; | 41 | int fd; |
42 | bool fd_pipe; | ||
43 | bool repipe; | ||
30 | int cwdlen; | 44 | int cwdlen; |
31 | char *cwd; | 45 | char *cwd; |
46 | struct ordered_samples ordered_samples; | ||
32 | char filename[0]; | 47 | char filename[0]; |
33 | }; | 48 | }; |
34 | 49 | ||
50 | struct perf_event_ops; | ||
51 | |||
35 | typedef int (*event_op)(event_t *self, struct perf_session *session); | 52 | typedef int (*event_op)(event_t *self, struct perf_session *session); |
53 | typedef int (*event_op2)(event_t *self, struct perf_session *session, | ||
54 | struct perf_event_ops *ops); | ||
36 | 55 | ||
37 | struct perf_event_ops { | 56 | struct perf_event_ops { |
38 | event_op sample, | 57 | event_op sample, |
39 | mmap, | 58 | mmap, |
40 | comm, | 59 | comm, |
41 | fork, | 60 | fork, |
42 | exit, | 61 | exit, |
43 | lost, | 62 | lost, |
44 | read, | 63 | read, |
45 | throttle, | 64 | throttle, |
46 | unthrottle; | 65 | unthrottle, |
66 | attr, | ||
67 | event_type, | ||
68 | tracing_data, | ||
69 | build_id; | ||
70 | event_op2 finished_round; | ||
71 | bool ordered_samples; | ||
47 | }; | 72 | }; |
48 | 73 | ||
49 | struct perf_session *perf_session__new(const char *filename, int mode, bool force); | 74 | struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe); |
50 | void perf_session__delete(struct perf_session *self); | 75 | void perf_session__delete(struct perf_session *self); |
51 | 76 | ||
52 | void perf_event_header__bswap(struct perf_event_header *self); | 77 | void perf_event_header__bswap(struct perf_event_header *self); |
@@ -57,33 +82,66 @@ int __perf_session__process_events(struct perf_session *self, | |||
57 | int perf_session__process_events(struct perf_session *self, | 82 | int perf_session__process_events(struct perf_session *self, |
58 | struct perf_event_ops *event_ops); | 83 | struct perf_event_ops *event_ops); |
59 | 84 | ||
60 | struct symbol **perf_session__resolve_callchain(struct perf_session *self, | 85 | struct map_symbol *perf_session__resolve_callchain(struct perf_session *self, |
61 | struct thread *thread, | 86 | struct thread *thread, |
62 | struct ip_callchain *chain, | 87 | struct ip_callchain *chain, |
63 | struct symbol **parent); | 88 | struct symbol **parent); |
64 | 89 | ||
65 | bool perf_session__has_traces(struct perf_session *self, const char *msg); | 90 | bool perf_session__has_traces(struct perf_session *self, const char *msg); |
66 | 91 | ||
67 | int perf_header__read_build_ids(struct perf_header *self, int input, | 92 | int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps, |
68 | u64 offset, u64 file_size); | ||
69 | |||
70 | int perf_session__set_kallsyms_ref_reloc_sym(struct perf_session *self, | ||
71 | const char *symbol_name, | 93 | const char *symbol_name, |
72 | u64 addr); | 94 | u64 addr); |
73 | 95 | ||
74 | void mem_bswap_64(void *src, int byte_size); | 96 | void mem_bswap_64(void *src, int byte_size); |
75 | 97 | ||
76 | static inline int __perf_session__create_kernel_maps(struct perf_session *self, | 98 | int perf_session__create_kernel_maps(struct perf_session *self); |
77 | struct dso *kernel) | 99 | |
100 | int do_read(int fd, void *buf, size_t size); | ||
101 | void perf_session__update_sample_type(struct perf_session *self); | ||
102 | |||
103 | static inline | ||
104 | struct machine *perf_session__find_host_machine(struct perf_session *self) | ||
105 | { | ||
106 | return &self->host_machine; | ||
107 | } | ||
108 | |||
109 | static inline | ||
110 | struct machine *perf_session__find_machine(struct perf_session *self, pid_t pid) | ||
111 | { | ||
112 | if (pid == HOST_KERNEL_ID) | ||
113 | return &self->host_machine; | ||
114 | return machines__find(&self->machines, pid); | ||
115 | } | ||
116 | |||
117 | static inline | ||
118 | struct machine *perf_session__findnew_machine(struct perf_session *self, pid_t pid) | ||
119 | { | ||
120 | if (pid == HOST_KERNEL_ID) | ||
121 | return &self->host_machine; | ||
122 | return machines__findnew(&self->machines, pid); | ||
123 | } | ||
124 | |||
125 | static inline | ||
126 | void perf_session__process_machines(struct perf_session *self, | ||
127 | machine__process_t process) | ||
128 | { | ||
129 | process(&self->host_machine, self); | ||
130 | return machines__process(&self->machines, process, self); | ||
131 | } | ||
132 | |||
133 | size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp); | ||
134 | |||
135 | static inline | ||
136 | size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp, | ||
137 | bool with_hits) | ||
78 | { | 138 | { |
79 | return __map_groups__create_kernel_maps(&self->kmaps, | 139 | return machines__fprintf_dsos_buildid(&self->machines, fp, with_hits); |
80 | self->vmlinux_maps, kernel); | ||
81 | } | 140 | } |
82 | 141 | ||
83 | static inline struct map * | 142 | static inline |
84 | perf_session__new_module_map(struct perf_session *self, | 143 | size_t perf_session__fprintf_nr_events(struct perf_session *self, FILE *fp) |
85 | u64 start, const char *filename) | ||
86 | { | 144 | { |
87 | return map_groups__new_module(&self->kmaps, start, filename); | 145 | return hists__fprintf_nr_events(&self->hists, fp); |
88 | } | 146 | } |
89 | #endif /* __PERF_SESSION_H */ | 147 | #endif /* __PERF_SESSION_H */ |
diff --git a/tools/perf/util/sort.c b/tools/perf/util/sort.c index cb0f327de9e8..da30b305fba0 100644 --- a/tools/perf/util/sort.c +++ b/tools/perf/util/sort.c | |||
@@ -18,39 +18,50 @@ char * field_sep; | |||
18 | 18 | ||
19 | LIST_HEAD(hist_entry__sort_list); | 19 | LIST_HEAD(hist_entry__sort_list); |
20 | 20 | ||
21 | static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf, | ||
22 | size_t size, unsigned int width); | ||
23 | static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf, | ||
24 | size_t size, unsigned int width); | ||
25 | static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf, | ||
26 | size_t size, unsigned int width); | ||
27 | static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf, | ||
28 | size_t size, unsigned int width); | ||
29 | static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf, | ||
30 | size_t size, unsigned int width); | ||
31 | |||
21 | struct sort_entry sort_thread = { | 32 | struct sort_entry sort_thread = { |
22 | .header = "Command: Pid", | 33 | .se_header = "Command: Pid", |
23 | .cmp = sort__thread_cmp, | 34 | .se_cmp = sort__thread_cmp, |
24 | .print = sort__thread_print, | 35 | .se_snprintf = hist_entry__thread_snprintf, |
25 | .width = &threads__col_width, | 36 | .se_width = &threads__col_width, |
26 | }; | 37 | }; |
27 | 38 | ||
28 | struct sort_entry sort_comm = { | 39 | struct sort_entry sort_comm = { |
29 | .header = "Command", | 40 | .se_header = "Command", |
30 | .cmp = sort__comm_cmp, | 41 | .se_cmp = sort__comm_cmp, |
31 | .collapse = sort__comm_collapse, | 42 | .se_collapse = sort__comm_collapse, |
32 | .print = sort__comm_print, | 43 | .se_snprintf = hist_entry__comm_snprintf, |
33 | .width = &comms__col_width, | 44 | .se_width = &comms__col_width, |
34 | }; | 45 | }; |
35 | 46 | ||
36 | struct sort_entry sort_dso = { | 47 | struct sort_entry sort_dso = { |
37 | .header = "Shared Object", | 48 | .se_header = "Shared Object", |
38 | .cmp = sort__dso_cmp, | 49 | .se_cmp = sort__dso_cmp, |
39 | .print = sort__dso_print, | 50 | .se_snprintf = hist_entry__dso_snprintf, |
40 | .width = &dsos__col_width, | 51 | .se_width = &dsos__col_width, |
41 | }; | 52 | }; |
42 | 53 | ||
43 | struct sort_entry sort_sym = { | 54 | struct sort_entry sort_sym = { |
44 | .header = "Symbol", | 55 | .se_header = "Symbol", |
45 | .cmp = sort__sym_cmp, | 56 | .se_cmp = sort__sym_cmp, |
46 | .print = sort__sym_print, | 57 | .se_snprintf = hist_entry__sym_snprintf, |
47 | }; | 58 | }; |
48 | 59 | ||
49 | struct sort_entry sort_parent = { | 60 | struct sort_entry sort_parent = { |
50 | .header = "Parent symbol", | 61 | .se_header = "Parent symbol", |
51 | .cmp = sort__parent_cmp, | 62 | .se_cmp = sort__parent_cmp, |
52 | .print = sort__parent_print, | 63 | .se_snprintf = hist_entry__parent_snprintf, |
53 | .width = &parent_symbol__col_width, | 64 | .se_width = &parent_symbol__col_width, |
54 | }; | 65 | }; |
55 | 66 | ||
56 | struct sort_dimension { | 67 | struct sort_dimension { |
@@ -85,45 +96,38 @@ sort__thread_cmp(struct hist_entry *left, struct hist_entry *right) | |||
85 | return right->thread->pid - left->thread->pid; | 96 | return right->thread->pid - left->thread->pid; |
86 | } | 97 | } |
87 | 98 | ||
88 | int repsep_fprintf(FILE *fp, const char *fmt, ...) | 99 | static int repsep_snprintf(char *bf, size_t size, const char *fmt, ...) |
89 | { | 100 | { |
90 | int n; | 101 | int n; |
91 | va_list ap; | 102 | va_list ap; |
92 | 103 | ||
93 | va_start(ap, fmt); | 104 | va_start(ap, fmt); |
94 | if (!field_sep) | 105 | n = vsnprintf(bf, size, fmt, ap); |
95 | n = vfprintf(fp, fmt, ap); | 106 | if (field_sep && n > 0) { |
96 | else { | 107 | char *sep = bf; |
97 | char *bf = NULL; | 108 | |
98 | n = vasprintf(&bf, fmt, ap); | 109 | while (1) { |
99 | if (n > 0) { | 110 | sep = strchr(sep, *field_sep); |
100 | char *sep = bf; | 111 | if (sep == NULL) |
101 | 112 | break; | |
102 | while (1) { | 113 | *sep = '.'; |
103 | sep = strchr(sep, *field_sep); | ||
104 | if (sep == NULL) | ||
105 | break; | ||
106 | *sep = '.'; | ||
107 | } | ||
108 | } | 114 | } |
109 | fputs(bf, fp); | ||
110 | free(bf); | ||
111 | } | 115 | } |
112 | va_end(ap); | 116 | va_end(ap); |
113 | return n; | 117 | return n; |
114 | } | 118 | } |
115 | 119 | ||
116 | size_t | 120 | static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf, |
117 | sort__thread_print(FILE *fp, struct hist_entry *self, unsigned int width) | 121 | size_t size, unsigned int width) |
118 | { | 122 | { |
119 | return repsep_fprintf(fp, "%*s:%5d", width - 6, | 123 | return repsep_snprintf(bf, size, "%*s:%5d", width, |
120 | self->thread->comm ?: "", self->thread->pid); | 124 | self->thread->comm ?: "", self->thread->pid); |
121 | } | 125 | } |
122 | 126 | ||
123 | size_t | 127 | static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf, |
124 | sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width) | 128 | size_t size, unsigned int width) |
125 | { | 129 | { |
126 | return repsep_fprintf(fp, "%*s", width, self->thread->comm); | 130 | return repsep_snprintf(bf, size, "%*s", width, self->thread->comm); |
127 | } | 131 | } |
128 | 132 | ||
129 | /* --sort dso */ | 133 | /* --sort dso */ |
@@ -131,8 +135,8 @@ sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width) | |||
131 | int64_t | 135 | int64_t |
132 | sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) | 136 | sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) |
133 | { | 137 | { |
134 | struct dso *dso_l = left->map ? left->map->dso : NULL; | 138 | struct dso *dso_l = left->ms.map ? left->ms.map->dso : NULL; |
135 | struct dso *dso_r = right->map ? right->map->dso : NULL; | 139 | struct dso *dso_r = right->ms.map ? right->ms.map->dso : NULL; |
136 | const char *dso_name_l, *dso_name_r; | 140 | const char *dso_name_l, *dso_name_r; |
137 | 141 | ||
138 | if (!dso_l || !dso_r) | 142 | if (!dso_l || !dso_r) |
@@ -149,16 +153,16 @@ sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) | |||
149 | return strcmp(dso_name_l, dso_name_r); | 153 | return strcmp(dso_name_l, dso_name_r); |
150 | } | 154 | } |
151 | 155 | ||
152 | size_t | 156 | static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf, |
153 | sort__dso_print(FILE *fp, struct hist_entry *self, unsigned int width) | 157 | size_t size, unsigned int width) |
154 | { | 158 | { |
155 | if (self->map && self->map->dso) { | 159 | if (self->ms.map && self->ms.map->dso) { |
156 | const char *dso_name = !verbose ? self->map->dso->short_name : | 160 | const char *dso_name = !verbose ? self->ms.map->dso->short_name : |
157 | self->map->dso->long_name; | 161 | self->ms.map->dso->long_name; |
158 | return repsep_fprintf(fp, "%-*s", width, dso_name); | 162 | return repsep_snprintf(bf, size, "%-*s", width, dso_name); |
159 | } | 163 | } |
160 | 164 | ||
161 | return repsep_fprintf(fp, "%*llx", width, (u64)self->ip); | 165 | return repsep_snprintf(bf, size, "%*Lx", width, self->ip); |
162 | } | 166 | } |
163 | 167 | ||
164 | /* --sort symbol */ | 168 | /* --sort symbol */ |
@@ -168,31 +172,31 @@ sort__sym_cmp(struct hist_entry *left, struct hist_entry *right) | |||
168 | { | 172 | { |
169 | u64 ip_l, ip_r; | 173 | u64 ip_l, ip_r; |
170 | 174 | ||
171 | if (left->sym == right->sym) | 175 | if (left->ms.sym == right->ms.sym) |
172 | return 0; | 176 | return 0; |
173 | 177 | ||
174 | ip_l = left->sym ? left->sym->start : left->ip; | 178 | ip_l = left->ms.sym ? left->ms.sym->start : left->ip; |
175 | ip_r = right->sym ? right->sym->start : right->ip; | 179 | ip_r = right->ms.sym ? right->ms.sym->start : right->ip; |
176 | 180 | ||
177 | return (int64_t)(ip_r - ip_l); | 181 | return (int64_t)(ip_r - ip_l); |
178 | } | 182 | } |
179 | 183 | ||
180 | 184 | static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf, | |
181 | size_t | 185 | size_t size, unsigned int width __used) |
182 | sort__sym_print(FILE *fp, struct hist_entry *self, unsigned int width __used) | ||
183 | { | 186 | { |
184 | size_t ret = 0; | 187 | size_t ret = 0; |
185 | 188 | ||
186 | if (verbose) { | 189 | if (verbose) { |
187 | char o = self->map ? dso__symtab_origin(self->map->dso) : '!'; | 190 | char o = self->ms.map ? dso__symtab_origin(self->ms.map->dso) : '!'; |
188 | ret += repsep_fprintf(fp, "%#018llx %c ", (u64)self->ip, o); | 191 | ret += repsep_snprintf(bf, size, "%#018llx %c ", self->ip, o); |
189 | } | 192 | } |
190 | 193 | ||
191 | ret += repsep_fprintf(fp, "[%c] ", self->level); | 194 | ret += repsep_snprintf(bf + ret, size - ret, "[%c] ", self->level); |
192 | if (self->sym) | 195 | if (self->ms.sym) |
193 | ret += repsep_fprintf(fp, "%s", self->sym->name); | 196 | ret += repsep_snprintf(bf + ret, size - ret, "%s", |
197 | self->ms.sym->name); | ||
194 | else | 198 | else |
195 | ret += repsep_fprintf(fp, "%#016llx", (u64)self->ip); | 199 | ret += repsep_snprintf(bf + ret, size - ret, "%#016llx", self->ip); |
196 | 200 | ||
197 | return ret; | 201 | return ret; |
198 | } | 202 | } |
@@ -231,10 +235,10 @@ sort__parent_cmp(struct hist_entry *left, struct hist_entry *right) | |||
231 | return strcmp(sym_l->name, sym_r->name); | 235 | return strcmp(sym_l->name, sym_r->name); |
232 | } | 236 | } |
233 | 237 | ||
234 | size_t | 238 | static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf, |
235 | sort__parent_print(FILE *fp, struct hist_entry *self, unsigned int width) | 239 | size_t size, unsigned int width) |
236 | { | 240 | { |
237 | return repsep_fprintf(fp, "%-*s", width, | 241 | return repsep_snprintf(bf, size, "%-*s", width, |
238 | self->parent ? self->parent->name : "[other]"); | 242 | self->parent ? self->parent->name : "[other]"); |
239 | } | 243 | } |
240 | 244 | ||
@@ -251,7 +255,7 @@ int sort_dimension__add(const char *tok) | |||
251 | if (strncasecmp(tok, sd->name, strlen(tok))) | 255 | if (strncasecmp(tok, sd->name, strlen(tok))) |
252 | continue; | 256 | continue; |
253 | 257 | ||
254 | if (sd->entry->collapse) | 258 | if (sd->entry->se_collapse) |
255 | sort__need_collapse = 1; | 259 | sort__need_collapse = 1; |
256 | 260 | ||
257 | if (sd->entry == &sort_parent) { | 261 | if (sd->entry == &sort_parent) { |
@@ -260,9 +264,8 @@ int sort_dimension__add(const char *tok) | |||
260 | char err[BUFSIZ]; | 264 | char err[BUFSIZ]; |
261 | 265 | ||
262 | regerror(ret, &parent_regex, err, sizeof(err)); | 266 | regerror(ret, &parent_regex, err, sizeof(err)); |
263 | fprintf(stderr, "Invalid regex: %s\n%s", | 267 | pr_err("Invalid regex: %s\n%s", parent_pattern, err); |
264 | parent_pattern, err); | 268 | return -EINVAL; |
265 | exit(-1); | ||
266 | } | 269 | } |
267 | sort__has_parent = 1; | 270 | sort__has_parent = 1; |
268 | } | 271 | } |
diff --git a/tools/perf/util/sort.h b/tools/perf/util/sort.h index 753f9ea99fb0..eab2e0b3b74e 100644 --- a/tools/perf/util/sort.h +++ b/tools/perf/util/sort.h | |||
@@ -43,19 +43,24 @@ extern enum sort_type sort__first_dimension; | |||
43 | 43 | ||
44 | struct hist_entry { | 44 | struct hist_entry { |
45 | struct rb_node rb_node; | 45 | struct rb_node rb_node; |
46 | u64 count; | 46 | u64 period; |
47 | u64 period_sys; | ||
48 | u64 period_us; | ||
49 | u64 period_guest_sys; | ||
50 | u64 period_guest_us; | ||
51 | struct map_symbol ms; | ||
47 | struct thread *thread; | 52 | struct thread *thread; |
48 | struct map *map; | ||
49 | struct symbol *sym; | ||
50 | u64 ip; | 53 | u64 ip; |
54 | u32 nr_events; | ||
51 | char level; | 55 | char level; |
52 | struct symbol *parent; | 56 | u8 filtered; |
53 | struct callchain_node callchain; | 57 | struct symbol *parent; |
54 | union { | 58 | union { |
55 | unsigned long position; | 59 | unsigned long position; |
56 | struct hist_entry *pair; | 60 | struct hist_entry *pair; |
57 | struct rb_root sorted_chain; | 61 | struct rb_root sorted_chain; |
58 | }; | 62 | }; |
63 | struct callchain_node callchain[0]; | ||
59 | }; | 64 | }; |
60 | 65 | ||
61 | enum sort_type { | 66 | enum sort_type { |
@@ -73,12 +78,13 @@ enum sort_type { | |||
73 | struct sort_entry { | 78 | struct sort_entry { |
74 | struct list_head list; | 79 | struct list_head list; |
75 | 80 | ||
76 | const char *header; | 81 | const char *se_header; |
77 | 82 | ||
78 | int64_t (*cmp)(struct hist_entry *, struct hist_entry *); | 83 | int64_t (*se_cmp)(struct hist_entry *, struct hist_entry *); |
79 | int64_t (*collapse)(struct hist_entry *, struct hist_entry *); | 84 | int64_t (*se_collapse)(struct hist_entry *, struct hist_entry *); |
80 | size_t (*print)(FILE *fp, struct hist_entry *, unsigned int width); | 85 | int (*se_snprintf)(struct hist_entry *self, char *bf, size_t size, |
81 | unsigned int *width; | 86 | unsigned int width); |
87 | unsigned int *se_width; | ||
82 | bool elide; | 88 | bool elide; |
83 | }; | 89 | }; |
84 | 90 | ||
@@ -87,7 +93,6 @@ extern struct list_head hist_entry__sort_list; | |||
87 | 93 | ||
88 | void setup_sorting(const char * const usagestr[], const struct option *opts); | 94 | void setup_sorting(const char * const usagestr[], const struct option *opts); |
89 | 95 | ||
90 | extern int repsep_fprintf(FILE *fp, const char *fmt, ...); | ||
91 | extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int); | 96 | extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int); |
92 | extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int); | 97 | extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int); |
93 | extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int); | 98 | extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int); |
diff --git a/tools/perf/util/string.c b/tools/perf/util/string.c index a175949ed216..0409fc7c0058 100644 --- a/tools/perf/util/string.c +++ b/tools/perf/util/string.c | |||
@@ -1,48 +1,5 @@ | |||
1 | #include "string.h" | ||
2 | #include "util.h" | 1 | #include "util.h" |
3 | 2 | #include "string.h" | |
4 | static int hex(char ch) | ||
5 | { | ||
6 | if ((ch >= '0') && (ch <= '9')) | ||
7 | return ch - '0'; | ||
8 | if ((ch >= 'a') && (ch <= 'f')) | ||
9 | return ch - 'a' + 10; | ||
10 | if ((ch >= 'A') && (ch <= 'F')) | ||
11 | return ch - 'A' + 10; | ||
12 | return -1; | ||
13 | } | ||
14 | |||
15 | /* | ||
16 | * While we find nice hex chars, build a long_val. | ||
17 | * Return number of chars processed. | ||
18 | */ | ||
19 | int hex2u64(const char *ptr, u64 *long_val) | ||
20 | { | ||
21 | const char *p = ptr; | ||
22 | *long_val = 0; | ||
23 | |||
24 | while (*p) { | ||
25 | const int hex_val = hex(*p); | ||
26 | |||
27 | if (hex_val < 0) | ||
28 | break; | ||
29 | |||
30 | *long_val = (*long_val << 4) | hex_val; | ||
31 | p++; | ||
32 | } | ||
33 | |||
34 | return p - ptr; | ||
35 | } | ||
36 | |||
37 | char *strxfrchar(char *s, char from, char to) | ||
38 | { | ||
39 | char *p = s; | ||
40 | |||
41 | while ((p = strchr(p, from)) != NULL) | ||
42 | *p++ = to; | ||
43 | |||
44 | return s; | ||
45 | } | ||
46 | 3 | ||
47 | #define K 1024LL | 4 | #define K 1024LL |
48 | /* | 5 | /* |
diff --git a/tools/perf/util/string.h b/tools/perf/util/string.h deleted file mode 100644 index 542e44de3719..000000000000 --- a/tools/perf/util/string.h +++ /dev/null | |||
@@ -1,18 +0,0 @@ | |||
1 | #ifndef __PERF_STRING_H_ | ||
2 | #define __PERF_STRING_H_ | ||
3 | |||
4 | #include <stdbool.h> | ||
5 | #include "types.h" | ||
6 | |||
7 | int hex2u64(const char *ptr, u64 *val); | ||
8 | char *strxfrchar(char *s, char from, char to); | ||
9 | s64 perf_atoll(const char *str); | ||
10 | char **argv_split(const char *str, int *argcp); | ||
11 | void argv_free(char **argv); | ||
12 | bool strglobmatch(const char *str, const char *pat); | ||
13 | bool strlazymatch(const char *str, const char *pat); | ||
14 | |||
15 | #define _STR(x) #x | ||
16 | #define STR(x) _STR(x) | ||
17 | |||
18 | #endif /* __PERF_STRING_H */ | ||
diff --git a/tools/perf/util/symbol.c b/tools/perf/util/symbol.c index c458c4a371d1..ecccc8df128e 100644 --- a/tools/perf/util/symbol.c +++ b/tools/perf/util/symbol.c | |||
@@ -1,13 +1,19 @@ | |||
1 | #include "util.h" | 1 | #define _GNU_SOURCE |
2 | #include "../perf.h" | 2 | #include <ctype.h> |
3 | #include "sort.h" | 3 | #include <dirent.h> |
4 | #include "string.h" | 4 | #include <errno.h> |
5 | #include <libgen.h> | ||
6 | #include <stdlib.h> | ||
7 | #include <stdio.h> | ||
8 | #include <string.h> | ||
9 | #include <sys/types.h> | ||
10 | #include <sys/stat.h> | ||
11 | #include <sys/param.h> | ||
12 | #include <fcntl.h> | ||
13 | #include <unistd.h> | ||
5 | #include "symbol.h" | 14 | #include "symbol.h" |
6 | #include "thread.h" | 15 | #include "strlist.h" |
7 | 16 | ||
8 | #include "debug.h" | ||
9 | |||
10 | #include <asm/bug.h> | ||
11 | #include <libelf.h> | 17 | #include <libelf.h> |
12 | #include <gelf.h> | 18 | #include <gelf.h> |
13 | #include <elf.h> | 19 | #include <elf.h> |
@@ -18,22 +24,12 @@ | |||
18 | #define NT_GNU_BUILD_ID 3 | 24 | #define NT_GNU_BUILD_ID 3 |
19 | #endif | 25 | #endif |
20 | 26 | ||
21 | enum dso_origin { | ||
22 | DSO__ORIG_KERNEL = 0, | ||
23 | DSO__ORIG_JAVA_JIT, | ||
24 | DSO__ORIG_BUILD_ID_CACHE, | ||
25 | DSO__ORIG_FEDORA, | ||
26 | DSO__ORIG_UBUNTU, | ||
27 | DSO__ORIG_BUILDID, | ||
28 | DSO__ORIG_DSO, | ||
29 | DSO__ORIG_KMODULE, | ||
30 | DSO__ORIG_NOT_FOUND, | ||
31 | }; | ||
32 | |||
33 | static void dsos__add(struct list_head *head, struct dso *dso); | 27 | static void dsos__add(struct list_head *head, struct dso *dso); |
34 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type); | 28 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type); |
35 | static int dso__load_kernel_sym(struct dso *self, struct map *map, | 29 | static int dso__load_kernel_sym(struct dso *self, struct map *map, |
36 | symbol_filter_t filter); | 30 | symbol_filter_t filter); |
31 | static int dso__load_guest_kernel_sym(struct dso *self, struct map *map, | ||
32 | symbol_filter_t filter); | ||
37 | static int vmlinux_path__nr_entries; | 33 | static int vmlinux_path__nr_entries; |
38 | static char **vmlinux_path; | 34 | static char **vmlinux_path; |
39 | 35 | ||
@@ -126,16 +122,17 @@ static void map_groups__fixup_end(struct map_groups *self) | |||
126 | static struct symbol *symbol__new(u64 start, u64 len, const char *name) | 122 | static struct symbol *symbol__new(u64 start, u64 len, const char *name) |
127 | { | 123 | { |
128 | size_t namelen = strlen(name) + 1; | 124 | size_t namelen = strlen(name) + 1; |
129 | struct symbol *self = zalloc(symbol_conf.priv_size + | 125 | struct symbol *self = calloc(1, (symbol_conf.priv_size + |
130 | sizeof(*self) + namelen); | 126 | sizeof(*self) + namelen)); |
131 | if (self == NULL) | 127 | if (self == NULL) |
132 | return NULL; | 128 | return NULL; |
133 | 129 | ||
134 | if (symbol_conf.priv_size) | 130 | if (symbol_conf.priv_size) |
135 | self = ((void *)self) + symbol_conf.priv_size; | 131 | self = ((void *)self) + symbol_conf.priv_size; |
136 | 132 | ||
137 | self->start = start; | 133 | self->start = start; |
138 | self->end = len ? start + len - 1 : start; | 134 | self->end = len ? start + len - 1 : start; |
135 | self->namelen = namelen - 1; | ||
139 | 136 | ||
140 | pr_debug4("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end); | 137 | pr_debug4("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end); |
141 | 138 | ||
@@ -178,7 +175,7 @@ static void dso__set_basename(struct dso *self) | |||
178 | 175 | ||
179 | struct dso *dso__new(const char *name) | 176 | struct dso *dso__new(const char *name) |
180 | { | 177 | { |
181 | struct dso *self = zalloc(sizeof(*self) + strlen(name) + 1); | 178 | struct dso *self = calloc(1, sizeof(*self) + strlen(name) + 1); |
182 | 179 | ||
183 | if (self != NULL) { | 180 | if (self != NULL) { |
184 | int i; | 181 | int i; |
@@ -192,6 +189,8 @@ struct dso *dso__new(const char *name) | |||
192 | self->loaded = 0; | 189 | self->loaded = 0; |
193 | self->sorted_by_name = 0; | 190 | self->sorted_by_name = 0; |
194 | self->has_build_id = 0; | 191 | self->has_build_id = 0; |
192 | self->kernel = DSO_TYPE_USER; | ||
193 | INIT_LIST_HEAD(&self->node); | ||
195 | } | 194 | } |
196 | 195 | ||
197 | return self; | 196 | return self; |
@@ -408,12 +407,9 @@ int kallsyms__parse(const char *filename, void *arg, | |||
408 | char *symbol_name; | 407 | char *symbol_name; |
409 | 408 | ||
410 | line_len = getline(&line, &n, file); | 409 | line_len = getline(&line, &n, file); |
411 | if (line_len < 0) | 410 | if (line_len < 0 || !line) |
412 | break; | 411 | break; |
413 | 412 | ||
414 | if (!line) | ||
415 | goto out_failure; | ||
416 | |||
417 | line[--line_len] = '\0'; /* \n */ | 413 | line[--line_len] = '\0'; /* \n */ |
418 | 414 | ||
419 | len = hex2u64(line, &start); | 415 | len = hex2u64(line, &start); |
@@ -465,6 +461,7 @@ static int map__process_kallsym_symbol(void *arg, const char *name, | |||
465 | * map__split_kallsyms, when we have split the maps per module | 461 | * map__split_kallsyms, when we have split the maps per module |
466 | */ | 462 | */ |
467 | symbols__insert(root, sym); | 463 | symbols__insert(root, sym); |
464 | |||
468 | return 0; | 465 | return 0; |
469 | } | 466 | } |
470 | 467 | ||
@@ -489,6 +486,7 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
489 | symbol_filter_t filter) | 486 | symbol_filter_t filter) |
490 | { | 487 | { |
491 | struct map_groups *kmaps = map__kmap(map)->kmaps; | 488 | struct map_groups *kmaps = map__kmap(map)->kmaps; |
489 | struct machine *machine = kmaps->machine; | ||
492 | struct map *curr_map = map; | 490 | struct map *curr_map = map; |
493 | struct symbol *pos; | 491 | struct symbol *pos; |
494 | int count = 0; | 492 | int count = 0; |
@@ -510,15 +508,33 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
510 | *module++ = '\0'; | 508 | *module++ = '\0'; |
511 | 509 | ||
512 | if (strcmp(curr_map->dso->short_name, module)) { | 510 | if (strcmp(curr_map->dso->short_name, module)) { |
513 | curr_map = map_groups__find_by_name(kmaps, map->type, module); | 511 | if (curr_map != map && |
512 | self->kernel == DSO_TYPE_GUEST_KERNEL && | ||
513 | machine__is_default_guest(machine)) { | ||
514 | /* | ||
515 | * We assume all symbols of a module are | ||
516 | * continuous in * kallsyms, so curr_map | ||
517 | * points to a module and all its | ||
518 | * symbols are in its kmap. Mark it as | ||
519 | * loaded. | ||
520 | */ | ||
521 | dso__set_loaded(curr_map->dso, | ||
522 | curr_map->type); | ||
523 | } | ||
524 | |||
525 | curr_map = map_groups__find_by_name(kmaps, | ||
526 | map->type, module); | ||
514 | if (curr_map == NULL) { | 527 | if (curr_map == NULL) { |
515 | pr_debug("/proc/{kallsyms,modules} " | 528 | pr_err("%s/proc/{kallsyms,modules} " |
516 | "inconsistency while looking " | 529 | "inconsistency while looking " |
517 | "for \"%s\" module!\n", module); | 530 | "for \"%s\" module!\n", |
518 | return -1; | 531 | machine->root_dir, module); |
532 | curr_map = map; | ||
533 | goto discard_symbol; | ||
519 | } | 534 | } |
520 | 535 | ||
521 | if (curr_map->dso->loaded) | 536 | if (curr_map->dso->loaded && |
537 | !machine__is_default_guest(machine)) | ||
522 | goto discard_symbol; | 538 | goto discard_symbol; |
523 | } | 539 | } |
524 | /* | 540 | /* |
@@ -531,13 +547,21 @@ static int dso__split_kallsyms(struct dso *self, struct map *map, | |||
531 | char dso_name[PATH_MAX]; | 547 | char dso_name[PATH_MAX]; |
532 | struct dso *dso; | 548 | struct dso *dso; |
533 | 549 | ||
534 | snprintf(dso_name, sizeof(dso_name), "[kernel].%d", | 550 | if (self->kernel == DSO_TYPE_GUEST_KERNEL) |
535 | kernel_range++); | 551 | snprintf(dso_name, sizeof(dso_name), |
552 | "[guest.kernel].%d", | ||
553 | kernel_range++); | ||
554 | else | ||
555 | snprintf(dso_name, sizeof(dso_name), | ||
556 | "[kernel].%d", | ||
557 | kernel_range++); | ||
536 | 558 | ||
537 | dso = dso__new(dso_name); | 559 | dso = dso__new(dso_name); |
538 | if (dso == NULL) | 560 | if (dso == NULL) |
539 | return -1; | 561 | return -1; |
540 | 562 | ||
563 | dso->kernel = self->kernel; | ||
564 | |||
541 | curr_map = map__new2(pos->start, dso, map->type); | 565 | curr_map = map__new2(pos->start, dso, map->type); |
542 | if (curr_map == NULL) { | 566 | if (curr_map == NULL) { |
543 | dso__delete(dso); | 567 | dso__delete(dso); |
@@ -561,6 +585,12 @@ discard_symbol: rb_erase(&pos->rb_node, root); | |||
561 | } | 585 | } |
562 | } | 586 | } |
563 | 587 | ||
588 | if (curr_map != map && | ||
589 | self->kernel == DSO_TYPE_GUEST_KERNEL && | ||
590 | machine__is_default_guest(kmaps->machine)) { | ||
591 | dso__set_loaded(curr_map->dso, curr_map->type); | ||
592 | } | ||
593 | |||
564 | return count; | 594 | return count; |
565 | } | 595 | } |
566 | 596 | ||
@@ -571,7 +601,10 @@ int dso__load_kallsyms(struct dso *self, const char *filename, | |||
571 | return -1; | 601 | return -1; |
572 | 602 | ||
573 | symbols__fixup_end(&self->symbols[map->type]); | 603 | symbols__fixup_end(&self->symbols[map->type]); |
574 | self->origin = DSO__ORIG_KERNEL; | 604 | if (self->kernel == DSO_TYPE_GUEST_KERNEL) |
605 | self->origin = DSO__ORIG_GUEST_KERNEL; | ||
606 | else | ||
607 | self->origin = DSO__ORIG_KERNEL; | ||
575 | 608 | ||
576 | return dso__split_kallsyms(self, map, filter); | 609 | return dso__split_kallsyms(self, map, filter); |
577 | } | 610 | } |
@@ -870,8 +903,8 @@ out_close: | |||
870 | if (err == 0) | 903 | if (err == 0) |
871 | return nr; | 904 | return nr; |
872 | out: | 905 | out: |
873 | pr_warning("%s: problems reading %s PLT info.\n", | 906 | pr_debug("%s: problems reading %s PLT info.\n", |
874 | __func__, self->long_name); | 907 | __func__, self->long_name); |
875 | return 0; | 908 | return 0; |
876 | } | 909 | } |
877 | 910 | ||
@@ -958,7 +991,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
958 | nr_syms = shdr.sh_size / shdr.sh_entsize; | 991 | nr_syms = shdr.sh_size / shdr.sh_entsize; |
959 | 992 | ||
960 | memset(&sym, 0, sizeof(sym)); | 993 | memset(&sym, 0, sizeof(sym)); |
961 | if (!self->kernel) { | 994 | if (self->kernel == DSO_TYPE_USER) { |
962 | self->adjust_symbols = (ehdr.e_type == ET_EXEC || | 995 | self->adjust_symbols = (ehdr.e_type == ET_EXEC || |
963 | elf_section_by_name(elf, &ehdr, &shdr, | 996 | elf_section_by_name(elf, &ehdr, &shdr, |
964 | ".gnu.prelink_undo", | 997 | ".gnu.prelink_undo", |
@@ -990,7 +1023,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
990 | 1023 | ||
991 | section_name = elf_sec__name(&shdr, secstrs); | 1024 | section_name = elf_sec__name(&shdr, secstrs); |
992 | 1025 | ||
993 | if (self->kernel || kmodule) { | 1026 | if (self->kernel != DSO_TYPE_USER || kmodule) { |
994 | char dso_name[PATH_MAX]; | 1027 | char dso_name[PATH_MAX]; |
995 | 1028 | ||
996 | if (strcmp(section_name, | 1029 | if (strcmp(section_name, |
@@ -1017,6 +1050,7 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
1017 | curr_dso = dso__new(dso_name); | 1050 | curr_dso = dso__new(dso_name); |
1018 | if (curr_dso == NULL) | 1051 | if (curr_dso == NULL) |
1019 | goto out_elf_end; | 1052 | goto out_elf_end; |
1053 | curr_dso->kernel = self->kernel; | ||
1020 | curr_map = map__new2(start, curr_dso, | 1054 | curr_map = map__new2(start, curr_dso, |
1021 | map->type); | 1055 | map->type); |
1022 | if (curr_map == NULL) { | 1056 | if (curr_map == NULL) { |
@@ -1025,9 +1059,9 @@ static int dso__load_sym(struct dso *self, struct map *map, const char *name, | |||
1025 | } | 1059 | } |
1026 | curr_map->map_ip = identity__map_ip; | 1060 | curr_map->map_ip = identity__map_ip; |
1027 | curr_map->unmap_ip = identity__map_ip; | 1061 | curr_map->unmap_ip = identity__map_ip; |
1028 | curr_dso->origin = DSO__ORIG_KERNEL; | 1062 | curr_dso->origin = self->origin; |
1029 | map_groups__insert(kmap->kmaps, curr_map); | 1063 | map_groups__insert(kmap->kmaps, curr_map); |
1030 | dsos__add(&dsos__kernel, curr_dso); | 1064 | dsos__add(&self->node, curr_dso); |
1031 | dso__set_loaded(curr_dso, map->type); | 1065 | dso__set_loaded(curr_dso, map->type); |
1032 | } else | 1066 | } else |
1033 | curr_dso = curr_map->dso; | 1067 | curr_dso = curr_map->dso; |
@@ -1089,7 +1123,7 @@ static bool dso__build_id_equal(const struct dso *self, u8 *build_id) | |||
1089 | return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0; | 1123 | return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0; |
1090 | } | 1124 | } |
1091 | 1125 | ||
1092 | static bool __dsos__read_build_ids(struct list_head *head, bool with_hits) | 1126 | bool __dsos__read_build_ids(struct list_head *head, bool with_hits) |
1093 | { | 1127 | { |
1094 | bool have_build_id = false; | 1128 | bool have_build_id = false; |
1095 | struct dso *pos; | 1129 | struct dso *pos; |
@@ -1107,13 +1141,6 @@ static bool __dsos__read_build_ids(struct list_head *head, bool with_hits) | |||
1107 | return have_build_id; | 1141 | return have_build_id; |
1108 | } | 1142 | } |
1109 | 1143 | ||
1110 | bool dsos__read_build_ids(bool with_hits) | ||
1111 | { | ||
1112 | bool kbuildids = __dsos__read_build_ids(&dsos__kernel, with_hits), | ||
1113 | ubuildids = __dsos__read_build_ids(&dsos__user, with_hits); | ||
1114 | return kbuildids || ubuildids; | ||
1115 | } | ||
1116 | |||
1117 | /* | 1144 | /* |
1118 | * Align offset to 4 bytes as needed for note name and descriptor data. | 1145 | * Align offset to 4 bytes as needed for note name and descriptor data. |
1119 | */ | 1146 | */ |
@@ -1248,6 +1275,8 @@ char dso__symtab_origin(const struct dso *self) | |||
1248 | [DSO__ORIG_BUILDID] = 'b', | 1275 | [DSO__ORIG_BUILDID] = 'b', |
1249 | [DSO__ORIG_DSO] = 'd', | 1276 | [DSO__ORIG_DSO] = 'd', |
1250 | [DSO__ORIG_KMODULE] = 'K', | 1277 | [DSO__ORIG_KMODULE] = 'K', |
1278 | [DSO__ORIG_GUEST_KERNEL] = 'g', | ||
1279 | [DSO__ORIG_GUEST_KMODULE] = 'G', | ||
1251 | }; | 1280 | }; |
1252 | 1281 | ||
1253 | if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) | 1282 | if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) |
@@ -1263,11 +1292,20 @@ int dso__load(struct dso *self, struct map *map, symbol_filter_t filter) | |||
1263 | char build_id_hex[BUILD_ID_SIZE * 2 + 1]; | 1292 | char build_id_hex[BUILD_ID_SIZE * 2 + 1]; |
1264 | int ret = -1; | 1293 | int ret = -1; |
1265 | int fd; | 1294 | int fd; |
1295 | struct machine *machine; | ||
1296 | const char *root_dir; | ||
1266 | 1297 | ||
1267 | dso__set_loaded(self, map->type); | 1298 | dso__set_loaded(self, map->type); |
1268 | 1299 | ||
1269 | if (self->kernel) | 1300 | if (self->kernel == DSO_TYPE_KERNEL) |
1270 | return dso__load_kernel_sym(self, map, filter); | 1301 | return dso__load_kernel_sym(self, map, filter); |
1302 | else if (self->kernel == DSO_TYPE_GUEST_KERNEL) | ||
1303 | return dso__load_guest_kernel_sym(self, map, filter); | ||
1304 | |||
1305 | if (map->groups && map->groups->machine) | ||
1306 | machine = map->groups->machine; | ||
1307 | else | ||
1308 | machine = NULL; | ||
1271 | 1309 | ||
1272 | name = malloc(size); | 1310 | name = malloc(size); |
1273 | if (!name) | 1311 | if (!name) |
@@ -1321,6 +1359,13 @@ more: | |||
1321 | case DSO__ORIG_DSO: | 1359 | case DSO__ORIG_DSO: |
1322 | snprintf(name, size, "%s", self->long_name); | 1360 | snprintf(name, size, "%s", self->long_name); |
1323 | break; | 1361 | break; |
1362 | case DSO__ORIG_GUEST_KMODULE: | ||
1363 | if (map->groups && map->groups->machine) | ||
1364 | root_dir = map->groups->machine->root_dir; | ||
1365 | else | ||
1366 | root_dir = ""; | ||
1367 | snprintf(name, size, "%s%s", root_dir, self->long_name); | ||
1368 | break; | ||
1324 | 1369 | ||
1325 | default: | 1370 | default: |
1326 | goto out; | 1371 | goto out; |
@@ -1374,7 +1419,8 @@ struct map *map_groups__find_by_name(struct map_groups *self, | |||
1374 | return NULL; | 1419 | return NULL; |
1375 | } | 1420 | } |
1376 | 1421 | ||
1377 | static int dso__kernel_module_get_build_id(struct dso *self) | 1422 | static int dso__kernel_module_get_build_id(struct dso *self, |
1423 | const char *root_dir) | ||
1378 | { | 1424 | { |
1379 | char filename[PATH_MAX]; | 1425 | char filename[PATH_MAX]; |
1380 | /* | 1426 | /* |
@@ -1384,8 +1430,8 @@ static int dso__kernel_module_get_build_id(struct dso *self) | |||
1384 | const char *name = self->short_name + 1; | 1430 | const char *name = self->short_name + 1; |
1385 | 1431 | ||
1386 | snprintf(filename, sizeof(filename), | 1432 | snprintf(filename, sizeof(filename), |
1387 | "/sys/module/%.*s/notes/.note.gnu.build-id", | 1433 | "%s/sys/module/%.*s/notes/.note.gnu.build-id", |
1388 | (int)strlen(name - 1), name); | 1434 | root_dir, (int)strlen(name) - 1, name); |
1389 | 1435 | ||
1390 | if (sysfs__read_build_id(filename, self->build_id, | 1436 | if (sysfs__read_build_id(filename, self->build_id, |
1391 | sizeof(self->build_id)) == 0) | 1437 | sizeof(self->build_id)) == 0) |
@@ -1394,26 +1440,33 @@ static int dso__kernel_module_get_build_id(struct dso *self) | |||
1394 | return 0; | 1440 | return 0; |
1395 | } | 1441 | } |
1396 | 1442 | ||
1397 | static int map_groups__set_modules_path_dir(struct map_groups *self, char *dirname) | 1443 | static int map_groups__set_modules_path_dir(struct map_groups *self, |
1444 | const char *dir_name) | ||
1398 | { | 1445 | { |
1399 | struct dirent *dent; | 1446 | struct dirent *dent; |
1400 | DIR *dir = opendir(dirname); | 1447 | DIR *dir = opendir(dir_name); |
1401 | 1448 | ||
1402 | if (!dir) { | 1449 | if (!dir) { |
1403 | pr_debug("%s: cannot open %s dir\n", __func__, dirname); | 1450 | pr_debug("%s: cannot open %s dir\n", __func__, dir_name); |
1404 | return -1; | 1451 | return -1; |
1405 | } | 1452 | } |
1406 | 1453 | ||
1407 | while ((dent = readdir(dir)) != NULL) { | 1454 | while ((dent = readdir(dir)) != NULL) { |
1408 | char path[PATH_MAX]; | 1455 | char path[PATH_MAX]; |
1456 | struct stat st; | ||
1409 | 1457 | ||
1410 | if (dent->d_type == DT_DIR) { | 1458 | /*sshfs might return bad dent->d_type, so we have to stat*/ |
1459 | sprintf(path, "%s/%s", dir_name, dent->d_name); | ||
1460 | if (stat(path, &st)) | ||
1461 | continue; | ||
1462 | |||
1463 | if (S_ISDIR(st.st_mode)) { | ||
1411 | if (!strcmp(dent->d_name, ".") || | 1464 | if (!strcmp(dent->d_name, ".") || |
1412 | !strcmp(dent->d_name, "..")) | 1465 | !strcmp(dent->d_name, "..")) |
1413 | continue; | 1466 | continue; |
1414 | 1467 | ||
1415 | snprintf(path, sizeof(path), "%s/%s", | 1468 | snprintf(path, sizeof(path), "%s/%s", |
1416 | dirname, dent->d_name); | 1469 | dir_name, dent->d_name); |
1417 | if (map_groups__set_modules_path_dir(self, path) < 0) | 1470 | if (map_groups__set_modules_path_dir(self, path) < 0) |
1418 | goto failure; | 1471 | goto failure; |
1419 | } else { | 1472 | } else { |
@@ -1433,13 +1486,13 @@ static int map_groups__set_modules_path_dir(struct map_groups *self, char *dirna | |||
1433 | continue; | 1486 | continue; |
1434 | 1487 | ||
1435 | snprintf(path, sizeof(path), "%s/%s", | 1488 | snprintf(path, sizeof(path), "%s/%s", |
1436 | dirname, dent->d_name); | 1489 | dir_name, dent->d_name); |
1437 | 1490 | ||
1438 | long_name = strdup(path); | 1491 | long_name = strdup(path); |
1439 | if (long_name == NULL) | 1492 | if (long_name == NULL) |
1440 | goto failure; | 1493 | goto failure; |
1441 | dso__set_long_name(map->dso, long_name); | 1494 | dso__set_long_name(map->dso, long_name); |
1442 | dso__kernel_module_get_build_id(map->dso); | 1495 | dso__kernel_module_get_build_id(map->dso, ""); |
1443 | } | 1496 | } |
1444 | } | 1497 | } |
1445 | 1498 | ||
@@ -1449,18 +1502,47 @@ failure: | |||
1449 | return -1; | 1502 | return -1; |
1450 | } | 1503 | } |
1451 | 1504 | ||
1452 | static int map_groups__set_modules_path(struct map_groups *self) | 1505 | static char *get_kernel_version(const char *root_dir) |
1453 | { | 1506 | { |
1454 | struct utsname uts; | 1507 | char version[PATH_MAX]; |
1508 | FILE *file; | ||
1509 | char *name, *tmp; | ||
1510 | const char *prefix = "Linux version "; | ||
1511 | |||
1512 | sprintf(version, "%s/proc/version", root_dir); | ||
1513 | file = fopen(version, "r"); | ||
1514 | if (!file) | ||
1515 | return NULL; | ||
1516 | |||
1517 | version[0] = '\0'; | ||
1518 | tmp = fgets(version, sizeof(version), file); | ||
1519 | fclose(file); | ||
1520 | |||
1521 | name = strstr(version, prefix); | ||
1522 | if (!name) | ||
1523 | return NULL; | ||
1524 | name += strlen(prefix); | ||
1525 | tmp = strchr(name, ' '); | ||
1526 | if (tmp) | ||
1527 | *tmp = '\0'; | ||
1528 | |||
1529 | return strdup(name); | ||
1530 | } | ||
1531 | |||
1532 | static int machine__set_modules_path(struct machine *self) | ||
1533 | { | ||
1534 | char *version; | ||
1455 | char modules_path[PATH_MAX]; | 1535 | char modules_path[PATH_MAX]; |
1456 | 1536 | ||
1457 | if (uname(&uts) < 0) | 1537 | version = get_kernel_version(self->root_dir); |
1538 | if (!version) | ||
1458 | return -1; | 1539 | return -1; |
1459 | 1540 | ||
1460 | snprintf(modules_path, sizeof(modules_path), "/lib/modules/%s/kernel", | 1541 | snprintf(modules_path, sizeof(modules_path), "%s/lib/modules/%s/kernel", |
1461 | uts.release); | 1542 | self->root_dir, version); |
1543 | free(version); | ||
1462 | 1544 | ||
1463 | return map_groups__set_modules_path_dir(self, modules_path); | 1545 | return map_groups__set_modules_path_dir(&self->kmaps, modules_path); |
1464 | } | 1546 | } |
1465 | 1547 | ||
1466 | /* | 1548 | /* |
@@ -1470,8 +1552,8 @@ static int map_groups__set_modules_path(struct map_groups *self) | |||
1470 | */ | 1552 | */ |
1471 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) | 1553 | static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) |
1472 | { | 1554 | { |
1473 | struct map *self = zalloc(sizeof(*self) + | 1555 | struct map *self = calloc(1, (sizeof(*self) + |
1474 | (dso->kernel ? sizeof(struct kmap) : 0)); | 1556 | (dso->kernel ? sizeof(struct kmap) : 0))); |
1475 | if (self != NULL) { | 1557 | if (self != NULL) { |
1476 | /* | 1558 | /* |
1477 | * ->end will be filled after we load all the symbols | 1559 | * ->end will be filled after we load all the symbols |
@@ -1482,11 +1564,11 @@ static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) | |||
1482 | return self; | 1564 | return self; |
1483 | } | 1565 | } |
1484 | 1566 | ||
1485 | struct map *map_groups__new_module(struct map_groups *self, u64 start, | 1567 | struct map *machine__new_module(struct machine *self, u64 start, |
1486 | const char *filename) | 1568 | const char *filename) |
1487 | { | 1569 | { |
1488 | struct map *map; | 1570 | struct map *map; |
1489 | struct dso *dso = __dsos__findnew(&dsos__kernel, filename); | 1571 | struct dso *dso = __dsos__findnew(&self->kernel_dsos, filename); |
1490 | 1572 | ||
1491 | if (dso == NULL) | 1573 | if (dso == NULL) |
1492 | return NULL; | 1574 | return NULL; |
@@ -1495,18 +1577,31 @@ struct map *map_groups__new_module(struct map_groups *self, u64 start, | |||
1495 | if (map == NULL) | 1577 | if (map == NULL) |
1496 | return NULL; | 1578 | return NULL; |
1497 | 1579 | ||
1498 | dso->origin = DSO__ORIG_KMODULE; | 1580 | if (machine__is_host(self)) |
1499 | map_groups__insert(self, map); | 1581 | dso->origin = DSO__ORIG_KMODULE; |
1582 | else | ||
1583 | dso->origin = DSO__ORIG_GUEST_KMODULE; | ||
1584 | map_groups__insert(&self->kmaps, map); | ||
1500 | return map; | 1585 | return map; |
1501 | } | 1586 | } |
1502 | 1587 | ||
1503 | static int map_groups__create_modules(struct map_groups *self) | 1588 | static int machine__create_modules(struct machine *self) |
1504 | { | 1589 | { |
1505 | char *line = NULL; | 1590 | char *line = NULL; |
1506 | size_t n; | 1591 | size_t n; |
1507 | FILE *file = fopen("/proc/modules", "r"); | 1592 | FILE *file; |
1508 | struct map *map; | 1593 | struct map *map; |
1594 | const char *modules; | ||
1595 | char path[PATH_MAX]; | ||
1596 | |||
1597 | if (machine__is_default_guest(self)) | ||
1598 | modules = symbol_conf.default_guest_modules; | ||
1599 | else { | ||
1600 | sprintf(path, "%s/proc/modules", self->root_dir); | ||
1601 | modules = path; | ||
1602 | } | ||
1509 | 1603 | ||
1604 | file = fopen(modules, "r"); | ||
1510 | if (file == NULL) | 1605 | if (file == NULL) |
1511 | return -1; | 1606 | return -1; |
1512 | 1607 | ||
@@ -1538,16 +1633,16 @@ static int map_groups__create_modules(struct map_groups *self) | |||
1538 | *sep = '\0'; | 1633 | *sep = '\0'; |
1539 | 1634 | ||
1540 | snprintf(name, sizeof(name), "[%s]", line); | 1635 | snprintf(name, sizeof(name), "[%s]", line); |
1541 | map = map_groups__new_module(self, start, name); | 1636 | map = machine__new_module(self, start, name); |
1542 | if (map == NULL) | 1637 | if (map == NULL) |
1543 | goto out_delete_line; | 1638 | goto out_delete_line; |
1544 | dso__kernel_module_get_build_id(map->dso); | 1639 | dso__kernel_module_get_build_id(map->dso, self->root_dir); |
1545 | } | 1640 | } |
1546 | 1641 | ||
1547 | free(line); | 1642 | free(line); |
1548 | fclose(file); | 1643 | fclose(file); |
1549 | 1644 | ||
1550 | return map_groups__set_modules_path(self); | 1645 | return machine__set_modules_path(self); |
1551 | 1646 | ||
1552 | out_delete_line: | 1647 | out_delete_line: |
1553 | free(line); | 1648 | free(line); |
@@ -1714,8 +1809,56 @@ out_fixup: | |||
1714 | return err; | 1809 | return err; |
1715 | } | 1810 | } |
1716 | 1811 | ||
1717 | LIST_HEAD(dsos__user); | 1812 | static int dso__load_guest_kernel_sym(struct dso *self, struct map *map, |
1718 | LIST_HEAD(dsos__kernel); | 1813 | symbol_filter_t filter) |
1814 | { | ||
1815 | int err; | ||
1816 | const char *kallsyms_filename = NULL; | ||
1817 | struct machine *machine; | ||
1818 | char path[PATH_MAX]; | ||
1819 | |||
1820 | if (!map->groups) { | ||
1821 | pr_debug("Guest kernel map hasn't the point to groups\n"); | ||
1822 | return -1; | ||
1823 | } | ||
1824 | machine = map->groups->machine; | ||
1825 | |||
1826 | if (machine__is_default_guest(machine)) { | ||
1827 | /* | ||
1828 | * if the user specified a vmlinux filename, use it and only | ||
1829 | * it, reporting errors to the user if it cannot be used. | ||
1830 | * Or use file guest_kallsyms inputted by user on commandline | ||
1831 | */ | ||
1832 | if (symbol_conf.default_guest_vmlinux_name != NULL) { | ||
1833 | err = dso__load_vmlinux(self, map, | ||
1834 | symbol_conf.default_guest_vmlinux_name, filter); | ||
1835 | goto out_try_fixup; | ||
1836 | } | ||
1837 | |||
1838 | kallsyms_filename = symbol_conf.default_guest_kallsyms; | ||
1839 | if (!kallsyms_filename) | ||
1840 | return -1; | ||
1841 | } else { | ||
1842 | sprintf(path, "%s/proc/kallsyms", machine->root_dir); | ||
1843 | kallsyms_filename = path; | ||
1844 | } | ||
1845 | |||
1846 | err = dso__load_kallsyms(self, kallsyms_filename, map, filter); | ||
1847 | if (err > 0) | ||
1848 | pr_debug("Using %s for symbols\n", kallsyms_filename); | ||
1849 | |||
1850 | out_try_fixup: | ||
1851 | if (err > 0) { | ||
1852 | if (kallsyms_filename != NULL) { | ||
1853 | machine__mmap_name(machine, path, sizeof(path)); | ||
1854 | dso__set_long_name(self, strdup(path)); | ||
1855 | } | ||
1856 | map__fixup_start(map); | ||
1857 | map__fixup_end(map); | ||
1858 | } | ||
1859 | |||
1860 | return err; | ||
1861 | } | ||
1719 | 1862 | ||
1720 | static void dsos__add(struct list_head *head, struct dso *dso) | 1863 | static void dsos__add(struct list_head *head, struct dso *dso) |
1721 | { | 1864 | { |
@@ -1747,21 +1890,32 @@ struct dso *__dsos__findnew(struct list_head *head, const char *name) | |||
1747 | return dso; | 1890 | return dso; |
1748 | } | 1891 | } |
1749 | 1892 | ||
1750 | static void __dsos__fprintf(struct list_head *head, FILE *fp) | 1893 | size_t __dsos__fprintf(struct list_head *head, FILE *fp) |
1751 | { | 1894 | { |
1752 | struct dso *pos; | 1895 | struct dso *pos; |
1896 | size_t ret = 0; | ||
1753 | 1897 | ||
1754 | list_for_each_entry(pos, head, node) { | 1898 | list_for_each_entry(pos, head, node) { |
1755 | int i; | 1899 | int i; |
1756 | for (i = 0; i < MAP__NR_TYPES; ++i) | 1900 | for (i = 0; i < MAP__NR_TYPES; ++i) |
1757 | dso__fprintf(pos, i, fp); | 1901 | ret += dso__fprintf(pos, i, fp); |
1758 | } | 1902 | } |
1903 | |||
1904 | return ret; | ||
1759 | } | 1905 | } |
1760 | 1906 | ||
1761 | void dsos__fprintf(FILE *fp) | 1907 | size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp) |
1762 | { | 1908 | { |
1763 | __dsos__fprintf(&dsos__kernel, fp); | 1909 | struct rb_node *nd; |
1764 | __dsos__fprintf(&dsos__user, fp); | 1910 | size_t ret = 0; |
1911 | |||
1912 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
1913 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
1914 | ret += __dsos__fprintf(&pos->kernel_dsos, fp); | ||
1915 | ret += __dsos__fprintf(&pos->user_dsos, fp); | ||
1916 | } | ||
1917 | |||
1918 | return ret; | ||
1765 | } | 1919 | } |
1766 | 1920 | ||
1767 | static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, | 1921 | static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, |
@@ -1779,10 +1933,17 @@ static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp, | |||
1779 | return ret; | 1933 | return ret; |
1780 | } | 1934 | } |
1781 | 1935 | ||
1782 | size_t dsos__fprintf_buildid(FILE *fp, bool with_hits) | 1936 | size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits) |
1783 | { | 1937 | { |
1784 | return (__dsos__fprintf_buildid(&dsos__kernel, fp, with_hits) + | 1938 | struct rb_node *nd; |
1785 | __dsos__fprintf_buildid(&dsos__user, fp, with_hits)); | 1939 | size_t ret = 0; |
1940 | |||
1941 | for (nd = rb_first(self); nd; nd = rb_next(nd)) { | ||
1942 | struct machine *pos = rb_entry(nd, struct machine, rb_node); | ||
1943 | ret += __dsos__fprintf_buildid(&pos->kernel_dsos, fp, with_hits); | ||
1944 | ret += __dsos__fprintf_buildid(&pos->user_dsos, fp, with_hits); | ||
1945 | } | ||
1946 | return ret; | ||
1786 | } | 1947 | } |
1787 | 1948 | ||
1788 | struct dso *dso__new_kernel(const char *name) | 1949 | struct dso *dso__new_kernel(const char *name) |
@@ -1791,55 +1952,98 @@ struct dso *dso__new_kernel(const char *name) | |||
1791 | 1952 | ||
1792 | if (self != NULL) { | 1953 | if (self != NULL) { |
1793 | dso__set_short_name(self, "[kernel]"); | 1954 | dso__set_short_name(self, "[kernel]"); |
1794 | self->kernel = 1; | 1955 | self->kernel = DSO_TYPE_KERNEL; |
1795 | } | 1956 | } |
1796 | 1957 | ||
1797 | return self; | 1958 | return self; |
1798 | } | 1959 | } |
1799 | 1960 | ||
1800 | void dso__read_running_kernel_build_id(struct dso *self) | 1961 | static struct dso *dso__new_guest_kernel(struct machine *machine, |
1962 | const char *name) | ||
1801 | { | 1963 | { |
1802 | if (sysfs__read_build_id("/sys/kernel/notes", self->build_id, | 1964 | char bf[PATH_MAX]; |
1965 | struct dso *self = dso__new(name ?: machine__mmap_name(machine, bf, sizeof(bf))); | ||
1966 | |||
1967 | if (self != NULL) { | ||
1968 | dso__set_short_name(self, "[guest.kernel]"); | ||
1969 | self->kernel = DSO_TYPE_GUEST_KERNEL; | ||
1970 | } | ||
1971 | |||
1972 | return self; | ||
1973 | } | ||
1974 | |||
1975 | void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine) | ||
1976 | { | ||
1977 | char path[PATH_MAX]; | ||
1978 | |||
1979 | if (machine__is_default_guest(machine)) | ||
1980 | return; | ||
1981 | sprintf(path, "%s/sys/kernel/notes", machine->root_dir); | ||
1982 | if (sysfs__read_build_id(path, self->build_id, | ||
1803 | sizeof(self->build_id)) == 0) | 1983 | sizeof(self->build_id)) == 0) |
1804 | self->has_build_id = true; | 1984 | self->has_build_id = true; |
1805 | } | 1985 | } |
1806 | 1986 | ||
1807 | static struct dso *dsos__create_kernel(const char *vmlinux) | 1987 | static struct dso *machine__create_kernel(struct machine *self) |
1808 | { | 1988 | { |
1809 | struct dso *kernel = dso__new_kernel(vmlinux); | 1989 | const char *vmlinux_name = NULL; |
1990 | struct dso *kernel; | ||
1810 | 1991 | ||
1811 | if (kernel != NULL) { | 1992 | if (machine__is_host(self)) { |
1812 | dso__read_running_kernel_build_id(kernel); | 1993 | vmlinux_name = symbol_conf.vmlinux_name; |
1813 | dsos__add(&dsos__kernel, kernel); | 1994 | kernel = dso__new_kernel(vmlinux_name); |
1995 | } else { | ||
1996 | if (machine__is_default_guest(self)) | ||
1997 | vmlinux_name = symbol_conf.default_guest_vmlinux_name; | ||
1998 | kernel = dso__new_guest_kernel(self, vmlinux_name); | ||
1814 | } | 1999 | } |
1815 | 2000 | ||
2001 | if (kernel != NULL) { | ||
2002 | dso__read_running_kernel_build_id(kernel, self); | ||
2003 | dsos__add(&self->kernel_dsos, kernel); | ||
2004 | } | ||
1816 | return kernel; | 2005 | return kernel; |
1817 | } | 2006 | } |
1818 | 2007 | ||
1819 | int __map_groups__create_kernel_maps(struct map_groups *self, | 2008 | int __machine__create_kernel_maps(struct machine *self, struct dso *kernel) |
1820 | struct map *vmlinux_maps[MAP__NR_TYPES], | ||
1821 | struct dso *kernel) | ||
1822 | { | 2009 | { |
1823 | enum map_type type; | 2010 | enum map_type type; |
1824 | 2011 | ||
1825 | for (type = 0; type < MAP__NR_TYPES; ++type) { | 2012 | for (type = 0; type < MAP__NR_TYPES; ++type) { |
1826 | struct kmap *kmap; | 2013 | struct kmap *kmap; |
1827 | 2014 | ||
1828 | vmlinux_maps[type] = map__new2(0, kernel, type); | 2015 | self->vmlinux_maps[type] = map__new2(0, kernel, type); |
1829 | if (vmlinux_maps[type] == NULL) | 2016 | if (self->vmlinux_maps[type] == NULL) |
1830 | return -1; | 2017 | return -1; |
1831 | 2018 | ||
1832 | vmlinux_maps[type]->map_ip = | 2019 | self->vmlinux_maps[type]->map_ip = |
1833 | vmlinux_maps[type]->unmap_ip = identity__map_ip; | 2020 | self->vmlinux_maps[type]->unmap_ip = identity__map_ip; |
1834 | 2021 | ||
1835 | kmap = map__kmap(vmlinux_maps[type]); | 2022 | kmap = map__kmap(self->vmlinux_maps[type]); |
1836 | kmap->kmaps = self; | 2023 | kmap->kmaps = &self->kmaps; |
1837 | map_groups__insert(self, vmlinux_maps[type]); | 2024 | map_groups__insert(&self->kmaps, self->vmlinux_maps[type]); |
1838 | } | 2025 | } |
1839 | 2026 | ||
1840 | return 0; | 2027 | return 0; |
1841 | } | 2028 | } |
1842 | 2029 | ||
2030 | int machine__create_kernel_maps(struct machine *self) | ||
2031 | { | ||
2032 | struct dso *kernel = machine__create_kernel(self); | ||
2033 | |||
2034 | if (kernel == NULL || | ||
2035 | __machine__create_kernel_maps(self, kernel) < 0) | ||
2036 | return -1; | ||
2037 | |||
2038 | if (symbol_conf.use_modules && machine__create_modules(self) < 0) | ||
2039 | pr_debug("Problems creating module maps, continuing anyway...\n"); | ||
2040 | /* | ||
2041 | * Now that we have all the maps created, just set the ->end of them: | ||
2042 | */ | ||
2043 | map_groups__fixup_end(&self->kmaps); | ||
2044 | return 0; | ||
2045 | } | ||
2046 | |||
1843 | static void vmlinux_path__exit(void) | 2047 | static void vmlinux_path__exit(void) |
1844 | { | 2048 | { |
1845 | while (--vmlinux_path__nr_entries >= 0) { | 2049 | while (--vmlinux_path__nr_entries >= 0) { |
@@ -1895,6 +2099,17 @@ out_fail: | |||
1895 | return -1; | 2099 | return -1; |
1896 | } | 2100 | } |
1897 | 2101 | ||
2102 | size_t vmlinux_path__fprintf(FILE *fp) | ||
2103 | { | ||
2104 | int i; | ||
2105 | size_t printed = 0; | ||
2106 | |||
2107 | for (i = 0; i < vmlinux_path__nr_entries; ++i) | ||
2108 | printed += fprintf(fp, "[%d] %s\n", i, vmlinux_path[i]); | ||
2109 | |||
2110 | return printed; | ||
2111 | } | ||
2112 | |||
1898 | static int setup_list(struct strlist **list, const char *list_str, | 2113 | static int setup_list(struct strlist **list, const char *list_str, |
1899 | const char *list_name) | 2114 | const char *list_name) |
1900 | { | 2115 | { |
@@ -1945,22 +2160,129 @@ out_free_comm_list: | |||
1945 | return -1; | 2160 | return -1; |
1946 | } | 2161 | } |
1947 | 2162 | ||
1948 | int map_groups__create_kernel_maps(struct map_groups *self, | 2163 | int machines__create_kernel_maps(struct rb_root *self, pid_t pid) |
1949 | struct map *vmlinux_maps[MAP__NR_TYPES]) | ||
1950 | { | 2164 | { |
1951 | struct dso *kernel = dsos__create_kernel(symbol_conf.vmlinux_name); | 2165 | struct machine *machine = machines__findnew(self, pid); |
1952 | 2166 | ||
1953 | if (kernel == NULL) | 2167 | if (machine == NULL) |
1954 | return -1; | 2168 | return -1; |
1955 | 2169 | ||
1956 | if (__map_groups__create_kernel_maps(self, vmlinux_maps, kernel) < 0) | 2170 | return machine__create_kernel_maps(machine); |
1957 | return -1; | 2171 | } |
1958 | 2172 | ||
1959 | if (symbol_conf.use_modules && map_groups__create_modules(self) < 0) | 2173 | static int hex(char ch) |
1960 | pr_debug("Problems creating module maps, continuing anyway...\n"); | 2174 | { |
1961 | /* | 2175 | if ((ch >= '0') && (ch <= '9')) |
1962 | * Now that we have all the maps created, just set the ->end of them: | 2176 | return ch - '0'; |
1963 | */ | 2177 | if ((ch >= 'a') && (ch <= 'f')) |
1964 | map_groups__fixup_end(self); | 2178 | return ch - 'a' + 10; |
1965 | return 0; | 2179 | if ((ch >= 'A') && (ch <= 'F')) |
2180 | return ch - 'A' + 10; | ||
2181 | return -1; | ||
2182 | } | ||
2183 | |||
2184 | /* | ||
2185 | * While we find nice hex chars, build a long_val. | ||
2186 | * Return number of chars processed. | ||
2187 | */ | ||
2188 | int hex2u64(const char *ptr, u64 *long_val) | ||
2189 | { | ||
2190 | const char *p = ptr; | ||
2191 | *long_val = 0; | ||
2192 | |||
2193 | while (*p) { | ||
2194 | const int hex_val = hex(*p); | ||
2195 | |||
2196 | if (hex_val < 0) | ||
2197 | break; | ||
2198 | |||
2199 | *long_val = (*long_val << 4) | hex_val; | ||
2200 | p++; | ||
2201 | } | ||
2202 | |||
2203 | return p - ptr; | ||
2204 | } | ||
2205 | |||
2206 | char *strxfrchar(char *s, char from, char to) | ||
2207 | { | ||
2208 | char *p = s; | ||
2209 | |||
2210 | while ((p = strchr(p, from)) != NULL) | ||
2211 | *p++ = to; | ||
2212 | |||
2213 | return s; | ||
2214 | } | ||
2215 | |||
2216 | int machines__create_guest_kernel_maps(struct rb_root *self) | ||
2217 | { | ||
2218 | int ret = 0; | ||
2219 | struct dirent **namelist = NULL; | ||
2220 | int i, items = 0; | ||
2221 | char path[PATH_MAX]; | ||
2222 | pid_t pid; | ||
2223 | |||
2224 | if (symbol_conf.default_guest_vmlinux_name || | ||
2225 | symbol_conf.default_guest_modules || | ||
2226 | symbol_conf.default_guest_kallsyms) { | ||
2227 | machines__create_kernel_maps(self, DEFAULT_GUEST_KERNEL_ID); | ||
2228 | } | ||
2229 | |||
2230 | if (symbol_conf.guestmount) { | ||
2231 | items = scandir(symbol_conf.guestmount, &namelist, NULL, NULL); | ||
2232 | if (items <= 0) | ||
2233 | return -ENOENT; | ||
2234 | for (i = 0; i < items; i++) { | ||
2235 | if (!isdigit(namelist[i]->d_name[0])) { | ||
2236 | /* Filter out . and .. */ | ||
2237 | continue; | ||
2238 | } | ||
2239 | pid = atoi(namelist[i]->d_name); | ||
2240 | sprintf(path, "%s/%s/proc/kallsyms", | ||
2241 | symbol_conf.guestmount, | ||
2242 | namelist[i]->d_name); | ||
2243 | ret = access(path, R_OK); | ||
2244 | if (ret) { | ||
2245 | pr_debug("Can't access file %s\n", path); | ||
2246 | goto failure; | ||
2247 | } | ||
2248 | machines__create_kernel_maps(self, pid); | ||
2249 | } | ||
2250 | failure: | ||
2251 | free(namelist); | ||
2252 | } | ||
2253 | |||
2254 | return ret; | ||
2255 | } | ||
2256 | |||
2257 | int machine__load_kallsyms(struct machine *self, const char *filename, | ||
2258 | enum map_type type, symbol_filter_t filter) | ||
2259 | { | ||
2260 | struct map *map = self->vmlinux_maps[type]; | ||
2261 | int ret = dso__load_kallsyms(map->dso, filename, map, filter); | ||
2262 | |||
2263 | if (ret > 0) { | ||
2264 | dso__set_loaded(map->dso, type); | ||
2265 | /* | ||
2266 | * Since /proc/kallsyms will have multiple sessions for the | ||
2267 | * kernel, with modules between them, fixup the end of all | ||
2268 | * sections. | ||
2269 | */ | ||
2270 | __map_groups__fixup_end(&self->kmaps, type); | ||
2271 | } | ||
2272 | |||
2273 | return ret; | ||
2274 | } | ||
2275 | |||
2276 | int machine__load_vmlinux_path(struct machine *self, enum map_type type, | ||
2277 | symbol_filter_t filter) | ||
2278 | { | ||
2279 | struct map *map = self->vmlinux_maps[type]; | ||
2280 | int ret = dso__load_vmlinux_path(map->dso, map, filter); | ||
2281 | |||
2282 | if (ret > 0) { | ||
2283 | dso__set_loaded(map->dso, type); | ||
2284 | map__reloc_vmlinux(map); | ||
2285 | } | ||
2286 | |||
2287 | return ret; | ||
1966 | } | 2288 | } |
diff --git a/tools/perf/util/symbol.h b/tools/perf/util/symbol.h index f30a37428919..6389d1acaf81 100644 --- a/tools/perf/util/symbol.h +++ b/tools/perf/util/symbol.h | |||
@@ -3,10 +3,11 @@ | |||
3 | 3 | ||
4 | #include <linux/types.h> | 4 | #include <linux/types.h> |
5 | #include <stdbool.h> | 5 | #include <stdbool.h> |
6 | #include "types.h" | 6 | #include <stdint.h> |
7 | #include "map.h" | ||
7 | #include <linux/list.h> | 8 | #include <linux/list.h> |
8 | #include <linux/rbtree.h> | 9 | #include <linux/rbtree.h> |
9 | #include "event.h" | 10 | #include <stdio.h> |
10 | 11 | ||
11 | #define DEBUG_CACHE_DIR ".debug" | 12 | #define DEBUG_CACHE_DIR ".debug" |
12 | 13 | ||
@@ -29,6 +30,9 @@ static inline char *bfd_demangle(void __used *v, const char __used *c, | |||
29 | #endif | 30 | #endif |
30 | #endif | 31 | #endif |
31 | 32 | ||
33 | int hex2u64(const char *ptr, u64 *val); | ||
34 | char *strxfrchar(char *s, char from, char to); | ||
35 | |||
32 | /* | 36 | /* |
33 | * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP; | 37 | * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP; |
34 | * for newer versions we can use mmap to reduce memory usage: | 38 | * for newer versions we can use mmap to reduce memory usage: |
@@ -44,10 +48,13 @@ static inline char *bfd_demangle(void __used *v, const char __used *c, | |||
44 | #define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */ | 48 | #define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */ |
45 | #endif | 49 | #endif |
46 | 50 | ||
51 | #define BUILD_ID_SIZE 20 | ||
52 | |||
47 | struct symbol { | 53 | struct symbol { |
48 | struct rb_node rb_node; | 54 | struct rb_node rb_node; |
49 | u64 start; | 55 | u64 start; |
50 | u64 end; | 56 | u64 end; |
57 | u16 namelen; | ||
51 | char name[0]; | 58 | char name[0]; |
52 | }; | 59 | }; |
53 | 60 | ||
@@ -63,10 +70,15 @@ struct symbol_conf { | |||
63 | show_nr_samples, | 70 | show_nr_samples, |
64 | use_callchain, | 71 | use_callchain, |
65 | exclude_other, | 72 | exclude_other, |
66 | full_paths; | 73 | full_paths, |
74 | show_cpu_utilization; | ||
67 | const char *vmlinux_name, | 75 | const char *vmlinux_name, |
68 | *field_sep; | 76 | *field_sep; |
69 | char *dso_list_str, | 77 | const char *default_guest_vmlinux_name, |
78 | *default_guest_kallsyms, | ||
79 | *default_guest_modules; | ||
80 | const char *guestmount; | ||
81 | char *dso_list_str, | ||
70 | *comm_list_str, | 82 | *comm_list_str, |
71 | *sym_list_str, | 83 | *sym_list_str, |
72 | *col_width_list_str; | 84 | *col_width_list_str; |
@@ -88,6 +100,11 @@ struct ref_reloc_sym { | |||
88 | u64 unrelocated_addr; | 100 | u64 unrelocated_addr; |
89 | }; | 101 | }; |
90 | 102 | ||
103 | struct map_symbol { | ||
104 | struct map *map; | ||
105 | struct symbol *sym; | ||
106 | }; | ||
107 | |||
91 | struct addr_location { | 108 | struct addr_location { |
92 | struct thread *thread; | 109 | struct thread *thread; |
93 | struct map *map; | 110 | struct map *map; |
@@ -95,6 +112,13 @@ struct addr_location { | |||
95 | u64 addr; | 112 | u64 addr; |
96 | char level; | 113 | char level; |
97 | bool filtered; | 114 | bool filtered; |
115 | unsigned int cpumode; | ||
116 | }; | ||
117 | |||
118 | enum dso_kernel_type { | ||
119 | DSO_TYPE_USER = 0, | ||
120 | DSO_TYPE_KERNEL, | ||
121 | DSO_TYPE_GUEST_KERNEL | ||
98 | }; | 122 | }; |
99 | 123 | ||
100 | struct dso { | 124 | struct dso { |
@@ -104,8 +128,9 @@ struct dso { | |||
104 | u8 adjust_symbols:1; | 128 | u8 adjust_symbols:1; |
105 | u8 slen_calculated:1; | 129 | u8 slen_calculated:1; |
106 | u8 has_build_id:1; | 130 | u8 has_build_id:1; |
107 | u8 kernel:1; | 131 | enum dso_kernel_type kernel; |
108 | u8 hit:1; | 132 | u8 hit:1; |
133 | u8 annotate_warned:1; | ||
109 | unsigned char origin; | 134 | unsigned char origin; |
110 | u8 sorted_by_name; | 135 | u8 sorted_by_name; |
111 | u8 loaded; | 136 | u8 loaded; |
@@ -131,42 +156,65 @@ static inline void dso__set_loaded(struct dso *self, enum map_type type) | |||
131 | 156 | ||
132 | void dso__sort_by_name(struct dso *self, enum map_type type); | 157 | void dso__sort_by_name(struct dso *self, enum map_type type); |
133 | 158 | ||
134 | extern struct list_head dsos__user, dsos__kernel; | ||
135 | |||
136 | struct dso *__dsos__findnew(struct list_head *head, const char *name); | 159 | struct dso *__dsos__findnew(struct list_head *head, const char *name); |
137 | 160 | ||
138 | static inline struct dso *dsos__findnew(const char *name) | ||
139 | { | ||
140 | return __dsos__findnew(&dsos__user, name); | ||
141 | } | ||
142 | |||
143 | int dso__load(struct dso *self, struct map *map, symbol_filter_t filter); | 161 | int dso__load(struct dso *self, struct map *map, symbol_filter_t filter); |
144 | int dso__load_vmlinux_path(struct dso *self, struct map *map, | 162 | int dso__load_vmlinux_path(struct dso *self, struct map *map, |
145 | symbol_filter_t filter); | 163 | symbol_filter_t filter); |
146 | int dso__load_kallsyms(struct dso *self, const char *filename, struct map *map, | 164 | int dso__load_kallsyms(struct dso *self, const char *filename, struct map *map, |
147 | symbol_filter_t filter); | 165 | symbol_filter_t filter); |
148 | void dsos__fprintf(FILE *fp); | 166 | int machine__load_kallsyms(struct machine *self, const char *filename, |
149 | size_t dsos__fprintf_buildid(FILE *fp, bool with_hits); | 167 | enum map_type type, symbol_filter_t filter); |
168 | int machine__load_vmlinux_path(struct machine *self, enum map_type type, | ||
169 | symbol_filter_t filter); | ||
170 | |||
171 | size_t __dsos__fprintf(struct list_head *head, FILE *fp); | ||
172 | |||
173 | size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp); | ||
174 | size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits); | ||
150 | 175 | ||
151 | size_t dso__fprintf_buildid(struct dso *self, FILE *fp); | 176 | size_t dso__fprintf_buildid(struct dso *self, FILE *fp); |
152 | size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp); | 177 | size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp); |
178 | |||
179 | enum dso_origin { | ||
180 | DSO__ORIG_KERNEL = 0, | ||
181 | DSO__ORIG_GUEST_KERNEL, | ||
182 | DSO__ORIG_JAVA_JIT, | ||
183 | DSO__ORIG_BUILD_ID_CACHE, | ||
184 | DSO__ORIG_FEDORA, | ||
185 | DSO__ORIG_UBUNTU, | ||
186 | DSO__ORIG_BUILDID, | ||
187 | DSO__ORIG_DSO, | ||
188 | DSO__ORIG_GUEST_KMODULE, | ||
189 | DSO__ORIG_KMODULE, | ||
190 | DSO__ORIG_NOT_FOUND, | ||
191 | }; | ||
192 | |||
153 | char dso__symtab_origin(const struct dso *self); | 193 | char dso__symtab_origin(const struct dso *self); |
154 | void dso__set_long_name(struct dso *self, char *name); | 194 | void dso__set_long_name(struct dso *self, char *name); |
155 | void dso__set_build_id(struct dso *self, void *build_id); | 195 | void dso__set_build_id(struct dso *self, void *build_id); |
156 | void dso__read_running_kernel_build_id(struct dso *self); | 196 | void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine); |
157 | struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr); | 197 | struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr); |
158 | struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type, | 198 | struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type, |
159 | const char *name); | 199 | const char *name); |
160 | 200 | ||
161 | int filename__read_build_id(const char *filename, void *bf, size_t size); | 201 | int filename__read_build_id(const char *filename, void *bf, size_t size); |
162 | int sysfs__read_build_id(const char *filename, void *bf, size_t size); | 202 | int sysfs__read_build_id(const char *filename, void *bf, size_t size); |
163 | bool dsos__read_build_ids(bool with_hits); | 203 | bool __dsos__read_build_ids(struct list_head *head, bool with_hits); |
164 | int build_id__sprintf(const u8 *self, int len, char *bf); | 204 | int build_id__sprintf(const u8 *self, int len, char *bf); |
165 | int kallsyms__parse(const char *filename, void *arg, | 205 | int kallsyms__parse(const char *filename, void *arg, |
166 | int (*process_symbol)(void *arg, const char *name, | 206 | int (*process_symbol)(void *arg, const char *name, |
167 | char type, u64 start)); | 207 | char type, u64 start)); |
168 | 208 | ||
209 | int __machine__create_kernel_maps(struct machine *self, struct dso *kernel); | ||
210 | int machine__create_kernel_maps(struct machine *self); | ||
211 | |||
212 | int machines__create_kernel_maps(struct rb_root *self, pid_t pid); | ||
213 | int machines__create_guest_kernel_maps(struct rb_root *self); | ||
214 | |||
169 | int symbol__init(void); | 215 | int symbol__init(void); |
170 | bool symbol_type__is_a(char symbol_type, enum map_type map_type); | 216 | bool symbol_type__is_a(char symbol_type, enum map_type map_type); |
171 | 217 | ||
218 | size_t vmlinux_path__fprintf(FILE *fp); | ||
219 | |||
172 | #endif /* __PERF_SYMBOL */ | 220 | #endif /* __PERF_SYMBOL */ |
diff --git a/tools/perf/util/thread.c b/tools/perf/util/thread.c index fa968312ee7d..1f7ecd47f499 100644 --- a/tools/perf/util/thread.c +++ b/tools/perf/util/thread.c | |||
@@ -7,13 +7,35 @@ | |||
7 | #include "util.h" | 7 | #include "util.h" |
8 | #include "debug.h" | 8 | #include "debug.h" |
9 | 9 | ||
10 | void map_groups__init(struct map_groups *self) | 10 | int find_all_tid(int pid, pid_t ** all_tid) |
11 | { | 11 | { |
12 | char name[256]; | ||
13 | int items; | ||
14 | struct dirent **namelist = NULL; | ||
15 | int ret = 0; | ||
12 | int i; | 16 | int i; |
13 | for (i = 0; i < MAP__NR_TYPES; ++i) { | 17 | |
14 | self->maps[i] = RB_ROOT; | 18 | sprintf(name, "/proc/%d/task", pid); |
15 | INIT_LIST_HEAD(&self->removed_maps[i]); | 19 | items = scandir(name, &namelist, NULL, NULL); |
20 | if (items <= 0) | ||
21 | return -ENOENT; | ||
22 | *all_tid = malloc(sizeof(pid_t) * items); | ||
23 | if (!*all_tid) { | ||
24 | ret = -ENOMEM; | ||
25 | goto failure; | ||
16 | } | 26 | } |
27 | |||
28 | for (i = 0; i < items; i++) | ||
29 | (*all_tid)[i] = atoi(namelist[i]->d_name); | ||
30 | |||
31 | ret = items; | ||
32 | |||
33 | failure: | ||
34 | for (i=0; i<items; i++) | ||
35 | free(namelist[i]); | ||
36 | free(namelist); | ||
37 | |||
38 | return ret; | ||
17 | } | 39 | } |
18 | 40 | ||
19 | static struct thread *thread__new(pid_t pid) | 41 | static struct thread *thread__new(pid_t pid) |
@@ -31,28 +53,6 @@ static struct thread *thread__new(pid_t pid) | |||
31 | return self; | 53 | return self; |
32 | } | 54 | } |
33 | 55 | ||
34 | static void map_groups__flush(struct map_groups *self) | ||
35 | { | ||
36 | int type; | ||
37 | |||
38 | for (type = 0; type < MAP__NR_TYPES; type++) { | ||
39 | struct rb_root *root = &self->maps[type]; | ||
40 | struct rb_node *next = rb_first(root); | ||
41 | |||
42 | while (next) { | ||
43 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
44 | next = rb_next(&pos->rb_node); | ||
45 | rb_erase(&pos->rb_node, root); | ||
46 | /* | ||
47 | * We may have references to this map, for | ||
48 | * instance in some hist_entry instances, so | ||
49 | * just move them to a separate list. | ||
50 | */ | ||
51 | list_add_tail(&pos->node, &self->removed_maps[pos->type]); | ||
52 | } | ||
53 | } | ||
54 | } | ||
55 | |||
56 | int thread__set_comm(struct thread *self, const char *comm) | 56 | int thread__set_comm(struct thread *self, const char *comm) |
57 | { | 57 | { |
58 | int err; | 58 | int err; |
@@ -79,69 +79,10 @@ int thread__comm_len(struct thread *self) | |||
79 | return self->comm_len; | 79 | return self->comm_len; |
80 | } | 80 | } |
81 | 81 | ||
82 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
83 | enum map_type type, FILE *fp) | ||
84 | { | ||
85 | size_t printed = fprintf(fp, "%s:\n", map_type__name[type]); | ||
86 | struct rb_node *nd; | ||
87 | |||
88 | for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { | ||
89 | struct map *pos = rb_entry(nd, struct map, rb_node); | ||
90 | printed += fprintf(fp, "Map:"); | ||
91 | printed += map__fprintf(pos, fp); | ||
92 | if (verbose > 2) { | ||
93 | printed += dso__fprintf(pos->dso, type, fp); | ||
94 | printed += fprintf(fp, "--\n"); | ||
95 | } | ||
96 | } | ||
97 | |||
98 | return printed; | ||
99 | } | ||
100 | |||
101 | size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp) | ||
102 | { | ||
103 | size_t printed = 0, i; | ||
104 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
105 | printed += __map_groups__fprintf_maps(self, i, fp); | ||
106 | return printed; | ||
107 | } | ||
108 | |||
109 | static size_t __map_groups__fprintf_removed_maps(struct map_groups *self, | ||
110 | enum map_type type, FILE *fp) | ||
111 | { | ||
112 | struct map *pos; | ||
113 | size_t printed = 0; | ||
114 | |||
115 | list_for_each_entry(pos, &self->removed_maps[type], node) { | ||
116 | printed += fprintf(fp, "Map:"); | ||
117 | printed += map__fprintf(pos, fp); | ||
118 | if (verbose > 1) { | ||
119 | printed += dso__fprintf(pos->dso, type, fp); | ||
120 | printed += fprintf(fp, "--\n"); | ||
121 | } | ||
122 | } | ||
123 | return printed; | ||
124 | } | ||
125 | |||
126 | static size_t map_groups__fprintf_removed_maps(struct map_groups *self, FILE *fp) | ||
127 | { | ||
128 | size_t printed = 0, i; | ||
129 | for (i = 0; i < MAP__NR_TYPES; ++i) | ||
130 | printed += __map_groups__fprintf_removed_maps(self, i, fp); | ||
131 | return printed; | ||
132 | } | ||
133 | |||
134 | static size_t map_groups__fprintf(struct map_groups *self, FILE *fp) | ||
135 | { | ||
136 | size_t printed = map_groups__fprintf_maps(self, fp); | ||
137 | printed += fprintf(fp, "Removed maps:\n"); | ||
138 | return printed + map_groups__fprintf_removed_maps(self, fp); | ||
139 | } | ||
140 | |||
141 | static size_t thread__fprintf(struct thread *self, FILE *fp) | 82 | static size_t thread__fprintf(struct thread *self, FILE *fp) |
142 | { | 83 | { |
143 | return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) + | 84 | return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) + |
144 | map_groups__fprintf(&self->mg, fp); | 85 | map_groups__fprintf(&self->mg, verbose, fp); |
145 | } | 86 | } |
146 | 87 | ||
147 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) | 88 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) |
@@ -183,127 +124,12 @@ struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) | |||
183 | return th; | 124 | return th; |
184 | } | 125 | } |
185 | 126 | ||
186 | static int map_groups__fixup_overlappings(struct map_groups *self, | ||
187 | struct map *map) | ||
188 | { | ||
189 | struct rb_root *root = &self->maps[map->type]; | ||
190 | struct rb_node *next = rb_first(root); | ||
191 | |||
192 | while (next) { | ||
193 | struct map *pos = rb_entry(next, struct map, rb_node); | ||
194 | next = rb_next(&pos->rb_node); | ||
195 | |||
196 | if (!map__overlap(pos, map)) | ||
197 | continue; | ||
198 | |||
199 | if (verbose >= 2) { | ||
200 | fputs("overlapping maps:\n", stderr); | ||
201 | map__fprintf(map, stderr); | ||
202 | map__fprintf(pos, stderr); | ||
203 | } | ||
204 | |||
205 | rb_erase(&pos->rb_node, root); | ||
206 | /* | ||
207 | * We may have references to this map, for instance in some | ||
208 | * hist_entry instances, so just move them to a separate | ||
209 | * list. | ||
210 | */ | ||
211 | list_add_tail(&pos->node, &self->removed_maps[map->type]); | ||
212 | /* | ||
213 | * Now check if we need to create new maps for areas not | ||
214 | * overlapped by the new map: | ||
215 | */ | ||
216 | if (map->start > pos->start) { | ||
217 | struct map *before = map__clone(pos); | ||
218 | |||
219 | if (before == NULL) | ||
220 | return -ENOMEM; | ||
221 | |||
222 | before->end = map->start - 1; | ||
223 | map_groups__insert(self, before); | ||
224 | if (verbose >= 2) | ||
225 | map__fprintf(before, stderr); | ||
226 | } | ||
227 | |||
228 | if (map->end < pos->end) { | ||
229 | struct map *after = map__clone(pos); | ||
230 | |||
231 | if (after == NULL) | ||
232 | return -ENOMEM; | ||
233 | |||
234 | after->start = map->end + 1; | ||
235 | map_groups__insert(self, after); | ||
236 | if (verbose >= 2) | ||
237 | map__fprintf(after, stderr); | ||
238 | } | ||
239 | } | ||
240 | |||
241 | return 0; | ||
242 | } | ||
243 | |||
244 | void maps__insert(struct rb_root *maps, struct map *map) | ||
245 | { | ||
246 | struct rb_node **p = &maps->rb_node; | ||
247 | struct rb_node *parent = NULL; | ||
248 | const u64 ip = map->start; | ||
249 | struct map *m; | ||
250 | |||
251 | while (*p != NULL) { | ||
252 | parent = *p; | ||
253 | m = rb_entry(parent, struct map, rb_node); | ||
254 | if (ip < m->start) | ||
255 | p = &(*p)->rb_left; | ||
256 | else | ||
257 | p = &(*p)->rb_right; | ||
258 | } | ||
259 | |||
260 | rb_link_node(&map->rb_node, parent, p); | ||
261 | rb_insert_color(&map->rb_node, maps); | ||
262 | } | ||
263 | |||
264 | struct map *maps__find(struct rb_root *maps, u64 ip) | ||
265 | { | ||
266 | struct rb_node **p = &maps->rb_node; | ||
267 | struct rb_node *parent = NULL; | ||
268 | struct map *m; | ||
269 | |||
270 | while (*p != NULL) { | ||
271 | parent = *p; | ||
272 | m = rb_entry(parent, struct map, rb_node); | ||
273 | if (ip < m->start) | ||
274 | p = &(*p)->rb_left; | ||
275 | else if (ip > m->end) | ||
276 | p = &(*p)->rb_right; | ||
277 | else | ||
278 | return m; | ||
279 | } | ||
280 | |||
281 | return NULL; | ||
282 | } | ||
283 | |||
284 | void thread__insert_map(struct thread *self, struct map *map) | 127 | void thread__insert_map(struct thread *self, struct map *map) |
285 | { | 128 | { |
286 | map_groups__fixup_overlappings(&self->mg, map); | 129 | map_groups__fixup_overlappings(&self->mg, map, verbose, stderr); |
287 | map_groups__insert(&self->mg, map); | 130 | map_groups__insert(&self->mg, map); |
288 | } | 131 | } |
289 | 132 | ||
290 | /* | ||
291 | * XXX This should not really _copy_ te maps, but refcount them. | ||
292 | */ | ||
293 | static int map_groups__clone(struct map_groups *self, | ||
294 | struct map_groups *parent, enum map_type type) | ||
295 | { | ||
296 | struct rb_node *nd; | ||
297 | for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) { | ||
298 | struct map *map = rb_entry(nd, struct map, rb_node); | ||
299 | struct map *new = map__clone(map); | ||
300 | if (new == NULL) | ||
301 | return -ENOMEM; | ||
302 | map_groups__insert(self, new); | ||
303 | } | ||
304 | return 0; | ||
305 | } | ||
306 | |||
307 | int thread__fork(struct thread *self, struct thread *parent) | 133 | int thread__fork(struct thread *self, struct thread *parent) |
308 | { | 134 | { |
309 | int i; | 135 | int i; |
@@ -336,15 +162,3 @@ size_t perf_session__fprintf(struct perf_session *self, FILE *fp) | |||
336 | 162 | ||
337 | return ret; | 163 | return ret; |
338 | } | 164 | } |
339 | |||
340 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
341 | enum map_type type, u64 addr, | ||
342 | symbol_filter_t filter) | ||
343 | { | ||
344 | struct map *map = map_groups__find(self, type, addr); | ||
345 | |||
346 | if (map != NULL) | ||
347 | return map__find_symbol(map, map->map_ip(map, addr), filter); | ||
348 | |||
349 | return NULL; | ||
350 | } | ||
diff --git a/tools/perf/util/thread.h b/tools/perf/util/thread.h index dcf70303e58e..1dfd9ff8bdcd 100644 --- a/tools/perf/util/thread.h +++ b/tools/perf/util/thread.h | |||
@@ -5,14 +5,6 @@ | |||
5 | #include <unistd.h> | 5 | #include <unistd.h> |
6 | #include "symbol.h" | 6 | #include "symbol.h" |
7 | 7 | ||
8 | struct map_groups { | ||
9 | struct rb_root maps[MAP__NR_TYPES]; | ||
10 | struct list_head removed_maps[MAP__NR_TYPES]; | ||
11 | }; | ||
12 | |||
13 | size_t __map_groups__fprintf_maps(struct map_groups *self, | ||
14 | enum map_type type, FILE *fp); | ||
15 | |||
16 | struct thread { | 8 | struct thread { |
17 | struct rb_node rb_node; | 9 | struct rb_node rb_node; |
18 | struct map_groups mg; | 10 | struct map_groups mg; |
@@ -23,29 +15,16 @@ struct thread { | |||
23 | int comm_len; | 15 | int comm_len; |
24 | }; | 16 | }; |
25 | 17 | ||
26 | void map_groups__init(struct map_groups *self); | 18 | struct perf_session; |
19 | |||
20 | int find_all_tid(int pid, pid_t ** all_tid); | ||
27 | int thread__set_comm(struct thread *self, const char *comm); | 21 | int thread__set_comm(struct thread *self, const char *comm); |
28 | int thread__comm_len(struct thread *self); | 22 | int thread__comm_len(struct thread *self); |
29 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid); | 23 | struct thread *perf_session__findnew(struct perf_session *self, pid_t pid); |
30 | void thread__insert_map(struct thread *self, struct map *map); | 24 | void thread__insert_map(struct thread *self, struct map *map); |
31 | int thread__fork(struct thread *self, struct thread *parent); | 25 | int thread__fork(struct thread *self, struct thread *parent); |
32 | size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp); | ||
33 | size_t perf_session__fprintf(struct perf_session *self, FILE *fp); | 26 | size_t perf_session__fprintf(struct perf_session *self, FILE *fp); |
34 | 27 | ||
35 | void maps__insert(struct rb_root *maps, struct map *map); | ||
36 | struct map *maps__find(struct rb_root *maps, u64 addr); | ||
37 | |||
38 | static inline void map_groups__insert(struct map_groups *self, struct map *map) | ||
39 | { | ||
40 | maps__insert(&self->maps[map->type], map); | ||
41 | } | ||
42 | |||
43 | static inline struct map *map_groups__find(struct map_groups *self, | ||
44 | enum map_type type, u64 addr) | ||
45 | { | ||
46 | return maps__find(&self->maps[type], addr); | ||
47 | } | ||
48 | |||
49 | static inline struct map *thread__find_map(struct thread *self, | 28 | static inline struct map *thread__find_map(struct thread *self, |
50 | enum map_type type, u64 addr) | 29 | enum map_type type, u64 addr) |
51 | { | 30 | { |
@@ -54,34 +33,12 @@ static inline struct map *thread__find_map(struct thread *self, | |||
54 | 33 | ||
55 | void thread__find_addr_map(struct thread *self, | 34 | void thread__find_addr_map(struct thread *self, |
56 | struct perf_session *session, u8 cpumode, | 35 | struct perf_session *session, u8 cpumode, |
57 | enum map_type type, u64 addr, | 36 | enum map_type type, pid_t pid, u64 addr, |
58 | struct addr_location *al); | 37 | struct addr_location *al); |
59 | 38 | ||
60 | void thread__find_addr_location(struct thread *self, | 39 | void thread__find_addr_location(struct thread *self, |
61 | struct perf_session *session, u8 cpumode, | 40 | struct perf_session *session, u8 cpumode, |
62 | enum map_type type, u64 addr, | 41 | enum map_type type, pid_t pid, u64 addr, |
63 | struct addr_location *al, | 42 | struct addr_location *al, |
64 | symbol_filter_t filter); | 43 | symbol_filter_t filter); |
65 | struct symbol *map_groups__find_symbol(struct map_groups *self, | ||
66 | enum map_type type, u64 addr, | ||
67 | symbol_filter_t filter); | ||
68 | |||
69 | static inline struct symbol *map_groups__find_function(struct map_groups *self, | ||
70 | u64 addr, | ||
71 | symbol_filter_t filter) | ||
72 | { | ||
73 | return map_groups__find_symbol(self, MAP__FUNCTION, addr, filter); | ||
74 | } | ||
75 | |||
76 | struct map *map_groups__find_by_name(struct map_groups *self, | ||
77 | enum map_type type, const char *name); | ||
78 | |||
79 | int __map_groups__create_kernel_maps(struct map_groups *self, | ||
80 | struct map *vmlinux_maps[MAP__NR_TYPES], | ||
81 | struct dso *kernel); | ||
82 | int map_groups__create_kernel_maps(struct map_groups *self, | ||
83 | struct map *vmlinux_maps[MAP__NR_TYPES]); | ||
84 | |||
85 | struct map *map_groups__new_module(struct map_groups *self, u64 start, | ||
86 | const char *filename); | ||
87 | #endif /* __PERF_THREAD_H */ | 44 | #endif /* __PERF_THREAD_H */ |
diff --git a/tools/perf/util/trace-event-info.c b/tools/perf/util/trace-event-info.c index 5ea8973ad331..b1572601286c 100644 --- a/tools/perf/util/trace-event-info.c +++ b/tools/perf/util/trace-event-info.c | |||
@@ -154,10 +154,17 @@ static void put_tracing_file(char *file) | |||
154 | free(file); | 154 | free(file); |
155 | } | 155 | } |
156 | 156 | ||
157 | static ssize_t calc_data_size; | ||
158 | |||
157 | static ssize_t write_or_die(const void *buf, size_t len) | 159 | static ssize_t write_or_die(const void *buf, size_t len) |
158 | { | 160 | { |
159 | int ret; | 161 | int ret; |
160 | 162 | ||
163 | if (calc_data_size) { | ||
164 | calc_data_size += len; | ||
165 | return len; | ||
166 | } | ||
167 | |||
161 | ret = write(output_fd, buf, len); | 168 | ret = write(output_fd, buf, len); |
162 | if (ret < 0) | 169 | if (ret < 0) |
163 | die("writing to '%s'", output_file); | 170 | die("writing to '%s'", output_file); |
@@ -480,6 +487,17 @@ get_tracepoints_path(struct perf_event_attr *pattrs, int nb_events) | |||
480 | return nr_tracepoints > 0 ? path.next : NULL; | 487 | return nr_tracepoints > 0 ? path.next : NULL; |
481 | } | 488 | } |
482 | 489 | ||
490 | bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events) | ||
491 | { | ||
492 | int i; | ||
493 | |||
494 | for (i = 0; i < nb_events; i++) | ||
495 | if (pattrs[i].type == PERF_TYPE_TRACEPOINT) | ||
496 | return true; | ||
497 | |||
498 | return false; | ||
499 | } | ||
500 | |||
483 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) | 501 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) |
484 | { | 502 | { |
485 | char buf[BUFSIZ]; | 503 | char buf[BUFSIZ]; |
@@ -526,3 +544,20 @@ int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) | |||
526 | 544 | ||
527 | return 0; | 545 | return 0; |
528 | } | 546 | } |
547 | |||
548 | ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs, | ||
549 | int nb_events) | ||
550 | { | ||
551 | ssize_t size; | ||
552 | int err = 0; | ||
553 | |||
554 | calc_data_size = 1; | ||
555 | err = read_tracing_data(fd, pattrs, nb_events); | ||
556 | size = calc_data_size - 1; | ||
557 | calc_data_size = 0; | ||
558 | |||
559 | if (err < 0) | ||
560 | return err; | ||
561 | |||
562 | return size; | ||
563 | } | ||
diff --git a/tools/perf/util/trace-event-parse.c b/tools/perf/util/trace-event-parse.c index 9b3c20f42f98..069f261b225c 100644 --- a/tools/perf/util/trace-event-parse.c +++ b/tools/perf/util/trace-event-parse.c | |||
@@ -37,10 +37,12 @@ int header_page_ts_offset; | |||
37 | int header_page_ts_size; | 37 | int header_page_ts_size; |
38 | int header_page_size_offset; | 38 | int header_page_size_offset; |
39 | int header_page_size_size; | 39 | int header_page_size_size; |
40 | int header_page_overwrite_offset; | ||
41 | int header_page_overwrite_size; | ||
40 | int header_page_data_offset; | 42 | int header_page_data_offset; |
41 | int header_page_data_size; | 43 | int header_page_data_size; |
42 | 44 | ||
43 | int latency_format; | 45 | bool latency_format; |
44 | 46 | ||
45 | static char *input_buf; | 47 | static char *input_buf; |
46 | static unsigned long long input_buf_ptr; | 48 | static unsigned long long input_buf_ptr; |
@@ -628,23 +630,32 @@ static int test_type(enum event_type type, enum event_type expect) | |||
628 | return 0; | 630 | return 0; |
629 | } | 631 | } |
630 | 632 | ||
631 | static int test_type_token(enum event_type type, char *token, | 633 | static int __test_type_token(enum event_type type, char *token, |
632 | enum event_type expect, const char *expect_tok) | 634 | enum event_type expect, const char *expect_tok, |
635 | bool warn) | ||
633 | { | 636 | { |
634 | if (type != expect) { | 637 | if (type != expect) { |
635 | warning("Error: expected type %d but read %d", | 638 | if (warn) |
636 | expect, type); | 639 | warning("Error: expected type %d but read %d", |
640 | expect, type); | ||
637 | return -1; | 641 | return -1; |
638 | } | 642 | } |
639 | 643 | ||
640 | if (strcmp(token, expect_tok) != 0) { | 644 | if (strcmp(token, expect_tok) != 0) { |
641 | warning("Error: expected '%s' but read '%s'", | 645 | if (warn) |
642 | expect_tok, token); | 646 | warning("Error: expected '%s' but read '%s'", |
647 | expect_tok, token); | ||
643 | return -1; | 648 | return -1; |
644 | } | 649 | } |
645 | return 0; | 650 | return 0; |
646 | } | 651 | } |
647 | 652 | ||
653 | static int test_type_token(enum event_type type, char *token, | ||
654 | enum event_type expect, const char *expect_tok) | ||
655 | { | ||
656 | return __test_type_token(type, token, expect, expect_tok, true); | ||
657 | } | ||
658 | |||
648 | static int __read_expect_type(enum event_type expect, char **tok, int newline_ok) | 659 | static int __read_expect_type(enum event_type expect, char **tok, int newline_ok) |
649 | { | 660 | { |
650 | enum event_type type; | 661 | enum event_type type; |
@@ -661,7 +672,8 @@ static int read_expect_type(enum event_type expect, char **tok) | |||
661 | return __read_expect_type(expect, tok, 1); | 672 | return __read_expect_type(expect, tok, 1); |
662 | } | 673 | } |
663 | 674 | ||
664 | static int __read_expected(enum event_type expect, const char *str, int newline_ok) | 675 | static int __read_expected(enum event_type expect, const char *str, |
676 | int newline_ok, bool warn) | ||
665 | { | 677 | { |
666 | enum event_type type; | 678 | enum event_type type; |
667 | char *token; | 679 | char *token; |
@@ -672,7 +684,7 @@ static int __read_expected(enum event_type expect, const char *str, int newline_ | |||
672 | else | 684 | else |
673 | type = read_token_item(&token); | 685 | type = read_token_item(&token); |
674 | 686 | ||
675 | ret = test_type_token(type, token, expect, str); | 687 | ret = __test_type_token(type, token, expect, str, warn); |
676 | 688 | ||
677 | free_token(token); | 689 | free_token(token); |
678 | 690 | ||
@@ -681,12 +693,12 @@ static int __read_expected(enum event_type expect, const char *str, int newline_ | |||
681 | 693 | ||
682 | static int read_expected(enum event_type expect, const char *str) | 694 | static int read_expected(enum event_type expect, const char *str) |
683 | { | 695 | { |
684 | return __read_expected(expect, str, 1); | 696 | return __read_expected(expect, str, 1, true); |
685 | } | 697 | } |
686 | 698 | ||
687 | static int read_expected_item(enum event_type expect, const char *str) | 699 | static int read_expected_item(enum event_type expect, const char *str) |
688 | { | 700 | { |
689 | return __read_expected(expect, str, 0); | 701 | return __read_expected(expect, str, 0, true); |
690 | } | 702 | } |
691 | 703 | ||
692 | static char *event_read_name(void) | 704 | static char *event_read_name(void) |
@@ -744,7 +756,7 @@ static int field_is_string(struct format_field *field) | |||
744 | 756 | ||
745 | static int field_is_dynamic(struct format_field *field) | 757 | static int field_is_dynamic(struct format_field *field) |
746 | { | 758 | { |
747 | if (!strcmp(field->type, "__data_loc")) | 759 | if (!strncmp(field->type, "__data_loc", 10)) |
748 | return 1; | 760 | return 1; |
749 | 761 | ||
750 | return 0; | 762 | return 0; |
@@ -3087,88 +3099,6 @@ static void print_args(struct print_arg *args) | |||
3087 | } | 3099 | } |
3088 | } | 3100 | } |
3089 | 3101 | ||
3090 | static void parse_header_field(const char *field, | ||
3091 | int *offset, int *size) | ||
3092 | { | ||
3093 | char *token; | ||
3094 | int type; | ||
3095 | |||
3096 | if (read_expected(EVENT_ITEM, "field") < 0) | ||
3097 | return; | ||
3098 | if (read_expected(EVENT_OP, ":") < 0) | ||
3099 | return; | ||
3100 | |||
3101 | /* type */ | ||
3102 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3103 | goto fail; | ||
3104 | free_token(token); | ||
3105 | |||
3106 | if (read_expected(EVENT_ITEM, field) < 0) | ||
3107 | return; | ||
3108 | if (read_expected(EVENT_OP, ";") < 0) | ||
3109 | return; | ||
3110 | if (read_expected(EVENT_ITEM, "offset") < 0) | ||
3111 | return; | ||
3112 | if (read_expected(EVENT_OP, ":") < 0) | ||
3113 | return; | ||
3114 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3115 | goto fail; | ||
3116 | *offset = atoi(token); | ||
3117 | free_token(token); | ||
3118 | if (read_expected(EVENT_OP, ";") < 0) | ||
3119 | return; | ||
3120 | if (read_expected(EVENT_ITEM, "size") < 0) | ||
3121 | return; | ||
3122 | if (read_expected(EVENT_OP, ":") < 0) | ||
3123 | return; | ||
3124 | if (read_expect_type(EVENT_ITEM, &token) < 0) | ||
3125 | goto fail; | ||
3126 | *size = atoi(token); | ||
3127 | free_token(token); | ||
3128 | if (read_expected(EVENT_OP, ";") < 0) | ||
3129 | return; | ||
3130 | type = read_token(&token); | ||
3131 | if (type != EVENT_NEWLINE) { | ||
3132 | /* newer versions of the kernel have a "signed" type */ | ||
3133 | if (type != EVENT_ITEM) | ||
3134 | goto fail; | ||
3135 | |||
3136 | if (strcmp(token, "signed") != 0) | ||
3137 | goto fail; | ||
3138 | |||
3139 | free_token(token); | ||
3140 | |||
3141 | if (read_expected(EVENT_OP, ":") < 0) | ||
3142 | return; | ||
3143 | |||
3144 | if (read_expect_type(EVENT_ITEM, &token)) | ||
3145 | goto fail; | ||
3146 | |||
3147 | free_token(token); | ||
3148 | if (read_expected(EVENT_OP, ";") < 0) | ||
3149 | return; | ||
3150 | |||
3151 | if (read_expect_type(EVENT_NEWLINE, &token)) | ||
3152 | goto fail; | ||
3153 | } | ||
3154 | fail: | ||
3155 | free_token(token); | ||
3156 | } | ||
3157 | |||
3158 | int parse_header_page(char *buf, unsigned long size) | ||
3159 | { | ||
3160 | init_input_buf(buf, size); | ||
3161 | |||
3162 | parse_header_field("timestamp", &header_page_ts_offset, | ||
3163 | &header_page_ts_size); | ||
3164 | parse_header_field("commit", &header_page_size_offset, | ||
3165 | &header_page_size_size); | ||
3166 | parse_header_field("data", &header_page_data_offset, | ||
3167 | &header_page_data_size); | ||
3168 | |||
3169 | return 0; | ||
3170 | } | ||
3171 | |||
3172 | int parse_ftrace_file(char *buf, unsigned long size) | 3102 | int parse_ftrace_file(char *buf, unsigned long size) |
3173 | { | 3103 | { |
3174 | struct format_field *field; | 3104 | struct format_field *field; |
diff --git a/tools/perf/util/trace-event-read.c b/tools/perf/util/trace-event-read.c index 7cd1193918c7..cb54cd002f49 100644 --- a/tools/perf/util/trace-event-read.c +++ b/tools/perf/util/trace-event-read.c | |||
@@ -50,14 +50,51 @@ static int long_size; | |||
50 | 50 | ||
51 | static unsigned long page_size; | 51 | static unsigned long page_size; |
52 | 52 | ||
53 | static ssize_t calc_data_size; | ||
54 | static bool repipe; | ||
55 | |||
56 | /* If it fails, the next read will report it */ | ||
57 | static void skip(int size) | ||
58 | { | ||
59 | lseek(input_fd, size, SEEK_CUR); | ||
60 | } | ||
61 | |||
62 | static int do_read(int fd, void *buf, int size) | ||
63 | { | ||
64 | int rsize = size; | ||
65 | |||
66 | while (size) { | ||
67 | int ret = read(fd, buf, size); | ||
68 | |||
69 | if (ret <= 0) | ||
70 | return -1; | ||
71 | |||
72 | if (repipe) { | ||
73 | int retw = write(STDOUT_FILENO, buf, ret); | ||
74 | |||
75 | if (retw <= 0 || retw != ret) | ||
76 | die("repiping input file"); | ||
77 | } | ||
78 | |||
79 | size -= ret; | ||
80 | buf += ret; | ||
81 | } | ||
82 | |||
83 | return rsize; | ||
84 | } | ||
85 | |||
53 | static int read_or_die(void *data, int size) | 86 | static int read_or_die(void *data, int size) |
54 | { | 87 | { |
55 | int r; | 88 | int r; |
56 | 89 | ||
57 | r = read(input_fd, data, size); | 90 | r = do_read(input_fd, data, size); |
58 | if (r != size) | 91 | if (r <= 0) |
59 | die("reading input file (size expected=%d received=%d)", | 92 | die("reading input file (size expected=%d received=%d)", |
60 | size, r); | 93 | size, r); |
94 | |||
95 | if (calc_data_size) | ||
96 | calc_data_size += r; | ||
97 | |||
61 | return r; | 98 | return r; |
62 | } | 99 | } |
63 | 100 | ||
@@ -82,57 +119,36 @@ static char *read_string(void) | |||
82 | char buf[BUFSIZ]; | 119 | char buf[BUFSIZ]; |
83 | char *str = NULL; | 120 | char *str = NULL; |
84 | int size = 0; | 121 | int size = 0; |
85 | int i; | ||
86 | off_t r; | 122 | off_t r; |
123 | char c; | ||
87 | 124 | ||
88 | for (;;) { | 125 | for (;;) { |
89 | r = read(input_fd, buf, BUFSIZ); | 126 | r = read(input_fd, &c, 1); |
90 | if (r < 0) | 127 | if (r < 0) |
91 | die("reading input file"); | 128 | die("reading input file"); |
92 | 129 | ||
93 | if (!r) | 130 | if (!r) |
94 | die("no data"); | 131 | die("no data"); |
95 | 132 | ||
96 | for (i = 0; i < r; i++) { | 133 | if (repipe) { |
97 | if (!buf[i]) | 134 | int retw = write(STDOUT_FILENO, &c, 1); |
98 | break; | ||
99 | } | ||
100 | if (i < r) | ||
101 | break; | ||
102 | 135 | ||
103 | if (str) { | 136 | if (retw <= 0 || retw != r) |
104 | size += BUFSIZ; | 137 | die("repiping input file string"); |
105 | str = realloc(str, size); | ||
106 | if (!str) | ||
107 | die("malloc of size %d", size); | ||
108 | memcpy(str + (size - BUFSIZ), buf, BUFSIZ); | ||
109 | } else { | ||
110 | size = BUFSIZ; | ||
111 | str = malloc_or_die(size); | ||
112 | memcpy(str, buf, size); | ||
113 | } | 138 | } |
114 | } | ||
115 | 139 | ||
116 | /* trailing \0: */ | 140 | buf[size++] = c; |
117 | i++; | 141 | |
118 | 142 | if (!c) | |
119 | /* move the file descriptor to the end of the string */ | 143 | break; |
120 | r = lseek(input_fd, -(r - i), SEEK_CUR); | ||
121 | if (r == (off_t)-1) | ||
122 | die("lseek"); | ||
123 | |||
124 | if (str) { | ||
125 | size += i; | ||
126 | str = realloc(str, size); | ||
127 | if (!str) | ||
128 | die("malloc of size %d", size); | ||
129 | memcpy(str + (size - i), buf, i); | ||
130 | } else { | ||
131 | size = i; | ||
132 | str = malloc_or_die(i); | ||
133 | memcpy(str, buf, i); | ||
134 | } | 144 | } |
135 | 145 | ||
146 | if (calc_data_size) | ||
147 | calc_data_size += size; | ||
148 | |||
149 | str = malloc_or_die(size); | ||
150 | memcpy(str, buf, size); | ||
151 | |||
136 | return str; | 152 | return str; |
137 | } | 153 | } |
138 | 154 | ||
@@ -174,7 +190,6 @@ static void read_ftrace_printk(void) | |||
174 | static void read_header_files(void) | 190 | static void read_header_files(void) |
175 | { | 191 | { |
176 | unsigned long long size; | 192 | unsigned long long size; |
177 | char *header_page; | ||
178 | char *header_event; | 193 | char *header_event; |
179 | char buf[BUFSIZ]; | 194 | char buf[BUFSIZ]; |
180 | 195 | ||
@@ -184,10 +199,7 @@ static void read_header_files(void) | |||
184 | die("did not read header page"); | 199 | die("did not read header page"); |
185 | 200 | ||
186 | size = read8(); | 201 | size = read8(); |
187 | header_page = malloc_or_die(size); | 202 | skip(size); |
188 | read_or_die(header_page, size); | ||
189 | parse_header_page(header_page, size); | ||
190 | free(header_page); | ||
191 | 203 | ||
192 | /* | 204 | /* |
193 | * The size field in the page is of type long, | 205 | * The size field in the page is of type long, |
@@ -459,7 +471,7 @@ struct record *trace_read_data(int cpu) | |||
459 | return data; | 471 | return data; |
460 | } | 472 | } |
461 | 473 | ||
462 | void trace_report(int fd) | 474 | ssize_t trace_report(int fd, bool __repipe) |
463 | { | 475 | { |
464 | char buf[BUFSIZ]; | 476 | char buf[BUFSIZ]; |
465 | char test[] = { 23, 8, 68 }; | 477 | char test[] = { 23, 8, 68 }; |
@@ -467,6 +479,10 @@ void trace_report(int fd) | |||
467 | int show_version = 0; | 479 | int show_version = 0; |
468 | int show_funcs = 0; | 480 | int show_funcs = 0; |
469 | int show_printk = 0; | 481 | int show_printk = 0; |
482 | ssize_t size; | ||
483 | |||
484 | calc_data_size = 1; | ||
485 | repipe = __repipe; | ||
470 | 486 | ||
471 | input_fd = fd; | 487 | input_fd = fd; |
472 | 488 | ||
@@ -499,14 +515,18 @@ void trace_report(int fd) | |||
499 | read_proc_kallsyms(); | 515 | read_proc_kallsyms(); |
500 | read_ftrace_printk(); | 516 | read_ftrace_printk(); |
501 | 517 | ||
518 | size = calc_data_size - 1; | ||
519 | calc_data_size = 0; | ||
520 | repipe = false; | ||
521 | |||
502 | if (show_funcs) { | 522 | if (show_funcs) { |
503 | print_funcs(); | 523 | print_funcs(); |
504 | return; | 524 | return size; |
505 | } | 525 | } |
506 | if (show_printk) { | 526 | if (show_printk) { |
507 | print_printk(); | 527 | print_printk(); |
508 | return; | 528 | return size; |
509 | } | 529 | } |
510 | 530 | ||
511 | return; | 531 | return size; |
512 | } | 532 | } |
diff --git a/tools/perf/util/trace-event.h b/tools/perf/util/trace-event.h index c3269b937db4..406d452956db 100644 --- a/tools/perf/util/trace-event.h +++ b/tools/perf/util/trace-event.h | |||
@@ -1,6 +1,7 @@ | |||
1 | #ifndef __PERF_TRACE_EVENTS_H | 1 | #ifndef __PERF_TRACE_EVENTS_H |
2 | #define __PERF_TRACE_EVENTS_H | 2 | #define __PERF_TRACE_EVENTS_H |
3 | 3 | ||
4 | #include <stdbool.h> | ||
4 | #include "parse-events.h" | 5 | #include "parse-events.h" |
5 | 6 | ||
6 | #define __unused __attribute__((unused)) | 7 | #define __unused __attribute__((unused)) |
@@ -162,7 +163,7 @@ struct record *trace_read_data(int cpu); | |||
162 | 163 | ||
163 | void parse_set_info(int nr_cpus, int long_sz); | 164 | void parse_set_info(int nr_cpus, int long_sz); |
164 | 165 | ||
165 | void trace_report(int fd); | 166 | ssize_t trace_report(int fd, bool repipe); |
166 | 167 | ||
167 | void *malloc_or_die(unsigned int size); | 168 | void *malloc_or_die(unsigned int size); |
168 | 169 | ||
@@ -241,9 +242,8 @@ extern int header_page_size_size; | |||
241 | extern int header_page_data_offset; | 242 | extern int header_page_data_offset; |
242 | extern int header_page_data_size; | 243 | extern int header_page_data_size; |
243 | 244 | ||
244 | extern int latency_format; | 245 | extern bool latency_format; |
245 | 246 | ||
246 | int parse_header_page(char *buf, unsigned long size); | ||
247 | int trace_parse_common_type(void *data); | 247 | int trace_parse_common_type(void *data); |
248 | int trace_parse_common_pid(void *data); | 248 | int trace_parse_common_pid(void *data); |
249 | int parse_common_pc(void *data); | 249 | int parse_common_pc(void *data); |
@@ -258,6 +258,8 @@ void *raw_field_ptr(struct event *event, const char *name, void *data); | |||
258 | unsigned long long eval_flag(const char *flag); | 258 | unsigned long long eval_flag(const char *flag); |
259 | 259 | ||
260 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events); | 260 | int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events); |
261 | ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs, | ||
262 | int nb_events); | ||
261 | 263 | ||
262 | /* taken from kernel/trace/trace.h */ | 264 | /* taken from kernel/trace/trace.h */ |
263 | enum trace_flag_type { | 265 | enum trace_flag_type { |
diff --git a/tools/perf/util/util.c b/tools/perf/util/util.c index f9b890fde681..214265674ddd 100644 --- a/tools/perf/util/util.c +++ b/tools/perf/util/util.c | |||
@@ -92,3 +92,25 @@ out_close_from: | |||
92 | out: | 92 | out: |
93 | return err; | 93 | return err; |
94 | } | 94 | } |
95 | |||
96 | unsigned long convert_unit(unsigned long value, char *unit) | ||
97 | { | ||
98 | *unit = ' '; | ||
99 | |||
100 | if (value > 1000) { | ||
101 | value /= 1000; | ||
102 | *unit = 'K'; | ||
103 | } | ||
104 | |||
105 | if (value > 1000) { | ||
106 | value /= 1000; | ||
107 | *unit = 'M'; | ||
108 | } | ||
109 | |||
110 | if (value > 1000) { | ||
111 | value /= 1000; | ||
112 | *unit = 'G'; | ||
113 | } | ||
114 | |||
115 | return value; | ||
116 | } | ||
diff --git a/tools/perf/util/util.h b/tools/perf/util/util.h index 0f5b2a6f1080..0795bf304b19 100644 --- a/tools/perf/util/util.h +++ b/tools/perf/util/util.h | |||
@@ -42,12 +42,14 @@ | |||
42 | #define _ALL_SOURCE 1 | 42 | #define _ALL_SOURCE 1 |
43 | #define _GNU_SOURCE 1 | 43 | #define _GNU_SOURCE 1 |
44 | #define _BSD_SOURCE 1 | 44 | #define _BSD_SOURCE 1 |
45 | #define HAS_BOOL | ||
45 | 46 | ||
46 | #include <unistd.h> | 47 | #include <unistd.h> |
47 | #include <stdio.h> | 48 | #include <stdio.h> |
48 | #include <sys/stat.h> | 49 | #include <sys/stat.h> |
49 | #include <sys/statfs.h> | 50 | #include <sys/statfs.h> |
50 | #include <fcntl.h> | 51 | #include <fcntl.h> |
52 | #include <stdbool.h> | ||
51 | #include <stddef.h> | 53 | #include <stddef.h> |
52 | #include <stdlib.h> | 54 | #include <stdlib.h> |
53 | #include <stdarg.h> | 55 | #include <stdarg.h> |
@@ -78,6 +80,7 @@ | |||
78 | #include <pwd.h> | 80 | #include <pwd.h> |
79 | #include <inttypes.h> | 81 | #include <inttypes.h> |
80 | #include "../../../include/linux/magic.h" | 82 | #include "../../../include/linux/magic.h" |
83 | #include "types.h" | ||
81 | 84 | ||
82 | 85 | ||
83 | #ifndef NO_ICONV | 86 | #ifndef NO_ICONV |
@@ -295,6 +298,13 @@ extern void *xmemdupz(const void *data, size_t len); | |||
295 | extern char *xstrndup(const char *str, size_t len); | 298 | extern char *xstrndup(const char *str, size_t len); |
296 | extern void *xrealloc(void *ptr, size_t size) __attribute__((weak)); | 299 | extern void *xrealloc(void *ptr, size_t size) __attribute__((weak)); |
297 | 300 | ||
301 | static inline void *xzalloc(size_t size) | ||
302 | { | ||
303 | void *buf = xmalloc(size); | ||
304 | |||
305 | return memset(buf, 0, size); | ||
306 | } | ||
307 | |||
298 | static inline void *zalloc(size_t size) | 308 | static inline void *zalloc(size_t size) |
299 | { | 309 | { |
300 | return calloc(1, size); | 310 | return calloc(1, size); |
@@ -309,6 +319,7 @@ static inline int has_extension(const char *filename, const char *ext) | |||
309 | { | 319 | { |
310 | size_t len = strlen(filename); | 320 | size_t len = strlen(filename); |
311 | size_t extlen = strlen(ext); | 321 | size_t extlen = strlen(ext); |
322 | |||
312 | return len > extlen && !memcmp(filename + len - extlen, ext, extlen); | 323 | return len > extlen && !memcmp(filename + len - extlen, ext, extlen); |
313 | } | 324 | } |
314 | 325 | ||
@@ -322,6 +333,7 @@ static inline int has_extension(const char *filename, const char *ext) | |||
322 | #undef isalnum | 333 | #undef isalnum |
323 | #undef tolower | 334 | #undef tolower |
324 | #undef toupper | 335 | #undef toupper |
336 | |||
325 | extern unsigned char sane_ctype[256]; | 337 | extern unsigned char sane_ctype[256]; |
326 | #define GIT_SPACE 0x01 | 338 | #define GIT_SPACE 0x01 |
327 | #define GIT_DIGIT 0x02 | 339 | #define GIT_DIGIT 0x02 |
@@ -406,4 +418,14 @@ void git_qsort(void *base, size_t nmemb, size_t size, | |||
406 | int mkdir_p(char *path, mode_t mode); | 418 | int mkdir_p(char *path, mode_t mode); |
407 | int copyfile(const char *from, const char *to); | 419 | int copyfile(const char *from, const char *to); |
408 | 420 | ||
421 | s64 perf_atoll(const char *str); | ||
422 | char **argv_split(const char *str, int *argcp); | ||
423 | void argv_free(char **argv); | ||
424 | bool strglobmatch(const char *str, const char *pat); | ||
425 | bool strlazymatch(const char *str, const char *pat); | ||
426 | unsigned long convert_unit(unsigned long value, char *unit); | ||
427 | |||
428 | #define _STR(x) #x | ||
429 | #define STR(x) _STR(x) | ||
430 | |||
409 | #endif | 431 | #endif |